diff --git "a/wandb/run-20220328_170142-by95ehra/files/wandb-summary.json" "b/wandb/run-20220328_170142-by95ehra/files/wandb-summary.json" --- "a/wandb/run-20220328_170142-by95ehra/files/wandb-summary.json" +++ "b/wandb/run-20220328_170142-by95ehra/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.1177, "train/learning_rate": 5.557377049180327e-05, "train/epoch": 9.01, "train/global_step": 1000, "_runtime": 23313, "_timestamp": 1648510215, "_step": 1001, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 5.0, 4.0, 11.0, 12.0, 20.0, 24.0, 32.0, 39.0, 71.0, 74.0, 94.0, 117.0, 103.0, 81.0, 77.0, 69.0, 54.0, 32.0, 26.0, 18.0, 10.0, 14.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6982321739196777, -1.651377558708191, -1.604522943496704, -1.5576683282852173, -1.5108137130737305, -1.4639590978622437, -1.4171044826507568, -1.37024986743927, -1.3233952522277832, -1.2765406370162964, -1.2296860218048096, -1.1828314065933228, -1.135976791381836, -1.0891221761703491, -1.0422675609588623, -0.9954129457473755, -0.9485583305358887, -0.9017037153244019, -0.854849100112915, -0.8079944849014282, -0.7611398696899414, -0.7142852544784546, -0.6674306392669678, -0.620576024055481, -0.5737214088439941, -0.5268667936325073, -0.4800121784210205, -0.4331575632095337, -0.3863029479980469, -0.33944833278656006, -0.29259371757507324, -0.24573910236358643, -0.19888460636138916, -0.15202999114990234, -0.10517537593841553, -0.05832076072692871, -0.011466145515441895, 0.03538846969604492, 0.08224308490753174, 0.12909770011901855, 0.17595231533050537, 0.2228069305419922, 0.269661545753479, 0.3165161609649658, 0.36337077617645264, 0.41022539138793945, 0.45708000659942627, 0.5039346218109131, 0.5507892370223999, 0.5976438522338867, 0.6444984674453735, 0.6913530826568604, 0.7382076978683472, 0.785062313079834, 0.8319169282913208, 0.8787715435028076, 0.9256261587142944, 0.9724807739257812, 1.019335389137268, 1.0661900043487549, 1.1130446195602417, 1.1598992347717285, 1.2067538499832153, 1.2536084651947021, 1.300463080406189]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 11.0, 6.0, 10.0, 15.0, 18.0, 19.0, 18.0, 17.0, 31.0, 24.0, 42.0, 24.0, 37.0, 26.0, 42.0, 31.0, 38.0, 47.0, 29.0, 31.0, 33.0, 45.0, 35.0, 46.0, 32.0, 38.0, 24.0, 29.0, 27.0, 27.0, 24.0, 15.0, 16.0, 12.0, 16.0, 14.0, 12.0, 6.0, 6.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.7940231561660767, -0.7693271636962891, -0.7446311712265015, -0.7199351787567139, -0.6952391862869263, -0.6705431938171387, -0.6458472013473511, -0.6211512088775635, -0.5964552164077759, -0.5717592239379883, -0.5470632314682007, -0.5223672389984131, -0.4976712465286255, -0.4729752540588379, -0.4482792615890503, -0.4235832691192627, -0.3988872766494751, -0.3741912841796875, -0.3494952917098999, -0.3247992992401123, -0.3001033067703247, -0.2754073143005371, -0.2507113218307495, -0.22601532936096191, -0.20131933689117432, -0.17662334442138672, -0.15192735195159912, -0.12723135948181152, -0.10253536701202393, -0.07783937454223633, -0.05314338207244873, -0.028447389602661133, -0.0037513375282287598, 0.020944654941558838, 0.045640647411346436, 0.07033663988113403, 0.09503263235092163, 0.11972862482070923, 0.14442461729049683, 0.16912060976028442, 0.19381660223007202, 0.21851259469985962, 0.24320858716964722, 0.2679045796394348, 0.2926005721092224, 0.31729656457901, 0.3419925570487976, 0.3666885495185852, 0.3913845419883728, 0.4160805344581604, 0.440776526927948, 0.4654725193977356, 0.4901685118675232, 0.5148645043373108, 0.5395604968070984, 0.564256489276886, 0.5889524817466736, 0.6136484742164612, 0.6383444666862488, 0.6630404591560364, 0.687736451625824, 0.7124324440956116, 0.7371284365653992, 0.7618244290351868, 0.7865204215049744]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [4.0, 3.0, 5.0, 2.0, 8.0, 6.0, 11.0, 18.0, 13.0, 32.0, 34.0, 69.0, 81.0, 108.0, 143.0, 216.0, 333.0, 489.0, 724.0, 1109.0, 1788.0, 2812.0, 5143.0, 11100.0, 35137.0, 253462.0, 1494864.0, 1929695.0, 381752.0, 49243.0, 12019.0, 5573.0, 3088.0, 1833.0, 1142.0, 771.0, 406.0, 331.0, 220.0, 153.0, 105.0, 72.0, 55.0, 38.0, 15.0, 28.0, 13.0, 14.0, 9.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.755859375, -2.654144287109375, -2.55242919921875, -2.450714111328125, -2.3489990234375, -2.247283935546875, -2.14556884765625, -2.043853759765625, -1.942138671875, -1.840423583984375, -1.73870849609375, -1.636993408203125, -1.5352783203125, -1.433563232421875, -1.33184814453125, -1.230133056640625, -1.12841796875, -1.026702880859375, -0.92498779296875, -0.823272705078125, -0.7215576171875, -0.619842529296875, -0.51812744140625, -0.416412353515625, -0.314697265625, -0.212982177734375, -0.11126708984375, -0.009552001953125, 0.0921630859375, 0.193878173828125, 0.29559326171875, 0.397308349609375, 0.4990234375, 0.600738525390625, 0.70245361328125, 0.804168701171875, 0.9058837890625, 1.007598876953125, 1.10931396484375, 1.211029052734375, 1.312744140625, 1.414459228515625, 1.51617431640625, 1.617889404296875, 1.7196044921875, 1.821319580078125, 1.92303466796875, 2.024749755859375, 2.12646484375, 2.228179931640625, 2.32989501953125, 2.431610107421875, 2.5333251953125, 2.635040283203125, 2.73675537109375, 2.838470458984375, 2.940185546875, 3.041900634765625, 3.14361572265625, 3.245330810546875, 3.3470458984375, 3.448760986328125, 3.55047607421875, 3.652191162109375, 3.75390625]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 5.0, 5.0, 6.0, 5.0, 8.0, 15.0, 13.0, 14.0, 22.0, 24.0, 29.0, 21.0, 38.0, 26.0, 51.0, 35.0, 32.0, 49.0, 40.0, 36.0, 35.0, 45.0, 51.0, 41.0, 46.0, 38.0, 28.0, 27.0, 32.0, 31.0, 26.0, 18.0, 12.0, 25.0, 19.0, 17.0, 8.0, 8.0, 8.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.779296875, -1.717010498046875, -1.65472412109375, -1.592437744140625, -1.5301513671875, -1.467864990234375, -1.40557861328125, -1.343292236328125, -1.281005859375, -1.218719482421875, -1.15643310546875, -1.094146728515625, -1.0318603515625, -0.969573974609375, -0.90728759765625, -0.845001220703125, -0.78271484375, -0.720428466796875, -0.65814208984375, -0.595855712890625, -0.5335693359375, -0.471282958984375, -0.40899658203125, -0.346710205078125, -0.284423828125, -0.222137451171875, -0.15985107421875, -0.097564697265625, -0.0352783203125, 0.027008056640625, 0.08929443359375, 0.151580810546875, 0.2138671875, 0.276153564453125, 0.33843994140625, 0.400726318359375, 0.4630126953125, 0.525299072265625, 0.58758544921875, 0.649871826171875, 0.712158203125, 0.774444580078125, 0.83673095703125, 0.899017333984375, 0.9613037109375, 1.023590087890625, 1.08587646484375, 1.148162841796875, 1.21044921875, 1.272735595703125, 1.33502197265625, 1.397308349609375, 1.4595947265625, 1.521881103515625, 1.58416748046875, 1.646453857421875, 1.708740234375, 1.771026611328125, 1.83331298828125, 1.895599365234375, 1.9578857421875, 2.020172119140625, 2.08245849609375, 2.144744873046875, 2.20703125]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 9.0, 11.0, 14.0, 35.0, 69.0, 190.0, 1104.0, 72219.0, 4115758.0, 4331.0, 374.0, 83.0, 35.0, 24.0, 9.0, 8.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.015625, -23.333984375, -22.65234375, -21.970703125, -21.2890625, -20.607421875, -19.92578125, -19.244140625, -18.5625, -17.880859375, -17.19921875, -16.517578125, -15.8359375, -15.154296875, -14.47265625, -13.791015625, -13.109375, -12.427734375, -11.74609375, -11.064453125, -10.3828125, -9.701171875, -9.01953125, -8.337890625, -7.65625, -6.974609375, -6.29296875, -5.611328125, -4.9296875, -4.248046875, -3.56640625, -2.884765625, -2.203125, -1.521484375, -0.83984375, -0.158203125, 0.5234375, 1.205078125, 1.88671875, 2.568359375, 3.25, 3.931640625, 4.61328125, 5.294921875, 5.9765625, 6.658203125, 7.33984375, 8.021484375, 8.703125, 9.384765625, 10.06640625, 10.748046875, 11.4296875, 12.111328125, 12.79296875, 13.474609375, 14.15625, 14.837890625, 15.51953125, 16.201171875, 16.8828125, 17.564453125, 18.24609375, 18.927734375, 19.609375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 5.0, 6.0, 9.0, 10.0, 17.0, 16.0, 31.0, 34.0, 73.0, 111.0, 172.0, 353.0, 783.0, 1166.0, 610.0, 289.0, 158.0, 71.0, 62.0, 29.0, 12.0, 17.0, 13.0, 9.0, 5.0, 8.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4169921875, -1.3744964599609375, -1.332000732421875, -1.2895050048828125, -1.24700927734375, -1.2045135498046875, -1.162017822265625, -1.1195220947265625, -1.0770263671875, -1.0345306396484375, -0.992034912109375, -0.9495391845703125, -0.90704345703125, -0.8645477294921875, -0.822052001953125, -0.7795562744140625, -0.737060546875, -0.6945648193359375, -0.652069091796875, -0.6095733642578125, -0.56707763671875, -0.5245819091796875, -0.482086181640625, -0.4395904541015625, -0.3970947265625, -0.3545989990234375, -0.312103271484375, -0.2696075439453125, -0.22711181640625, -0.1846160888671875, -0.142120361328125, -0.0996246337890625, -0.05712890625, -0.0146331787109375, 0.027862548828125, 0.0703582763671875, 0.11285400390625, 0.1553497314453125, 0.197845458984375, 0.2403411865234375, 0.2828369140625, 0.3253326416015625, 0.367828369140625, 0.4103240966796875, 0.45281982421875, 0.4953155517578125, 0.537811279296875, 0.5803070068359375, 0.622802734375, 0.6652984619140625, 0.707794189453125, 0.7502899169921875, 0.79278564453125, 0.8352813720703125, 0.877777099609375, 0.9202728271484375, 0.9627685546875, 1.0052642822265625, 1.047760009765625, 1.0902557373046875, 1.13275146484375, 1.1752471923828125, 1.217742919921875, 1.2602386474609375, 1.302734375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 2.0, 7.0, 15.0, 5.0, 12.0, 19.0, 22.0, 31.0, 25.0, 47.0, 40.0, 45.0, 76.0, 58.0, 75.0, 69.0, 54.0, 69.0, 55.0, 58.0, 45.0, 32.0, 15.0, 26.0, 20.0, 15.0, 13.0, 12.0, 4.0, 7.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.4160919189453125, -2.338754892349243, -2.261418104171753, -2.1840810775756836, -2.1067442893981934, -2.029407262802124, -1.9520702362060547, -1.874733328819275, -1.7973964214324951, -1.7200595140457153, -1.6427226066589355, -1.5653855800628662, -1.4880486726760864, -1.4107117652893066, -1.3333747386932373, -1.2560378313064575, -1.1787009239196777, -1.101364016532898, -1.0240271091461182, -0.9466900825500488, -0.869353175163269, -0.7920162677764893, -0.7146793007850647, -0.6373423337936401, -0.5600054264068604, -0.4826684892177582, -0.405331552028656, -0.32799461483955383, -0.25065767765045166, -0.1733207404613495, -0.09598380327224731, -0.018646836280822754, 0.05869007110595703, 0.1360270082950592, 0.21336394548416138, 0.29070088267326355, 0.3680378198623657, 0.4453747570514679, 0.5227116942405701, 0.6000486612319946, 0.6773855686187744, 0.7547224760055542, 0.8320594429969788, 0.9093964099884033, 0.9867333173751831, 1.064070224761963, 1.1414072513580322, 1.218744158744812, 1.2960810661315918, 1.3734179735183716, 1.4507548809051514, 1.5280919075012207, 1.6054288148880005, 1.6827657222747803, 1.7601027488708496, 1.8374396562576294, 1.9147765636444092, 1.992113471031189, 2.0694503784179688, 2.146787405014038, 2.2241244316101074, 2.3014612197875977, 2.378798246383667, 2.4561352729797363, 2.5334720611572266]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 5.0, 6.0, 5.0, 7.0, 7.0, 14.0, 12.0, 13.0, 21.0, 22.0, 21.0, 22.0, 24.0, 18.0, 25.0, 42.0, 28.0, 30.0, 37.0, 35.0, 32.0, 46.0, 38.0, 38.0, 31.0, 43.0, 43.0, 28.0, 34.0, 23.0, 23.0, 31.0, 27.0, 16.0, 17.0, 29.0, 16.0, 11.0, 10.0, 11.0, 10.0, 5.0, 11.0, 10.0, 2.0, 7.0, 7.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.5252161026000977, -1.4722870588302612, -1.4193580150604248, -1.3664289712905884, -1.313499927520752, -1.2605708837509155, -1.207641839981079, -1.1547127962112427, -1.1017837524414062, -1.0488547086715698, -0.9959256649017334, -0.942996621131897, -0.8900675773620605, -0.8371385335922241, -0.7842094898223877, -0.7312804460525513, -0.6783514022827148, -0.6254223585128784, -0.572493314743042, -0.5195642709732056, -0.46663522720336914, -0.4137061834335327, -0.3607771396636963, -0.30784809589385986, -0.25491905212402344, -0.201990008354187, -0.14906096458435059, -0.09613192081451416, -0.043202877044677734, 0.009726166725158691, 0.06265521049499512, 0.11558425426483154, 0.16851329803466797, 0.2214423418045044, 0.2743713855743408, 0.32730042934417725, 0.38022947311401367, 0.4331585168838501, 0.4860875606536865, 0.539016604423523, 0.5919456481933594, 0.6448746919631958, 0.6978037357330322, 0.7507327795028687, 0.8036618232727051, 0.8565908670425415, 0.9095199108123779, 0.9624489545822144, 1.0153779983520508, 1.0683070421218872, 1.1212360858917236, 1.17416512966156, 1.2270941734313965, 1.280023217201233, 1.3329522609710693, 1.3858813047409058, 1.4388103485107422, 1.4917393922805786, 1.544668436050415, 1.5975974798202515, 1.650526523590088, 1.7034555673599243, 1.7563846111297607, 1.8093136548995972, 1.8622426986694336]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 10.0, 22.0, 26.0, 35.0, 37.0, 71.0, 113.0, 180.0, 268.0, 426.0, 663.0, 1009.0, 1680.0, 2860.0, 4783.0, 8412.0, 15122.0, 28238.0, 53580.0, 103487.0, 196989.0, 266994.0, 171798.0, 89652.0, 46017.0, 24477.0, 13384.0, 7520.0, 4223.0, 2459.0, 1473.0, 875.0, 619.0, 357.0, 237.0, 143.0, 113.0, 69.0, 30.0, 29.0, 16.0, 20.0, 13.0, 8.0, 4.0, 7.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.7880859375, -0.765167236328125, -0.74224853515625, -0.719329833984375, -0.6964111328125, -0.673492431640625, -0.65057373046875, -0.627655029296875, -0.604736328125, -0.581817626953125, -0.55889892578125, -0.535980224609375, -0.5130615234375, -0.490142822265625, -0.46722412109375, -0.444305419921875, -0.42138671875, -0.398468017578125, -0.37554931640625, -0.352630615234375, -0.3297119140625, -0.306793212890625, -0.28387451171875, -0.260955810546875, -0.238037109375, -0.215118408203125, -0.19219970703125, -0.169281005859375, -0.1463623046875, -0.123443603515625, -0.10052490234375, -0.077606201171875, -0.0546875, -0.031768798828125, -0.00885009765625, 0.014068603515625, 0.0369873046875, 0.059906005859375, 0.08282470703125, 0.105743408203125, 0.128662109375, 0.151580810546875, 0.17449951171875, 0.197418212890625, 0.2203369140625, 0.243255615234375, 0.26617431640625, 0.289093017578125, 0.31201171875, 0.334930419921875, 0.35784912109375, 0.380767822265625, 0.4036865234375, 0.426605224609375, 0.44952392578125, 0.472442626953125, 0.495361328125, 0.518280029296875, 0.54119873046875, 0.564117431640625, 0.5870361328125, 0.609954833984375, 0.63287353515625, 0.655792236328125, 0.6787109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 4.0, 5.0, 2.0, 6.0, 7.0, 7.0, 8.0, 12.0, 13.0, 18.0, 11.0, 18.0, 21.0, 28.0, 28.0, 27.0, 41.0, 32.0, 42.0, 45.0, 47.0, 49.0, 52.0, 43.0, 46.0, 42.0, 39.0, 44.0, 34.0, 31.0, 36.0, 25.0, 20.0, 21.0, 17.0, 10.0, 15.0, 11.0, 12.0, 9.0, 12.0, 4.0, 4.0, 3.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.26953125, -1.22235107421875, -1.1751708984375, -1.12799072265625, -1.080810546875, -1.03363037109375, -0.9864501953125, -0.93927001953125, -0.89208984375, -0.84490966796875, -0.7977294921875, -0.75054931640625, -0.703369140625, -0.65618896484375, -0.6090087890625, -0.56182861328125, -0.5146484375, -0.46746826171875, -0.4202880859375, -0.37310791015625, -0.325927734375, -0.27874755859375, -0.2315673828125, -0.18438720703125, -0.13720703125, -0.09002685546875, -0.0428466796875, 0.00433349609375, 0.051513671875, 0.09869384765625, 0.1458740234375, 0.19305419921875, 0.240234375, 0.28741455078125, 0.3345947265625, 0.38177490234375, 0.428955078125, 0.47613525390625, 0.5233154296875, 0.57049560546875, 0.61767578125, 0.66485595703125, 0.7120361328125, 0.75921630859375, 0.806396484375, 0.85357666015625, 0.9007568359375, 0.94793701171875, 0.9951171875, 1.04229736328125, 1.0894775390625, 1.13665771484375, 1.183837890625, 1.23101806640625, 1.2781982421875, 1.32537841796875, 1.37255859375, 1.41973876953125, 1.4669189453125, 1.51409912109375, 1.561279296875, 1.60845947265625, 1.6556396484375, 1.70281982421875, 1.75]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 10.0, 15.0, 12.0, 17.0, 32.0, 33.0, 62.0, 74.0, 128.0, 193.0, 288.0, 464.0, 703.0, 1278.0, 2151.0, 4019.0, 7694.0, 15403.0, 32524.0, 70982.0, 159869.0, 294964.0, 242945.0, 115665.0, 51133.0, 23396.0, 11391.0, 5792.0, 3010.0, 1669.0, 999.0, 592.0, 360.0, 205.0, 139.0, 113.0, 68.0, 51.0, 37.0, 20.0, 20.0, 6.0, 7.0, 7.0, 8.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.74365234375, -0.7202606201171875, -0.696868896484375, -0.6734771728515625, -0.65008544921875, -0.6266937255859375, -0.603302001953125, -0.5799102783203125, -0.5565185546875, -0.5331268310546875, -0.509735107421875, -0.4863433837890625, -0.46295166015625, -0.4395599365234375, -0.416168212890625, -0.3927764892578125, -0.369384765625, -0.3459930419921875, -0.322601318359375, -0.2992095947265625, -0.27581787109375, -0.2524261474609375, -0.229034423828125, -0.2056427001953125, -0.1822509765625, -0.1588592529296875, -0.135467529296875, -0.1120758056640625, -0.08868408203125, -0.0652923583984375, -0.041900634765625, -0.0185089111328125, 0.0048828125, 0.0282745361328125, 0.051666259765625, 0.0750579833984375, 0.09844970703125, 0.1218414306640625, 0.145233154296875, 0.1686248779296875, 0.1920166015625, 0.2154083251953125, 0.238800048828125, 0.2621917724609375, 0.28558349609375, 0.3089752197265625, 0.332366943359375, 0.3557586669921875, 0.379150390625, 0.4025421142578125, 0.425933837890625, 0.4493255615234375, 0.47271728515625, 0.4961090087890625, 0.519500732421875, 0.5428924560546875, 0.5662841796875, 0.5896759033203125, 0.613067626953125, 0.6364593505859375, 0.65985107421875, 0.6832427978515625, 0.706634521484375, 0.7300262451171875, 0.75341796875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 7.0, 5.0, 3.0, 8.0, 13.0, 12.0, 13.0, 17.0, 16.0, 25.0, 23.0, 26.0, 21.0, 35.0, 20.0, 32.0, 42.0, 37.0, 44.0, 38.0, 50.0, 53.0, 32.0, 44.0, 50.0, 40.0, 46.0, 26.0, 29.0, 39.0, 25.0, 28.0, 18.0, 28.0, 12.0, 9.0, 7.0, 9.0, 7.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-3.134765625, -3.03961181640625, -2.9444580078125, -2.84930419921875, -2.754150390625, -2.65899658203125, -2.5638427734375, -2.46868896484375, -2.37353515625, -2.27838134765625, -2.1832275390625, -2.08807373046875, -1.992919921875, -1.89776611328125, -1.8026123046875, -1.70745849609375, -1.6123046875, -1.51715087890625, -1.4219970703125, -1.32684326171875, -1.231689453125, -1.13653564453125, -1.0413818359375, -0.94622802734375, -0.85107421875, -0.75592041015625, -0.6607666015625, -0.56561279296875, -0.470458984375, -0.37530517578125, -0.2801513671875, -0.18499755859375, -0.08984375, 0.00531005859375, 0.1004638671875, 0.19561767578125, 0.290771484375, 0.38592529296875, 0.4810791015625, 0.57623291015625, 0.67138671875, 0.76654052734375, 0.8616943359375, 0.95684814453125, 1.052001953125, 1.14715576171875, 1.2423095703125, 1.33746337890625, 1.4326171875, 1.52777099609375, 1.6229248046875, 1.71807861328125, 1.813232421875, 1.90838623046875, 2.0035400390625, 2.09869384765625, 2.19384765625, 2.28900146484375, 2.3841552734375, 2.47930908203125, 2.574462890625, 2.66961669921875, 2.7647705078125, 2.85992431640625, 2.955078125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 6.0, 4.0, 8.0, 5.0, 10.0, 12.0, 20.0, 19.0, 37.0, 60.0, 79.0, 118.0, 192.0, 328.0, 528.0, 979.0, 2254.0, 7072.0, 46388.0, 671507.0, 289266.0, 21671.0, 4387.0, 1570.0, 845.0, 464.0, 247.0, 171.0, 92.0, 67.0, 56.0, 30.0, 23.0, 16.0, 12.0, 12.0, 4.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.68798828125, -0.6676483154296875, -0.647308349609375, -0.6269683837890625, -0.60662841796875, -0.5862884521484375, -0.565948486328125, -0.5456085205078125, -0.5252685546875, -0.5049285888671875, -0.484588623046875, -0.4642486572265625, -0.44390869140625, -0.4235687255859375, -0.403228759765625, -0.3828887939453125, -0.362548828125, -0.3422088623046875, -0.321868896484375, -0.3015289306640625, -0.28118896484375, -0.2608489990234375, -0.240509033203125, -0.2201690673828125, -0.1998291015625, -0.1794891357421875, -0.159149169921875, -0.1388092041015625, -0.11846923828125, -0.0981292724609375, -0.077789306640625, -0.0574493408203125, -0.037109375, -0.0167694091796875, 0.003570556640625, 0.0239105224609375, 0.04425048828125, 0.0645904541015625, 0.084930419921875, 0.1052703857421875, 0.1256103515625, 0.1459503173828125, 0.166290283203125, 0.1866302490234375, 0.20697021484375, 0.2273101806640625, 0.247650146484375, 0.2679901123046875, 0.288330078125, 0.3086700439453125, 0.329010009765625, 0.3493499755859375, 0.36968994140625, 0.3900299072265625, 0.410369873046875, 0.4307098388671875, 0.4510498046875, 0.4713897705078125, 0.491729736328125, 0.5120697021484375, 0.53240966796875, 0.5527496337890625, 0.573089599609375, 0.5934295654296875, 0.61376953125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 7.0, 4.0, 8.0, 7.0, 15.0, 29.0, 51.0, 65.0, 101.0, 154.0, 159.0, 144.0, 84.0, 55.0, 30.0, 31.0, 17.0, 20.0, 9.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002949237823486328, -0.0002832375466823578, -0.00027155131101608276, -0.00025986507534980774, -0.0002481788396835327, -0.0002364926040172577, -0.00022480636835098267, -0.00021312013268470764, -0.00020143389701843262, -0.0001897476613521576, -0.00017806142568588257, -0.00016637519001960754, -0.00015468895435333252, -0.0001430027186870575, -0.00013131648302078247, -0.00011963024735450745, -0.00010794401168823242, -9.62577760219574e-05, -8.457154035568237e-05, -7.288530468940735e-05, -6.119906902313232e-05, -4.95128333568573e-05, -3.7826597690582275e-05, -2.614036202430725e-05, -1.4454126358032227e-05, -2.767890691757202e-06, 8.918344974517822e-06, 2.0604580640792847e-05, 3.229081630706787e-05, 4.3977051973342896e-05, 5.566328763961792e-05, 6.734952330589294e-05, 7.903575897216797e-05, 9.072199463844299e-05, 0.00010240823030471802, 0.00011409446597099304, 0.00012578070163726807, 0.0001374669373035431, 0.00014915317296981812, 0.00016083940863609314, 0.00017252564430236816, 0.0001842118799686432, 0.0001958981156349182, 0.00020758435130119324, 0.00021927058696746826, 0.00023095682263374329, 0.0002426430583000183, 0.00025432929396629333, 0.00026601552963256836, 0.0002777017652988434, 0.0002893880009651184, 0.00030107423663139343, 0.00031276047229766846, 0.0003244467079639435, 0.0003361329436302185, 0.00034781917929649353, 0.00035950541496276855, 0.0003711916506290436, 0.0003828778862953186, 0.00039456412196159363, 0.00040625035762786865, 0.0004179365932941437, 0.0004296228289604187, 0.0004413090646266937, 0.00045299530029296875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 8.0, 8.0, 20.0, 12.0, 25.0, 41.0, 45.0, 82.0, 87.0, 131.0, 202.0, 270.0, 389.0, 523.0, 879.0, 1340.0, 2273.0, 4957.0, 13336.0, 58022.0, 393063.0, 473034.0, 71771.0, 15891.0, 5460.0, 2486.0, 1394.0, 883.0, 589.0, 361.0, 280.0, 187.0, 138.0, 103.0, 65.0, 47.0, 34.0, 28.0, 24.0, 21.0, 10.0, 13.0, 6.0, 3.0, 2.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.429443359375, -0.4151573181152344, -0.40087127685546875, -0.3865852355957031, -0.3722991943359375, -0.3580131530761719, -0.34372711181640625, -0.3294410705566406, -0.315155029296875, -0.3008689880371094, -0.28658294677734375, -0.2722969055175781, -0.2580108642578125, -0.24372482299804688, -0.22943878173828125, -0.21515274047851562, -0.20086669921875, -0.18658065795898438, -0.17229461669921875, -0.15800857543945312, -0.1437225341796875, -0.12943649291992188, -0.11515045166015625, -0.10086441040039062, -0.086578369140625, -0.07229232788085938, -0.05800628662109375, -0.043720245361328125, -0.0294342041015625, -0.015148162841796875, -0.00086212158203125, 0.013423919677734375, 0.0277099609375, 0.041996002197265625, 0.05628204345703125, 0.07056808471679688, 0.0848541259765625, 0.09914016723632812, 0.11342620849609375, 0.12771224975585938, 0.141998291015625, 0.15628433227539062, 0.17057037353515625, 0.18485641479492188, 0.1991424560546875, 0.21342849731445312, 0.22771453857421875, 0.24200057983398438, 0.25628662109375, 0.2705726623535156, 0.28485870361328125, 0.2991447448730469, 0.3134307861328125, 0.3277168273925781, 0.34200286865234375, 0.3562889099121094, 0.370574951171875, 0.3848609924316406, 0.39914703369140625, 0.4134330749511719, 0.4277191162109375, 0.4420051574707031, 0.45629119873046875, 0.4705772399902344, 0.48486328125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 5.0, 4.0, 11.0, 14.0, 29.0, 40.0, 64.0, 93.0, 105.0, 133.0, 121.0, 117.0, 96.0, 67.0, 36.0, 19.0, 14.0, 10.0, 4.0, 3.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1915283203125, -0.18604087829589844, -0.18055343627929688, -0.1750659942626953, -0.16957855224609375, -0.1640911102294922, -0.15860366821289062, -0.15311622619628906, -0.1476287841796875, -0.14214134216308594, -0.13665390014648438, -0.1311664581298828, -0.12567901611328125, -0.12019157409667969, -0.11470413208007812, -0.10921669006347656, -0.103729248046875, -0.09824180603027344, -0.09275436401367188, -0.08726692199707031, -0.08177947998046875, -0.07629203796386719, -0.07080459594726562, -0.06531715393066406, -0.0598297119140625, -0.05434226989746094, -0.048854827880859375, -0.04336738586425781, -0.03787994384765625, -0.03239250183105469, -0.026905059814453125, -0.021417617797851562, -0.01593017578125, -0.010442733764648438, -0.004955291748046875, 0.0005321502685546875, 0.00601959228515625, 0.011507034301757812, 0.016994476318359375, 0.022481918334960938, 0.0279693603515625, 0.03345680236816406, 0.038944244384765625, 0.04443168640136719, 0.04991912841796875, 0.05540657043457031, 0.060894012451171875, 0.06638145446777344, 0.071868896484375, 0.07735633850097656, 0.08284378051757812, 0.08833122253417969, 0.09381866455078125, 0.09930610656738281, 0.10479354858398438, 0.11028099060058594, 0.1157684326171875, 0.12125587463378906, 0.12674331665039062, 0.1322307586669922, 0.13771820068359375, 0.1432056427001953, 0.14869308471679688, 0.15418052673339844, 0.15966796875]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 6.0, 3.0, 5.0, 9.0, 12.0, 18.0, 23.0, 25.0, 39.0, 47.0, 82.0, 85.0, 111.0, 99.0, 105.0, 79.0, 79.0, 49.0, 37.0, 28.0, 22.0, 10.0, 8.0, 6.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6781560182571411, -1.5998300313949585, -1.5215039253234863, -1.4431779384613037, -1.364851951599121, -1.2865259647369385, -1.2081998586654663, -1.1298738718032837, -1.0515477657318115, -0.9732217192649841, -0.8948957324028015, -0.8165696859359741, -0.7382436990737915, -0.6599176526069641, -0.5815916061401367, -0.5032656192779541, -0.4249396324157715, -0.3466136157512665, -0.2682875990867615, -0.18996155261993408, -0.11163553595542908, -0.03330951929092407, 0.04501652717590332, 0.12334251403808594, 0.20166856050491333, 0.27999457716941833, 0.35832059383392334, 0.43664664030075073, 0.5149726867675781, 0.5932986736297607, 0.6716247200965881, 0.7499507069587708, 0.8282766342163086, 0.906602680683136, 0.9849286675453186, 1.063254714012146, 1.1415807008743286, 1.2199068069458008, 1.2982327938079834, 1.376558780670166, 1.4548847675323486, 1.5332107543945312, 1.6115368604660034, 1.689862847328186, 1.7681888341903687, 1.8465149402618408, 1.9248409271240234, 2.003166913986206, 2.0814929008483887, 2.1598188877105713, 2.238144874572754, 2.3164710998535156, 2.3947970867156982, 2.473123073577881, 2.5514490604400635, 2.629775047302246, 2.708101272583008, 2.7864272594451904, 2.864753246307373, 2.9430794715881348, 3.0214054584503174, 3.0997314453125, 3.1780574321746826, 3.2563834190368652, 3.334709405899048]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 2.0, 4.0, 1.0, 8.0, 2.0, 6.0, 9.0, 9.0, 10.0, 20.0, 23.0, 19.0, 16.0, 21.0, 22.0, 25.0, 38.0, 33.0, 41.0, 43.0, 40.0, 33.0, 44.0, 31.0, 40.0, 50.0, 41.0, 42.0, 32.0, 41.0, 27.0, 29.0, 37.0, 23.0, 18.0, 15.0, 18.0, 17.0, 16.0, 15.0, 7.0, 7.0, 3.0, 9.0, 5.0, 2.0, 4.0, 4.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1356970071792603, -1.0936849117279053, -1.0516726970672607, -1.0096604824066162, -0.9676483869552612, -0.9256362318992615, -0.8836240768432617, -0.841611921787262, -0.7995997667312622, -0.7575876116752625, -0.7155754566192627, -0.6735633015632629, -0.6315511465072632, -0.5895389914512634, -0.5475268363952637, -0.5055146813392639, -0.46350252628326416, -0.4214903712272644, -0.37947821617126465, -0.3374660611152649, -0.29545390605926514, -0.2534417510032654, -0.21142959594726562, -0.16941744089126587, -0.1274052858352661, -0.08539313077926636, -0.0433809757232666, -0.0013688206672668457, 0.04064333438873291, 0.08265548944473267, 0.12466764450073242, 0.16667979955673218, 0.20869183540344238, 0.25070399045944214, 0.2927161455154419, 0.33472830057144165, 0.3767404556274414, 0.41875261068344116, 0.4607647657394409, 0.5027769207954407, 0.5447890758514404, 0.5868012309074402, 0.6288133859634399, 0.6708255410194397, 0.7128376960754395, 0.7548498511314392, 0.796862006187439, 0.8388741612434387, 0.8808863162994385, 0.9228984713554382, 0.964910626411438, 1.006922721862793, 1.0489349365234375, 1.090947151184082, 1.132959246635437, 1.174971342086792, 1.2169835567474365, 1.258995771408081, 1.301007866859436, 1.343019962310791, 1.3850321769714355, 1.42704439163208, 1.469056487083435, 1.51106858253479, 1.5530807971954346]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 4.0, 9.0, 7.0, 12.0, 12.0, 12.0, 21.0, 14.0, 29.0, 37.0, 41.0, 63.0, 79.0, 74.0, 115.0, 133.0, 187.0, 246.0, 331.0, 412.0, 605.0, 815.0, 1139.0, 1732.0, 2703.0, 4822.0, 10274.0, 32918.0, 194597.0, 638040.0, 115614.0, 23175.0, 8167.0, 4069.0, 2487.0, 1547.0, 1037.0, 741.0, 529.0, 407.0, 278.0, 213.0, 170.0, 137.0, 121.0, 87.0, 73.0, 51.0, 43.0, 30.0, 23.0, 19.0, 17.0, 7.0, 13.0, 10.0, 6.0, 5.0, 2.0, 4.0, 4.0, 1.0], "bins": [-0.9267578125, -0.897216796875, -0.86767578125, -0.838134765625, -0.80859375, -0.779052734375, -0.74951171875, -0.719970703125, -0.6904296875, -0.660888671875, -0.63134765625, -0.601806640625, -0.572265625, -0.542724609375, -0.51318359375, -0.483642578125, -0.4541015625, -0.424560546875, -0.39501953125, -0.365478515625, -0.3359375, -0.306396484375, -0.27685546875, -0.247314453125, -0.2177734375, -0.188232421875, -0.15869140625, -0.129150390625, -0.099609375, -0.070068359375, -0.04052734375, -0.010986328125, 0.0185546875, 0.048095703125, 0.07763671875, 0.107177734375, 0.13671875, 0.166259765625, 0.19580078125, 0.225341796875, 0.2548828125, 0.284423828125, 0.31396484375, 0.343505859375, 0.373046875, 0.402587890625, 0.43212890625, 0.461669921875, 0.4912109375, 0.520751953125, 0.55029296875, 0.579833984375, 0.609375, 0.638916015625, 0.66845703125, 0.697998046875, 0.7275390625, 0.757080078125, 0.78662109375, 0.816162109375, 0.845703125, 0.875244140625, 0.90478515625, 0.934326171875, 0.9638671875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 3.0, 7.0, 4.0, 9.0, 13.0, 14.0, 14.0, 11.0, 17.0, 28.0, 17.0, 21.0, 33.0, 36.0, 33.0, 30.0, 43.0, 43.0, 33.0, 29.0, 64.0, 28.0, 42.0, 41.0, 27.0, 45.0, 35.0, 35.0, 17.0, 30.0, 26.0, 21.0, 29.0, 14.0, 7.0, 12.0, 17.0, 13.0, 13.0, 6.0, 8.0, 5.0, 6.0, 7.0, 1.0, 2.0, 5.0, 0.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.109375, -2.039581298828125, -1.96978759765625, -1.899993896484375, -1.8302001953125, -1.760406494140625, -1.69061279296875, -1.620819091796875, -1.551025390625, -1.481231689453125, -1.41143798828125, -1.341644287109375, -1.2718505859375, -1.202056884765625, -1.13226318359375, -1.062469482421875, -0.99267578125, -0.922882080078125, -0.85308837890625, -0.783294677734375, -0.7135009765625, -0.643707275390625, -0.57391357421875, -0.504119873046875, -0.434326171875, -0.364532470703125, -0.29473876953125, -0.224945068359375, -0.1551513671875, -0.085357666015625, -0.01556396484375, 0.054229736328125, 0.1240234375, 0.193817138671875, 0.26361083984375, 0.333404541015625, 0.4031982421875, 0.472991943359375, 0.54278564453125, 0.612579345703125, 0.682373046875, 0.752166748046875, 0.82196044921875, 0.891754150390625, 0.9615478515625, 1.031341552734375, 1.10113525390625, 1.170928955078125, 1.24072265625, 1.310516357421875, 1.38031005859375, 1.450103759765625, 1.5198974609375, 1.589691162109375, 1.65948486328125, 1.729278564453125, 1.799072265625, 1.868865966796875, 1.93865966796875, 2.008453369140625, 2.0782470703125, 2.148040771484375, 2.21783447265625, 2.287628173828125, 2.357421875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 9.0, 8.0, 14.0, 20.0, 28.0, 24.0, 41.0, 44.0, 80.0, 120.0, 172.0, 227.0, 385.0, 746.0, 1181.0, 2309.0, 5624.0, 18106.0, 192172.0, 766301.0, 44250.0, 9232.0, 3542.0, 1632.0, 865.0, 491.0, 294.0, 176.0, 121.0, 82.0, 59.0, 54.0, 31.0, 21.0, 18.0, 14.0, 12.0, 12.0, 8.0, 8.0, 3.0, 4.0, 5.0, 4.0, 2.0, 1.0], "bins": [-1.970703125, -1.91778564453125, -1.8648681640625, -1.81195068359375, -1.759033203125, -1.70611572265625, -1.6531982421875, -1.60028076171875, -1.54736328125, -1.49444580078125, -1.4415283203125, -1.38861083984375, -1.335693359375, -1.28277587890625, -1.2298583984375, -1.17694091796875, -1.1240234375, -1.07110595703125, -1.0181884765625, -0.96527099609375, -0.912353515625, -0.85943603515625, -0.8065185546875, -0.75360107421875, -0.70068359375, -0.64776611328125, -0.5948486328125, -0.54193115234375, -0.489013671875, -0.43609619140625, -0.3831787109375, -0.33026123046875, -0.27734375, -0.22442626953125, -0.1715087890625, -0.11859130859375, -0.065673828125, -0.01275634765625, 0.0401611328125, 0.09307861328125, 0.14599609375, 0.19891357421875, 0.2518310546875, 0.30474853515625, 0.357666015625, 0.41058349609375, 0.4635009765625, 0.51641845703125, 0.5693359375, 0.62225341796875, 0.6751708984375, 0.72808837890625, 0.781005859375, 0.83392333984375, 0.8868408203125, 0.93975830078125, 0.99267578125, 1.04559326171875, 1.0985107421875, 1.15142822265625, 1.204345703125, 1.25726318359375, 1.3101806640625, 1.36309814453125, 1.416015625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 6.0, 6.0, 7.0, 5.0, 11.0, 19.0, 19.0, 11.0, 23.0, 25.0, 31.0, 18.0, 41.0, 36.0, 32.0, 51.0, 42.0, 40.0, 49.0, 51.0, 60.0, 47.0, 58.0, 34.0, 42.0, 45.0, 26.0, 22.0, 20.0, 28.0, 20.0, 17.0, 8.0, 6.0, 9.0, 9.0, 5.0, 6.0, 5.0, 4.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0], "bins": [-3.32421875, -3.2357177734375, -3.147216796875, -3.0587158203125, -2.97021484375, -2.8817138671875, -2.793212890625, -2.7047119140625, -2.6162109375, -2.5277099609375, -2.439208984375, -2.3507080078125, -2.26220703125, -2.1737060546875, -2.085205078125, -1.9967041015625, -1.908203125, -1.8197021484375, -1.731201171875, -1.6427001953125, -1.55419921875, -1.4656982421875, -1.377197265625, -1.2886962890625, -1.2001953125, -1.1116943359375, -1.023193359375, -0.9346923828125, -0.84619140625, -0.7576904296875, -0.669189453125, -0.5806884765625, -0.4921875, -0.4036865234375, -0.315185546875, -0.2266845703125, -0.13818359375, -0.0496826171875, 0.038818359375, 0.1273193359375, 0.2158203125, 0.3043212890625, 0.392822265625, 0.4813232421875, 0.56982421875, 0.6583251953125, 0.746826171875, 0.8353271484375, 0.923828125, 1.0123291015625, 1.100830078125, 1.1893310546875, 1.27783203125, 1.3663330078125, 1.454833984375, 1.5433349609375, 1.6318359375, 1.7203369140625, 1.808837890625, 1.8973388671875, 1.98583984375, 2.0743408203125, 2.162841796875, 2.2513427734375, 2.33984375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 1.0, 2.0, 10.0, 7.0, 20.0, 16.0, 18.0, 23.0, 34.0, 47.0, 60.0, 107.0, 168.0, 249.0, 436.0, 743.0, 1417.0, 2806.0, 6814.0, 21629.0, 257636.0, 712861.0, 28339.0, 8145.0, 3216.0, 1635.0, 811.0, 473.0, 272.0, 145.0, 129.0, 85.0, 60.0, 38.0, 30.0, 12.0, 17.0, 13.0, 11.0, 6.0, 3.0, 4.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61083984375, -0.5911941528320312, -0.5715484619140625, -0.5519027709960938, -0.532257080078125, -0.5126113891601562, -0.4929656982421875, -0.47332000732421875, -0.45367431640625, -0.43402862548828125, -0.4143829345703125, -0.39473724365234375, -0.375091552734375, -0.35544586181640625, -0.3358001708984375, -0.31615447998046875, -0.2965087890625, -0.27686309814453125, -0.2572174072265625, -0.23757171630859375, -0.217926025390625, -0.19828033447265625, -0.1786346435546875, -0.15898895263671875, -0.13934326171875, -0.11969757080078125, -0.1000518798828125, -0.08040618896484375, -0.060760498046875, -0.04111480712890625, -0.0214691162109375, -0.00182342529296875, 0.017822265625, 0.03746795654296875, 0.0571136474609375, 0.07675933837890625, 0.096405029296875, 0.11605072021484375, 0.1356964111328125, 0.15534210205078125, 0.17498779296875, 0.19463348388671875, 0.2142791748046875, 0.23392486572265625, 0.253570556640625, 0.27321624755859375, 0.2928619384765625, 0.31250762939453125, 0.3321533203125, 0.35179901123046875, 0.3714447021484375, 0.39109039306640625, 0.410736083984375, 0.43038177490234375, 0.4500274658203125, 0.46967315673828125, 0.48931884765625, 0.5089645385742188, 0.5286102294921875, 0.5482559204101562, 0.567901611328125, 0.5875473022460938, 0.6071929931640625, 0.6268386840820312, 0.646484375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 2.0, 7.0, 4.0, 5.0, 11.0, 30.0, 62.0, 150.0, 432.0, 173.0, 58.0, 24.0, 12.0, 12.0, 9.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010144710540771484, -9.760819375514984e-05, -9.376928210258484e-05, -8.993037045001984e-05, -8.609145879745483e-05, -8.225254714488983e-05, -7.841363549232483e-05, -7.457472383975983e-05, -7.073581218719482e-05, -6.689690053462982e-05, -6.305798888206482e-05, -5.921907722949982e-05, -5.5380165576934814e-05, -5.154125392436981e-05, -4.770234227180481e-05, -4.386343061923981e-05, -4.0024518966674805e-05, -3.61856073141098e-05, -3.23466956615448e-05, -2.8507784008979797e-05, -2.4668872356414795e-05, -2.0829960703849792e-05, -1.699104905128479e-05, -1.3152137398719788e-05, -9.313225746154785e-06, -5.474314093589783e-06, -1.6354024410247803e-06, 2.203509211540222e-06, 6.042420864105225e-06, 9.881332516670227e-06, 1.372024416923523e-05, 1.7559155821800232e-05, 2.1398067474365234e-05, 2.5236979126930237e-05, 2.907589077949524e-05, 3.291480243206024e-05, 3.6753714084625244e-05, 4.0592625737190247e-05, 4.443153738975525e-05, 4.827044904232025e-05, 5.2109360694885254e-05, 5.5948272347450256e-05, 5.978718400001526e-05, 6.362609565258026e-05, 6.746500730514526e-05, 7.130391895771027e-05, 7.514283061027527e-05, 7.898174226284027e-05, 8.282065391540527e-05, 8.665956556797028e-05, 9.049847722053528e-05, 9.433738887310028e-05, 9.817630052566528e-05, 0.00010201521217823029, 0.00010585412383079529, 0.00010969303548336029, 0.00011353194713592529, 0.0001173708587884903, 0.0001212097704410553, 0.0001250486820936203, 0.0001288875937461853, 0.0001327265053987503, 0.0001365654170513153, 0.0001404043287038803, 0.0001442432403564453]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 9.0, 10.0, 18.0, 21.0, 34.0, 30.0, 52.0, 71.0, 97.0, 150.0, 190.0, 280.0, 423.0, 567.0, 900.0, 1446.0, 2336.0, 4073.0, 7740.0, 18268.0, 63796.0, 678086.0, 208717.0, 34651.0, 12176.0, 5734.0, 3120.0, 1909.0, 1187.0, 754.0, 503.0, 384.0, 238.0, 158.0, 118.0, 86.0, 55.0, 40.0, 35.0, 28.0, 16.0, 7.0, 6.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.277099609375, -0.2674713134765625, -0.257843017578125, -0.2482147216796875, -0.23858642578125, -0.2289581298828125, -0.219329833984375, -0.2097015380859375, -0.2000732421875, -0.1904449462890625, -0.180816650390625, -0.1711883544921875, -0.16156005859375, -0.1519317626953125, -0.142303466796875, -0.1326751708984375, -0.123046875, -0.1134185791015625, -0.103790283203125, -0.0941619873046875, -0.08453369140625, -0.0749053955078125, -0.065277099609375, -0.0556488037109375, -0.0460205078125, -0.0363922119140625, -0.026763916015625, -0.0171356201171875, -0.00750732421875, 0.0021209716796875, 0.011749267578125, 0.0213775634765625, 0.031005859375, 0.0406341552734375, 0.050262451171875, 0.0598907470703125, 0.06951904296875, 0.0791473388671875, 0.088775634765625, 0.0984039306640625, 0.1080322265625, 0.1176605224609375, 0.127288818359375, 0.1369171142578125, 0.14654541015625, 0.1561737060546875, 0.165802001953125, 0.1754302978515625, 0.18505859375, 0.1946868896484375, 0.204315185546875, 0.2139434814453125, 0.22357177734375, 0.2332000732421875, 0.242828369140625, 0.2524566650390625, 0.2620849609375, 0.2717132568359375, 0.281341552734375, 0.2909698486328125, 0.30059814453125, 0.3102264404296875, 0.319854736328125, 0.3294830322265625, 0.339111328125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 3.0, 1.0, 5.0, 12.0, 14.0, 5.0, 12.0, 16.0, 27.0, 39.0, 54.0, 89.0, 208.0, 208.0, 93.0, 48.0, 42.0, 31.0, 23.0, 17.0, 11.0, 5.0, 2.0, 1.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.177001953125, -0.1718006134033203, -0.16659927368164062, -0.16139793395996094, -0.15619659423828125, -0.15099525451660156, -0.14579391479492188, -0.1405925750732422, -0.1353912353515625, -0.1301898956298828, -0.12498855590820312, -0.11978721618652344, -0.11458587646484375, -0.10938453674316406, -0.10418319702148438, -0.09898185729980469, -0.093780517578125, -0.08857917785644531, -0.08337783813476562, -0.07817649841308594, -0.07297515869140625, -0.06777381896972656, -0.06257247924804688, -0.05737113952636719, -0.0521697998046875, -0.04696846008300781, -0.041767120361328125, -0.03656578063964844, -0.03136444091796875, -0.026163101196289062, -0.020961761474609375, -0.015760421752929688, -0.01055908203125, -0.0053577423095703125, -0.000156402587890625, 0.0050449371337890625, 0.01024627685546875, 0.015447616577148438, 0.020648956298828125, 0.025850296020507812, 0.0310516357421875, 0.03625297546386719, 0.041454315185546875, 0.04665565490722656, 0.05185699462890625, 0.05705833435058594, 0.062259674072265625, 0.06746101379394531, 0.072662353515625, 0.07786369323730469, 0.08306503295898438, 0.08826637268066406, 0.09346771240234375, 0.09866905212402344, 0.10387039184570312, 0.10907173156738281, 0.1142730712890625, 0.11947441101074219, 0.12467575073242188, 0.12987709045410156, 0.13507843017578125, 0.14027976989746094, 0.14548110961914062, 0.1506824493408203, 0.1558837890625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 4.0, 13.0, 20.0, 53.0, 128.0, 218.0, 246.0, 175.0, 88.0, 34.0, 22.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.15004825592041, -14.848811149597168, -14.547574043273926, -14.246337890625, -13.945100784301758, -13.643863677978516, -13.342626571655273, -13.041389465332031, -12.740152359008789, -12.438915252685547, -12.137678146362305, -11.836441993713379, -11.535204887390137, -11.233967781066895, -10.932730674743652, -10.63149356842041, -10.330257415771484, -10.029020309448242, -9.727783203125, -9.426547050476074, -9.125309944152832, -8.82407283782959, -8.522835731506348, -8.221598625183105, -7.9203619956970215, -7.619124889373779, -7.317888259887695, -7.016651153564453, -6.715414047241211, -6.414177417755127, -6.112940311431885, -5.811703681945801, -5.510465621948242, -5.209228515625, -4.907991886138916, -4.606754779815674, -4.30551815032959, -4.004281044006348, -3.7030439376831055, -3.4018070697784424, -3.1005702018737793, -2.799333333969116, -2.498096466064453, -2.196859359741211, -1.8956224918365479, -1.5943856239318848, -1.2931486368179321, -0.9919116497039795, -0.6906747817993164, -0.38943785429000854, -0.08820092678070068, 0.21303600072860718, 0.514272928237915, 0.8155097961425781, 1.1167467832565308, 1.4179837703704834, 1.7192206382751465, 2.0204575061798096, 2.3216943740844727, 2.622931480407715, 2.924168348312378, 3.225405216217041, 3.526642322540283, 3.8278791904449463, 4.129116058349609]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 4.0, 5.0, 4.0, 6.0, 7.0, 7.0, 11.0, 14.0, 6.0, 21.0, 12.0, 16.0, 16.0, 15.0, 17.0, 21.0, 23.0, 45.0, 33.0, 31.0, 18.0, 34.0, 39.0, 40.0, 28.0, 38.0, 37.0, 35.0, 40.0, 31.0, 32.0, 29.0, 31.0, 25.0, 26.0, 28.0, 23.0, 25.0, 18.0, 18.0, 15.0, 16.0, 11.0, 11.0, 6.0, 8.0, 5.0, 5.0, 5.0, 2.0, 8.0, 2.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.2388625144958496, -3.131962776184082, -3.0250630378723145, -2.918163299560547, -2.8112635612487793, -2.7043638229370117, -2.597464084625244, -2.4905643463134766, -2.383664608001709, -2.2767648696899414, -2.169865131378174, -2.0629653930664062, -1.9560656547546387, -1.849165916442871, -1.7422661781311035, -1.635366439819336, -1.528466820716858, -1.4215670824050903, -1.3146673440933228, -1.2077676057815552, -1.1008678674697876, -0.9939681887626648, -0.8870684504508972, -0.7801687121391296, -0.6732689738273621, -0.5663692355155945, -0.4594694972038269, -0.3525697886943817, -0.24567005038261414, -0.13877034187316895, -0.03187060356140137, 0.07502913475036621, 0.1819288730621338, 0.28882861137390137, 0.39572834968566895, 0.5026280879974365, 0.6095278263092041, 0.7164275050163269, 0.8233272433280945, 0.9302269816398621, 1.0371267795562744, 1.144026517868042, 1.2509262561798096, 1.3578259944915771, 1.4647257328033447, 1.5716254711151123, 1.6785252094268799, 1.7854249477386475, 1.8923245668411255, 1.999224305152893, 2.106123924255371, 2.2130236625671387, 2.3199234008789062, 2.426823139190674, 2.5337228775024414, 2.640622615814209, 2.7475223541259766, 2.854422092437744, 2.9613218307495117, 3.0682215690612793, 3.175121307373047, 3.2820210456848145, 3.388920783996582, 3.4958205223083496, 3.602720260620117]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 9.0, 17.0, 20.0, 22.0, 28.0, 53.0, 61.0, 99.0, 109.0, 184.0, 257.0, 379.0, 490.0, 685.0, 1033.0, 1567.0, 2376.0, 3968.0, 7701.0, 18670.0, 77515.0, 365979.0, 1572293.0, 1650992.0, 379059.0, 74278.0, 17639.0, 7720.0, 3871.0, 2409.0, 1573.0, 943.0, 673.0, 471.0, 380.0, 221.0, 165.0, 111.0, 86.0, 51.0, 45.0, 32.0, 18.0, 10.0, 12.0, 8.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.26953125, -2.200775146484375, -2.13201904296875, -2.063262939453125, -1.9945068359375, -1.925750732421875, -1.85699462890625, -1.788238525390625, -1.719482421875, -1.650726318359375, -1.58197021484375, -1.513214111328125, -1.4444580078125, -1.375701904296875, -1.30694580078125, -1.238189697265625, -1.16943359375, -1.100677490234375, -1.03192138671875, -0.963165283203125, -0.8944091796875, -0.825653076171875, -0.75689697265625, -0.688140869140625, -0.619384765625, -0.550628662109375, -0.48187255859375, -0.413116455078125, -0.3443603515625, -0.275604248046875, -0.20684814453125, -0.138092041015625, -0.0693359375, -0.000579833984375, 0.06817626953125, 0.136932373046875, 0.2056884765625, 0.274444580078125, 0.34320068359375, 0.411956787109375, 0.480712890625, 0.549468994140625, 0.61822509765625, 0.686981201171875, 0.7557373046875, 0.824493408203125, 0.89324951171875, 0.962005615234375, 1.03076171875, 1.099517822265625, 1.16827392578125, 1.237030029296875, 1.3057861328125, 1.374542236328125, 1.44329833984375, 1.512054443359375, 1.580810546875, 1.649566650390625, 1.71832275390625, 1.787078857421875, 1.8558349609375, 1.924591064453125, 1.99334716796875, 2.062103271484375, 2.130859375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 6.0, 10.0, 5.0, 9.0, 11.0, 12.0, 15.0, 24.0, 24.0, 25.0, 23.0, 31.0, 37.0, 47.0, 30.0, 43.0, 45.0, 42.0, 46.0, 45.0, 52.0, 44.0, 52.0, 32.0, 35.0, 41.0, 30.0, 22.0, 28.0, 20.0, 19.0, 14.0, 15.0, 10.0, 11.0, 4.0, 7.0, 7.0, 6.0, 6.0, 3.0, 3.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.376953125, -1.3264617919921875, -1.275970458984375, -1.2254791259765625, -1.17498779296875, -1.1244964599609375, -1.074005126953125, -1.0235137939453125, -0.9730224609375, -0.9225311279296875, -0.872039794921875, -0.8215484619140625, -0.77105712890625, -0.7205657958984375, -0.670074462890625, -0.6195831298828125, -0.569091796875, -0.5186004638671875, -0.468109130859375, -0.4176177978515625, -0.36712646484375, -0.3166351318359375, -0.266143798828125, -0.2156524658203125, -0.1651611328125, -0.1146697998046875, -0.064178466796875, -0.0136871337890625, 0.03680419921875, 0.0872955322265625, 0.137786865234375, 0.1882781982421875, 0.23876953125, 0.2892608642578125, 0.339752197265625, 0.3902435302734375, 0.44073486328125, 0.4912261962890625, 0.541717529296875, 0.5922088623046875, 0.6427001953125, 0.6931915283203125, 0.743682861328125, 0.7941741943359375, 0.84466552734375, 0.8951568603515625, 0.945648193359375, 0.9961395263671875, 1.046630859375, 1.0971221923828125, 1.147613525390625, 1.1981048583984375, 1.24859619140625, 1.2990875244140625, 1.349578857421875, 1.4000701904296875, 1.4505615234375, 1.5010528564453125, 1.551544189453125, 1.6020355224609375, 1.65252685546875, 1.7030181884765625, 1.753509521484375, 1.8040008544921875, 1.8544921875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 2.0, 7.0, 19.0, 18.0, 34.0, 68.0, 140.0, 559.0, 3888.0, 77587.0, 4071939.0, 36889.0, 2454.0, 433.0, 105.0, 53.0, 24.0, 13.0, 13.0, 3.0, 4.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0859375, -8.75439453125, -8.4228515625, -8.09130859375, -7.759765625, -7.42822265625, -7.0966796875, -6.76513671875, -6.43359375, -6.10205078125, -5.7705078125, -5.43896484375, -5.107421875, -4.77587890625, -4.4443359375, -4.11279296875, -3.78125, -3.44970703125, -3.1181640625, -2.78662109375, -2.455078125, -2.12353515625, -1.7919921875, -1.46044921875, -1.12890625, -0.79736328125, -0.4658203125, -0.13427734375, 0.197265625, 0.52880859375, 0.8603515625, 1.19189453125, 1.5234375, 1.85498046875, 2.1865234375, 2.51806640625, 2.849609375, 3.18115234375, 3.5126953125, 3.84423828125, 4.17578125, 4.50732421875, 4.8388671875, 5.17041015625, 5.501953125, 5.83349609375, 6.1650390625, 6.49658203125, 6.828125, 7.15966796875, 7.4912109375, 7.82275390625, 8.154296875, 8.48583984375, 8.8173828125, 9.14892578125, 9.48046875, 9.81201171875, 10.1435546875, 10.47509765625, 10.806640625, 11.13818359375, 11.4697265625, 11.80126953125, 12.1328125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 4.0, 3.0, 6.0, 1.0, 4.0, 8.0, 15.0, 9.0, 16.0, 15.0, 22.0, 30.0, 44.0, 66.0, 107.0, 158.0, 278.0, 438.0, 676.0, 780.0, 525.0, 297.0, 169.0, 100.0, 78.0, 54.0, 40.0, 26.0, 14.0, 18.0, 14.0, 11.0, 13.0, 8.0, 4.0, 5.0, 5.0, 0.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.95556640625, -0.9275436401367188, -0.8995208740234375, -0.8714981079101562, -0.843475341796875, -0.8154525756835938, -0.7874298095703125, -0.7594070434570312, -0.73138427734375, -0.7033615112304688, -0.6753387451171875, -0.6473159790039062, -0.619293212890625, -0.5912704467773438, -0.5632476806640625, -0.5352249145507812, -0.5072021484375, -0.47917938232421875, -0.4511566162109375, -0.42313385009765625, -0.395111083984375, -0.36708831787109375, -0.3390655517578125, -0.31104278564453125, -0.28302001953125, -0.25499725341796875, -0.2269744873046875, -0.19895172119140625, -0.170928955078125, -0.14290618896484375, -0.1148834228515625, -0.08686065673828125, -0.058837890625, -0.03081512451171875, -0.0027923583984375, 0.02523040771484375, 0.053253173828125, 0.08127593994140625, 0.1092987060546875, 0.13732147216796875, 0.16534423828125, 0.19336700439453125, 0.2213897705078125, 0.24941253662109375, 0.277435302734375, 0.30545806884765625, 0.3334808349609375, 0.36150360107421875, 0.3895263671875, 0.41754913330078125, 0.4455718994140625, 0.47359466552734375, 0.501617431640625, 0.5296401977539062, 0.5576629638671875, 0.5856857299804688, 0.61370849609375, 0.6417312622070312, 0.6697540283203125, 0.6977767944335938, 0.725799560546875, 0.7538223266601562, 0.7818450927734375, 0.8098678588867188, 0.837890625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 7.0, 6.0, 13.0, 13.0, 12.0, 21.0, 27.0, 39.0, 48.0, 53.0, 68.0, 81.0, 100.0, 96.0, 92.0, 64.0, 65.0, 53.0, 45.0, 27.0, 15.0, 12.0, 13.0, 7.0, 11.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.3531672954559326, -3.265151262283325, -3.1771352291107178, -3.0891191959381104, -3.001103162765503, -2.9130871295928955, -2.825071096420288, -2.7370550632476807, -2.6490390300750732, -2.561022996902466, -2.4730069637298584, -2.384990930557251, -2.2969748973846436, -2.208958864212036, -2.1209428310394287, -2.0329267978668213, -1.9449107646942139, -1.8568947315216064, -1.768878698348999, -1.6808626651763916, -1.5928466320037842, -1.5048305988311768, -1.4168145656585693, -1.328798532485962, -1.2407824993133545, -1.152766466140747, -1.0647504329681396, -0.9767343997955322, -0.8887183666229248, -0.8007023334503174, -0.71268630027771, -0.6246702671051025, -0.5366544723510742, -0.4486384391784668, -0.3606224060058594, -0.27260637283325195, -0.18459033966064453, -0.09657430648803711, -0.008558273315429688, 0.07945775985717773, 0.16747379302978516, 0.2554898262023926, 0.343505859375, 0.4315218925476074, 0.5195379257202148, 0.6075539588928223, 0.6955699920654297, 0.7835860252380371, 0.8716020584106445, 0.959618091583252, 1.0476341247558594, 1.1356501579284668, 1.2236661911010742, 1.3116822242736816, 1.399698257446289, 1.4877142906188965, 1.575730323791504, 1.6637463569641113, 1.7517623901367188, 1.8397784233093262, 1.9277944564819336, 2.015810489654541, 2.1038265228271484, 2.191842555999756, 2.2798585891723633]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 7.0, 7.0, 10.0, 8.0, 13.0, 15.0, 13.0, 9.0, 31.0, 21.0, 30.0, 24.0, 27.0, 28.0, 35.0, 26.0, 44.0, 37.0, 46.0, 52.0, 52.0, 33.0, 37.0, 30.0, 37.0, 32.0, 36.0, 28.0, 29.0, 23.0, 20.0, 22.0, 19.0, 22.0, 18.0, 9.0, 11.0, 10.0, 11.0, 6.0, 8.0, 6.0, 3.0, 4.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.6309282779693604, -1.5800631046295166, -1.5291980504989624, -1.4783328771591187, -1.427467703819275, -1.3766026496887207, -1.325737476348877, -1.2748723030090332, -1.2240071296691895, -1.1731419563293457, -1.1222769021987915, -1.0714117288589478, -1.020546555519104, -0.969681441783905, -0.918816328048706, -0.8679511547088623, -0.8170861005783081, -0.7662209868431091, -0.7153558135032654, -0.6644906997680664, -0.6136255264282227, -0.5627604126930237, -0.5118952989578247, -0.46103015542030334, -0.410165011882782, -0.3592998683452606, -0.30843472480773926, -0.2575696110725403, -0.20670446753501892, -0.15583932399749756, -0.10497421026229858, -0.05410906672477722, -0.0032439231872558594, 0.047621212899684906, 0.09848634898662567, 0.14935147762298584, 0.2002166211605072, 0.25108176469802856, 0.30194687843322754, 0.3528120219707489, 0.40367716550827026, 0.4545423090457916, 0.505407452583313, 0.556272566318512, 0.6071376800537109, 0.6580028533935547, 0.7088679671287537, 0.7597330808639526, 0.8105982542037964, 0.8614633679389954, 0.9123285412788391, 0.9631936550140381, 1.0140588283538818, 1.0649240016937256, 1.1157890558242798, 1.1666542291641235, 1.2175192832946777, 1.2683844566345215, 1.3192495107650757, 1.3701146841049194, 1.4209798574447632, 1.4718449115753174, 1.5227100849151611, 1.5735752582550049, 1.6244404315948486]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 6.0, 1.0, 2.0, 4.0, 4.0, 10.0, 6.0, 6.0, 16.0, 21.0, 29.0, 47.0, 57.0, 102.0, 148.0, 260.0, 391.0, 731.0, 1298.0, 2450.0, 4667.0, 9765.0, 23312.0, 62615.0, 192445.0, 437548.0, 202468.0, 65311.0, 24020.0, 10292.0, 4967.0, 2473.0, 1321.0, 691.0, 394.0, 259.0, 128.0, 99.0, 57.0, 47.0, 25.0, 25.0, 12.0, 10.0, 8.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.71240234375, -0.6865158081054688, -0.6606292724609375, -0.6347427368164062, -0.608856201171875, -0.5829696655273438, -0.5570831298828125, -0.5311965942382812, -0.50531005859375, -0.47942352294921875, -0.4535369873046875, -0.42765045166015625, -0.401763916015625, -0.37587738037109375, -0.3499908447265625, -0.32410430908203125, -0.2982177734375, -0.27233123779296875, -0.2464447021484375, -0.22055816650390625, -0.194671630859375, -0.16878509521484375, -0.1428985595703125, -0.11701202392578125, -0.09112548828125, -0.06523895263671875, -0.0393524169921875, -0.01346588134765625, 0.012420654296875, 0.03830718994140625, 0.0641937255859375, 0.09008026123046875, 0.115966796875, 0.14185333251953125, 0.1677398681640625, 0.19362640380859375, 0.219512939453125, 0.24539947509765625, 0.2712860107421875, 0.29717254638671875, 0.32305908203125, 0.34894561767578125, 0.3748321533203125, 0.40071868896484375, 0.426605224609375, 0.45249176025390625, 0.4783782958984375, 0.5042648315429688, 0.5301513671875, 0.5560379028320312, 0.5819244384765625, 0.6078109741210938, 0.633697509765625, 0.6595840454101562, 0.6854705810546875, 0.7113571166992188, 0.73724365234375, 0.7631301879882812, 0.7890167236328125, 0.8149032592773438, 0.840789794921875, 0.8666763305664062, 0.8925628662109375, 0.9184494018554688, 0.9443359375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 5.0, 4.0, 7.0, 7.0, 9.0, 9.0, 10.0, 13.0, 15.0, 15.0, 13.0, 20.0, 24.0, 33.0, 27.0, 35.0, 33.0, 33.0, 33.0, 39.0, 56.0, 33.0, 54.0, 40.0, 35.0, 37.0, 36.0, 40.0, 36.0, 25.0, 21.0, 25.0, 25.0, 21.0, 17.0, 13.0, 16.0, 10.0, 9.0, 8.0, 9.0, 13.0, 8.0, 6.0, 1.0, 5.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.0205078125, -0.987030029296875, -0.95355224609375, -0.920074462890625, -0.8865966796875, -0.853118896484375, -0.81964111328125, -0.786163330078125, -0.752685546875, -0.719207763671875, -0.68572998046875, -0.652252197265625, -0.6187744140625, -0.585296630859375, -0.55181884765625, -0.518341064453125, -0.48486328125, -0.451385498046875, -0.41790771484375, -0.384429931640625, -0.3509521484375, -0.317474365234375, -0.28399658203125, -0.250518798828125, -0.217041015625, -0.183563232421875, -0.15008544921875, -0.116607666015625, -0.0831298828125, -0.049652099609375, -0.01617431640625, 0.017303466796875, 0.05078125, 0.084259033203125, 0.11773681640625, 0.151214599609375, 0.1846923828125, 0.218170166015625, 0.25164794921875, 0.285125732421875, 0.318603515625, 0.352081298828125, 0.38555908203125, 0.419036865234375, 0.4525146484375, 0.485992431640625, 0.51947021484375, 0.552947998046875, 0.58642578125, 0.619903564453125, 0.65338134765625, 0.686859130859375, 0.7203369140625, 0.753814697265625, 0.78729248046875, 0.820770263671875, 0.854248046875, 0.887725830078125, 0.92120361328125, 0.954681396484375, 0.9881591796875, 1.021636962890625, 1.05511474609375, 1.088592529296875, 1.1220703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 8.0, 9.0, 12.0, 16.0, 13.0, 36.0, 38.0, 56.0, 85.0, 112.0, 184.0, 260.0, 396.0, 619.0, 1041.0, 1696.0, 3090.0, 5835.0, 12091.0, 27618.0, 69376.0, 187429.0, 372622.0, 222937.0, 82407.0, 31916.0, 13686.0, 6662.0, 3343.0, 1838.0, 1173.0, 668.0, 414.0, 288.0, 183.0, 109.0, 88.0, 51.0, 47.0, 33.0, 21.0, 21.0, 13.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.568359375, -0.5491485595703125, -0.529937744140625, -0.5107269287109375, -0.49151611328125, -0.4723052978515625, -0.453094482421875, -0.4338836669921875, -0.4146728515625, -0.3954620361328125, -0.376251220703125, -0.3570404052734375, -0.33782958984375, -0.3186187744140625, -0.299407958984375, -0.2801971435546875, -0.260986328125, -0.2417755126953125, -0.222564697265625, -0.2033538818359375, -0.18414306640625, -0.1649322509765625, -0.145721435546875, -0.1265106201171875, -0.1072998046875, -0.0880889892578125, -0.068878173828125, -0.0496673583984375, -0.03045654296875, -0.0112457275390625, 0.007965087890625, 0.0271759033203125, 0.04638671875, 0.0655975341796875, 0.084808349609375, 0.1040191650390625, 0.12322998046875, 0.1424407958984375, 0.161651611328125, 0.1808624267578125, 0.2000732421875, 0.2192840576171875, 0.238494873046875, 0.2577056884765625, 0.27691650390625, 0.2961273193359375, 0.315338134765625, 0.3345489501953125, 0.353759765625, 0.3729705810546875, 0.392181396484375, 0.4113922119140625, 0.43060302734375, 0.4498138427734375, 0.469024658203125, 0.4882354736328125, 0.5074462890625, 0.5266571044921875, 0.545867919921875, 0.5650787353515625, 0.58428955078125, 0.6035003662109375, 0.622711181640625, 0.6419219970703125, 0.6611328125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 9.0, 4.0, 3.0, 10.0, 11.0, 9.0, 13.0, 18.0, 28.0, 32.0, 32.0, 29.0, 39.0, 44.0, 46.0, 56.0, 62.0, 51.0, 50.0, 49.0, 55.0, 45.0, 39.0, 41.0, 37.0, 33.0, 28.0, 24.0, 19.0, 19.0, 15.0, 17.0, 11.0, 6.0, 5.0, 4.0, 5.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.07421875, -2.989471435546875, -2.90472412109375, -2.819976806640625, -2.7352294921875, -2.650482177734375, -2.56573486328125, -2.480987548828125, -2.396240234375, -2.311492919921875, -2.22674560546875, -2.141998291015625, -2.0572509765625, -1.972503662109375, -1.88775634765625, -1.803009033203125, -1.71826171875, -1.633514404296875, -1.54876708984375, -1.464019775390625, -1.3792724609375, -1.294525146484375, -1.20977783203125, -1.125030517578125, -1.040283203125, -0.955535888671875, -0.87078857421875, -0.786041259765625, -0.7012939453125, -0.616546630859375, -0.53179931640625, -0.447052001953125, -0.3623046875, -0.277557373046875, -0.19281005859375, -0.108062744140625, -0.0233154296875, 0.061431884765625, 0.14617919921875, 0.230926513671875, 0.315673828125, 0.400421142578125, 0.48516845703125, 0.569915771484375, 0.6546630859375, 0.739410400390625, 0.82415771484375, 0.908905029296875, 0.99365234375, 1.078399658203125, 1.16314697265625, 1.247894287109375, 1.3326416015625, 1.417388916015625, 1.50213623046875, 1.586883544921875, 1.671630859375, 1.756378173828125, 1.84112548828125, 1.925872802734375, 2.0106201171875, 2.095367431640625, 2.18011474609375, 2.264862060546875, 2.349609375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 4.0, 7.0, 11.0, 18.0, 14.0, 24.0, 41.0, 59.0, 70.0, 103.0, 151.0, 214.0, 388.0, 619.0, 1018.0, 1729.0, 3519.0, 7613.0, 18898.0, 58606.0, 264588.0, 513796.0, 121037.0, 32795.0, 11987.0, 5145.0, 2517.0, 1347.0, 820.0, 488.0, 276.0, 195.0, 129.0, 94.0, 72.0, 39.0, 25.0, 15.0, 25.0, 12.0, 15.0, 13.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2139892578125, -0.20714378356933594, -0.20029830932617188, -0.1934528350830078, -0.18660736083984375, -0.1797618865966797, -0.17291641235351562, -0.16607093811035156, -0.1592254638671875, -0.15237998962402344, -0.14553451538085938, -0.1386890411376953, -0.13184356689453125, -0.12499809265136719, -0.11815261840820312, -0.11130714416503906, -0.104461669921875, -0.09761619567871094, -0.09077072143554688, -0.08392524719238281, -0.07707977294921875, -0.07023429870605469, -0.06338882446289062, -0.05654335021972656, -0.0496978759765625, -0.04285240173339844, -0.036006927490234375, -0.029161453247070312, -0.02231597900390625, -0.015470504760742188, -0.008625030517578125, -0.0017795562744140625, 0.00506591796875, 0.011911392211914062, 0.018756866455078125, 0.025602340698242188, 0.03244781494140625, 0.03929328918457031, 0.046138763427734375, 0.05298423767089844, 0.0598297119140625, 0.06667518615722656, 0.07352066040039062, 0.08036613464355469, 0.08721160888671875, 0.09405708312988281, 0.10090255737304688, 0.10774803161621094, 0.114593505859375, 0.12143898010253906, 0.12828445434570312, 0.1351299285888672, 0.14197540283203125, 0.1488208770751953, 0.15566635131835938, 0.16251182556152344, 0.1693572998046875, 0.17620277404785156, 0.18304824829101562, 0.1898937225341797, 0.19673919677734375, 0.2035846710205078, 0.21043014526367188, 0.21727561950683594, 0.22412109375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 5.0, 4.0, 11.0, 8.0, 12.0, 22.0, 25.0, 42.0, 63.0, 90.0, 130.0, 147.0, 127.0, 100.0, 52.0, 38.0, 32.0, 19.0, 13.0, 10.0, 17.0, 4.0, 6.0, 3.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020742416381835938, -0.00020189769566059113, -0.00019637122750282288, -0.00019084475934505463, -0.00018531829118728638, -0.00017979182302951813, -0.00017426535487174988, -0.00016873888671398163, -0.00016321241855621338, -0.00015768595039844513, -0.00015215948224067688, -0.00014663301408290863, -0.00014110654592514038, -0.00013558007776737213, -0.00013005360960960388, -0.00012452714145183563, -0.00011900067329406738, -0.00011347420513629913, -0.00010794773697853088, -0.00010242126882076263, -9.689480066299438e-05, -9.136833250522614e-05, -8.584186434745789e-05, -8.031539618968964e-05, -7.478892803192139e-05, -6.926245987415314e-05, -6.373599171638489e-05, -5.820952355861664e-05, -5.268305540084839e-05, -4.715658724308014e-05, -4.163011908531189e-05, -3.610365092754364e-05, -3.057718276977539e-05, -2.505071461200714e-05, -1.952424645423889e-05, -1.3997778296470642e-05, -8.471310138702393e-06, -2.944841980934143e-06, 2.5816261768341064e-06, 8.108094334602356e-06, 1.3634562492370605e-05, 1.9161030650138855e-05, 2.4687498807907104e-05, 3.0213966965675354e-05, 3.5740435123443604e-05, 4.126690328121185e-05, 4.67933714389801e-05, 5.231983959674835e-05, 5.78463077545166e-05, 6.337277591228485e-05, 6.88992440700531e-05, 7.442571222782135e-05, 7.99521803855896e-05, 8.547864854335785e-05, 9.10051167011261e-05, 9.653158485889435e-05, 0.0001020580530166626, 0.00010758452117443085, 0.0001131109893321991, 0.00011863745748996735, 0.0001241639256477356, 0.00012969039380550385, 0.0001352168619632721, 0.00014074333012104034, 0.0001462697982788086]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 6.0, 4.0, 4.0, 13.0, 15.0, 12.0, 30.0, 33.0, 47.0, 59.0, 76.0, 109.0, 150.0, 202.0, 330.0, 503.0, 739.0, 1054.0, 1807.0, 2907.0, 4939.0, 8927.0, 18069.0, 42200.0, 119242.0, 369267.0, 311914.0, 95328.0, 35150.0, 15616.0, 7941.0, 4403.0, 2559.0, 1640.0, 998.0, 701.0, 443.0, 309.0, 226.0, 148.0, 113.0, 80.0, 71.0, 44.0, 30.0, 27.0, 23.0, 12.0, 9.0, 10.0, 9.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.1715087890625, -0.16613388061523438, -0.16075897216796875, -0.15538406372070312, -0.1500091552734375, -0.14463424682617188, -0.13925933837890625, -0.13388442993164062, -0.128509521484375, -0.12313461303710938, -0.11775970458984375, -0.11238479614257812, -0.1070098876953125, -0.10163497924804688, -0.09626007080078125, -0.09088516235351562, -0.08551025390625, -0.08013534545898438, -0.07476043701171875, -0.06938552856445312, -0.0640106201171875, -0.058635711669921875, -0.05326080322265625, -0.047885894775390625, -0.042510986328125, -0.037136077880859375, -0.03176116943359375, -0.026386260986328125, -0.0210113525390625, -0.015636444091796875, -0.01026153564453125, -0.004886627197265625, 0.00048828125, 0.005863189697265625, 0.01123809814453125, 0.016613006591796875, 0.0219879150390625, 0.027362823486328125, 0.03273773193359375, 0.038112640380859375, 0.043487548828125, 0.048862457275390625, 0.05423736572265625, 0.059612274169921875, 0.0649871826171875, 0.07036209106445312, 0.07573699951171875, 0.08111190795898438, 0.08648681640625, 0.09186172485351562, 0.09723663330078125, 0.10261154174804688, 0.1079864501953125, 0.11336135864257812, 0.11873626708984375, 0.12411117553710938, 0.129486083984375, 0.13486099243164062, 0.14023590087890625, 0.14561080932617188, 0.1509857177734375, 0.15636062622070312, 0.16173553466796875, 0.16711044311523438, 0.1724853515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 5.0, 4.0, 2.0, 7.0, 7.0, 10.0, 22.0, 21.0, 24.0, 32.0, 41.0, 58.0, 86.0, 76.0, 83.0, 111.0, 72.0, 72.0, 52.0, 46.0, 26.0, 29.0, 20.0, 25.0, 13.0, 10.0, 4.0, 8.0, 6.0, 1.0, 6.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06304931640625, -0.06111574172973633, -0.059182167053222656, -0.057248592376708984, -0.05531501770019531, -0.05338144302368164, -0.05144786834716797, -0.0495142936706543, -0.047580718994140625, -0.04564714431762695, -0.04371356964111328, -0.04177999496459961, -0.03984642028808594, -0.037912845611572266, -0.035979270935058594, -0.03404569625854492, -0.03211212158203125, -0.030178546905517578, -0.028244972229003906, -0.026311397552490234, -0.024377822875976562, -0.02244424819946289, -0.02051067352294922, -0.018577098846435547, -0.016643524169921875, -0.014709949493408203, -0.012776374816894531, -0.01084280014038086, -0.008909225463867188, -0.006975650787353516, -0.005042076110839844, -0.003108501434326172, -0.0011749267578125, 0.0007586479187011719, 0.0026922225952148438, 0.004625797271728516, 0.0065593719482421875, 0.00849294662475586, 0.010426521301269531, 0.012360095977783203, 0.014293670654296875, 0.016227245330810547, 0.01816082000732422, 0.02009439468383789, 0.022027969360351562, 0.023961544036865234, 0.025895118713378906, 0.027828693389892578, 0.02976226806640625, 0.03169584274291992, 0.033629417419433594, 0.035562992095947266, 0.03749656677246094, 0.03943014144897461, 0.04136371612548828, 0.04329729080200195, 0.045230865478515625, 0.0471644401550293, 0.04909801483154297, 0.05103158950805664, 0.05296516418457031, 0.054898738861083984, 0.056832313537597656, 0.05876588821411133, 0.060699462890625]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 6.0, 7.0, 4.0, 8.0, 7.0, 8.0, 17.0, 24.0, 26.0, 60.0, 58.0, 80.0, 83.0, 91.0, 98.0, 80.0, 72.0, 67.0, 53.0, 37.0, 24.0, 28.0, 18.0, 14.0, 3.0, 8.0, 9.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-1.9908307790756226, -1.9362215995788574, -1.8816124200820923, -1.8270032405853271, -1.7723939418792725, -1.7177847623825073, -1.6631755828857422, -1.608566403388977, -1.553957223892212, -1.4993480443954468, -1.4447388648986816, -1.390129566192627, -1.3355203866958618, -1.2809112071990967, -1.2263020277023315, -1.1716928482055664, -1.1170835494995117, -1.0624743700027466, -1.0078651905059814, -0.9532559514045715, -0.8986467123031616, -0.8440375328063965, -0.7894283533096313, -0.7348191738128662, -0.6802099347114563, -0.6256007552146912, -0.5709915161132812, -0.5163823366165161, -0.4617731273174286, -0.40716391801834106, -0.3525547385215759, -0.2979455292224884, -0.24333643913269043, -0.1887272298336029, -0.13411803543567657, -0.07950884103775024, -0.02489963173866272, 0.029709577560424805, 0.08431875705718994, 0.13892796635627747, 0.193537175655365, 0.24814638495445251, 0.30275559425354004, 0.3573647737503052, 0.4119739830493927, 0.4665831923484802, 0.5211923718452454, 0.5758016109466553, 0.6304107904434204, 0.6850199699401855, 0.7396292090415955, 0.7942383885383606, 0.8488476276397705, 0.9034568071365356, 0.9580659866333008, 1.012675166130066, 1.067284345626831, 1.1218935251235962, 1.1765027046203613, 1.231112003326416, 1.2857211828231812, 1.3403303623199463, 1.3949395418167114, 1.4495487213134766, 1.5041580200195312]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 6.0, 9.0, 5.0, 8.0, 11.0, 14.0, 14.0, 12.0, 24.0, 16.0, 28.0, 22.0, 27.0, 25.0, 31.0, 37.0, 29.0, 30.0, 44.0, 33.0, 43.0, 37.0, 50.0, 38.0, 49.0, 31.0, 31.0, 25.0, 30.0, 35.0, 24.0, 18.0, 25.0, 15.0, 23.0, 11.0, 16.0, 8.0, 11.0, 10.0, 10.0, 6.0, 8.0, 3.0, 7.0, 5.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.0005931854248047, -0.969087541103363, -0.9375819563865662, -0.9060763120651245, -0.8745707273483276, -0.843065083026886, -0.8115594387054443, -0.7800538539886475, -0.7485482692718506, -0.7170426249504089, -0.6855370402336121, -0.6540313959121704, -0.6225258111953735, -0.5910201668739319, -0.5595145225524902, -0.5280089378356934, -0.4965032935142517, -0.46499767899513245, -0.4334920644760132, -0.40198642015457153, -0.37048083543777466, -0.338975191116333, -0.30746957659721375, -0.2759639620780945, -0.24445834755897522, -0.21295273303985596, -0.1814471185207367, -0.14994148910045624, -0.11843587458133698, -0.08693026006221771, -0.055424630641937256, -0.023919016122817993, 0.0075865983963012695, 0.03909221664071083, 0.07059783488512039, 0.10210345685482025, 0.13360907137393951, 0.16511468589305878, 0.19662031531333923, 0.2281259298324585, 0.25963154435157776, 0.291137158870697, 0.3226427733898163, 0.35414838790893555, 0.3856540322303772, 0.4171596169471741, 0.4486652612686157, 0.480170875787735, 0.5116764903068542, 0.5431821346282959, 0.5746877193450928, 0.6061933636665344, 0.6376989483833313, 0.669204592704773, 0.7007101774215698, 0.7322158217430115, 0.7637214660644531, 0.7952271103858948, 0.8267326951026917, 0.8582383394241333, 0.8897439241409302, 0.9212495684623718, 0.9527552127838135, 0.9842607975006104, 1.0157663822174072]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 5.0, 19.0, 11.0, 19.0, 28.0, 35.0, 46.0, 60.0, 67.0, 126.0, 140.0, 213.0, 284.0, 437.0, 638.0, 1016.0, 1466.0, 2525.0, 4302.0, 8760.0, 22613.0, 113992.0, 729505.0, 118474.0, 23475.0, 8687.0, 4270.0, 2582.0, 1539.0, 1036.0, 635.0, 459.0, 292.0, 198.0, 167.0, 106.0, 91.0, 63.0, 38.0, 38.0, 15.0, 19.0, 21.0, 10.0, 12.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.4052734375, -1.3620452880859375, -1.318817138671875, -1.2755889892578125, -1.23236083984375, -1.1891326904296875, -1.145904541015625, -1.1026763916015625, -1.0594482421875, -1.0162200927734375, -0.972991943359375, -0.9297637939453125, -0.88653564453125, -0.8433074951171875, -0.800079345703125, -0.7568511962890625, -0.713623046875, -0.6703948974609375, -0.627166748046875, -0.5839385986328125, -0.54071044921875, -0.4974822998046875, -0.454254150390625, -0.4110260009765625, -0.3677978515625, -0.3245697021484375, -0.281341552734375, -0.2381134033203125, -0.19488525390625, -0.1516571044921875, -0.108428955078125, -0.0652008056640625, -0.02197265625, 0.0212554931640625, 0.064483642578125, 0.1077117919921875, 0.15093994140625, 0.1941680908203125, 0.237396240234375, 0.2806243896484375, 0.3238525390625, 0.3670806884765625, 0.410308837890625, 0.4535369873046875, 0.49676513671875, 0.5399932861328125, 0.583221435546875, 0.6264495849609375, 0.669677734375, 0.7129058837890625, 0.756134033203125, 0.7993621826171875, 0.84259033203125, 0.8858184814453125, 0.929046630859375, 0.9722747802734375, 1.0155029296875, 1.0587310791015625, 1.101959228515625, 1.1451873779296875, 1.18841552734375, 1.2316436767578125, 1.274871826171875, 1.3180999755859375, 1.361328125]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 2.0, 2.0, 2.0, 8.0, 9.0, 10.0, 15.0, 22.0, 19.0, 21.0, 22.0, 20.0, 30.0, 28.0, 40.0, 33.0, 39.0, 51.0, 45.0, 40.0, 56.0, 49.0, 62.0, 40.0, 40.0, 34.0, 35.0, 22.0, 23.0, 29.0, 27.0, 23.0, 10.0, 24.0, 13.0, 9.0, 9.0, 10.0, 9.0, 4.0, 6.0, 6.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3828125, -2.308319091796875, -2.23382568359375, -2.159332275390625, -2.0848388671875, -2.010345458984375, -1.93585205078125, -1.861358642578125, -1.786865234375, -1.712371826171875, -1.63787841796875, -1.563385009765625, -1.4888916015625, -1.414398193359375, -1.33990478515625, -1.265411376953125, -1.19091796875, -1.116424560546875, -1.04193115234375, -0.967437744140625, -0.8929443359375, -0.818450927734375, -0.74395751953125, -0.669464111328125, -0.594970703125, -0.520477294921875, -0.44598388671875, -0.371490478515625, -0.2969970703125, -0.222503662109375, -0.14801025390625, -0.073516845703125, 0.0009765625, 0.075469970703125, 0.14996337890625, 0.224456787109375, 0.2989501953125, 0.373443603515625, 0.44793701171875, 0.522430419921875, 0.596923828125, 0.671417236328125, 0.74591064453125, 0.820404052734375, 0.8948974609375, 0.969390869140625, 1.04388427734375, 1.118377685546875, 1.19287109375, 1.267364501953125, 1.34185791015625, 1.416351318359375, 1.4908447265625, 1.565338134765625, 1.63983154296875, 1.714324951171875, 1.788818359375, 1.863311767578125, 1.93780517578125, 2.012298583984375, 2.0867919921875, 2.161285400390625, 2.23577880859375, 2.310272216796875, 2.384765625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 6.0, 12.0, 11.0, 12.0, 11.0, 18.0, 17.0, 22.0, 19.0, 34.0, 71.0, 79.0, 114.0, 259.0, 774.0, 6273.0, 1024550.0, 14481.0, 1014.0, 303.0, 123.0, 85.0, 46.0, 36.0, 37.0, 24.0, 20.0, 18.0, 14.0, 13.0, 8.0, 8.0, 6.0, 9.0, 11.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9375, -7.7012939453125, -7.465087890625, -7.2288818359375, -6.99267578125, -6.7564697265625, -6.520263671875, -6.2840576171875, -6.0478515625, -5.8116455078125, -5.575439453125, -5.3392333984375, -5.10302734375, -4.8668212890625, -4.630615234375, -4.3944091796875, -4.158203125, -3.9219970703125, -3.685791015625, -3.4495849609375, -3.21337890625, -2.9771728515625, -2.740966796875, -2.5047607421875, -2.2685546875, -2.0323486328125, -1.796142578125, -1.5599365234375, -1.32373046875, -1.0875244140625, -0.851318359375, -0.6151123046875, -0.37890625, -0.1427001953125, 0.093505859375, 0.3297119140625, 0.56591796875, 0.8021240234375, 1.038330078125, 1.2745361328125, 1.5107421875, 1.7469482421875, 1.983154296875, 2.2193603515625, 2.45556640625, 2.6917724609375, 2.927978515625, 3.1641845703125, 3.400390625, 3.6365966796875, 3.872802734375, 4.1090087890625, 4.34521484375, 4.5814208984375, 4.817626953125, 5.0538330078125, 5.2900390625, 5.5262451171875, 5.762451171875, 5.9986572265625, 6.23486328125, 6.4710693359375, 6.707275390625, 6.9434814453125, 7.1796875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 7.0, 4.0, 11.0, 13.0, 11.0, 8.0, 15.0, 20.0, 15.0, 22.0, 20.0, 35.0, 40.0, 47.0, 55.0, 42.0, 43.0, 47.0, 56.0, 63.0, 47.0, 49.0, 41.0, 40.0, 37.0, 28.0, 34.0, 22.0, 17.0, 26.0, 12.0, 16.0, 10.0, 7.0, 7.0, 4.0, 8.0, 9.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.20703125, -3.116729736328125, -3.02642822265625, -2.936126708984375, -2.8458251953125, -2.755523681640625, -2.66522216796875, -2.574920654296875, -2.484619140625, -2.394317626953125, -2.30401611328125, -2.213714599609375, -2.1234130859375, -2.033111572265625, -1.94281005859375, -1.852508544921875, -1.76220703125, -1.671905517578125, -1.58160400390625, -1.491302490234375, -1.4010009765625, -1.310699462890625, -1.22039794921875, -1.130096435546875, -1.039794921875, -0.949493408203125, -0.85919189453125, -0.768890380859375, -0.6785888671875, -0.588287353515625, -0.49798583984375, -0.407684326171875, -0.3173828125, -0.227081298828125, -0.13677978515625, -0.046478271484375, 0.0438232421875, 0.134124755859375, 0.22442626953125, 0.314727783203125, 0.405029296875, 0.495330810546875, 0.58563232421875, 0.675933837890625, 0.7662353515625, 0.856536865234375, 0.94683837890625, 1.037139892578125, 1.12744140625, 1.217742919921875, 1.30804443359375, 1.398345947265625, 1.4886474609375, 1.578948974609375, 1.66925048828125, 1.759552001953125, 1.849853515625, 1.940155029296875, 2.03045654296875, 2.120758056640625, 2.2110595703125, 2.301361083984375, 2.39166259765625, 2.481964111328125, 2.572265625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 8.0, 13.0, 25.0, 34.0, 74.0, 246.0, 1112.0, 12556.0, 999263.0, 32899.0, 1801.0, 303.0, 103.0, 46.0, 17.0, 16.0, 12.0, 12.0, 3.0, 3.0, 2.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.73046875, -1.67205810546875, -1.6136474609375, -1.55523681640625, -1.496826171875, -1.43841552734375, -1.3800048828125, -1.32159423828125, -1.26318359375, -1.20477294921875, -1.1463623046875, -1.08795166015625, -1.029541015625, -0.97113037109375, -0.9127197265625, -0.85430908203125, -0.7958984375, -0.73748779296875, -0.6790771484375, -0.62066650390625, -0.562255859375, -0.50384521484375, -0.4454345703125, -0.38702392578125, -0.32861328125, -0.27020263671875, -0.2117919921875, -0.15338134765625, -0.094970703125, -0.03656005859375, 0.0218505859375, 0.08026123046875, 0.138671875, 0.19708251953125, 0.2554931640625, 0.31390380859375, 0.372314453125, 0.43072509765625, 0.4891357421875, 0.54754638671875, 0.60595703125, 0.66436767578125, 0.7227783203125, 0.78118896484375, 0.839599609375, 0.89801025390625, 0.9564208984375, 1.01483154296875, 1.0732421875, 1.13165283203125, 1.1900634765625, 1.24847412109375, 1.306884765625, 1.36529541015625, 1.4237060546875, 1.48211669921875, 1.54052734375, 1.59893798828125, 1.6573486328125, 1.71575927734375, 1.774169921875, 1.83258056640625, 1.8909912109375, 1.94940185546875, 2.0078125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 0.0, 5.0, 3.0, 3.0, 2.0, 12.0, 11.0, 23.0, 30.0, 51.0, 97.0, 216.0, 257.0, 130.0, 70.0, 26.0, 19.0, 11.0, 13.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.212162017822266e-05, -6.886385381221771e-05, -6.560608744621277e-05, -6.234832108020782e-05, -5.909055471420288e-05, -5.583278834819794e-05, -5.257502198219299e-05, -4.931725561618805e-05, -4.6059489250183105e-05, -4.280172288417816e-05, -3.954395651817322e-05, -3.6286190152168274e-05, -3.302842378616333e-05, -2.9770657420158386e-05, -2.6512891054153442e-05, -2.32551246881485e-05, -1.9997358322143555e-05, -1.673959195613861e-05, -1.3481825590133667e-05, -1.0224059224128723e-05, -6.966292858123779e-06, -3.7085264921188354e-06, -4.507601261138916e-07, 2.8070062398910522e-06, 6.064772605895996e-06, 9.32253897190094e-06, 1.2580305337905884e-05, 1.5838071703910828e-05, 1.909583806991577e-05, 2.2353604435920715e-05, 2.561137080192566e-05, 2.8869137167930603e-05, 3.212690353393555e-05, 3.538466989994049e-05, 3.8642436265945435e-05, 4.190020263195038e-05, 4.515796899795532e-05, 4.8415735363960266e-05, 5.167350172996521e-05, 5.4931268095970154e-05, 5.81890344619751e-05, 6.144680082798004e-05, 6.470456719398499e-05, 6.796233355998993e-05, 7.122009992599487e-05, 7.447786629199982e-05, 7.773563265800476e-05, 8.09933990240097e-05, 8.425116539001465e-05, 8.750893175601959e-05, 9.076669812202454e-05, 9.402446448802948e-05, 9.728223085403442e-05, 0.00010053999722003937, 0.00010379776358604431, 0.00010705552995204926, 0.0001103132963180542, 0.00011357106268405914, 0.00011682882905006409, 0.00012008659541606903, 0.00012334436178207397, 0.00012660212814807892, 0.00012985989451408386, 0.0001331176608800888, 0.00013637542724609375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 9.0, 13.0, 27.0, 25.0, 64.0, 196.0, 425.0, 1761.0, 10819.0, 376152.0, 642989.0, 13154.0, 1998.0, 526.0, 184.0, 97.0, 41.0, 17.0, 18.0, 9.0, 7.0, 3.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.359375, -1.3270416259765625, -1.294708251953125, -1.2623748779296875, -1.23004150390625, -1.1977081298828125, -1.165374755859375, -1.1330413818359375, -1.1007080078125, -1.0683746337890625, -1.036041259765625, -1.0037078857421875, -0.97137451171875, -0.9390411376953125, -0.906707763671875, -0.8743743896484375, -0.842041015625, -0.8097076416015625, -0.777374267578125, -0.7450408935546875, -0.71270751953125, -0.6803741455078125, -0.648040771484375, -0.6157073974609375, -0.5833740234375, -0.5510406494140625, -0.518707275390625, -0.4863739013671875, -0.45404052734375, -0.4217071533203125, -0.389373779296875, -0.3570404052734375, -0.32470703125, -0.2923736572265625, -0.260040283203125, -0.2277069091796875, -0.19537353515625, -0.1630401611328125, -0.130706787109375, -0.0983734130859375, -0.0660400390625, -0.0337066650390625, -0.001373291015625, 0.0309600830078125, 0.06329345703125, 0.0956268310546875, 0.127960205078125, 0.1602935791015625, 0.192626953125, 0.2249603271484375, 0.257293701171875, 0.2896270751953125, 0.32196044921875, 0.3542938232421875, 0.386627197265625, 0.4189605712890625, 0.4512939453125, 0.4836273193359375, 0.515960693359375, 0.5482940673828125, 0.58062744140625, 0.6129608154296875, 0.645294189453125, 0.6776275634765625, 0.7099609375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 5.0, 13.0, 17.0, 23.0, 24.0, 20.0, 41.0, 75.0, 121.0, 230.0, 174.0, 64.0, 53.0, 40.0, 19.0, 22.0, 17.0, 14.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.201171875, -0.1943645477294922, -0.18755722045898438, -0.18074989318847656, -0.17394256591796875, -0.16713523864746094, -0.16032791137695312, -0.1535205841064453, -0.1467132568359375, -0.1399059295654297, -0.13309860229492188, -0.12629127502441406, -0.11948394775390625, -0.11267662048339844, -0.10586929321289062, -0.09906196594238281, -0.092254638671875, -0.08544731140136719, -0.07863998413085938, -0.07183265686035156, -0.06502532958984375, -0.05821800231933594, -0.051410675048828125, -0.04460334777832031, -0.0377960205078125, -0.030988693237304688, -0.024181365966796875, -0.017374038696289062, -0.01056671142578125, -0.0037593841552734375, 0.003047943115234375, 0.009855270385742188, 0.01666259765625, 0.023469924926757812, 0.030277252197265625, 0.03708457946777344, 0.04389190673828125, 0.05069923400878906, 0.057506561279296875, 0.06431388854980469, 0.0711212158203125, 0.07792854309082031, 0.08473587036132812, 0.09154319763183594, 0.09835052490234375, 0.10515785217285156, 0.11196517944335938, 0.11877250671386719, 0.125579833984375, 0.1323871612548828, 0.13919448852539062, 0.14600181579589844, 0.15280914306640625, 0.15961647033691406, 0.16642379760742188, 0.1732311248779297, 0.1800384521484375, 0.1868457794189453, 0.19365310668945312, 0.20046043395996094, 0.20726776123046875, 0.21407508850097656, 0.22088241577148438, 0.2276897430419922, 0.2344970703125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 27.0, 119.0, 520.0, 285.0, 54.0, 7.0, 3.0], "bins": [-39.530670166015625, -38.8690071105957, -38.20734405517578, -37.545677185058594, -36.88401412963867, -36.22235107421875, -35.56068801879883, -34.899024963378906, -34.23735809326172, -33.5756950378418, -32.914031982421875, -32.25236511230469, -31.590702056884766, -30.929039001464844, -30.26737403869629, -29.605710983276367, -28.944047927856445, -28.282384872436523, -27.62071990966797, -26.959056854248047, -26.297391891479492, -25.63572883605957, -24.974063873291016, -24.312400817871094, -23.650737762451172, -22.98907470703125, -22.327409744262695, -21.665746688842773, -21.00408172607422, -20.342418670654297, -19.680753707885742, -19.01909065246582, -18.3574275970459, -17.695764541625977, -17.034099578857422, -16.3724365234375, -15.710771560668945, -15.049108505249023, -14.387444496154785, -13.725780487060547, -13.064115524291992, -12.402451515197754, -11.740787506103516, -11.079123497009277, -10.417459487915039, -9.755796432495117, -9.094132423400879, -8.43246841430664, -7.7708048820495605, -7.109140872955322, -6.447477340698242, -5.785813331604004, -5.124149322509766, -4.462485313415527, -3.800821542739868, -3.139157772064209, -2.4774937629699707, -1.815829873085022, -1.1541659832000732, -0.4925020933151245, 0.16916179656982422, 0.8308258056640625, 1.4924895763397217, 2.154153347015381, 2.815817356109619]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 6.0, 10.0, 10.0, 13.0, 9.0, 14.0, 17.0, 27.0, 26.0, 29.0, 28.0, 30.0, 33.0, 35.0, 36.0, 40.0, 46.0, 49.0, 50.0, 50.0, 56.0, 37.0, 40.0, 52.0, 24.0, 32.0, 35.0, 18.0, 21.0, 22.0, 14.0, 22.0, 19.0, 13.0, 8.0, 6.0, 3.0, 5.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1127829551696777, -2.9984607696533203, -2.884138822555542, -2.7698166370391846, -2.655494451522827, -2.541172504425049, -2.4268503189086914, -2.312528133392334, -2.1982059478759766, -2.083883762359619, -1.9695616960525513, -1.8552396297454834, -1.740917444229126, -1.626595377922058, -1.5122733116149902, -1.3979511260986328, -1.283629059791565, -1.169306993484497, -1.0549848079681396, -0.9406627416610718, -0.8263405561447144, -0.7120184898376465, -0.5976963639259338, -0.4833742380142212, -0.36905211210250854, -0.2547299861907959, -0.14040787518024445, -0.026085764169692993, 0.08823636174201965, 0.2025584578514099, 0.31688058376312256, 0.4312027096748352, 0.5455248355865479, 0.6598469614982605, 0.7741690874099731, 0.888491153717041, 1.0028133392333984, 1.1171354055404663, 1.2314574718475342, 1.3457796573638916, 1.460101842880249, 1.574423909187317, 1.6887460947036743, 1.8030681610107422, 1.9173903465270996, 2.031712532043457, 2.1460344791412354, 2.2603566646575928, 2.374678611755371, 2.4890007972717285, 2.603322744369507, 2.7176449298858643, 2.8319671154022217, 2.9462890625, 3.0606112480163574, 3.174933433532715, 3.2892556190490723, 3.4035778045654297, 3.517899751663208, 3.6322219371795654, 3.746544122695923, 3.860866069793701, 3.9751882553100586, 4.089510440826416, 4.203832626342773]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 7.0, 9.0, 11.0, 11.0, 30.0, 24.0, 35.0, 38.0, 58.0, 78.0, 118.0, 168.0, 275.0, 429.0, 733.0, 1271.0, 2220.0, 4499.0, 12473.0, 78818.0, 1121400.0, 2696247.0, 237757.0, 24338.0, 6659.0, 2946.0, 1419.0, 774.0, 455.0, 326.0, 198.0, 156.0, 98.0, 59.0, 36.0, 25.0, 22.0, 13.0, 9.0, 7.0, 12.0, 6.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-3.796875, -3.689056396484375, -3.58123779296875, -3.473419189453125, -3.3656005859375, -3.257781982421875, -3.14996337890625, -3.042144775390625, -2.934326171875, -2.826507568359375, -2.71868896484375, -2.610870361328125, -2.5030517578125, -2.395233154296875, -2.28741455078125, -2.179595947265625, -2.07177734375, -1.963958740234375, -1.85614013671875, -1.748321533203125, -1.6405029296875, -1.532684326171875, -1.42486572265625, -1.317047119140625, -1.209228515625, -1.101409912109375, -0.99359130859375, -0.885772705078125, -0.7779541015625, -0.670135498046875, -0.56231689453125, -0.454498291015625, -0.3466796875, -0.238861083984375, -0.13104248046875, -0.023223876953125, 0.0845947265625, 0.192413330078125, 0.30023193359375, 0.408050537109375, 0.515869140625, 0.623687744140625, 0.73150634765625, 0.839324951171875, 0.9471435546875, 1.054962158203125, 1.16278076171875, 1.270599365234375, 1.37841796875, 1.486236572265625, 1.59405517578125, 1.701873779296875, 1.8096923828125, 1.917510986328125, 2.02532958984375, 2.133148193359375, 2.240966796875, 2.348785400390625, 2.45660400390625, 2.564422607421875, 2.6722412109375, 2.780059814453125, 2.88787841796875, 2.995697021484375, 3.103515625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 0.0, 7.0, 7.0, 3.0, 10.0, 10.0, 8.0, 10.0, 18.0, 21.0, 23.0, 34.0, 27.0, 27.0, 26.0, 44.0, 47.0, 51.0, 50.0, 36.0, 56.0, 41.0, 50.0, 39.0, 49.0, 52.0, 33.0, 42.0, 36.0, 23.0, 20.0, 20.0, 17.0, 20.0, 6.0, 9.0, 6.0, 5.0, 3.0, 5.0, 3.0, 2.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5400390625, -1.4932403564453125, -1.446441650390625, -1.3996429443359375, -1.35284423828125, -1.3060455322265625, -1.259246826171875, -1.2124481201171875, -1.1656494140625, -1.1188507080078125, -1.072052001953125, -1.0252532958984375, -0.97845458984375, -0.9316558837890625, -0.884857177734375, -0.8380584716796875, -0.791259765625, -0.7444610595703125, -0.697662353515625, -0.6508636474609375, -0.60406494140625, -0.5572662353515625, -0.510467529296875, -0.4636688232421875, -0.4168701171875, -0.3700714111328125, -0.323272705078125, -0.2764739990234375, -0.22967529296875, -0.1828765869140625, -0.136077880859375, -0.0892791748046875, -0.04248046875, 0.0043182373046875, 0.051116943359375, 0.0979156494140625, 0.14471435546875, 0.1915130615234375, 0.238311767578125, 0.2851104736328125, 0.3319091796875, 0.3787078857421875, 0.425506591796875, 0.4723052978515625, 0.51910400390625, 0.5659027099609375, 0.612701416015625, 0.6595001220703125, 0.706298828125, 0.7530975341796875, 0.799896240234375, 0.8466949462890625, 0.89349365234375, 0.9402923583984375, 0.987091064453125, 1.0338897705078125, 1.0806884765625, 1.1274871826171875, 1.174285888671875, 1.2210845947265625, 1.26788330078125, 1.3146820068359375, 1.361480712890625, 1.4082794189453125, 1.455078125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 9.0, 7.0, 7.0, 13.0, 12.0, 22.0, 30.0, 61.0, 99.0, 176.0, 313.0, 717.0, 1587.0, 4443.0, 17318.0, 168149.0, 3814817.0, 162101.0, 16936.0, 4436.0, 1530.0, 725.0, 337.0, 165.0, 93.0, 62.0, 34.0, 18.0, 13.0, 15.0, 11.0, 5.0, 5.0, 4.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.765625, -3.628662109375, -3.49169921875, -3.354736328125, -3.2177734375, -3.080810546875, -2.94384765625, -2.806884765625, -2.669921875, -2.532958984375, -2.39599609375, -2.259033203125, -2.1220703125, -1.985107421875, -1.84814453125, -1.711181640625, -1.57421875, -1.437255859375, -1.30029296875, -1.163330078125, -1.0263671875, -0.889404296875, -0.75244140625, -0.615478515625, -0.478515625, -0.341552734375, -0.20458984375, -0.067626953125, 0.0693359375, 0.206298828125, 0.34326171875, 0.480224609375, 0.6171875, 0.754150390625, 0.89111328125, 1.028076171875, 1.1650390625, 1.302001953125, 1.43896484375, 1.575927734375, 1.712890625, 1.849853515625, 1.98681640625, 2.123779296875, 2.2607421875, 2.397705078125, 2.53466796875, 2.671630859375, 2.80859375, 2.945556640625, 3.08251953125, 3.219482421875, 3.3564453125, 3.493408203125, 3.63037109375, 3.767333984375, 3.904296875, 4.041259765625, 4.17822265625, 4.315185546875, 4.4521484375, 4.589111328125, 4.72607421875, 4.863037109375, 5.0]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 5.0, 3.0, 4.0, 7.0, 11.0, 8.0, 18.0, 22.0, 23.0, 30.0, 61.0, 90.0, 164.0, 304.0, 486.0, 857.0, 817.0, 511.0, 252.0, 142.0, 87.0, 51.0, 28.0, 26.0, 18.0, 12.0, 11.0, 4.0, 9.0, 1.0, 6.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0556640625, -1.0245361328125, -0.993408203125, -0.9622802734375, -0.93115234375, -0.9000244140625, -0.868896484375, -0.8377685546875, -0.806640625, -0.7755126953125, -0.744384765625, -0.7132568359375, -0.68212890625, -0.6510009765625, -0.619873046875, -0.5887451171875, -0.5576171875, -0.5264892578125, -0.495361328125, -0.4642333984375, -0.43310546875, -0.4019775390625, -0.370849609375, -0.3397216796875, -0.30859375, -0.2774658203125, -0.246337890625, -0.2152099609375, -0.18408203125, -0.1529541015625, -0.121826171875, -0.0906982421875, -0.0595703125, -0.0284423828125, 0.002685546875, 0.0338134765625, 0.06494140625, 0.0960693359375, 0.127197265625, 0.1583251953125, 0.189453125, 0.2205810546875, 0.251708984375, 0.2828369140625, 0.31396484375, 0.3450927734375, 0.376220703125, 0.4073486328125, 0.4384765625, 0.4696044921875, 0.500732421875, 0.5318603515625, 0.56298828125, 0.5941162109375, 0.625244140625, 0.6563720703125, 0.6875, 0.7186279296875, 0.749755859375, 0.7808837890625, 0.81201171875, 0.8431396484375, 0.874267578125, 0.9053955078125, 0.9365234375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 3.0, 4.0, 7.0, 8.0, 15.0, 19.0, 21.0, 43.0, 48.0, 61.0, 78.0, 85.0, 104.0, 107.0, 96.0, 76.0, 63.0, 48.0, 24.0, 23.0, 20.0, 11.0, 5.0, 9.0, 10.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.513014554977417, -3.425304651260376, -3.337594747543335, -3.249885082244873, -3.162175178527832, -3.074465274810791, -2.98675537109375, -2.899045467376709, -2.811335563659668, -2.723625659942627, -2.635915756225586, -2.548205852508545, -2.460496187210083, -2.372786283493042, -2.285076379776001, -2.19736647605896, -2.109656810760498, -2.021946907043457, -1.9342371225357056, -1.8465272188186646, -1.758817434310913, -1.671107530593872, -1.583397626876831, -1.49568772315979, -1.4079779386520386, -1.3202680349349976, -1.232558250427246, -1.144848346710205, -1.057138442993164, -0.9694286584854126, -0.8817187547683716, -0.7940089106559753, -0.706298828125, -0.6185889840126038, -0.5308791399002075, -0.4431692361831665, -0.35545939207077026, -0.267749547958374, -0.180039644241333, -0.09232980012893677, -0.004619956016540527, 0.0830899029970169, 0.17079976201057434, 0.25850963592529297, 0.3462194800376892, 0.43392932415008545, 0.5216392278671265, 0.6093490719795227, 0.697058916091919, 0.7847687602043152, 0.8724786043167114, 0.9601885080337524, 1.047898292541504, 1.135608196258545, 1.223318099975586, 1.311028003692627, 1.3987377882003784, 1.4864476919174194, 1.574157476425171, 1.661867380142212, 1.749577283859253, 1.8372870683670044, 1.9249969720840454, 2.012706756591797, 2.100416660308838]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 7.0, 4.0, 8.0, 7.0, 11.0, 15.0, 12.0, 18.0, 18.0, 26.0, 29.0, 16.0, 28.0, 29.0, 37.0, 48.0, 30.0, 48.0, 56.0, 46.0, 46.0, 45.0, 45.0, 40.0, 36.0, 52.0, 24.0, 34.0, 24.0, 33.0, 25.0, 21.0, 23.0, 16.0, 11.0, 7.0, 3.0, 4.0, 3.0, 3.0, 5.0, 3.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.542176604270935, -1.4889832735061646, -1.435789942741394, -1.3825966119766235, -1.3294031620025635, -1.276209831237793, -1.2230165004730225, -1.169823169708252, -1.1166298389434814, -1.063436508178711, -1.0102431774139404, -0.9570497870445251, -0.9038564562797546, -0.8506631255149841, -0.7974697351455688, -0.7442764043807983, -0.6910830736160278, -0.6378897428512573, -0.5846964120864868, -0.5315030217170715, -0.478309690952301, -0.4251163601875305, -0.3719229996204376, -0.3187296390533447, -0.2655363082885742, -0.21234296262264252, -0.15914961695671082, -0.10595627129077911, -0.05276292562484741, 0.0004304051399230957, 0.05362376570701599, 0.10681712627410889, 0.16001033782958984, 0.21320368349552155, 0.26639702916145325, 0.31959038972854614, 0.37278372049331665, 0.42597705125808716, 0.47917041182518005, 0.532363772392273, 0.5855571031570435, 0.638750433921814, 0.6919437646865845, 0.7451371550559998, 0.7983304858207703, 0.8515238165855408, 0.904717206954956, 0.9579105377197266, 1.011103868484497, 1.0642971992492676, 1.117490530014038, 1.1706838607788086, 1.223877191543579, 1.2770705223083496, 1.3302639722824097, 1.3834573030471802, 1.4366506338119507, 1.4898439645767212, 1.5430372953414917, 1.5962306261062622, 1.6494240760803223, 1.7026174068450928, 1.7558107376098633, 1.8090040683746338, 1.8621973991394043]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 6.0, 3.0, 3.0, 4.0, 8.0, 6.0, 20.0, 31.0, 30.0, 65.0, 82.0, 170.0, 354.0, 782.0, 1770.0, 4779.0, 13552.0, 44733.0, 241386.0, 604829.0, 97617.0, 24599.0, 8344.0, 3036.0, 1204.0, 568.0, 238.0, 124.0, 72.0, 28.0, 20.0, 21.0, 14.0, 6.0, 7.0, 8.0, 5.0, 5.0, 6.0, 2.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1376953125, -1.1024322509765625, -1.067169189453125, -1.0319061279296875, -0.99664306640625, -0.9613800048828125, -0.926116943359375, -0.8908538818359375, -0.8555908203125, -0.8203277587890625, -0.785064697265625, -0.7498016357421875, -0.71453857421875, -0.6792755126953125, -0.644012451171875, -0.6087493896484375, -0.573486328125, -0.5382232666015625, -0.502960205078125, -0.4676971435546875, -0.43243408203125, -0.3971710205078125, -0.361907958984375, -0.3266448974609375, -0.2913818359375, -0.2561187744140625, -0.220855712890625, -0.1855926513671875, -0.15032958984375, -0.1150665283203125, -0.079803466796875, -0.0445404052734375, -0.00927734375, 0.0259857177734375, 0.061248779296875, 0.0965118408203125, 0.13177490234375, 0.1670379638671875, 0.202301025390625, 0.2375640869140625, 0.2728271484375, 0.3080902099609375, 0.343353271484375, 0.3786163330078125, 0.41387939453125, 0.4491424560546875, 0.484405517578125, 0.5196685791015625, 0.554931640625, 0.5901947021484375, 0.625457763671875, 0.6607208251953125, 0.69598388671875, 0.7312469482421875, 0.766510009765625, 0.8017730712890625, 0.8370361328125, 0.8722991943359375, 0.907562255859375, 0.9428253173828125, 0.97808837890625, 1.0133514404296875, 1.048614501953125, 1.0838775634765625, 1.119140625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 10.0, 15.0, 16.0, 23.0, 31.0, 28.0, 39.0, 58.0, 60.0, 69.0, 67.0, 98.0, 88.0, 68.0, 75.0, 58.0, 44.0, 44.0, 37.0, 37.0, 12.0, 7.0, 4.0, 4.0, 5.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0546875, -0.9990234375, -0.943359375, -0.8876953125, -0.83203125, -0.7763671875, -0.720703125, -0.6650390625, -0.609375, -0.5537109375, -0.498046875, -0.4423828125, -0.38671875, -0.3310546875, -0.275390625, -0.2197265625, -0.1640625, -0.1083984375, -0.052734375, 0.0029296875, 0.05859375, 0.1142578125, 0.169921875, 0.2255859375, 0.28125, 0.3369140625, 0.392578125, 0.4482421875, 0.50390625, 0.5595703125, 0.615234375, 0.6708984375, 0.7265625, 0.7822265625, 0.837890625, 0.8935546875, 0.94921875, 1.0048828125, 1.060546875, 1.1162109375, 1.171875, 1.2275390625, 1.283203125, 1.3388671875, 1.39453125, 1.4501953125, 1.505859375, 1.5615234375, 1.6171875, 1.6728515625, 1.728515625, 1.7841796875, 1.83984375, 1.8955078125, 1.951171875, 2.0068359375, 2.0625, 2.1181640625, 2.173828125, 2.2294921875, 2.28515625, 2.3408203125, 2.396484375, 2.4521484375, 2.5078125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 5.0, 11.0, 12.0, 9.0, 25.0, 31.0, 49.0, 48.0, 77.0, 125.0, 190.0, 241.0, 402.0, 572.0, 981.0, 1572.0, 2609.0, 4730.0, 8528.0, 16858.0, 35077.0, 81820.0, 225758.0, 386250.0, 161816.0, 62943.0, 27787.0, 13506.0, 6969.0, 3770.0, 2182.0, 1292.0, 802.0, 506.0, 309.0, 212.0, 151.0, 110.0, 59.0, 44.0, 27.0, 27.0, 12.0, 16.0, 10.0, 3.0, 8.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.40283203125, -0.3903770446777344, -0.37792205810546875, -0.3654670715332031, -0.3530120849609375, -0.3405570983886719, -0.32810211181640625, -0.3156471252441406, -0.303192138671875, -0.2907371520996094, -0.27828216552734375, -0.2658271789550781, -0.2533721923828125, -0.24091720581054688, -0.22846221923828125, -0.21600723266601562, -0.20355224609375, -0.19109725952148438, -0.17864227294921875, -0.16618728637695312, -0.1537322998046875, -0.14127731323242188, -0.12882232666015625, -0.11636734008789062, -0.103912353515625, -0.09145736694335938, -0.07900238037109375, -0.06654739379882812, -0.0540924072265625, -0.041637420654296875, -0.02918243408203125, -0.016727447509765625, -0.0042724609375, 0.008182525634765625, 0.02063751220703125, 0.033092498779296875, 0.0455474853515625, 0.058002471923828125, 0.07045745849609375, 0.08291244506835938, 0.095367431640625, 0.10782241821289062, 0.12027740478515625, 0.13273239135742188, 0.1451873779296875, 0.15764236450195312, 0.17009735107421875, 0.18255233764648438, 0.19500732421875, 0.20746231079101562, 0.21991729736328125, 0.23237228393554688, 0.2448272705078125, 0.2572822570800781, 0.26973724365234375, 0.2821922302246094, 0.294647216796875, 0.3071022033691406, 0.31955718994140625, 0.3320121765136719, 0.3444671630859375, 0.3569221496582031, 0.36937713623046875, 0.3818321228027344, 0.394287109375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 1.0, 5.0, 4.0, 2.0, 9.0, 15.0, 12.0, 15.0, 26.0, 31.0, 29.0, 44.0, 42.0, 56.0, 54.0, 74.0, 64.0, 70.0, 65.0, 49.0, 62.0, 54.0, 48.0, 26.0, 32.0, 31.0, 24.0, 17.0, 14.0, 5.0, 5.0, 3.0, 5.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9453125, -1.870819091796875, -1.79632568359375, -1.721832275390625, -1.6473388671875, -1.572845458984375, -1.49835205078125, -1.423858642578125, -1.349365234375, -1.274871826171875, -1.20037841796875, -1.125885009765625, -1.0513916015625, -0.976898193359375, -0.90240478515625, -0.827911376953125, -0.75341796875, -0.678924560546875, -0.60443115234375, -0.529937744140625, -0.4554443359375, -0.380950927734375, -0.30645751953125, -0.231964111328125, -0.157470703125, -0.082977294921875, -0.00848388671875, 0.066009521484375, 0.1405029296875, 0.214996337890625, 0.28948974609375, 0.363983154296875, 0.4384765625, 0.512969970703125, 0.58746337890625, 0.661956787109375, 0.7364501953125, 0.810943603515625, 0.88543701171875, 0.959930419921875, 1.034423828125, 1.108917236328125, 1.18341064453125, 1.257904052734375, 1.3323974609375, 1.406890869140625, 1.48138427734375, 1.555877685546875, 1.63037109375, 1.704864501953125, 1.77935791015625, 1.853851318359375, 1.9283447265625, 2.002838134765625, 2.07733154296875, 2.151824951171875, 2.226318359375, 2.300811767578125, 2.37530517578125, 2.449798583984375, 2.5242919921875, 2.598785400390625, 2.67327880859375, 2.747772216796875, 2.822265625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 10.0, 10.0, 19.0, 35.0, 34.0, 40.0, 67.0, 71.0, 120.0, 237.0, 301.0, 617.0, 945.0, 1992.0, 3941.0, 9020.0, 25878.0, 111436.0, 540507.0, 276307.0, 50463.0, 14724.0, 5651.0, 2730.0, 1381.0, 781.0, 454.0, 261.0, 161.0, 87.0, 70.0, 58.0, 34.0, 24.0, 17.0, 17.0, 17.0, 10.0, 6.0, 2.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.18603515625, -0.18017578125, -0.17431640625, -0.16845703125, -0.16259765625, -0.15673828125, -0.15087890625, -0.14501953125, -0.13916015625, -0.13330078125, -0.12744140625, -0.12158203125, -0.11572265625, -0.10986328125, -0.10400390625, -0.09814453125, -0.09228515625, -0.08642578125, -0.08056640625, -0.07470703125, -0.06884765625, -0.06298828125, -0.05712890625, -0.05126953125, -0.04541015625, -0.03955078125, -0.03369140625, -0.02783203125, -0.02197265625, -0.01611328125, -0.01025390625, -0.00439453125, 0.00146484375, 0.00732421875, 0.01318359375, 0.01904296875, 0.02490234375, 0.03076171875, 0.03662109375, 0.04248046875, 0.04833984375, 0.05419921875, 0.06005859375, 0.06591796875, 0.07177734375, 0.07763671875, 0.08349609375, 0.08935546875, 0.09521484375, 0.10107421875, 0.10693359375, 0.11279296875, 0.11865234375, 0.12451171875, 0.13037109375, 0.13623046875, 0.14208984375, 0.14794921875, 0.15380859375, 0.15966796875, 0.16552734375, 0.17138671875, 0.17724609375, 0.18310546875, 0.18896484375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 5.0, 17.0, 14.0, 18.0, 45.0, 33.0, 68.0, 122.0, 143.0, 184.0, 143.0, 65.0, 45.0, 25.0, 21.0, 13.0, 9.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012826919555664062, -0.00012353435158729553, -0.00011879950761795044, -0.00011406466364860535, -0.00010932981967926025, -0.00010459497570991516, -9.986013174057007e-05, -9.512528777122498e-05, -9.039044380187988e-05, -8.565559983253479e-05, -8.09207558631897e-05, -7.61859118938446e-05, -7.145106792449951e-05, -6.671622395515442e-05, -6.198137998580933e-05, -5.7246536016464233e-05, -5.251169204711914e-05, -4.777684807777405e-05, -4.3042004108428955e-05, -3.830716013908386e-05, -3.357231616973877e-05, -2.8837472200393677e-05, -2.4102628231048584e-05, -1.936778426170349e-05, -1.4632940292358398e-05, -9.898096323013306e-06, -5.163252353668213e-06, -4.284083843231201e-07, 4.306435585021973e-06, 9.041279554367065e-06, 1.3776123523712158e-05, 1.851096749305725e-05, 2.3245811462402344e-05, 2.7980655431747437e-05, 3.271549940109253e-05, 3.745034337043762e-05, 4.2185187339782715e-05, 4.692003130912781e-05, 5.16548752784729e-05, 5.638971924781799e-05, 6.112456321716309e-05, 6.585940718650818e-05, 7.059425115585327e-05, 7.532909512519836e-05, 8.006393909454346e-05, 8.479878306388855e-05, 8.953362703323364e-05, 9.426847100257874e-05, 9.900331497192383e-05, 0.00010373815894126892, 0.00010847300291061401, 0.0001132078468799591, 0.0001179426908493042, 0.0001226775348186493, 0.00012741237878799438, 0.00013214722275733948, 0.00013688206672668457, 0.00014161691069602966, 0.00014635175466537476, 0.00015108659863471985, 0.00015582144260406494, 0.00016055628657341003, 0.00016529113054275513, 0.00017002597451210022, 0.0001747608184814453]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 9.0, 7.0, 7.0, 5.0, 14.0, 16.0, 25.0, 39.0, 48.0, 70.0, 81.0, 114.0, 189.0, 242.0, 407.0, 574.0, 972.0, 1496.0, 2537.0, 4538.0, 9016.0, 20762.0, 59538.0, 227653.0, 469539.0, 169300.0, 46539.0, 16901.0, 7653.0, 4039.0, 2308.0, 1433.0, 783.0, 514.0, 342.0, 251.0, 176.0, 125.0, 81.0, 52.0, 41.0, 32.0, 24.0, 15.0, 13.0, 8.0, 12.0, 4.0, 6.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.162353515625, -0.15749168395996094, -0.15262985229492188, -0.1477680206298828, -0.14290618896484375, -0.1380443572998047, -0.13318252563476562, -0.12832069396972656, -0.1234588623046875, -0.11859703063964844, -0.11373519897460938, -0.10887336730957031, -0.10401153564453125, -0.09914970397949219, -0.09428787231445312, -0.08942604064941406, -0.084564208984375, -0.07970237731933594, -0.07484054565429688, -0.06997871398925781, -0.06511688232421875, -0.06025505065917969, -0.055393218994140625, -0.05053138732910156, -0.0456695556640625, -0.04080772399902344, -0.035945892333984375, -0.031084060668945312, -0.02622222900390625, -0.021360397338867188, -0.016498565673828125, -0.011636734008789062, -0.00677490234375, -0.0019130706787109375, 0.002948760986328125, 0.0078105926513671875, 0.01267242431640625, 0.017534255981445312, 0.022396087646484375, 0.027257919311523438, 0.0321197509765625, 0.03698158264160156, 0.041843414306640625, 0.04670524597167969, 0.05156707763671875, 0.05642890930175781, 0.061290740966796875, 0.06615257263183594, 0.071014404296875, 0.07587623596191406, 0.08073806762695312, 0.08559989929199219, 0.09046173095703125, 0.09532356262207031, 0.10018539428710938, 0.10504722595214844, 0.1099090576171875, 0.11477088928222656, 0.11963272094726562, 0.12449455261230469, 0.12935638427734375, 0.1342182159423828, 0.13908004760742188, 0.14394187927246094, 0.1488037109375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 7.0, 2.0, 1.0, 2.0, 6.0, 7.0, 2.0, 8.0, 5.0, 18.0, 11.0, 29.0, 33.0, 59.0, 56.0, 85.0, 96.0, 106.0, 107.0, 105.0, 66.0, 41.0, 32.0, 32.0, 26.0, 14.0, 7.0, 4.0, 7.0, 4.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051055908203125, -0.049384117126464844, -0.04771232604980469, -0.04604053497314453, -0.044368743896484375, -0.04269695281982422, -0.04102516174316406, -0.039353370666503906, -0.03768157958984375, -0.036009788513183594, -0.03433799743652344, -0.03266620635986328, -0.030994415283203125, -0.02932262420654297, -0.027650833129882812, -0.025979042053222656, -0.0243072509765625, -0.022635459899902344, -0.020963668823242188, -0.01929187774658203, -0.017620086669921875, -0.01594829559326172, -0.014276504516601562, -0.012604713439941406, -0.01093292236328125, -0.009261131286621094, -0.0075893402099609375, -0.005917549133300781, -0.004245758056640625, -0.0025739669799804688, -0.0009021759033203125, 0.0007696151733398438, 0.00244140625, 0.004113197326660156, 0.0057849884033203125, 0.007456779479980469, 0.009128570556640625, 0.010800361633300781, 0.012472152709960938, 0.014143943786621094, 0.01581573486328125, 0.017487525939941406, 0.019159317016601562, 0.02083110809326172, 0.022502899169921875, 0.02417469024658203, 0.025846481323242188, 0.027518272399902344, 0.0291900634765625, 0.030861854553222656, 0.03253364562988281, 0.03420543670654297, 0.035877227783203125, 0.03754901885986328, 0.03922080993652344, 0.040892601013183594, 0.04256439208984375, 0.044236183166503906, 0.04590797424316406, 0.04757976531982422, 0.049251556396484375, 0.05092334747314453, 0.05259513854980469, 0.054266929626464844, 0.055938720703125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 6.0, 3.0, 8.0, 6.0, 18.0, 13.0, 32.0, 37.0, 55.0, 74.0, 92.0, 125.0, 100.0, 118.0, 96.0, 58.0, 42.0, 33.0, 25.0, 14.0, 8.0, 11.0, 9.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7162421941757202, -1.6597799062728882, -1.6033176183700562, -1.5468553304672241, -1.490393042564392, -1.43393075466156, -1.377468466758728, -1.321006178855896, -1.264543890953064, -1.208081603050232, -1.1516193151474, -1.0951570272445679, -1.0386947393417358, -0.9822324514389038, -0.9257701635360718, -0.8693078756332397, -0.8128455877304077, -0.7563832998275757, -0.6999210119247437, -0.6434587240219116, -0.5869964361190796, -0.5305341482162476, -0.4740718603134155, -0.4176095724105835, -0.36114728450775146, -0.30468499660491943, -0.2482227087020874, -0.19176042079925537, -0.13529813289642334, -0.07883584499359131, -0.022373557090759277, 0.034088730812072754, 0.09055089950561523, 0.14701318740844727, 0.2034754753112793, 0.25993776321411133, 0.31640005111694336, 0.3728623390197754, 0.4293246269226074, 0.48578691482543945, 0.5422492027282715, 0.5987114906311035, 0.6551737785339355, 0.7116360664367676, 0.7680983543395996, 0.8245606422424316, 0.8810229301452637, 0.9374852180480957, 0.9939475059509277, 1.0504097938537598, 1.1068720817565918, 1.1633343696594238, 1.2197966575622559, 1.276258945465088, 1.33272123336792, 1.389183521270752, 1.445645809173584, 1.502108097076416, 1.558570384979248, 1.61503267288208, 1.671494960784912, 1.7279572486877441, 1.7844195365905762, 1.8408818244934082, 1.8973441123962402]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 13.0, 15.0, 16.0, 23.0, 37.0, 45.0, 39.0, 46.0, 66.0, 81.0, 89.0, 74.0, 68.0, 76.0, 65.0, 55.0, 50.0, 43.0, 26.0, 28.0, 18.0, 5.0, 5.0, 9.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.026350736618042, -0.9734401106834412, -0.9205294847488403, -0.8676189184188843, -0.8147082924842834, -0.7617976665496826, -0.7088870406150818, -0.655976414680481, -0.6030658483505249, -0.5501552224159241, -0.49724462628364563, -0.4443340003490448, -0.39142340421676636, -0.3385127782821655, -0.2856021523475647, -0.23269155621528625, -0.17978090047836304, -0.1268702894449234, -0.07395967096090317, -0.021049052476882935, 0.0318615585565567, 0.08477216958999634, 0.13768279552459717, 0.1905933916568756, 0.24350401759147644, 0.29641464352607727, 0.3493252396583557, 0.40223586559295654, 0.4551464915275574, 0.5080571174621582, 0.5609676837921143, 0.6138783097267151, 0.6667889356613159, 0.7196995615959167, 0.7726101875305176, 0.8255207538604736, 0.8784313797950745, 0.9313420057296753, 0.9842526316642761, 1.037163257598877, 1.090073823928833, 1.142984390258789, 1.1958950757980347, 1.2488056421279907, 1.3017163276672363, 1.3546268939971924, 1.4075374603271484, 1.460448145866394, 1.5133588314056396, 1.5662693977355957, 1.6191800832748413, 1.6720906496047974, 1.725001335144043, 1.777911901473999, 1.830822467803955, 1.8837331533432007, 1.9366437196731567, 1.9895542860031128, 2.0424649715423584, 2.0953755378723145, 2.1482861042022705, 2.2011966705322266, 2.2541074752807617, 2.3070180416107178, 2.359928607940674]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 1.0, 14.0, 10.0, 25.0, 25.0, 28.0, 55.0, 62.0, 94.0, 123.0, 207.0, 265.0, 345.0, 526.0, 822.0, 1146.0, 1768.0, 2706.0, 4422.0, 8017.0, 15830.0, 37824.0, 123136.0, 547042.0, 205484.0, 53515.0, 20599.0, 9617.0, 5356.0, 3164.0, 2034.0, 1326.0, 934.0, 555.0, 426.0, 323.0, 238.0, 142.0, 114.0, 75.0, 52.0, 30.0, 26.0, 17.0, 15.0, 10.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-1.017578125, -0.985443115234375, -0.95330810546875, -0.921173095703125, -0.8890380859375, -0.856903076171875, -0.82476806640625, -0.792633056640625, -0.760498046875, -0.728363037109375, -0.69622802734375, -0.664093017578125, -0.6319580078125, -0.599822998046875, -0.56768798828125, -0.535552978515625, -0.50341796875, -0.471282958984375, -0.43914794921875, -0.407012939453125, -0.3748779296875, -0.342742919921875, -0.31060791015625, -0.278472900390625, -0.246337890625, -0.214202880859375, -0.18206787109375, -0.149932861328125, -0.1177978515625, -0.085662841796875, -0.05352783203125, -0.021392822265625, 0.0107421875, 0.042877197265625, 0.07501220703125, 0.107147216796875, 0.1392822265625, 0.171417236328125, 0.20355224609375, 0.235687255859375, 0.267822265625, 0.299957275390625, 0.33209228515625, 0.364227294921875, 0.3963623046875, 0.428497314453125, 0.46063232421875, 0.492767333984375, 0.52490234375, 0.557037353515625, 0.58917236328125, 0.621307373046875, 0.6534423828125, 0.685577392578125, 0.71771240234375, 0.749847412109375, 0.781982421875, 0.814117431640625, 0.84625244140625, 0.878387451171875, 0.9105224609375, 0.942657470703125, 0.97479248046875, 1.006927490234375, 1.0390625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 14.0, 10.0, 10.0, 22.0, 25.0, 38.0, 41.0, 43.0, 55.0, 69.0, 77.0, 79.0, 86.0, 67.0, 90.0, 67.0, 52.0, 43.0, 34.0, 29.0, 16.0, 10.0, 10.0, 5.0, 7.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.28515625, -2.18115234375, -2.0771484375, -1.97314453125, -1.869140625, -1.76513671875, -1.6611328125, -1.55712890625, -1.453125, -1.34912109375, -1.2451171875, -1.14111328125, -1.037109375, -0.93310546875, -0.8291015625, -0.72509765625, -0.62109375, -0.51708984375, -0.4130859375, -0.30908203125, -0.205078125, -0.10107421875, 0.0029296875, 0.10693359375, 0.2109375, 0.31494140625, 0.4189453125, 0.52294921875, 0.626953125, 0.73095703125, 0.8349609375, 0.93896484375, 1.04296875, 1.14697265625, 1.2509765625, 1.35498046875, 1.458984375, 1.56298828125, 1.6669921875, 1.77099609375, 1.875, 1.97900390625, 2.0830078125, 2.18701171875, 2.291015625, 2.39501953125, 2.4990234375, 2.60302734375, 2.70703125, 2.81103515625, 2.9150390625, 3.01904296875, 3.123046875, 3.22705078125, 3.3310546875, 3.43505859375, 3.5390625, 3.64306640625, 3.7470703125, 3.85107421875, 3.955078125, 4.05908203125, 4.1630859375, 4.26708984375, 4.37109375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 4.0, 3.0, 7.0, 11.0, 8.0, 12.0, 17.0, 18.0, 21.0, 24.0, 31.0, 40.0, 39.0, 45.0, 88.0, 119.0, 636.0, 8420.0, 994516.0, 42276.0, 1603.0, 205.0, 77.0, 52.0, 47.0, 48.0, 25.0, 35.0, 18.0, 11.0, 17.0, 17.0, 14.0, 13.0, 12.0, 5.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-8.3515625, -8.10382080078125, -7.8560791015625, -7.60833740234375, -7.360595703125, -7.11285400390625, -6.8651123046875, -6.61737060546875, -6.36962890625, -6.12188720703125, -5.8741455078125, -5.62640380859375, -5.378662109375, -5.13092041015625, -4.8831787109375, -4.63543701171875, -4.3876953125, -4.13995361328125, -3.8922119140625, -3.64447021484375, -3.396728515625, -3.14898681640625, -2.9012451171875, -2.65350341796875, -2.40576171875, -2.15802001953125, -1.9102783203125, -1.66253662109375, -1.414794921875, -1.16705322265625, -0.9193115234375, -0.67156982421875, -0.423828125, -0.17608642578125, 0.0716552734375, 0.31939697265625, 0.567138671875, 0.81488037109375, 1.0626220703125, 1.31036376953125, 1.55810546875, 1.80584716796875, 2.0535888671875, 2.30133056640625, 2.549072265625, 2.79681396484375, 3.0445556640625, 3.29229736328125, 3.5400390625, 3.78778076171875, 4.0355224609375, 4.28326416015625, 4.531005859375, 4.77874755859375, 5.0264892578125, 5.27423095703125, 5.52197265625, 5.76971435546875, 6.0174560546875, 6.26519775390625, 6.512939453125, 6.76068115234375, 7.0084228515625, 7.25616455078125, 7.50390625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 7.0, 11.0, 7.0, 12.0, 15.0, 20.0, 22.0, 25.0, 25.0, 32.0, 37.0, 31.0, 50.0, 42.0, 48.0, 46.0, 52.0, 47.0, 51.0, 41.0, 38.0, 38.0, 43.0, 31.0, 36.0, 26.0, 32.0, 22.0, 23.0, 18.0, 19.0, 15.0, 9.0, 8.0, 6.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.955078125, -1.8883056640625, -1.821533203125, -1.7547607421875, -1.68798828125, -1.6212158203125, -1.554443359375, -1.4876708984375, -1.4208984375, -1.3541259765625, -1.287353515625, -1.2205810546875, -1.15380859375, -1.0870361328125, -1.020263671875, -0.9534912109375, -0.88671875, -0.8199462890625, -0.753173828125, -0.6864013671875, -0.61962890625, -0.5528564453125, -0.486083984375, -0.4193115234375, -0.3525390625, -0.2857666015625, -0.218994140625, -0.1522216796875, -0.08544921875, -0.0186767578125, 0.048095703125, 0.1148681640625, 0.181640625, 0.2484130859375, 0.315185546875, 0.3819580078125, 0.44873046875, 0.5155029296875, 0.582275390625, 0.6490478515625, 0.7158203125, 0.7825927734375, 0.849365234375, 0.9161376953125, 0.98291015625, 1.0496826171875, 1.116455078125, 1.1832275390625, 1.25, 1.3167724609375, 1.383544921875, 1.4503173828125, 1.51708984375, 1.5838623046875, 1.650634765625, 1.7174072265625, 1.7841796875, 1.8509521484375, 1.917724609375, 1.9844970703125, 2.05126953125, 2.1180419921875, 2.184814453125, 2.2515869140625, 2.318359375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 1.0, 4.0, 7.0, 3.0, 4.0, 19.0, 30.0, 54.0, 92.0, 172.0, 387.0, 1057.0, 4290.0, 45112.0, 964552.0, 27935.0, 3269.0, 848.0, 345.0, 157.0, 77.0, 45.0, 28.0, 22.0, 15.0, 12.0, 7.0, 7.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9736328125, -0.9259796142578125, -0.878326416015625, -0.8306732177734375, -0.78302001953125, -0.7353668212890625, -0.687713623046875, -0.6400604248046875, -0.5924072265625, -0.5447540283203125, -0.497100830078125, -0.4494476318359375, -0.40179443359375, -0.3541412353515625, -0.306488037109375, -0.2588348388671875, -0.211181640625, -0.1635284423828125, -0.115875244140625, -0.0682220458984375, -0.02056884765625, 0.0270843505859375, 0.074737548828125, 0.1223907470703125, 0.1700439453125, 0.2176971435546875, 0.265350341796875, 0.3130035400390625, 0.36065673828125, 0.4083099365234375, 0.455963134765625, 0.5036163330078125, 0.55126953125, 0.5989227294921875, 0.646575927734375, 0.6942291259765625, 0.74188232421875, 0.7895355224609375, 0.837188720703125, 0.8848419189453125, 0.9324951171875, 0.9801483154296875, 1.027801513671875, 1.0754547119140625, 1.12310791015625, 1.1707611083984375, 1.218414306640625, 1.2660675048828125, 1.313720703125, 1.3613739013671875, 1.409027099609375, 1.4566802978515625, 1.50433349609375, 1.5519866943359375, 1.599639892578125, 1.6472930908203125, 1.6949462890625, 1.7425994873046875, 1.790252685546875, 1.8379058837890625, 1.88555908203125, 1.9332122802734375, 1.980865478515625, 2.0285186767578125, 2.076171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 9.0, 12.0, 27.0, 33.0, 75.0, 151.0, 322.0, 184.0, 88.0, 47.0, 20.0, 7.0, 9.0, 3.0, 3.0, 4.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00022733211517333984, -0.00022200308740139008, -0.0002166740596294403, -0.00021134503185749054, -0.00020601600408554077, -0.000200686976313591, -0.00019535794854164124, -0.00019002892076969147, -0.0001846998929977417, -0.00017937086522579193, -0.00017404183745384216, -0.0001687128096818924, -0.00016338378190994263, -0.00015805475413799286, -0.0001527257263660431, -0.00014739669859409332, -0.00014206767082214355, -0.0001367386430501938, -0.00013140961527824402, -0.00012608058750629425, -0.00012075155973434448, -0.00011542253196239471, -0.00011009350419044495, -0.00010476447641849518, -9.943544864654541e-05, -9.410642087459564e-05, -8.877739310264587e-05, -8.34483653306961e-05, -7.811933755874634e-05, -7.279030978679657e-05, -6.74612820148468e-05, -6.213225424289703e-05, -5.6803226470947266e-05, -5.14741986989975e-05, -4.614517092704773e-05, -4.081614315509796e-05, -3.548711538314819e-05, -3.0158087611198425e-05, -2.4829059839248657e-05, -1.950003206729889e-05, -1.4171004295349121e-05, -8.841976523399353e-06, -3.512948751449585e-06, 1.816079020500183e-06, 7.145106792449951e-06, 1.247413456439972e-05, 1.7803162336349487e-05, 2.3132190108299255e-05, 2.8461217880249023e-05, 3.379024565219879e-05, 3.911927342414856e-05, 4.444830119609833e-05, 4.9777328968048096e-05, 5.5106356739997864e-05, 6.043538451194763e-05, 6.57644122838974e-05, 7.109344005584717e-05, 7.642246782779694e-05, 8.17514955997467e-05, 8.708052337169647e-05, 9.240955114364624e-05, 9.773857891559601e-05, 0.00010306760668754578, 0.00010839663445949554, 0.00011372566223144531]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 9.0, 5.0, 4.0, 13.0, 20.0, 29.0, 41.0, 86.0, 95.0, 144.0, 244.0, 495.0, 904.0, 1809.0, 4231.0, 13512.0, 101330.0, 818044.0, 86986.0, 12631.0, 4084.0, 1754.0, 853.0, 499.0, 259.0, 169.0, 94.0, 56.0, 46.0, 29.0, 24.0, 21.0, 13.0, 10.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.849609375, -0.8242263793945312, -0.7988433837890625, -0.7734603881835938, -0.748077392578125, -0.7226943969726562, -0.6973114013671875, -0.6719284057617188, -0.64654541015625, -0.6211624145507812, -0.5957794189453125, -0.5703964233398438, -0.545013427734375, -0.5196304321289062, -0.4942474365234375, -0.46886444091796875, -0.4434814453125, -0.41809844970703125, -0.3927154541015625, -0.36733245849609375, -0.341949462890625, -0.31656646728515625, -0.2911834716796875, -0.26580047607421875, -0.24041748046875, -0.21503448486328125, -0.1896514892578125, -0.16426849365234375, -0.138885498046875, -0.11350250244140625, -0.0881195068359375, -0.06273651123046875, -0.037353515625, -0.01197052001953125, 0.0134124755859375, 0.03879547119140625, 0.064178466796875, 0.08956146240234375, 0.1149444580078125, 0.14032745361328125, 0.16571044921875, 0.19109344482421875, 0.2164764404296875, 0.24185943603515625, 0.267242431640625, 0.29262542724609375, 0.3180084228515625, 0.34339141845703125, 0.3687744140625, 0.39415740966796875, 0.4195404052734375, 0.44492340087890625, 0.470306396484375, 0.49568939208984375, 0.5210723876953125, 0.5464553833007812, 0.57183837890625, 0.5972213745117188, 0.6226043701171875, 0.6479873657226562, 0.673370361328125, 0.6987533569335938, 0.7241363525390625, 0.7495193481445312, 0.77490234375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 8.0, 8.0, 19.0, 33.0, 58.0, 118.0, 143.0, 235.0, 137.0, 101.0, 62.0, 34.0, 15.0, 12.0, 7.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4111328125, -0.39762115478515625, -0.3841094970703125, -0.37059783935546875, -0.357086181640625, -0.34357452392578125, -0.3300628662109375, -0.31655120849609375, -0.30303955078125, -0.28952789306640625, -0.2760162353515625, -0.26250457763671875, -0.248992919921875, -0.23548126220703125, -0.2219696044921875, -0.20845794677734375, -0.1949462890625, -0.18143463134765625, -0.1679229736328125, -0.15441131591796875, -0.140899658203125, -0.12738800048828125, -0.1138763427734375, -0.10036468505859375, -0.08685302734375, -0.07334136962890625, -0.0598297119140625, -0.04631805419921875, -0.032806396484375, -0.01929473876953125, -0.0057830810546875, 0.00772857666015625, 0.021240234375, 0.03475189208984375, 0.0482635498046875, 0.06177520751953125, 0.075286865234375, 0.08879852294921875, 0.1023101806640625, 0.11582183837890625, 0.12933349609375, 0.14284515380859375, 0.1563568115234375, 0.16986846923828125, 0.183380126953125, 0.19689178466796875, 0.2104034423828125, 0.22391510009765625, 0.2374267578125, 0.25093841552734375, 0.2644500732421875, 0.27796173095703125, 0.291473388671875, 0.30498504638671875, 0.3184967041015625, 0.33200836181640625, 0.34552001953125, 0.35903167724609375, 0.3725433349609375, 0.38605499267578125, 0.399566650390625, 0.41307830810546875, 0.4265899658203125, 0.44010162353515625, 0.45361328125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 5.0, 20.0, 47.0, 104.0, 233.0, 313.0, 179.0, 65.0, 24.0, 17.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6970584392547607, -2.3720474243164062, -2.0470364093780518, -1.7220252752304077, -1.3970142602920532, -1.0720032453536987, -0.7469921112060547, -0.4219810962677002, -0.0969700813293457, 0.22804096341133118, 0.5530520081520081, 0.8780630826950073, 1.2030740976333618, 1.5280851125717163, 1.8530962467193604, 2.178107261657715, 2.5031182765960693, 2.828129291534424, 3.1531403064727783, 3.478151321411133, 3.8031625747680664, 4.128173351287842, 4.453184604644775, 4.778195381164551, 5.103206634521484, 5.428217887878418, 5.753228664398193, 6.078239917755127, 6.403250694274902, 6.728261947631836, 7.0532732009887695, 7.378283977508545, 7.703295707702637, 8.02830696105957, 8.353318214416504, 8.678328514099121, 9.003339767456055, 9.328351020812988, 9.653362274169922, 9.978372573852539, 10.303383827209473, 10.628395080566406, 10.95340633392334, 11.278416633605957, 11.60342788696289, 11.928439140319824, 12.253450393676758, 12.578460693359375, 12.903472900390625, 13.228484153747559, 13.553495407104492, 13.87850570678711, 14.203516960144043, 14.528528213500977, 14.85353946685791, 15.178550720214844, 15.503561019897461, 15.828572273254395, 16.153583526611328, 16.478593826293945, 16.803606033325195, 17.128616333007812, 17.45362663269043, 17.77863883972168, 18.103649139404297]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 8.0, 6.0, 9.0, 6.0, 8.0, 18.0, 16.0, 15.0, 23.0, 26.0, 19.0, 39.0, 27.0, 44.0, 55.0, 53.0, 59.0, 42.0, 44.0, 51.0, 59.0, 49.0, 42.0, 47.0, 38.0, 43.0, 28.0, 22.0, 17.0, 23.0, 18.0, 7.0, 13.0, 7.0, 8.0, 4.0, 6.0, 7.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0049030780792236, -2.897496461868286, -2.7900896072387695, -2.682682991027832, -2.5752763748168945, -2.467869758605957, -2.3604631423950195, -2.253056287765503, -2.1456496715545654, -2.038243055343628, -1.9308363199234009, -1.8234295845031738, -1.7160229682922363, -1.6086163520812988, -1.5012096166610718, -1.3938028812408447, -1.2863962650299072, -1.1789896488189697, -1.0715829133987427, -0.9641762375831604, -0.8567695617675781, -0.7493628859519958, -0.6419562101364136, -0.5345495343208313, -0.427142858505249, -0.31973618268966675, -0.21232950687408447, -0.1049228310585022, 0.002483844757080078, 0.10989052057266235, 0.21729719638824463, 0.3247038722038269, 0.4321105480194092, 0.5395172238349915, 0.6469238996505737, 0.754330575466156, 0.8617372512817383, 0.9691439270973206, 1.0765506029129028, 1.1839573383331299, 1.2913639545440674, 1.3987705707550049, 1.506177306175232, 1.613584041595459, 1.7209906578063965, 1.828397274017334, 1.935804009437561, 2.043210744857788, 2.1506173610687256, 2.258023977279663, 2.3654308319091797, 2.472837448120117, 2.5802440643310547, 2.687650680541992, 2.7950572967529297, 2.9024641513824463, 3.009870767593384, 3.1172773838043213, 3.224684238433838, 3.3320908546447754, 3.439497470855713, 3.5469040870666504, 3.654310703277588, 3.7617175579071045, 3.869124174118042]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 11.0, 12.0, 15.0, 19.0, 24.0, 32.0, 53.0, 77.0, 85.0, 104.0, 142.0, 163.0, 217.0, 251.0, 365.0, 598.0, 906.0, 1427.0, 2432.0, 5175.0, 17227.0, 102406.0, 881280.0, 2528036.0, 563739.0, 67542.0, 11799.0, 4112.0, 2031.0, 1225.0, 758.0, 527.0, 382.0, 302.0, 185.0, 126.0, 91.0, 87.0, 63.0, 53.0, 49.0, 31.0, 24.0, 15.0, 17.0, 15.0, 15.0, 10.0, 7.0, 4.0, 1.0, 8.0, 3.0, 3.0, 3.0, 3.0], "bins": [-2.390625, -2.314483642578125, -2.23834228515625, -2.162200927734375, -2.0860595703125, -2.009918212890625, -1.93377685546875, -1.857635498046875, -1.781494140625, -1.705352783203125, -1.62921142578125, -1.553070068359375, -1.4769287109375, -1.400787353515625, -1.32464599609375, -1.248504638671875, -1.17236328125, -1.096221923828125, -1.02008056640625, -0.943939208984375, -0.8677978515625, -0.791656494140625, -0.71551513671875, -0.639373779296875, -0.563232421875, -0.487091064453125, -0.41094970703125, -0.334808349609375, -0.2586669921875, -0.182525634765625, -0.10638427734375, -0.030242919921875, 0.0458984375, 0.122039794921875, 0.19818115234375, 0.274322509765625, 0.3504638671875, 0.426605224609375, 0.50274658203125, 0.578887939453125, 0.655029296875, 0.731170654296875, 0.80731201171875, 0.883453369140625, 0.9595947265625, 1.035736083984375, 1.11187744140625, 1.188018798828125, 1.26416015625, 1.340301513671875, 1.41644287109375, 1.492584228515625, 1.5687255859375, 1.644866943359375, 1.72100830078125, 1.797149658203125, 1.873291015625, 1.949432373046875, 2.02557373046875, 2.101715087890625, 2.1778564453125, 2.253997802734375, 2.33013916015625, 2.406280517578125, 2.482421875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 4.0, 8.0, 5.0, 9.0, 11.0, 19.0, 10.0, 16.0, 30.0, 18.0, 18.0, 44.0, 32.0, 38.0, 37.0, 37.0, 38.0, 49.0, 57.0, 40.0, 35.0, 45.0, 52.0, 43.0, 37.0, 34.0, 40.0, 27.0, 25.0, 17.0, 21.0, 20.0, 15.0, 15.0, 11.0, 9.0, 9.0, 7.0, 4.0, 0.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.4345703125, -1.3902435302734375, -1.345916748046875, -1.3015899658203125, -1.25726318359375, -1.2129364013671875, -1.168609619140625, -1.1242828369140625, -1.0799560546875, -1.0356292724609375, -0.991302490234375, -0.9469757080078125, -0.90264892578125, -0.8583221435546875, -0.813995361328125, -0.7696685791015625, -0.725341796875, -0.6810150146484375, -0.636688232421875, -0.5923614501953125, -0.54803466796875, -0.5037078857421875, -0.459381103515625, -0.4150543212890625, -0.3707275390625, -0.3264007568359375, -0.282073974609375, -0.2377471923828125, -0.19342041015625, -0.1490936279296875, -0.104766845703125, -0.0604400634765625, -0.01611328125, 0.0282135009765625, 0.072540283203125, 0.1168670654296875, 0.16119384765625, 0.2055206298828125, 0.249847412109375, 0.2941741943359375, 0.3385009765625, 0.3828277587890625, 0.427154541015625, 0.4714813232421875, 0.51580810546875, 0.5601348876953125, 0.604461669921875, 0.6487884521484375, 0.693115234375, 0.7374420166015625, 0.781768798828125, 0.8260955810546875, 0.87042236328125, 0.9147491455078125, 0.959075927734375, 1.0034027099609375, 1.0477294921875, 1.0920562744140625, 1.136383056640625, 1.1807098388671875, 1.22503662109375, 1.2693634033203125, 1.313690185546875, 1.3580169677734375, 1.40234375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 9.0, 8.0, 13.0, 20.0, 42.0, 52.0, 138.0, 250.0, 543.0, 1417.0, 4287.0, 18573.0, 195568.0, 3747551.0, 200162.0, 18682.0, 4402.0, 1457.0, 592.0, 240.0, 132.0, 64.0, 42.0, 16.0, 13.0, 8.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1796875, -4.073883056640625, -3.96807861328125, -3.862274169921875, -3.7564697265625, -3.650665283203125, -3.54486083984375, -3.439056396484375, -3.333251953125, -3.227447509765625, -3.12164306640625, -3.015838623046875, -2.9100341796875, -2.804229736328125, -2.69842529296875, -2.592620849609375, -2.48681640625, -2.381011962890625, -2.27520751953125, -2.169403076171875, -2.0635986328125, -1.957794189453125, -1.85198974609375, -1.746185302734375, -1.640380859375, -1.534576416015625, -1.42877197265625, -1.322967529296875, -1.2171630859375, -1.111358642578125, -1.00555419921875, -0.899749755859375, -0.7939453125, -0.688140869140625, -0.58233642578125, -0.476531982421875, -0.3707275390625, -0.264923095703125, -0.15911865234375, -0.053314208984375, 0.052490234375, 0.158294677734375, 0.26409912109375, 0.369903564453125, 0.4757080078125, 0.581512451171875, 0.68731689453125, 0.793121337890625, 0.89892578125, 1.004730224609375, 1.11053466796875, 1.216339111328125, 1.3221435546875, 1.427947998046875, 1.53375244140625, 1.639556884765625, 1.745361328125, 1.851165771484375, 1.95697021484375, 2.062774658203125, 2.1685791015625, 2.274383544921875, 2.38018798828125, 2.485992431640625, 2.591796875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 2.0, 6.0, 6.0, 10.0, 14.0, 19.0, 27.0, 33.0, 54.0, 85.0, 127.0, 248.0, 438.0, 608.0, 751.0, 595.0, 397.0, 222.0, 142.0, 77.0, 65.0, 37.0, 34.0, 16.0, 9.0, 11.0, 11.0, 5.0, 7.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6650390625, -0.6416778564453125, -0.618316650390625, -0.5949554443359375, -0.57159423828125, -0.5482330322265625, -0.524871826171875, -0.5015106201171875, -0.4781494140625, -0.4547882080078125, -0.431427001953125, -0.4080657958984375, -0.38470458984375, -0.3613433837890625, -0.337982177734375, -0.3146209716796875, -0.291259765625, -0.2678985595703125, -0.244537353515625, -0.2211761474609375, -0.19781494140625, -0.1744537353515625, -0.151092529296875, -0.1277313232421875, -0.1043701171875, -0.0810089111328125, -0.057647705078125, -0.0342864990234375, -0.01092529296875, 0.0124359130859375, 0.035797119140625, 0.0591583251953125, 0.08251953125, 0.1058807373046875, 0.129241943359375, 0.1526031494140625, 0.17596435546875, 0.1993255615234375, 0.222686767578125, 0.2460479736328125, 0.2694091796875, 0.2927703857421875, 0.316131591796875, 0.3394927978515625, 0.36285400390625, 0.3862152099609375, 0.409576416015625, 0.4329376220703125, 0.456298828125, 0.4796600341796875, 0.503021240234375, 0.5263824462890625, 0.54974365234375, 0.5731048583984375, 0.596466064453125, 0.6198272705078125, 0.6431884765625, 0.6665496826171875, 0.689910888671875, 0.7132720947265625, 0.73663330078125, 0.7599945068359375, 0.783355712890625, 0.8067169189453125, 0.830078125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 5.0, 8.0, 14.0, 9.0, 15.0, 20.0, 24.0, 23.0, 31.0, 39.0, 45.0, 60.0, 64.0, 84.0, 83.0, 74.0, 100.0, 58.0, 53.0, 53.0, 28.0, 24.0, 17.0, 13.0, 11.0, 10.0, 10.0, 4.0, 5.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8108224868774414, -1.7480031251907349, -1.6851836442947388, -1.6223642826080322, -1.5595448017120361, -1.4967254400253296, -1.433906078338623, -1.371086597442627, -1.3082672357559204, -1.2454478740692139, -1.1826283931732178, -1.1198090314865112, -1.0569896697998047, -0.9941701889038086, -0.931350827217102, -0.8685314059257507, -0.8057119846343994, -0.7428925633430481, -0.6800731420516968, -0.6172537803649902, -0.5544343590736389, -0.4916149377822876, -0.42879554629325867, -0.36597615480422974, -0.3031567335128784, -0.2403373271226883, -0.17751792073249817, -0.11469851434230804, -0.05187910795211792, 0.010940313339233398, 0.07375970482826233, 0.13657909631729126, 0.19939851760864258, 0.2622179388999939, 0.3250373303890228, 0.38785672187805176, 0.4506761431694031, 0.5134955644607544, 0.5763149261474609, 0.6391343474388123, 0.7019537687301636, 0.7647731900215149, 0.8275926113128662, 0.8904119729995728, 0.9532313942909241, 1.0160508155822754, 1.078870177268982, 1.1416895389556885, 1.2045090198516846, 1.2673283815383911, 1.3301478624343872, 1.3929672241210938, 1.4557867050170898, 1.5186060667037964, 1.581425428390503, 1.644244909286499, 1.7070642709732056, 1.769883632659912, 1.8327031135559082, 1.8955224752426147, 1.9583418369293213, 2.0211613178253174, 2.0839807987213135, 2.1468000411987305, 2.2096195220947266]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 5.0, 7.0, 4.0, 8.0, 6.0, 10.0, 7.0, 13.0, 10.0, 15.0, 19.0, 10.0, 16.0, 25.0, 39.0, 22.0, 28.0, 41.0, 38.0, 44.0, 45.0, 31.0, 45.0, 38.0, 49.0, 40.0, 37.0, 29.0, 24.0, 37.0, 30.0, 33.0, 35.0, 34.0, 18.0, 16.0, 17.0, 16.0, 11.0, 10.0, 8.0, 4.0, 9.0, 7.0, 1.0, 7.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.416862964630127, -1.375201940536499, -1.3335410356521606, -1.2918800115585327, -1.2502191066741943, -1.2085580825805664, -1.1668970584869385, -1.1252360343933105, -1.0835751295089722, -1.0419141054153442, -1.0002532005310059, -0.9585921764373779, -0.9169312119483948, -0.8752702474594116, -0.8336092233657837, -0.7919482588768005, -0.7502872943878174, -0.7086263298988342, -0.6669653654098511, -0.6253043413162231, -0.58364337682724, -0.5419824123382568, -0.5003213882446289, -0.45866042375564575, -0.4169994592666626, -0.37533849477767944, -0.3336775004863739, -0.29201650619506836, -0.2503555417060852, -0.20869456231594086, -0.1670335829257965, -0.12537258863449097, -0.08371162414550781, -0.042050644755363464, -0.0003896653652191162, 0.04127131402492523, 0.08293229341506958, 0.12459327280521393, 0.16625425219535828, 0.20791524648666382, 0.24957621097564697, 0.2912371754646301, 0.33289816975593567, 0.3745591640472412, 0.41622012853622437, 0.4578810930252075, 0.49954208731651306, 0.5412030816078186, 0.5828640460968018, 0.6245250105857849, 0.6661859750747681, 0.707846999168396, 0.7495079636573792, 0.7911689281463623, 0.8328299522399902, 0.8744909167289734, 0.9161518812179565, 0.9578128457069397, 0.9994738101959229, 1.0411348342895508, 1.0827958583831787, 1.124456763267517, 1.166117787361145, 1.2077786922454834, 1.2494397163391113]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 7.0, 13.0, 11.0, 25.0, 33.0, 61.0, 97.0, 241.0, 380.0, 913.0, 1902.0, 4693.0, 12713.0, 54116.0, 734344.0, 201335.0, 24453.0, 7710.0, 2961.0, 1226.0, 626.0, 313.0, 164.0, 75.0, 55.0, 26.0, 22.0, 18.0, 7.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.29296875, -1.254669189453125, -1.21636962890625, -1.178070068359375, -1.1397705078125, -1.101470947265625, -1.06317138671875, -1.024871826171875, -0.986572265625, -0.948272705078125, -0.90997314453125, -0.871673583984375, -0.8333740234375, -0.795074462890625, -0.75677490234375, -0.718475341796875, -0.68017578125, -0.641876220703125, -0.60357666015625, -0.565277099609375, -0.5269775390625, -0.488677978515625, -0.45037841796875, -0.412078857421875, -0.373779296875, -0.335479736328125, -0.29718017578125, -0.258880615234375, -0.2205810546875, -0.182281494140625, -0.14398193359375, -0.105682373046875, -0.0673828125, -0.029083251953125, 0.00921630859375, 0.047515869140625, 0.0858154296875, 0.124114990234375, 0.16241455078125, 0.200714111328125, 0.239013671875, 0.277313232421875, 0.31561279296875, 0.353912353515625, 0.3922119140625, 0.430511474609375, 0.46881103515625, 0.507110595703125, 0.54541015625, 0.583709716796875, 0.62200927734375, 0.660308837890625, 0.6986083984375, 0.736907958984375, 0.77520751953125, 0.813507080078125, 0.851806640625, 0.890106201171875, 0.92840576171875, 0.966705322265625, 1.0050048828125, 1.043304443359375, 1.08160400390625, 1.119903564453125, 1.158203125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 6.0, 11.0, 10.0, 18.0, 11.0, 24.0, 23.0, 33.0, 38.0, 43.0, 60.0, 62.0, 71.0, 66.0, 79.0, 69.0, 50.0, 43.0, 58.0, 35.0, 54.0, 37.0, 28.0, 18.0, 11.0, 13.0, 10.0, 6.0, 12.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88330078125, -0.8438644409179688, -0.8044281005859375, -0.7649917602539062, -0.725555419921875, -0.6861190795898438, -0.6466827392578125, -0.6072463989257812, -0.56781005859375, -0.5283737182617188, -0.4889373779296875, -0.44950103759765625, -0.410064697265625, -0.37062835693359375, -0.3311920166015625, -0.29175567626953125, -0.2523193359375, -0.21288299560546875, -0.1734466552734375, -0.13401031494140625, -0.094573974609375, -0.05513763427734375, -0.0157012939453125, 0.02373504638671875, 0.06317138671875, 0.10260772705078125, 0.1420440673828125, 0.18148040771484375, 0.220916748046875, 0.26035308837890625, 0.2997894287109375, 0.33922576904296875, 0.378662109375, 0.41809844970703125, 0.4575347900390625, 0.49697113037109375, 0.536407470703125, 0.5758438110351562, 0.6152801513671875, 0.6547164916992188, 0.69415283203125, 0.7335891723632812, 0.7730255126953125, 0.8124618530273438, 0.851898193359375, 0.8913345336914062, 0.9307708740234375, 0.9702072143554688, 1.0096435546875, 1.0490798950195312, 1.0885162353515625, 1.1279525756835938, 1.167388916015625, 1.2068252563476562, 1.2462615966796875, 1.2856979370117188, 1.32513427734375, 1.3645706176757812, 1.4040069580078125, 1.4434432983398438, 1.482879638671875, 1.5223159790039062, 1.5617523193359375, 1.6011886596679688, 1.640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 8.0, 3.0, 6.0, 6.0, 17.0, 20.0, 25.0, 41.0, 65.0, 90.0, 126.0, 201.0, 286.0, 406.0, 656.0, 979.0, 1589.0, 2768.0, 4835.0, 8822.0, 16944.0, 35915.0, 90356.0, 267321.0, 372340.0, 143313.0, 51979.0, 23015.0, 11303.0, 6115.0, 3442.0, 2003.0, 1187.0, 791.0, 511.0, 317.0, 219.0, 165.0, 116.0, 79.0, 63.0, 32.0, 23.0, 22.0, 12.0, 7.0, 10.0, 1.0, 4.0, 1.0, 4.0, 1.0, 2.0], "bins": [-0.31982421875, -0.3107414245605469, -0.30165863037109375, -0.2925758361816406, -0.2834930419921875, -0.2744102478027344, -0.26532745361328125, -0.2562446594238281, -0.247161865234375, -0.23807907104492188, -0.22899627685546875, -0.21991348266601562, -0.2108306884765625, -0.20174789428710938, -0.19266510009765625, -0.18358230590820312, -0.17449951171875, -0.16541671752929688, -0.15633392333984375, -0.14725112915039062, -0.1381683349609375, -0.12908554077148438, -0.12000274658203125, -0.11091995239257812, -0.101837158203125, -0.09275436401367188, -0.08367156982421875, -0.07458877563476562, -0.0655059814453125, -0.056423187255859375, -0.04734039306640625, -0.038257598876953125, -0.0291748046875, -0.020092010498046875, -0.01100921630859375, -0.001926422119140625, 0.0071563720703125, 0.016239166259765625, 0.02532196044921875, 0.034404754638671875, 0.043487548828125, 0.052570343017578125, 0.06165313720703125, 0.07073593139648438, 0.0798187255859375, 0.08890151977539062, 0.09798431396484375, 0.10706710815429688, 0.11614990234375, 0.12523269653320312, 0.13431549072265625, 0.14339828491210938, 0.1524810791015625, 0.16156387329101562, 0.17064666748046875, 0.17972946166992188, 0.188812255859375, 0.19789505004882812, 0.20697784423828125, 0.21606063842773438, 0.2251434326171875, 0.23422622680664062, 0.24330902099609375, 0.2523918151855469, 0.261474609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 7.0, 8.0, 9.0, 10.0, 15.0, 8.0, 21.0, 24.0, 30.0, 34.0, 39.0, 41.0, 57.0, 53.0, 38.0, 49.0, 55.0, 63.0, 64.0, 48.0, 39.0, 40.0, 47.0, 44.0, 27.0, 31.0, 31.0, 14.0, 9.0, 9.0, 7.0, 7.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6396484375, -1.5795440673828125, -1.519439697265625, -1.4593353271484375, -1.39923095703125, -1.3391265869140625, -1.279022216796875, -1.2189178466796875, -1.1588134765625, -1.0987091064453125, -1.038604736328125, -0.9785003662109375, -0.91839599609375, -0.8582916259765625, -0.798187255859375, -0.7380828857421875, -0.677978515625, -0.6178741455078125, -0.557769775390625, -0.4976654052734375, -0.43756103515625, -0.3774566650390625, -0.317352294921875, -0.2572479248046875, -0.1971435546875, -0.1370391845703125, -0.076934814453125, -0.0168304443359375, 0.04327392578125, 0.1033782958984375, 0.163482666015625, 0.2235870361328125, 0.28369140625, 0.3437957763671875, 0.403900146484375, 0.4640045166015625, 0.52410888671875, 0.5842132568359375, 0.644317626953125, 0.7044219970703125, 0.7645263671875, 0.8246307373046875, 0.884735107421875, 0.9448394775390625, 1.00494384765625, 1.0650482177734375, 1.125152587890625, 1.1852569580078125, 1.245361328125, 1.3054656982421875, 1.365570068359375, 1.4256744384765625, 1.48577880859375, 1.5458831787109375, 1.605987548828125, 1.6660919189453125, 1.7261962890625, 1.7863006591796875, 1.846405029296875, 1.9065093994140625, 1.96661376953125, 2.0267181396484375, 2.086822509765625, 2.1469268798828125, 2.20703125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 4.0, 6.0, 13.0, 18.0, 28.0, 42.0, 47.0, 70.0, 88.0, 167.0, 283.0, 439.0, 672.0, 1180.0, 2137.0, 3860.0, 7794.0, 16823.0, 41834.0, 124473.0, 361771.0, 319869.0, 102729.0, 34988.0, 14394.0, 6708.0, 3397.0, 1899.0, 1089.0, 663.0, 405.0, 203.0, 156.0, 102.0, 59.0, 41.0, 38.0, 20.0, 9.0, 10.0, 8.0, 8.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.079833984375, -0.07716560363769531, -0.07449722290039062, -0.07182884216308594, -0.06916046142578125, -0.06649208068847656, -0.06382369995117188, -0.06115531921386719, -0.0584869384765625, -0.05581855773925781, -0.053150177001953125, -0.05048179626464844, -0.04781341552734375, -0.04514503479003906, -0.042476654052734375, -0.03980827331542969, -0.037139892578125, -0.03447151184082031, -0.031803131103515625, -0.029134750366210938, -0.02646636962890625, -0.023797988891601562, -0.021129608154296875, -0.018461227416992188, -0.0157928466796875, -0.013124465942382812, -0.010456085205078125, -0.0077877044677734375, -0.00511932373046875, -0.0024509429931640625, 0.000217437744140625, 0.0028858184814453125, 0.00555419921875, 0.008222579956054688, 0.010890960693359375, 0.013559341430664062, 0.01622772216796875, 0.018896102905273438, 0.021564483642578125, 0.024232864379882812, 0.0269012451171875, 0.029569625854492188, 0.032238006591796875, 0.03490638732910156, 0.03757476806640625, 0.04024314880371094, 0.042911529541015625, 0.04557991027832031, 0.048248291015625, 0.05091667175292969, 0.053585052490234375, 0.05625343322753906, 0.05892181396484375, 0.06159019470214844, 0.06425857543945312, 0.06692695617675781, 0.0695953369140625, 0.07226371765136719, 0.07493209838867188, 0.07760047912597656, 0.08026885986328125, 0.08293724060058594, 0.08560562133789062, 0.08827400207519531, 0.0909423828125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 9.0, 10.0, 17.0, 15.0, 18.0, 29.0, 51.0, 65.0, 92.0, 114.0, 128.0, 105.0, 95.0, 65.0, 41.0, 30.0, 29.0, 19.0, 12.0, 12.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.176399230957031e-05, -6.942637264728546e-05, -6.708875298500061e-05, -6.475113332271576e-05, -6.241351366043091e-05, -6.007589399814606e-05, -5.7738274335861206e-05, -5.5400654673576355e-05, -5.3063035011291504e-05, -5.072541534900665e-05, -4.83877956867218e-05, -4.605017602443695e-05, -4.37125563621521e-05, -4.137493669986725e-05, -3.90373170375824e-05, -3.6699697375297546e-05, -3.4362077713012695e-05, -3.2024458050727844e-05, -2.9686838388442993e-05, -2.7349218726158142e-05, -2.501159906387329e-05, -2.267397940158844e-05, -2.033635973930359e-05, -1.7998740077018738e-05, -1.5661120414733887e-05, -1.3323500752449036e-05, -1.0985881090164185e-05, -8.648261427879333e-06, -6.310641765594482e-06, -3.973022103309631e-06, -1.6354024410247803e-06, 7.022172212600708e-07, 3.039836883544922e-06, 5.377456545829773e-06, 7.715076208114624e-06, 1.0052695870399475e-05, 1.2390315532684326e-05, 1.4727935194969177e-05, 1.706555485725403e-05, 1.940317451953888e-05, 2.174079418182373e-05, 2.407841384410858e-05, 2.6416033506393433e-05, 2.8753653168678284e-05, 3.1091272830963135e-05, 3.3428892493247986e-05, 3.576651215553284e-05, 3.810413181781769e-05, 4.044175148010254e-05, 4.277937114238739e-05, 4.511699080467224e-05, 4.745461046695709e-05, 4.979223012924194e-05, 5.2129849791526794e-05, 5.4467469453811646e-05, 5.6805089116096497e-05, 5.914270877838135e-05, 6.14803284406662e-05, 6.381794810295105e-05, 6.61555677652359e-05, 6.849318742752075e-05, 7.08308070898056e-05, 7.316842675209045e-05, 7.55060464143753e-05, 7.784366607666016e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 8.0, 4.0, 12.0, 13.0, 19.0, 25.0, 30.0, 68.0, 80.0, 131.0, 194.0, 342.0, 624.0, 1171.0, 2258.0, 4635.0, 10312.0, 27167.0, 92578.0, 389316.0, 382450.0, 90793.0, 26763.0, 10218.0, 4579.0, 2146.0, 1090.0, 623.0, 336.0, 204.0, 119.0, 72.0, 59.0, 29.0, 29.0, 19.0, 12.0, 12.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12103271484375, -0.1171274185180664, -0.11322212219238281, -0.10931682586669922, -0.10541152954101562, -0.10150623321533203, -0.09760093688964844, -0.09369564056396484, -0.08979034423828125, -0.08588504791259766, -0.08197975158691406, -0.07807445526123047, -0.07416915893554688, -0.07026386260986328, -0.06635856628417969, -0.062453269958496094, -0.0585479736328125, -0.054642677307128906, -0.05073738098144531, -0.04683208465576172, -0.042926788330078125, -0.03902149200439453, -0.03511619567871094, -0.031210899353027344, -0.02730560302734375, -0.023400306701660156, -0.019495010375976562, -0.015589714050292969, -0.011684417724609375, -0.007779121398925781, -0.0038738250732421875, 3.147125244140625e-05, 0.003936767578125, 0.007842063903808594, 0.011747360229492188, 0.01565265655517578, 0.019557952880859375, 0.02346324920654297, 0.027368545532226562, 0.031273841857910156, 0.03517913818359375, 0.039084434509277344, 0.04298973083496094, 0.04689502716064453, 0.050800323486328125, 0.05470561981201172, 0.05861091613769531, 0.0625162124633789, 0.0664215087890625, 0.0703268051147461, 0.07423210144042969, 0.07813739776611328, 0.08204269409179688, 0.08594799041748047, 0.08985328674316406, 0.09375858306884766, 0.09766387939453125, 0.10156917572021484, 0.10547447204589844, 0.10937976837158203, 0.11328506469726562, 0.11719036102294922, 0.12109565734863281, 0.1250009536743164, 0.12890625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 8.0, 2.0, 8.0, 9.0, 16.0, 7.0, 12.0, 10.0, 18.0, 24.0, 30.0, 33.0, 52.0, 35.0, 49.0, 43.0, 55.0, 63.0, 63.0, 53.0, 54.0, 59.0, 47.0, 38.0, 27.0, 33.0, 23.0, 26.0, 12.0, 14.0, 7.0, 16.0, 11.0, 10.0, 2.0, 7.0, 3.0, 2.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.025909423828125, -0.025172948837280273, -0.024436473846435547, -0.02369999885559082, -0.022963523864746094, -0.022227048873901367, -0.02149057388305664, -0.020754098892211914, -0.020017623901367188, -0.01928114891052246, -0.018544673919677734, -0.017808198928833008, -0.01707172393798828, -0.016335248947143555, -0.015598773956298828, -0.014862298965454102, -0.014125823974609375, -0.013389348983764648, -0.012652873992919922, -0.011916399002075195, -0.011179924011230469, -0.010443449020385742, -0.009706974029541016, -0.008970499038696289, -0.008234024047851562, -0.007497549057006836, -0.006761074066162109, -0.006024599075317383, -0.005288124084472656, -0.00455164909362793, -0.003815174102783203, -0.0030786991119384766, -0.00234222412109375, -0.0016057491302490234, -0.0008692741394042969, -0.0001327991485595703, 0.0006036758422851562, 0.0013401508331298828, 0.0020766258239746094, 0.002813100814819336, 0.0035495758056640625, 0.004286050796508789, 0.005022525787353516, 0.005759000778198242, 0.006495475769042969, 0.007231950759887695, 0.007968425750732422, 0.008704900741577148, 0.009441375732421875, 0.010177850723266602, 0.010914325714111328, 0.011650800704956055, 0.012387275695800781, 0.013123750686645508, 0.013860225677490234, 0.014596700668334961, 0.015333175659179688, 0.016069650650024414, 0.01680612564086914, 0.017542600631713867, 0.018279075622558594, 0.01901555061340332, 0.019752025604248047, 0.020488500595092773, 0.0212249755859375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 6.0, 8.0, 13.0, 15.0, 28.0, 44.0, 51.0, 92.0, 95.0, 124.0, 127.0, 111.0, 96.0, 58.0, 39.0, 26.0, 22.0, 16.0, 3.0, 5.0, 4.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1636282205581665, -1.111046314239502, -1.058464527130127, -1.0058826208114624, -0.9533007144927979, -0.9007188677787781, -0.8481370210647583, -0.7955551147460938, -0.742973268032074, -0.6903914213180542, -0.6378095149993896, -0.5852276682853699, -0.5326458215713501, -0.48006391525268555, -0.42748206853866577, -0.3749001920223236, -0.32231831550598145, -0.2697364389896393, -0.2171545773744583, -0.16457271575927734, -0.11199083924293518, -0.05940896272659302, -0.006827116012573242, 0.04575476050376892, 0.09833663702011108, 0.15091851353645325, 0.20350037515163422, 0.2560822367668152, 0.30866411328315735, 0.3612459897994995, 0.4138278365135193, 0.46640971302986145, 0.5189917087554932, 0.5715735554695129, 0.6241554617881775, 0.6767373085021973, 0.7293192148208618, 0.7819010615348816, 0.8344829082489014, 0.8870648145675659, 0.9396466612815857, 0.9922285079956055, 1.04481041431427, 1.0973923206329346, 1.1499741077423096, 1.2025560140609741, 1.2551379203796387, 1.3077197074890137, 1.3603016138076782, 1.4128835201263428, 1.4654653072357178, 1.5180472135543823, 1.5706291198730469, 1.6232109069824219, 1.6757928133010864, 1.728374719619751, 1.780956506729126, 1.8335384130477905, 1.8861202001571655, 1.93870210647583, 1.9912840127944946, 2.043865919113159, 2.096447706222534, 2.149029493331909, 2.2016115188598633]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 12.0, 17.0, 25.0, 15.0, 27.0, 53.0, 53.0, 73.0, 80.0, 86.0, 93.0, 83.0, 68.0, 79.0, 64.0, 59.0, 29.0, 37.0, 8.0, 13.0, 14.0, 9.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8270987868309021, -0.7772533893585205, -0.7274079322814941, -0.6775625348091125, -0.627717137336731, -0.5778717398643494, -0.5280263423919678, -0.4781808853149414, -0.4283354878425598, -0.3784900903701782, -0.32864466309547424, -0.27879923582077026, -0.22895383834838867, -0.1791084259748459, -0.1292630136013031, -0.07941758632659912, -0.02957218885421753, 0.020273223519325256, 0.07011863589286804, 0.11996404826641083, 0.1698094606399536, 0.2196548730134964, 0.2695002853870392, 0.31934571266174316, 0.36919111013412476, 0.41903650760650635, 0.4688819348812103, 0.5187273621559143, 0.5685727596282959, 0.6184181571006775, 0.6682635545730591, 0.7181090116500854, 0.7679543495178223, 0.8177997469902039, 0.8676451444625854, 0.9174906015396118, 0.9673359990119934, 1.017181396484375, 1.0670268535614014, 1.1168723106384277, 1.1667176485061646, 1.216563105583191, 1.2664084434509277, 1.316253900527954, 1.3660993576049805, 1.4159446954727173, 1.4657901525497437, 1.5156354904174805, 1.5654809474945068, 1.6153264045715332, 1.66517174243927, 1.7150171995162964, 1.7648625373840332, 1.8147079944610596, 1.864553451538086, 1.9143989086151123, 1.9642442464828491, 2.014089584350586, 2.0639350414276123, 2.1137804985046387, 2.163625955581665, 2.2134714126586914, 2.2633166313171387, 2.313162088394165, 2.3630075454711914]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 6.0, 6.0, 11.0, 8.0, 15.0, 37.0, 33.0, 64.0, 63.0, 100.0, 175.0, 236.0, 476.0, 746.0, 1351.0, 2576.0, 5525.0, 15953.0, 80616.0, 709161.0, 190723.0, 25710.0, 7759.0, 3280.0, 1562.0, 897.0, 512.0, 333.0, 193.0, 133.0, 105.0, 62.0, 43.0, 27.0, 19.0, 9.0, 16.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.7099609375, -1.655975341796875, -1.60198974609375, -1.548004150390625, -1.4940185546875, -1.440032958984375, -1.38604736328125, -1.332061767578125, -1.278076171875, -1.224090576171875, -1.17010498046875, -1.116119384765625, -1.0621337890625, -1.008148193359375, -0.95416259765625, -0.900177001953125, -0.84619140625, -0.792205810546875, -0.73822021484375, -0.684234619140625, -0.6302490234375, -0.576263427734375, -0.52227783203125, -0.468292236328125, -0.414306640625, -0.360321044921875, -0.30633544921875, -0.252349853515625, -0.1983642578125, -0.144378662109375, -0.09039306640625, -0.036407470703125, 0.017578125, 0.071563720703125, 0.12554931640625, 0.179534912109375, 0.2335205078125, 0.287506103515625, 0.34149169921875, 0.395477294921875, 0.449462890625, 0.503448486328125, 0.55743408203125, 0.611419677734375, 0.6654052734375, 0.719390869140625, 0.77337646484375, 0.827362060546875, 0.88134765625, 0.935333251953125, 0.98931884765625, 1.043304443359375, 1.0972900390625, 1.151275634765625, 1.20526123046875, 1.259246826171875, 1.313232421875, 1.367218017578125, 1.42120361328125, 1.475189208984375, 1.5291748046875, 1.583160400390625, 1.63714599609375, 1.691131591796875, 1.7451171875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 8.0, 12.0, 14.0, 16.0, 15.0, 23.0, 24.0, 32.0, 57.0, 61.0, 48.0, 61.0, 71.0, 69.0, 54.0, 63.0, 56.0, 64.0, 48.0, 41.0, 41.0, 21.0, 22.0, 23.0, 11.0, 13.0, 10.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.734375, -1.66424560546875, -1.5941162109375, -1.52398681640625, -1.453857421875, -1.38372802734375, -1.3135986328125, -1.24346923828125, -1.17333984375, -1.10321044921875, -1.0330810546875, -0.96295166015625, -0.892822265625, -0.82269287109375, -0.7525634765625, -0.68243408203125, -0.6123046875, -0.54217529296875, -0.4720458984375, -0.40191650390625, -0.331787109375, -0.26165771484375, -0.1915283203125, -0.12139892578125, -0.05126953125, 0.01885986328125, 0.0889892578125, 0.15911865234375, 0.229248046875, 0.29937744140625, 0.3695068359375, 0.43963623046875, 0.509765625, 0.57989501953125, 0.6500244140625, 0.72015380859375, 0.790283203125, 0.86041259765625, 0.9305419921875, 1.00067138671875, 1.07080078125, 1.14093017578125, 1.2110595703125, 1.28118896484375, 1.351318359375, 1.42144775390625, 1.4915771484375, 1.56170654296875, 1.6318359375, 1.70196533203125, 1.7720947265625, 1.84222412109375, 1.912353515625, 1.98248291015625, 2.0526123046875, 2.12274169921875, 2.19287109375, 2.26300048828125, 2.3331298828125, 2.40325927734375, 2.473388671875, 2.54351806640625, 2.6136474609375, 2.68377685546875, 2.75390625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 5.0, 6.0, 11.0, 8.0, 14.0, 11.0, 16.0, 19.0, 12.0, 20.0, 23.0, 28.0, 30.0, 34.0, 47.0, 64.0, 77.0, 165.0, 593.0, 3780.0, 105108.0, 926682.0, 9995.0, 1109.0, 224.0, 106.0, 54.0, 37.0, 46.0, 34.0, 27.0, 25.0, 31.0, 17.0, 17.0, 16.0, 13.0, 11.0, 10.0, 5.0, 4.0, 5.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.24609375, -4.09552001953125, -3.9449462890625, -3.79437255859375, -3.643798828125, -3.49322509765625, -3.3426513671875, -3.19207763671875, -3.04150390625, -2.89093017578125, -2.7403564453125, -2.58978271484375, -2.439208984375, -2.28863525390625, -2.1380615234375, -1.98748779296875, -1.8369140625, -1.68634033203125, -1.5357666015625, -1.38519287109375, -1.234619140625, -1.08404541015625, -0.9334716796875, -0.78289794921875, -0.63232421875, -0.48175048828125, -0.3311767578125, -0.18060302734375, -0.030029296875, 0.12054443359375, 0.2711181640625, 0.42169189453125, 0.572265625, 0.72283935546875, 0.8734130859375, 1.02398681640625, 1.174560546875, 1.32513427734375, 1.4757080078125, 1.62628173828125, 1.77685546875, 1.92742919921875, 2.0780029296875, 2.22857666015625, 2.379150390625, 2.52972412109375, 2.6802978515625, 2.83087158203125, 2.9814453125, 3.13201904296875, 3.2825927734375, 3.43316650390625, 3.583740234375, 3.73431396484375, 3.8848876953125, 4.03546142578125, 4.18603515625, 4.33660888671875, 4.4871826171875, 4.63775634765625, 4.788330078125, 4.93890380859375, 5.0894775390625, 5.24005126953125, 5.390625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 13.0, 7.0, 12.0, 15.0, 18.0, 21.0, 15.0, 16.0, 24.0, 29.0, 35.0, 23.0, 33.0, 35.0, 49.0, 34.0, 34.0, 54.0, 39.0, 54.0, 44.0, 44.0, 46.0, 25.0, 35.0, 29.0, 27.0, 34.0, 24.0, 21.0, 21.0, 26.0, 11.0, 10.0, 10.0, 8.0, 6.0, 4.0, 2.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.68359375, -1.6319580078125, -1.580322265625, -1.5286865234375, -1.47705078125, -1.4254150390625, -1.373779296875, -1.3221435546875, -1.2705078125, -1.2188720703125, -1.167236328125, -1.1156005859375, -1.06396484375, -1.0123291015625, -0.960693359375, -0.9090576171875, -0.857421875, -0.8057861328125, -0.754150390625, -0.7025146484375, -0.65087890625, -0.5992431640625, -0.547607421875, -0.4959716796875, -0.4443359375, -0.3927001953125, -0.341064453125, -0.2894287109375, -0.23779296875, -0.1861572265625, -0.134521484375, -0.0828857421875, -0.03125, 0.0203857421875, 0.072021484375, 0.1236572265625, 0.17529296875, 0.2269287109375, 0.278564453125, 0.3302001953125, 0.3818359375, 0.4334716796875, 0.485107421875, 0.5367431640625, 0.58837890625, 0.6400146484375, 0.691650390625, 0.7432861328125, 0.794921875, 0.8465576171875, 0.898193359375, 0.9498291015625, 1.00146484375, 1.0531005859375, 1.104736328125, 1.1563720703125, 1.2080078125, 1.2596435546875, 1.311279296875, 1.3629150390625, 1.41455078125, 1.4661865234375, 1.517822265625, 1.5694580078125, 1.62109375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 1.0, 2.0, 6.0, 3.0, 11.0, 22.0, 33.0, 35.0, 51.0, 95.0, 247.0, 493.0, 1152.0, 3497.0, 18253.0, 537929.0, 464536.0, 16715.0, 3413.0, 1100.0, 468.0, 219.0, 109.0, 62.0, 39.0, 31.0, 15.0, 3.0, 4.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50634765625, -0.48431396484375, -0.4622802734375, -0.44024658203125, -0.418212890625, -0.39617919921875, -0.3741455078125, -0.35211181640625, -0.330078125, -0.30804443359375, -0.2860107421875, -0.26397705078125, -0.241943359375, -0.21990966796875, -0.1978759765625, -0.17584228515625, -0.15380859375, -0.13177490234375, -0.1097412109375, -0.08770751953125, -0.065673828125, -0.04364013671875, -0.0216064453125, 0.00042724609375, 0.0224609375, 0.04449462890625, 0.0665283203125, 0.08856201171875, 0.110595703125, 0.13262939453125, 0.1546630859375, 0.17669677734375, 0.19873046875, 0.22076416015625, 0.2427978515625, 0.26483154296875, 0.286865234375, 0.30889892578125, 0.3309326171875, 0.35296630859375, 0.375, 0.39703369140625, 0.4190673828125, 0.44110107421875, 0.463134765625, 0.48516845703125, 0.5072021484375, 0.52923583984375, 0.55126953125, 0.57330322265625, 0.5953369140625, 0.61737060546875, 0.639404296875, 0.66143798828125, 0.6834716796875, 0.70550537109375, 0.7275390625, 0.74957275390625, 0.7716064453125, 0.79364013671875, 0.815673828125, 0.83770751953125, 0.8597412109375, 0.88177490234375, 0.90380859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 12.0, 6.0, 20.0, 26.0, 46.0, 89.0, 126.0, 191.0, 198.0, 114.0, 70.0, 33.0, 19.0, 16.0, 6.0, 12.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00012129545211791992, -0.00011854059994220734, -0.00011578574776649475, -0.00011303089559078217, -0.00011027604341506958, -0.000107521191239357, -0.00010476633906364441, -0.00010201148688793182, -9.925663471221924e-05, -9.650178253650665e-05, -9.374693036079407e-05, -9.099207818508148e-05, -8.82372260093689e-05, -8.548237383365631e-05, -8.272752165794373e-05, -7.997266948223114e-05, -7.721781730651855e-05, -7.446296513080597e-05, -7.170811295509338e-05, -6.89532607793808e-05, -6.619840860366821e-05, -6.344355642795563e-05, -6.068870425224304e-05, -5.7933852076530457e-05, -5.517899990081787e-05, -5.2424147725105286e-05, -4.96692955493927e-05, -4.6914443373680115e-05, -4.415959119796753e-05, -4.1404739022254944e-05, -3.864988684654236e-05, -3.589503467082977e-05, -3.314018249511719e-05, -3.0385330319404602e-05, -2.7630478143692017e-05, -2.487562596797943e-05, -2.2120773792266846e-05, -1.936592161655426e-05, -1.6611069440841675e-05, -1.385621726512909e-05, -1.1101365089416504e-05, -8.346512913703918e-06, -5.591660737991333e-06, -2.8368085622787476e-06, -8.195638656616211e-08, 2.6728957891464233e-06, 5.427747964859009e-06, 8.182600140571594e-06, 1.093745231628418e-05, 1.3692304491996765e-05, 1.644715666770935e-05, 1.9202008843421936e-05, 2.195686101913452e-05, 2.4711713194847107e-05, 2.7466565370559692e-05, 3.0221417546272278e-05, 3.297626972198486e-05, 3.573112189769745e-05, 3.8485974073410034e-05, 4.124082624912262e-05, 4.3995678424835205e-05, 4.675053060054779e-05, 4.9505382776260376e-05, 5.226023495197296e-05, 5.501508712768555e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 7.0, 4.0, 17.0, 6.0, 11.0, 22.0, 39.0, 72.0, 92.0, 192.0, 333.0, 694.0, 1582.0, 3878.0, 12771.0, 79289.0, 786494.0, 137611.0, 17149.0, 4731.0, 1823.0, 841.0, 381.0, 192.0, 106.0, 65.0, 45.0, 27.0, 15.0, 18.0, 13.0, 10.0, 7.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.52001953125, -0.5030288696289062, -0.4860382080078125, -0.46904754638671875, -0.452056884765625, -0.43506622314453125, -0.4180755615234375, -0.40108489990234375, -0.38409423828125, -0.36710357666015625, -0.3501129150390625, -0.33312225341796875, -0.316131591796875, -0.29914093017578125, -0.2821502685546875, -0.26515960693359375, -0.2481689453125, -0.23117828369140625, -0.2141876220703125, -0.19719696044921875, -0.180206298828125, -0.16321563720703125, -0.1462249755859375, -0.12923431396484375, -0.11224365234375, -0.09525299072265625, -0.0782623291015625, -0.06127166748046875, -0.044281005859375, -0.02729034423828125, -0.0102996826171875, 0.00669097900390625, 0.023681640625, 0.04067230224609375, 0.0576629638671875, 0.07465362548828125, 0.091644287109375, 0.10863494873046875, 0.1256256103515625, 0.14261627197265625, 0.15960693359375, 0.17659759521484375, 0.1935882568359375, 0.21057891845703125, 0.227569580078125, 0.24456024169921875, 0.2615509033203125, 0.27854156494140625, 0.2955322265625, 0.31252288818359375, 0.3295135498046875, 0.34650421142578125, 0.363494873046875, 0.38048553466796875, 0.3974761962890625, 0.41446685791015625, 0.43145751953125, 0.44844818115234375, 0.4654388427734375, 0.48242950439453125, 0.499420166015625, 0.5164108276367188, 0.5334014892578125, 0.5503921508789062, 0.5673828125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 7.0, 10.0, 7.0, 8.0, 21.0, 25.0, 35.0, 35.0, 66.0, 85.0, 119.0, 135.0, 127.0, 96.0, 63.0, 41.0, 35.0, 20.0, 13.0, 12.0, 4.0, 9.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.1953125, -0.1896800994873047, -0.18404769897460938, -0.17841529846191406, -0.17278289794921875, -0.16715049743652344, -0.16151809692382812, -0.1558856964111328, -0.1502532958984375, -0.1446208953857422, -0.13898849487304688, -0.13335609436035156, -0.12772369384765625, -0.12209129333496094, -0.11645889282226562, -0.11082649230957031, -0.105194091796875, -0.09956169128417969, -0.09392929077148438, -0.08829689025878906, -0.08266448974609375, -0.07703208923339844, -0.07139968872070312, -0.06576728820800781, -0.0601348876953125, -0.05450248718261719, -0.048870086669921875, -0.04323768615722656, -0.03760528564453125, -0.03197288513183594, -0.026340484619140625, -0.020708084106445312, -0.01507568359375, -0.009443283081054688, -0.003810882568359375, 0.0018215179443359375, 0.00745391845703125, 0.013086318969726562, 0.018718719482421875, 0.024351119995117188, 0.0299835205078125, 0.03561592102050781, 0.041248321533203125, 0.04688072204589844, 0.05251312255859375, 0.05814552307128906, 0.06377792358398438, 0.06941032409667969, 0.075042724609375, 0.08067512512207031, 0.08630752563476562, 0.09193992614746094, 0.09757232666015625, 0.10320472717285156, 0.10883712768554688, 0.11446952819824219, 0.1201019287109375, 0.1257343292236328, 0.13136672973632812, 0.13699913024902344, 0.14263153076171875, 0.14826393127441406, 0.15389633178710938, 0.1595287322998047, 0.1651611328125]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 6.0, 2.0, 5.0, 7.0, 16.0, 11.0, 13.0, 25.0, 16.0, 34.0, 49.0, 62.0, 85.0, 81.0, 98.0, 102.0, 106.0, 72.0, 54.0, 44.0, 37.0, 29.0, 19.0, 6.0, 7.0, 5.0, 5.0, 6.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2271065711975098, -2.1438546180725098, -2.060602903366089, -1.9773510694503784, -1.894099235534668, -1.810847282409668, -1.7275954484939575, -1.644343614578247, -1.5610917806625366, -1.4778399467468262, -1.3945881128311157, -1.3113362789154053, -1.2280843257904053, -1.1448326110839844, -1.0615806579589844, -0.9783288240432739, -0.8950769901275635, -0.811825156211853, -0.7285733222961426, -0.6453214287757874, -0.5620695948600769, -0.47881776094436646, -0.3955658972263336, -0.3123140335083008, -0.22906219959259033, -0.1458103507757187, -0.06255850195884705, 0.020693346858024597, 0.10394519567489624, 0.1871970295906067, 0.2704488933086395, 0.35370075702667236, 0.4369525909423828, 0.5202044248580933, 0.6034562587738037, 0.6867081522941589, 0.7699599862098694, 0.8532118201255798, 0.9364637136459351, 1.0197155475616455, 1.102967381477356, 1.1862192153930664, 1.2694710493087769, 1.3527228832244873, 1.4359748363494873, 1.5192265510559082, 1.6024785041809082, 1.6857303380966187, 1.768982172012329, 1.8522340059280396, 1.93548583984375, 2.01873779296875, 2.101989507675171, 2.185241460800171, 2.268493175506592, 2.351745128631592, 2.434997081756592, 2.518249034881592, 2.6015007495880127, 2.6847527027130127, 2.7680044174194336, 2.8512563705444336, 2.9345080852508545, 3.0177600383758545, 3.1010117530822754]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 8.0, 8.0, 9.0, 12.0, 22.0, 21.0, 14.0, 26.0, 23.0, 32.0, 32.0, 39.0, 48.0, 34.0, 47.0, 39.0, 64.0, 41.0, 62.0, 49.0, 37.0, 35.0, 33.0, 35.0, 28.0, 36.0, 25.0, 26.0, 20.0, 19.0, 20.0, 7.0, 8.0, 12.0, 6.0, 1.0, 7.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.779217481613159, -2.685767650604248, -2.592317819595337, -2.498867988586426, -2.4054181575775146, -2.3119683265686035, -2.2185182571411133, -2.125068426132202, -2.031618595123291, -1.9381687641143799, -1.8447189331054688, -1.7512691020965576, -1.657819151878357, -1.5643693208694458, -1.4709194898605347, -1.377469539642334, -1.2840198278427124, -1.1905699968338013, -1.0971201658248901, -1.0036702156066895, -0.9102203845977783, -0.8167705535888672, -0.723320722579956, -0.6298708319664001, -0.536421000957489, -0.4429711401462555, -0.349521279335022, -0.25607144832611084, -0.16262158751487732, -0.0691717267036438, 0.024278104305267334, 0.11772799491882324, 0.21117782592773438, 0.3046276867389679, 0.3980775475502014, 0.49152737855911255, 0.5849772691726685, 0.6784271001815796, 0.7718769311904907, 0.8653268218040466, 0.9587766528129578, 1.0522265434265137, 1.1456763744354248, 1.239126205444336, 1.332576036453247, 1.4260258674621582, 1.5194756984710693, 1.61292564868927, 1.7063754796981812, 1.7998253107070923, 1.8932751417160034, 1.986725091934204, 2.0801749229431152, 2.1736247539520264, 2.2670745849609375, 2.3605244159698486, 2.4539742469787598, 2.547424077987671, 2.640873908996582, 2.734323740005493, 2.8277735710144043, 2.9212236404418945, 3.0146732330322266, 3.108123302459717, 3.201573133468628]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 7.0, 6.0, 11.0, 16.0, 35.0, 42.0, 82.0, 105.0, 204.0, 446.0, 940.0, 3120.0, 22146.0, 1122835.0, 2969094.0, 67752.0, 5163.0, 1281.0, 514.0, 221.0, 120.0, 58.0, 36.0, 15.0, 16.0, 8.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.66015625, -5.534820556640625, -5.40948486328125, -5.284149169921875, -5.1588134765625, -5.033477783203125, -4.90814208984375, -4.782806396484375, -4.657470703125, -4.532135009765625, -4.40679931640625, -4.281463623046875, -4.1561279296875, -4.030792236328125, -3.90545654296875, -3.780120849609375, -3.65478515625, -3.529449462890625, -3.40411376953125, -3.278778076171875, -3.1534423828125, -3.028106689453125, -2.90277099609375, -2.777435302734375, -2.652099609375, -2.526763916015625, -2.40142822265625, -2.276092529296875, -2.1507568359375, -2.025421142578125, -1.90008544921875, -1.774749755859375, -1.6494140625, -1.524078369140625, -1.39874267578125, -1.273406982421875, -1.1480712890625, -1.022735595703125, -0.89739990234375, -0.772064208984375, -0.646728515625, -0.521392822265625, -0.39605712890625, -0.270721435546875, -0.1453857421875, -0.020050048828125, 0.10528564453125, 0.230621337890625, 0.35595703125, 0.481292724609375, 0.60662841796875, 0.731964111328125, 0.8572998046875, 0.982635498046875, 1.10797119140625, 1.233306884765625, 1.358642578125, 1.483978271484375, 1.60931396484375, 1.734649658203125, 1.8599853515625, 1.985321044921875, 2.11065673828125, 2.235992431640625, 2.361328125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 7.0, 2.0, 6.0, 8.0, 7.0, 14.0, 15.0, 20.0, 24.0, 17.0, 21.0, 28.0, 41.0, 46.0, 54.0, 44.0, 51.0, 57.0, 64.0, 43.0, 41.0, 46.0, 60.0, 49.0, 35.0, 38.0, 30.0, 24.0, 19.0, 24.0, 16.0, 11.0, 8.0, 11.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.421875, -1.3794708251953125, -1.337066650390625, -1.2946624755859375, -1.25225830078125, -1.2098541259765625, -1.167449951171875, -1.1250457763671875, -1.0826416015625, -1.0402374267578125, -0.997833251953125, -0.9554290771484375, -0.91302490234375, -0.8706207275390625, -0.828216552734375, -0.7858123779296875, -0.743408203125, -0.7010040283203125, -0.658599853515625, -0.6161956787109375, -0.57379150390625, -0.5313873291015625, -0.488983154296875, -0.4465789794921875, -0.4041748046875, -0.3617706298828125, -0.319366455078125, -0.2769622802734375, -0.23455810546875, -0.1921539306640625, -0.149749755859375, -0.1073455810546875, -0.06494140625, -0.0225372314453125, 0.019866943359375, 0.0622711181640625, 0.10467529296875, 0.1470794677734375, 0.189483642578125, 0.2318878173828125, 0.2742919921875, 0.3166961669921875, 0.359100341796875, 0.4015045166015625, 0.44390869140625, 0.4863128662109375, 0.528717041015625, 0.5711212158203125, 0.613525390625, 0.6559295654296875, 0.698333740234375, 0.7407379150390625, 0.78314208984375, 0.8255462646484375, 0.867950439453125, 0.9103546142578125, 0.9527587890625, 0.9951629638671875, 1.037567138671875, 1.0799713134765625, 1.12237548828125, 1.1647796630859375, 1.207183837890625, 1.2495880126953125, 1.2919921875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 8.0, 11.0, 18.0, 25.0, 31.0, 37.0, 64.0, 96.0, 170.0, 307.0, 893.0, 3514.0, 33618.0, 3730756.0, 411355.0, 10470.0, 1757.0, 535.0, 253.0, 126.0, 76.0, 49.0, 37.0, 15.0, 13.0, 15.0, 7.0, 8.0, 6.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4140625, -4.29071044921875, -4.1673583984375, -4.04400634765625, -3.920654296875, -3.79730224609375, -3.6739501953125, -3.55059814453125, -3.42724609375, -3.30389404296875, -3.1805419921875, -3.05718994140625, -2.933837890625, -2.81048583984375, -2.6871337890625, -2.56378173828125, -2.4404296875, -2.31707763671875, -2.1937255859375, -2.07037353515625, -1.947021484375, -1.82366943359375, -1.7003173828125, -1.57696533203125, -1.45361328125, -1.33026123046875, -1.2069091796875, -1.08355712890625, -0.960205078125, -0.83685302734375, -0.7135009765625, -0.59014892578125, -0.466796875, -0.34344482421875, -0.2200927734375, -0.09674072265625, 0.026611328125, 0.14996337890625, 0.2733154296875, 0.39666748046875, 0.52001953125, 0.64337158203125, 0.7667236328125, 0.89007568359375, 1.013427734375, 1.13677978515625, 1.2601318359375, 1.38348388671875, 1.5068359375, 1.63018798828125, 1.7535400390625, 1.87689208984375, 2.000244140625, 2.12359619140625, 2.2469482421875, 2.37030029296875, 2.49365234375, 2.61700439453125, 2.7403564453125, 2.86370849609375, 2.987060546875, 3.11041259765625, 3.2337646484375, 3.35711669921875, 3.48046875]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 12.0, 24.0, 56.0, 111.0, 233.0, 649.0, 1215.0, 979.0, 427.0, 178.0, 91.0, 34.0, 24.0, 9.0, 11.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6552734375, -0.623779296875, -0.59228515625, -0.560791015625, -0.529296875, -0.497802734375, -0.46630859375, -0.434814453125, -0.4033203125, -0.371826171875, -0.34033203125, -0.308837890625, -0.27734375, -0.245849609375, -0.21435546875, -0.182861328125, -0.1513671875, -0.119873046875, -0.08837890625, -0.056884765625, -0.025390625, 0.006103515625, 0.03759765625, 0.069091796875, 0.1005859375, 0.132080078125, 0.16357421875, 0.195068359375, 0.2265625, 0.258056640625, 0.28955078125, 0.321044921875, 0.3525390625, 0.384033203125, 0.41552734375, 0.447021484375, 0.478515625, 0.510009765625, 0.54150390625, 0.572998046875, 0.6044921875, 0.635986328125, 0.66748046875, 0.698974609375, 0.73046875, 0.761962890625, 0.79345703125, 0.824951171875, 0.8564453125, 0.887939453125, 0.91943359375, 0.950927734375, 0.982421875, 1.013916015625, 1.04541015625, 1.076904296875, 1.1083984375, 1.139892578125, 1.17138671875, 1.202880859375, 1.234375, 1.265869140625, 1.29736328125, 1.328857421875, 1.3603515625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 1.0, 5.0, 6.0, 9.0, 10.0, 15.0, 16.0, 20.0, 25.0, 38.0, 31.0, 43.0, 65.0, 69.0, 79.0, 82.0, 94.0, 68.0, 66.0, 65.0, 50.0, 33.0, 22.0, 20.0, 19.0, 8.0, 7.0, 11.0, 5.0, 2.0, 5.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7913415431976318, -1.7379173040390015, -1.684493064880371, -1.6310687065124512, -1.5776444673538208, -1.5242202281951904, -1.47079598903656, -1.4173717498779297, -1.3639473915100098, -1.3105231523513794, -1.257098913192749, -1.203674554824829, -1.1502503156661987, -1.0968260765075684, -1.043401837348938, -0.9899775385856628, -0.9365532994270325, -0.8831290602684021, -0.829704761505127, -0.7762805223464966, -0.7228562235832214, -0.6694319844245911, -0.6160076856613159, -0.5625834465026855, -0.5091592073440552, -0.4557349383831024, -0.40231066942214966, -0.3488864302635193, -0.29546213150024414, -0.24203789234161377, -0.188613623380661, -0.13518935441970825, -0.0817650556564331, -0.028340790420770645, 0.025083474814891815, 0.07850773632526398, 0.13193200528621674, 0.1853562593460083, 0.23878052830696106, 0.2922047972679138, 0.3456290662288666, 0.39905333518981934, 0.4524776041507721, 0.5059018731117249, 0.5593261122703552, 0.6127504110336304, 0.6661746501922607, 0.7195988893508911, 0.7730231881141663, 0.8264474272727966, 0.8798717260360718, 0.9332959651947021, 0.9867202639579773, 1.040144443511963, 1.0935688018798828, 1.1469930410385132, 1.2004172801971436, 1.253841519355774, 1.3072657585144043, 1.3606901168823242, 1.4141143560409546, 1.467538595199585, 1.5209628343582153, 1.5743870735168457, 1.6278114318847656]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 2.0, 4.0, 9.0, 12.0, 10.0, 19.0, 17.0, 10.0, 29.0, 17.0, 22.0, 24.0, 28.0, 32.0, 32.0, 33.0, 37.0, 42.0, 55.0, 52.0, 38.0, 51.0, 39.0, 49.0, 38.0, 33.0, 38.0, 28.0, 30.0, 27.0, 32.0, 24.0, 18.0, 16.0, 6.0, 12.0, 9.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1734586954116821, -1.1348876953125, -1.0963165760040283, -1.0577454566955566, -1.0191744565963745, -0.9806033968925476, -0.9420323371887207, -0.9034612774848938, -0.8648902177810669, -0.82631915807724, -0.7877480983734131, -0.7491770386695862, -0.7106059789657593, -0.6720349192619324, -0.6334638595581055, -0.5948927998542786, -0.5563217401504517, -0.5177506804466248, -0.47917962074279785, -0.44060856103897095, -0.40203750133514404, -0.36346644163131714, -0.32489538192749023, -0.28632432222366333, -0.24775326251983643, -0.20918220281600952, -0.17061114311218262, -0.1320400834083557, -0.09346902370452881, -0.054897964000701904, -0.016326904296875, 0.022244155406951904, 0.06081533432006836, 0.09938639402389526, 0.13795745372772217, 0.17652851343154907, 0.21509957313537598, 0.2536706328392029, 0.2922416925430298, 0.3308127522468567, 0.3693838119506836, 0.4079548716545105, 0.4465259313583374, 0.4850969910621643, 0.5236680507659912, 0.5622391104698181, 0.600810170173645, 0.6393812298774719, 0.6779522895812988, 0.7165233492851257, 0.7550944089889526, 0.7936654686927795, 0.8322365283966064, 0.8708075881004333, 0.9093786478042603, 0.9479497075080872, 0.9865207672119141, 1.0250918865203857, 1.0636628866195679, 1.10223388671875, 1.1408050060272217, 1.1793761253356934, 1.2179471254348755, 1.2565181255340576, 1.2950892448425293]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 7.0, 11.0, 12.0, 25.0, 13.0, 25.0, 46.0, 66.0, 90.0, 171.0, 290.0, 489.0, 901.0, 1556.0, 3001.0, 6200.0, 13426.0, 32023.0, 80648.0, 219038.0, 369870.0, 195340.0, 72270.0, 28589.0, 12493.0, 5739.0, 2806.0, 1425.0, 789.0, 435.0, 273.0, 156.0, 99.0, 69.0, 58.0, 30.0, 23.0, 8.0, 7.0, 7.0, 8.0, 6.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1812744140625, -0.17531967163085938, -0.16936492919921875, -0.16341018676757812, -0.1574554443359375, -0.15150070190429688, -0.14554595947265625, -0.13959121704101562, -0.133636474609375, -0.12768173217773438, -0.12172698974609375, -0.11577224731445312, -0.1098175048828125, -0.10386276245117188, -0.09790802001953125, -0.09195327758789062, -0.08599853515625, -0.08004379272460938, -0.07408905029296875, -0.06813430786132812, -0.0621795654296875, -0.056224822998046875, -0.05027008056640625, -0.044315338134765625, -0.038360595703125, -0.032405853271484375, -0.02645111083984375, -0.020496368408203125, -0.0145416259765625, -0.008586883544921875, -0.00263214111328125, 0.003322601318359375, 0.00927734375, 0.015232086181640625, 0.02118682861328125, 0.027141571044921875, 0.0330963134765625, 0.039051055908203125, 0.04500579833984375, 0.050960540771484375, 0.056915283203125, 0.06287002563476562, 0.06882476806640625, 0.07477951049804688, 0.0807342529296875, 0.08668899536132812, 0.09264373779296875, 0.09859848022460938, 0.10455322265625, 0.11050796508789062, 0.11646270751953125, 0.12241744995117188, 0.1283721923828125, 0.13432693481445312, 0.14028167724609375, 0.14623641967773438, 0.152191162109375, 0.15814590454101562, 0.16410064697265625, 0.17005538940429688, 0.1760101318359375, 0.18196487426757812, 0.18791961669921875, 0.19387435913085938, 0.1998291015625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 8.0, 8.0, 15.0, 10.0, 15.0, 14.0, 17.0, 29.0, 28.0, 30.0, 21.0, 35.0, 41.0, 44.0, 42.0, 36.0, 49.0, 60.0, 49.0, 54.0, 45.0, 53.0, 38.0, 32.0, 30.0, 26.0, 37.0, 23.0, 28.0, 13.0, 15.0, 14.0, 5.0, 5.0, 7.0, 1.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.7978515625, -0.7707443237304688, -0.7436370849609375, -0.7165298461914062, -0.689422607421875, -0.6623153686523438, -0.6352081298828125, -0.6081008911132812, -0.58099365234375, -0.5538864135742188, -0.5267791748046875, -0.49967193603515625, -0.472564697265625, -0.44545745849609375, -0.4183502197265625, -0.39124298095703125, -0.3641357421875, -0.33702850341796875, -0.3099212646484375, -0.28281402587890625, -0.255706787109375, -0.22859954833984375, -0.2014923095703125, -0.17438507080078125, -0.14727783203125, -0.12017059326171875, -0.0930633544921875, -0.06595611572265625, -0.038848876953125, -0.01174163818359375, 0.0153656005859375, 0.04247283935546875, 0.069580078125, 0.09668731689453125, 0.1237945556640625, 0.15090179443359375, 0.178009033203125, 0.20511627197265625, 0.2322235107421875, 0.25933074951171875, 0.28643798828125, 0.31354522705078125, 0.3406524658203125, 0.36775970458984375, 0.394866943359375, 0.42197418212890625, 0.4490814208984375, 0.47618865966796875, 0.5032958984375, 0.5304031372070312, 0.5575103759765625, 0.5846176147460938, 0.611724853515625, 0.6388320922851562, 0.6659393310546875, 0.6930465698242188, 0.72015380859375, 0.7472610473632812, 0.7743682861328125, 0.8014755249023438, 0.828582763671875, 0.8556900024414062, 0.8827972412109375, 0.9099044799804688, 0.93701171875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 9.0, 9.0, 13.0, 15.0, 20.0, 39.0, 59.0, 64.0, 96.0, 149.0, 268.0, 387.0, 676.0, 1217.0, 2180.0, 4355.0, 9050.0, 20123.0, 45847.0, 113247.0, 260336.0, 315118.0, 159519.0, 64608.0, 27087.0, 11961.0, 5618.0, 2838.0, 1500.0, 791.0, 499.0, 282.0, 201.0, 133.0, 69.0, 66.0, 33.0, 25.0, 19.0, 10.0, 12.0, 9.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1536865234375, -0.1487598419189453, -0.14383316040039062, -0.13890647888183594, -0.13397979736328125, -0.12905311584472656, -0.12412643432617188, -0.11919975280761719, -0.1142730712890625, -0.10934638977050781, -0.10441970825195312, -0.09949302673339844, -0.09456634521484375, -0.08963966369628906, -0.08471298217773438, -0.07978630065917969, -0.074859619140625, -0.06993293762207031, -0.06500625610351562, -0.06007957458496094, -0.05515289306640625, -0.05022621154785156, -0.045299530029296875, -0.04037284851074219, -0.0354461669921875, -0.030519485473632812, -0.025592803955078125, -0.020666122436523438, -0.01573944091796875, -0.010812759399414062, -0.005886077880859375, -0.0009593963623046875, 0.00396728515625, 0.008893966674804688, 0.013820648193359375, 0.018747329711914062, 0.02367401123046875, 0.028600692749023438, 0.033527374267578125, 0.03845405578613281, 0.0433807373046875, 0.04830741882324219, 0.053234100341796875, 0.05816078186035156, 0.06308746337890625, 0.06801414489746094, 0.07294082641601562, 0.07786750793457031, 0.082794189453125, 0.08772087097167969, 0.09264755249023438, 0.09757423400878906, 0.10250091552734375, 0.10742759704589844, 0.11235427856445312, 0.11728096008300781, 0.1222076416015625, 0.1271343231201172, 0.13206100463867188, 0.13698768615722656, 0.14191436767578125, 0.14684104919433594, 0.15176773071289062, 0.1566944122314453, 0.16162109375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 4.0, 7.0, 15.0, 13.0, 15.0, 27.0, 29.0, 42.0, 24.0, 38.0, 48.0, 43.0, 58.0, 64.0, 61.0, 54.0, 53.0, 61.0, 58.0, 47.0, 44.0, 30.0, 24.0, 22.0, 25.0, 16.0, 20.0, 13.0, 6.0, 14.0, 8.0, 5.0, 0.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.93359375, -1.875396728515625, -1.81719970703125, -1.759002685546875, -1.7008056640625, -1.642608642578125, -1.58441162109375, -1.526214599609375, -1.468017578125, -1.409820556640625, -1.35162353515625, -1.293426513671875, -1.2352294921875, -1.177032470703125, -1.11883544921875, -1.060638427734375, -1.00244140625, -0.944244384765625, -0.88604736328125, -0.827850341796875, -0.7696533203125, -0.711456298828125, -0.65325927734375, -0.595062255859375, -0.536865234375, -0.478668212890625, -0.42047119140625, -0.362274169921875, -0.3040771484375, -0.245880126953125, -0.18768310546875, -0.129486083984375, -0.0712890625, -0.013092041015625, 0.04510498046875, 0.103302001953125, 0.1614990234375, 0.219696044921875, 0.27789306640625, 0.336090087890625, 0.394287109375, 0.452484130859375, 0.51068115234375, 0.568878173828125, 0.6270751953125, 0.685272216796875, 0.74346923828125, 0.801666259765625, 0.85986328125, 0.918060302734375, 0.97625732421875, 1.034454345703125, 1.0926513671875, 1.150848388671875, 1.20904541015625, 1.267242431640625, 1.325439453125, 1.383636474609375, 1.44183349609375, 1.500030517578125, 1.5582275390625, 1.616424560546875, 1.67462158203125, 1.732818603515625, 1.791015625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 4.0, 9.0, 7.0, 12.0, 22.0, 40.0, 54.0, 60.0, 110.0, 166.0, 260.0, 499.0, 941.0, 1729.0, 3774.0, 8849.0, 23578.0, 73514.0, 242579.0, 417381.0, 186681.0, 55700.0, 18755.0, 7208.0, 3199.0, 1503.0, 766.0, 448.0, 250.0, 149.0, 101.0, 60.0, 41.0, 30.0, 19.0, 14.0, 13.0, 4.0, 5.0, 5.0, 1.0, 1.0, 6.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06231689453125, -0.06033134460449219, -0.058345794677734375, -0.05636024475097656, -0.05437469482421875, -0.05238914489746094, -0.050403594970703125, -0.04841804504394531, -0.0464324951171875, -0.04444694519042969, -0.042461395263671875, -0.04047584533691406, -0.03849029541015625, -0.03650474548339844, -0.034519195556640625, -0.03253364562988281, -0.030548095703125, -0.028562545776367188, -0.026576995849609375, -0.024591445922851562, -0.02260589599609375, -0.020620346069335938, -0.018634796142578125, -0.016649246215820312, -0.0146636962890625, -0.012678146362304688, -0.010692596435546875, -0.008707046508789062, -0.00672149658203125, -0.0047359466552734375, -0.002750396728515625, -0.0007648468017578125, 0.001220703125, 0.0032062530517578125, 0.005191802978515625, 0.0071773529052734375, 0.00916290283203125, 0.011148452758789062, 0.013134002685546875, 0.015119552612304688, 0.0171051025390625, 0.019090652465820312, 0.021076202392578125, 0.023061752319335938, 0.02504730224609375, 0.027032852172851562, 0.029018402099609375, 0.031003952026367188, 0.032989501953125, 0.03497505187988281, 0.036960601806640625, 0.03894615173339844, 0.04093170166015625, 0.04291725158691406, 0.044902801513671875, 0.04688835144042969, 0.0488739013671875, 0.05085945129394531, 0.052845001220703125, 0.05483055114746094, 0.05681610107421875, 0.05880165100097656, 0.060787200927734375, 0.06277275085449219, 0.06475830078125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 6.0, 4.0, 2.0, 6.0, 7.0, 12.0, 14.0, 16.0, 24.0, 31.0, 48.0, 54.0, 55.0, 75.0, 86.0, 91.0, 96.0, 76.0, 82.0, 61.0, 30.0, 41.0, 14.0, 14.0, 7.0, 9.0, 12.0, 5.0, 6.0, 7.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.8252601623535156e-05, -2.7004629373550415e-05, -2.5756657123565674e-05, -2.4508684873580933e-05, -2.326071262359619e-05, -2.201274037361145e-05, -2.076476812362671e-05, -1.9516795873641968e-05, -1.8268823623657227e-05, -1.7020851373672485e-05, -1.5772879123687744e-05, -1.4524906873703003e-05, -1.3276934623718262e-05, -1.202896237373352e-05, -1.078099012374878e-05, -9.533017873764038e-06, -8.285045623779297e-06, -7.037073373794556e-06, -5.7891011238098145e-06, -4.541128873825073e-06, -3.293156623840332e-06, -2.045184373855591e-06, -7.972121238708496e-07, 4.507601261138916e-07, 1.6987323760986328e-06, 2.946704626083374e-06, 4.194676876068115e-06, 5.4426491260528564e-06, 6.690621376037598e-06, 7.938593626022339e-06, 9.18656587600708e-06, 1.0434538125991821e-05, 1.1682510375976562e-05, 1.2930482625961304e-05, 1.4178454875946045e-05, 1.5426427125930786e-05, 1.6674399375915527e-05, 1.792237162590027e-05, 1.917034387588501e-05, 2.041831612586975e-05, 2.1666288375854492e-05, 2.2914260625839233e-05, 2.4162232875823975e-05, 2.5410205125808716e-05, 2.6658177375793457e-05, 2.7906149625778198e-05, 2.915412187576294e-05, 3.040209412574768e-05, 3.165006637573242e-05, 3.289803862571716e-05, 3.4146010875701904e-05, 3.5393983125686646e-05, 3.664195537567139e-05, 3.788992762565613e-05, 3.913789987564087e-05, 4.038587212562561e-05, 4.163384437561035e-05, 4.288181662559509e-05, 4.4129788875579834e-05, 4.5377761125564575e-05, 4.6625733375549316e-05, 4.787370562553406e-05, 4.91216778755188e-05, 5.036965012550354e-05, 5.161762237548828e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 12.0, 11.0, 7.0, 14.0, 29.0, 36.0, 60.0, 99.0, 164.0, 272.0, 459.0, 1032.0, 2122.0, 5023.0, 13332.0, 38877.0, 126587.0, 364841.0, 332903.0, 109368.0, 33380.0, 11505.0, 4493.0, 1859.0, 894.0, 483.0, 280.0, 173.0, 78.0, 39.0, 25.0, 31.0, 14.0, 16.0, 7.0, 10.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061553955078125, -0.05942678451538086, -0.05729961395263672, -0.05517244338989258, -0.05304527282714844, -0.0509181022644043, -0.048790931701660156, -0.046663761138916016, -0.044536590576171875, -0.042409420013427734, -0.040282249450683594, -0.03815507888793945, -0.03602790832519531, -0.03390073776245117, -0.03177356719970703, -0.02964639663696289, -0.02751922607421875, -0.02539205551147461, -0.02326488494873047, -0.021137714385986328, -0.019010543823242188, -0.016883373260498047, -0.014756202697753906, -0.012629032135009766, -0.010501861572265625, -0.008374691009521484, -0.006247520446777344, -0.004120349884033203, -0.0019931793212890625, 0.00013399124145507812, 0.0022611618041992188, 0.004388332366943359, 0.0065155029296875, 0.00864267349243164, 0.010769844055175781, 0.012897014617919922, 0.015024185180664062, 0.017151355743408203, 0.019278526306152344, 0.021405696868896484, 0.023532867431640625, 0.025660037994384766, 0.027787208557128906, 0.029914379119873047, 0.03204154968261719, 0.03416872024536133, 0.03629589080810547, 0.03842306137084961, 0.04055023193359375, 0.04267740249633789, 0.04480457305908203, 0.04693174362182617, 0.04905891418457031, 0.05118608474731445, 0.053313255310058594, 0.055440425872802734, 0.057567596435546875, 0.059694766998291016, 0.061821937561035156, 0.0639491081237793, 0.06607627868652344, 0.06820344924926758, 0.07033061981201172, 0.07245779037475586, 0.0745849609375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 7.0, 12.0, 15.0, 11.0, 12.0, 23.0, 23.0, 18.0, 29.0, 40.0, 44.0, 51.0, 55.0, 42.0, 66.0, 57.0, 54.0, 66.0, 58.0, 54.0, 54.0, 40.0, 37.0, 26.0, 24.0, 18.0, 14.0, 17.0, 4.0, 13.0, 5.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0203094482421875, -0.019755244255065918, -0.019201040267944336, -0.018646836280822754, -0.018092632293701172, -0.01753842830657959, -0.016984224319458008, -0.016430020332336426, -0.015875816345214844, -0.015321612358093262, -0.01476740837097168, -0.014213204383850098, -0.013659000396728516, -0.013104796409606934, -0.012550592422485352, -0.01199638843536377, -0.011442184448242188, -0.010887980461120605, -0.010333776473999023, -0.009779572486877441, -0.00922536849975586, -0.008671164512634277, -0.008116960525512695, -0.007562756538391113, -0.007008552551269531, -0.006454348564147949, -0.005900144577026367, -0.005345940589904785, -0.004791736602783203, -0.004237532615661621, -0.003683328628540039, -0.003129124641418457, -0.002574920654296875, -0.002020716667175293, -0.001466512680053711, -0.0009123086929321289, -0.0003581047058105469, 0.00019609928131103516, 0.0007503032684326172, 0.0013045072555541992, 0.0018587112426757812, 0.0024129152297973633, 0.0029671192169189453, 0.0035213232040405273, 0.004075527191162109, 0.004629731178283691, 0.0051839351654052734, 0.0057381391525268555, 0.0062923431396484375, 0.0068465471267700195, 0.0074007511138916016, 0.007954955101013184, 0.008509159088134766, 0.009063363075256348, 0.00961756706237793, 0.010171771049499512, 0.010725975036621094, 0.011280179023742676, 0.011834383010864258, 0.01238858699798584, 0.012942790985107422, 0.013496994972229004, 0.014051198959350586, 0.014605402946472168, 0.01515960693359375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 6.0, 11.0, 9.0, 19.0, 25.0, 21.0, 46.0, 58.0, 68.0, 94.0, 104.0, 115.0, 118.0, 85.0, 65.0, 45.0, 28.0, 23.0, 11.0, 16.0, 5.0, 5.0, 6.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3488291501998901, -1.305383563041687, -1.2619378566741943, -1.2184922695159912, -1.1750465631484985, -1.1316009759902954, -1.0881552696228027, -1.0447096824645996, -1.0012640953063965, -0.9578184485435486, -0.9143728017807007, -0.8709272146224976, -0.8274815082550049, -0.7840359210968018, -0.7405902743339539, -0.697144627571106, -0.6536989212036133, -0.6102532744407654, -0.5668076276779175, -0.5233620405197144, -0.47991636395454407, -0.43647071719169617, -0.39302510023117065, -0.34957945346832275, -0.30613380670547485, -0.26268815994262695, -0.21924252808094025, -0.17579689621925354, -0.13235124945640564, -0.08890560269355774, -0.04545998573303223, -0.002014338970184326, 0.041431307792663574, 0.08487694710493088, 0.12832258641719818, 0.1717682182788849, 0.2152138650417328, 0.2586595118045807, 0.3021051287651062, 0.3455507755279541, 0.388996422290802, 0.4324420690536499, 0.4758877158164978, 0.5193333625793457, 0.5627789497375488, 0.6062246561050415, 0.6496702432632446, 0.6931158900260925, 0.7365615367889404, 0.7800071835517883, 0.8234528303146362, 0.8668984174728394, 0.910344123840332, 0.9537897109985352, 0.9972353577613831, 1.040681004524231, 1.0841267108917236, 1.1275722980499268, 1.1710180044174194, 1.2144635915756226, 1.2579092979431152, 1.3013548851013184, 1.3448004722595215, 1.3882461786270142, 1.4316917657852173]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 1.0, 1.0, 6.0, 3.0, 9.0, 13.0, 14.0, 20.0, 10.0, 19.0, 23.0, 31.0, 24.0, 25.0, 30.0, 38.0, 38.0, 38.0, 58.0, 61.0, 49.0, 53.0, 48.0, 50.0, 41.0, 40.0, 40.0, 28.0, 31.0, 33.0, 32.0, 20.0, 14.0, 16.0, 10.0, 8.0, 4.0, 2.0, 5.0, 3.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.7549246549606323, -0.7283146977424622, -0.701704740524292, -0.675094723701477, -0.6484847664833069, -0.6218748092651367, -0.5952647924423218, -0.5686548352241516, -0.5420448780059814, -0.5154349207878113, -0.4888249337673187, -0.46221494674682617, -0.435604989528656, -0.40899503231048584, -0.3823850452899933, -0.35577505826950073, -0.32916510105133057, -0.3025551438331604, -0.27594515681266785, -0.2493351846933365, -0.22272521257400513, -0.19611524045467377, -0.1695052683353424, -0.14289529621601105, -0.11628532409667969, -0.08967535197734833, -0.06306537985801697, -0.03645540773868561, -0.009845435619354248, 0.016764536499977112, 0.04337450861930847, 0.06998448073863983, 0.09659439325332642, 0.12320436537265778, 0.14981433749198914, 0.1764243096113205, 0.20303428173065186, 0.22964425384998322, 0.2562542259693146, 0.28286421298980713, 0.3094741702079773, 0.33608412742614746, 0.36269411444664, 0.38930410146713257, 0.41591405868530273, 0.4425240159034729, 0.46913400292396545, 0.495743989944458, 0.5223539471626282, 0.5489639043807983, 0.5755739212036133, 0.6021838784217834, 0.6287938356399536, 0.6554037928581238, 0.682013750076294, 0.7086237668991089, 0.735233724117279, 0.7618436813354492, 0.7884536981582642, 0.8150636553764343, 0.8416736125946045, 0.8682835698127747, 0.8948935270309448, 0.9215035438537598, 0.9481135010719299]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 7.0, 9.0, 5.0, 11.0, 10.0, 12.0, 30.0, 41.0, 62.0, 100.0, 221.0, 426.0, 1008.0, 3341.0, 18429.0, 329275.0, 656255.0, 32156.0, 4736.0, 1306.0, 553.0, 238.0, 128.0, 65.0, 41.0, 35.0, 15.0, 12.0, 8.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.01953125, -1.952484130859375, -1.88543701171875, -1.818389892578125, -1.7513427734375, -1.684295654296875, -1.61724853515625, -1.550201416015625, -1.483154296875, -1.416107177734375, -1.34906005859375, -1.282012939453125, -1.2149658203125, -1.147918701171875, -1.08087158203125, -1.013824462890625, -0.94677734375, -0.879730224609375, -0.81268310546875, -0.745635986328125, -0.6785888671875, -0.611541748046875, -0.54449462890625, -0.477447509765625, -0.410400390625, -0.343353271484375, -0.27630615234375, -0.209259033203125, -0.1422119140625, -0.075164794921875, -0.00811767578125, 0.058929443359375, 0.1259765625, 0.193023681640625, 0.26007080078125, 0.327117919921875, 0.3941650390625, 0.461212158203125, 0.52825927734375, 0.595306396484375, 0.662353515625, 0.729400634765625, 0.79644775390625, 0.863494873046875, 0.9305419921875, 0.997589111328125, 1.06463623046875, 1.131683349609375, 1.19873046875, 1.265777587890625, 1.33282470703125, 1.399871826171875, 1.4669189453125, 1.533966064453125, 1.60101318359375, 1.668060302734375, 1.735107421875, 1.802154541015625, 1.86920166015625, 1.936248779296875, 2.0032958984375, 2.070343017578125, 2.13739013671875, 2.204437255859375, 2.271484375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 7.0, 5.0, 9.0, 14.0, 22.0, 35.0, 44.0, 50.0, 67.0, 98.0, 100.0, 116.0, 101.0, 98.0, 66.0, 60.0, 49.0, 22.0, 24.0, 7.0, 4.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6279296875, -1.5217437744140625, -1.415557861328125, -1.3093719482421875, -1.20318603515625, -1.0970001220703125, -0.990814208984375, -0.8846282958984375, -0.7784423828125, -0.6722564697265625, -0.566070556640625, -0.4598846435546875, -0.35369873046875, -0.2475128173828125, -0.141326904296875, -0.0351409912109375, 0.071044921875, 0.1772308349609375, 0.283416748046875, 0.3896026611328125, 0.49578857421875, 0.6019744873046875, 0.708160400390625, 0.8143463134765625, 0.9205322265625, 1.0267181396484375, 1.132904052734375, 1.2390899658203125, 1.34527587890625, 1.4514617919921875, 1.557647705078125, 1.6638336181640625, 1.77001953125, 1.8762054443359375, 1.982391357421875, 2.0885772705078125, 2.19476318359375, 2.3009490966796875, 2.407135009765625, 2.5133209228515625, 2.6195068359375, 2.7256927490234375, 2.831878662109375, 2.9380645751953125, 3.04425048828125, 3.1504364013671875, 3.256622314453125, 3.3628082275390625, 3.468994140625, 3.5751800537109375, 3.681365966796875, 3.7875518798828125, 3.89373779296875, 3.9999237060546875, 4.106109619140625, 4.2122955322265625, 4.3184814453125, 4.4246673583984375, 4.530853271484375, 4.6370391845703125, 4.74322509765625, 4.8494110107421875, 4.955596923828125, 5.0617828369140625, 5.16796875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 0.0, 3.0, 6.0, 4.0, 12.0, 7.0, 9.0, 18.0, 19.0, 34.0, 24.0, 62.0, 64.0, 75.0, 100.0, 173.0, 338.0, 924.0, 3654.0, 47879.0, 953721.0, 36531.0, 3147.0, 806.0, 313.0, 169.0, 117.0, 94.0, 59.0, 54.0, 31.0, 29.0, 14.0, 15.0, 10.0, 9.0, 8.0, 5.0, 7.0, 4.0, 0.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.37890625, -2.29229736328125, -2.2056884765625, -2.11907958984375, -2.032470703125, -1.94586181640625, -1.8592529296875, -1.77264404296875, -1.68603515625, -1.59942626953125, -1.5128173828125, -1.42620849609375, -1.339599609375, -1.25299072265625, -1.1663818359375, -1.07977294921875, -0.9931640625, -0.90655517578125, -0.8199462890625, -0.73333740234375, -0.646728515625, -0.56011962890625, -0.4735107421875, -0.38690185546875, -0.30029296875, -0.21368408203125, -0.1270751953125, -0.04046630859375, 0.046142578125, 0.13275146484375, 0.2193603515625, 0.30596923828125, 0.392578125, 0.47918701171875, 0.5657958984375, 0.65240478515625, 0.739013671875, 0.82562255859375, 0.9122314453125, 0.99884033203125, 1.08544921875, 1.17205810546875, 1.2586669921875, 1.34527587890625, 1.431884765625, 1.51849365234375, 1.6051025390625, 1.69171142578125, 1.7783203125, 1.86492919921875, 1.9515380859375, 2.03814697265625, 2.124755859375, 2.21136474609375, 2.2979736328125, 2.38458251953125, 2.47119140625, 2.55780029296875, 2.6444091796875, 2.73101806640625, 2.817626953125, 2.90423583984375, 2.9908447265625, 3.07745361328125, 3.1640625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 6.0, 7.0, 10.0, 11.0, 14.0, 15.0, 9.0, 15.0, 14.0, 16.0, 33.0, 25.0, 24.0, 29.0, 33.0, 41.0, 37.0, 38.0, 41.0, 46.0, 44.0, 35.0, 37.0, 40.0, 39.0, 43.0, 36.0, 31.0, 24.0, 31.0, 17.0, 26.0, 18.0, 19.0, 13.0, 19.0, 13.0, 7.0, 6.0, 5.0, 4.0, 7.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.533203125, -1.489593505859375, -1.44598388671875, -1.402374267578125, -1.3587646484375, -1.315155029296875, -1.27154541015625, -1.227935791015625, -1.184326171875, -1.140716552734375, -1.09710693359375, -1.053497314453125, -1.0098876953125, -0.966278076171875, -0.92266845703125, -0.879058837890625, -0.83544921875, -0.791839599609375, -0.74822998046875, -0.704620361328125, -0.6610107421875, -0.617401123046875, -0.57379150390625, -0.530181884765625, -0.486572265625, -0.442962646484375, -0.39935302734375, -0.355743408203125, -0.3121337890625, -0.268524169921875, -0.22491455078125, -0.181304931640625, -0.1376953125, -0.094085693359375, -0.05047607421875, -0.006866455078125, 0.0367431640625, 0.080352783203125, 0.12396240234375, 0.167572021484375, 0.211181640625, 0.254791259765625, 0.29840087890625, 0.342010498046875, 0.3856201171875, 0.429229736328125, 0.47283935546875, 0.516448974609375, 0.56005859375, 0.603668212890625, 0.64727783203125, 0.690887451171875, 0.7344970703125, 0.778106689453125, 0.82171630859375, 0.865325927734375, 0.908935546875, 0.952545166015625, 0.99615478515625, 1.039764404296875, 1.0833740234375, 1.126983642578125, 1.17059326171875, 1.214202880859375, 1.2578125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 10.0, 6.0, 14.0, 20.0, 31.0, 59.0, 64.0, 137.0, 250.0, 518.0, 1064.0, 3280.0, 18147.0, 816157.0, 195840.0, 9105.0, 2143.0, 812.0, 365.0, 198.0, 112.0, 80.0, 44.0, 31.0, 19.0, 14.0, 10.0, 5.0, 7.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0732421875, -1.0384368896484375, -1.003631591796875, -0.9688262939453125, -0.93402099609375, -0.8992156982421875, -0.864410400390625, -0.8296051025390625, -0.7947998046875, -0.7599945068359375, -0.725189208984375, -0.6903839111328125, -0.65557861328125, -0.6207733154296875, -0.585968017578125, -0.5511627197265625, -0.516357421875, -0.4815521240234375, -0.446746826171875, -0.4119415283203125, -0.37713623046875, -0.3423309326171875, -0.307525634765625, -0.2727203369140625, -0.2379150390625, -0.2031097412109375, -0.168304443359375, -0.1334991455078125, -0.09869384765625, -0.0638885498046875, -0.029083251953125, 0.0057220458984375, 0.04052734375, 0.0753326416015625, 0.110137939453125, 0.1449432373046875, 0.17974853515625, 0.2145538330078125, 0.249359130859375, 0.2841644287109375, 0.3189697265625, 0.3537750244140625, 0.388580322265625, 0.4233856201171875, 0.45819091796875, 0.4929962158203125, 0.527801513671875, 0.5626068115234375, 0.597412109375, 0.6322174072265625, 0.667022705078125, 0.7018280029296875, 0.73663330078125, 0.7714385986328125, 0.806243896484375, 0.8410491943359375, 0.8758544921875, 0.9106597900390625, 0.945465087890625, 0.9802703857421875, 1.01507568359375, 1.0498809814453125, 1.084686279296875, 1.1194915771484375, 1.154296875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 10.0, 11.0, 21.0, 22.0, 43.0, 66.0, 119.0, 235.0, 206.0, 108.0, 58.0, 31.0, 18.0, 16.0, 13.0, 4.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.296966552734375e-05, -7.933378219604492e-05, -7.56978988647461e-05, -7.206201553344727e-05, -6.842613220214844e-05, -6.479024887084961e-05, -6.115436553955078e-05, -5.751848220825195e-05, -5.3882598876953125e-05, -5.02467155456543e-05, -4.661083221435547e-05, -4.297494888305664e-05, -3.933906555175781e-05, -3.5703182220458984e-05, -3.2067298889160156e-05, -2.8431415557861328e-05, -2.47955322265625e-05, -2.1159648895263672e-05, -1.7523765563964844e-05, -1.3887882232666016e-05, -1.0251998901367188e-05, -6.616115570068359e-06, -2.9802322387695312e-06, 6.556510925292969e-07, 4.291534423828125e-06, 7.927417755126953e-06, 1.1563301086425781e-05, 1.519918441772461e-05, 1.8835067749023438e-05, 2.2470951080322266e-05, 2.6106834411621094e-05, 2.9742717742919922e-05, 3.337860107421875e-05, 3.701448440551758e-05, 4.0650367736816406e-05, 4.4286251068115234e-05, 4.792213439941406e-05, 5.155801773071289e-05, 5.519390106201172e-05, 5.882978439331055e-05, 6.246566772460938e-05, 6.61015510559082e-05, 6.973743438720703e-05, 7.337331771850586e-05, 7.700920104980469e-05, 8.064508438110352e-05, 8.428096771240234e-05, 8.791685104370117e-05, 9.1552734375e-05, 9.518861770629883e-05, 9.882450103759766e-05, 0.00010246038436889648, 0.00010609626770019531, 0.00010973215103149414, 0.00011336803436279297, 0.0001170039176940918, 0.00012063980102539062, 0.00012427568435668945, 0.00012791156768798828, 0.0001315474510192871, 0.00013518333435058594, 0.00013881921768188477, 0.0001424551010131836, 0.00014609098434448242, 0.00014972686767578125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 4.0, 5.0, 14.0, 16.0, 30.0, 43.0, 73.0, 87.0, 160.0, 314.0, 556.0, 1075.0, 2239.0, 5790.0, 35311.0, 910913.0, 78781.0, 7666.0, 2708.0, 1298.0, 652.0, 345.0, 209.0, 89.0, 71.0, 33.0, 21.0, 15.0, 9.0, 7.0, 5.0, 5.0, 2.0, 3.0, 5.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1728515625, -1.13897705078125, -1.1051025390625, -1.07122802734375, -1.037353515625, -1.00347900390625, -0.9696044921875, -0.93572998046875, -0.90185546875, -0.86798095703125, -0.8341064453125, -0.80023193359375, -0.766357421875, -0.73248291015625, -0.6986083984375, -0.66473388671875, -0.630859375, -0.59698486328125, -0.5631103515625, -0.52923583984375, -0.495361328125, -0.46148681640625, -0.4276123046875, -0.39373779296875, -0.35986328125, -0.32598876953125, -0.2921142578125, -0.25823974609375, -0.224365234375, -0.19049072265625, -0.1566162109375, -0.12274169921875, -0.0888671875, -0.05499267578125, -0.0211181640625, 0.01275634765625, 0.046630859375, 0.08050537109375, 0.1143798828125, 0.14825439453125, 0.18212890625, 0.21600341796875, 0.2498779296875, 0.28375244140625, 0.317626953125, 0.35150146484375, 0.3853759765625, 0.41925048828125, 0.453125, 0.48699951171875, 0.5208740234375, 0.55474853515625, 0.588623046875, 0.62249755859375, 0.6563720703125, 0.69024658203125, 0.72412109375, 0.75799560546875, 0.7918701171875, 0.82574462890625, 0.859619140625, 0.89349365234375, 0.9273681640625, 0.96124267578125, 0.9951171875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 7.0, 3.0, 16.0, 18.0, 37.0, 51.0, 111.0, 186.0, 261.0, 123.0, 85.0, 32.0, 22.0, 13.0, 11.0, 3.0, 0.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35400390625, -0.3423042297363281, -0.33060455322265625, -0.3189048767089844, -0.3072052001953125, -0.2955055236816406, -0.28380584716796875, -0.2721061706542969, -0.260406494140625, -0.24870681762695312, -0.23700714111328125, -0.22530746459960938, -0.2136077880859375, -0.20190811157226562, -0.19020843505859375, -0.17850875854492188, -0.16680908203125, -0.15510940551757812, -0.14340972900390625, -0.13171005249023438, -0.1200103759765625, -0.10831069946289062, -0.09661102294921875, -0.08491134643554688, -0.073211669921875, -0.061511993408203125, -0.04981231689453125, -0.038112640380859375, -0.0264129638671875, -0.014713287353515625, -0.00301361083984375, 0.008686065673828125, 0.0203857421875, 0.032085418701171875, 0.04378509521484375, 0.055484771728515625, 0.0671844482421875, 0.07888412475585938, 0.09058380126953125, 0.10228347778320312, 0.113983154296875, 0.12568283081054688, 0.13738250732421875, 0.14908218383789062, 0.1607818603515625, 0.17248153686523438, 0.18418121337890625, 0.19588088989257812, 0.20758056640625, 0.21928024291992188, 0.23097991943359375, 0.24267959594726562, 0.2543792724609375, 0.2660789489746094, 0.27777862548828125, 0.2894783020019531, 0.301177978515625, 0.3128776550292969, 0.32457733154296875, 0.3362770080566406, 0.3479766845703125, 0.3596763610839844, 0.37137603759765625, 0.3830757141113281, 0.394775390625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 2.0, 0.0, 6.0, 7.0, 19.0, 28.0, 42.0, 91.0, 149.0, 220.0, 166.0, 131.0, 66.0, 33.0, 23.0, 15.0, 5.0, 7.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.153860569000244, -1.9843436479568481, -1.8148267269134521, -1.6453098058700562, -1.4757928848266602, -1.3062759637832642, -1.1367590427398682, -0.9672421216964722, -0.7977252006530762, -0.6282082796096802, -0.4586913585662842, -0.2891744375228882, -0.11965751647949219, 0.04985940456390381, 0.2193763256072998, 0.3888932466506958, 0.5584101676940918, 0.7279270887374878, 0.8974440097808838, 1.0669609308242798, 1.2364778518676758, 1.4059947729110718, 1.5755116939544678, 1.7450286149978638, 1.9145455360412598, 2.0840625762939453, 2.2535793781280518, 2.423096179962158, 2.5926132202148438, 2.7621302604675293, 2.9316470623016357, 3.101163864135742, 3.2706804275512695, 3.440197467803955, 3.6097142696380615, 3.779231071472168, 3.9487481117248535, 4.118265151977539, 4.287781715393066, 4.457298755645752, 4.6268157958984375, 4.796332836151123, 4.965849876403809, 5.135366439819336, 5.3048834800720215, 5.474400520324707, 5.643917083740234, 5.81343412399292, 5.9829511642456055, 6.152468204498291, 6.321985244750977, 6.491501808166504, 6.6610188484191895, 6.830535888671875, 7.000052452087402, 7.169569492340088, 7.339086532592773, 7.508603572845459, 7.6781206130981445, 7.847637176513672, 8.017154693603516, 8.186671257019043, 8.35618782043457, 8.525705337524414, 8.695221900939941]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 9.0, 13.0, 12.0, 10.0, 16.0, 19.0, 26.0, 19.0, 33.0, 45.0, 52.0, 66.0, 52.0, 74.0, 53.0, 58.0, 56.0, 61.0, 53.0, 52.0, 40.0, 40.0, 30.0, 26.0, 24.0, 22.0, 18.0, 8.0, 3.0, 7.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6188249588012695, -2.5003929138183594, -2.3819611072540283, -2.263529062271118, -2.145097017288208, -2.026665210723877, -1.9082331657409668, -1.7898011207580566, -1.6713690757751465, -1.5529371500015259, -1.4345051050186157, -1.3160731792449951, -1.197641134262085, -1.0792092084884644, -0.960777223110199, -0.8423452377319336, -0.723913311958313, -0.6054813265800476, -0.4870493412017822, -0.36861738562583923, -0.25018540024757385, -0.13175344467163086, -0.013321459293365479, 0.1051105260848999, 0.22354251146316528, 0.34197449684143066, 0.46040648221969604, 0.5788384675979614, 0.697270393371582, 0.8157023787498474, 0.9341343641281128, 1.0525662899017334, 1.1709983348846436, 1.2894302606582642, 1.4078623056411743, 1.526294231414795, 1.644726276397705, 1.7631582021713257, 1.8815901279449463, 2.0000221729278564, 2.1184542179107666, 2.2368862628936768, 2.355318069458008, 2.473750114440918, 2.592182159423828, 2.7106142044067383, 2.8290460109710693, 2.9474780559539795, 3.0659098625183105, 3.1843419075012207, 3.3027737140655518, 3.421205759048462, 3.539637804031372, 3.658069610595703, 3.7765016555786133, 3.8949337005615234, 4.013365745544434, 4.131797790527344, 4.250229835510254, 4.368661880493164, 4.487093448638916, 4.605525493621826, 4.723957538604736, 4.8423895835876465, 4.960821628570557]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 4.0, 2.0, 9.0, 9.0, 21.0, 31.0, 49.0, 75.0, 118.0, 302.0, 764.0, 3711.0, 294453.0, 3875978.0, 16500.0, 1461.0, 427.0, 149.0, 100.0, 41.0, 31.0, 17.0, 12.0, 4.0, 3.0, 3.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.07421875, -4.86492919921875, -4.6556396484375, -4.44635009765625, -4.237060546875, -4.02777099609375, -3.8184814453125, -3.60919189453125, -3.39990234375, -3.19061279296875, -2.9813232421875, -2.77203369140625, -2.562744140625, -2.35345458984375, -2.1441650390625, -1.93487548828125, -1.7255859375, -1.51629638671875, -1.3070068359375, -1.09771728515625, -0.888427734375, -0.67913818359375, -0.4698486328125, -0.26055908203125, -0.05126953125, 0.15802001953125, 0.3673095703125, 0.57659912109375, 0.785888671875, 0.99517822265625, 1.2044677734375, 1.41375732421875, 1.623046875, 1.83233642578125, 2.0416259765625, 2.25091552734375, 2.460205078125, 2.66949462890625, 2.8787841796875, 3.08807373046875, 3.29736328125, 3.50665283203125, 3.7159423828125, 3.92523193359375, 4.134521484375, 4.34381103515625, 4.5531005859375, 4.76239013671875, 4.9716796875, 5.18096923828125, 5.3902587890625, 5.59954833984375, 5.808837890625, 6.01812744140625, 6.2274169921875, 6.43670654296875, 6.64599609375, 6.85528564453125, 7.0645751953125, 7.27386474609375, 7.483154296875, 7.69244384765625, 7.9017333984375, 8.11102294921875, 8.3203125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 11.0, 7.0, 5.0, 9.0, 12.0, 19.0, 21.0, 22.0, 28.0, 22.0, 38.0, 48.0, 44.0, 37.0, 48.0, 46.0, 54.0, 55.0, 54.0, 64.0, 39.0, 47.0, 44.0, 32.0, 35.0, 29.0, 18.0, 24.0, 21.0, 11.0, 14.0, 6.0, 11.0, 3.0, 7.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.365234375, -1.3252105712890625, -1.285186767578125, -1.2451629638671875, -1.20513916015625, -1.1651153564453125, -1.125091552734375, -1.0850677490234375, -1.0450439453125, -1.0050201416015625, -0.964996337890625, -0.9249725341796875, -0.88494873046875, -0.8449249267578125, -0.804901123046875, -0.7648773193359375, -0.724853515625, -0.6848297119140625, -0.644805908203125, -0.6047821044921875, -0.56475830078125, -0.5247344970703125, -0.484710693359375, -0.4446868896484375, -0.4046630859375, -0.3646392822265625, -0.324615478515625, -0.2845916748046875, -0.24456787109375, -0.2045440673828125, -0.164520263671875, -0.1244964599609375, -0.08447265625, -0.0444488525390625, -0.004425048828125, 0.0355987548828125, 0.07562255859375, 0.1156463623046875, 0.155670166015625, 0.1956939697265625, 0.2357177734375, 0.2757415771484375, 0.315765380859375, 0.3557891845703125, 0.39581298828125, 0.4358367919921875, 0.475860595703125, 0.5158843994140625, 0.555908203125, 0.5959320068359375, 0.635955810546875, 0.6759796142578125, 0.71600341796875, 0.7560272216796875, 0.796051025390625, 0.8360748291015625, 0.8760986328125, 0.9161224365234375, 0.956146240234375, 0.9961700439453125, 1.03619384765625, 1.0762176513671875, 1.116241455078125, 1.1562652587890625, 1.1962890625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 7.0, 12.0, 31.0, 75.0, 151.0, 337.0, 1037.0, 3354.0, 24171.0, 3665836.0, 485726.0, 10296.0, 2104.0, 662.0, 268.0, 95.0, 57.0, 30.0, 15.0, 9.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1171875, -2.99163818359375, -2.8660888671875, -2.74053955078125, -2.614990234375, -2.48944091796875, -2.3638916015625, -2.23834228515625, -2.11279296875, -1.98724365234375, -1.8616943359375, -1.73614501953125, -1.610595703125, -1.48504638671875, -1.3594970703125, -1.23394775390625, -1.1083984375, -0.98284912109375, -0.8572998046875, -0.73175048828125, -0.606201171875, -0.48065185546875, -0.3551025390625, -0.22955322265625, -0.10400390625, 0.02154541015625, 0.1470947265625, 0.27264404296875, 0.398193359375, 0.52374267578125, 0.6492919921875, 0.77484130859375, 0.900390625, 1.02593994140625, 1.1514892578125, 1.27703857421875, 1.402587890625, 1.52813720703125, 1.6536865234375, 1.77923583984375, 1.90478515625, 2.03033447265625, 2.1558837890625, 2.28143310546875, 2.406982421875, 2.53253173828125, 2.6580810546875, 2.78363037109375, 2.9091796875, 3.03472900390625, 3.1602783203125, 3.28582763671875, 3.411376953125, 3.53692626953125, 3.6624755859375, 3.78802490234375, 3.91357421875, 4.03912353515625, 4.1646728515625, 4.29022216796875, 4.415771484375, 4.54132080078125, 4.6668701171875, 4.79241943359375, 4.91796875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 7.0, 6.0, 13.0, 29.0, 43.0, 75.0, 140.0, 264.0, 516.0, 1021.0, 938.0, 497.0, 232.0, 121.0, 69.0, 38.0, 16.0, 10.0, 15.0, 6.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84228515625, -0.8188247680664062, -0.7953643798828125, -0.7719039916992188, -0.748443603515625, -0.7249832153320312, -0.7015228271484375, -0.6780624389648438, -0.65460205078125, -0.6311416625976562, -0.6076812744140625, -0.5842208862304688, -0.560760498046875, -0.5373001098632812, -0.5138397216796875, -0.49037933349609375, -0.4669189453125, -0.44345855712890625, -0.4199981689453125, -0.39653778076171875, -0.373077392578125, -0.34961700439453125, -0.3261566162109375, -0.30269622802734375, -0.27923583984375, -0.25577545166015625, -0.2323150634765625, -0.20885467529296875, -0.185394287109375, -0.16193389892578125, -0.1384735107421875, -0.11501312255859375, -0.091552734375, -0.06809234619140625, -0.0446319580078125, -0.02117156982421875, 0.002288818359375, 0.02574920654296875, 0.0492095947265625, 0.07266998291015625, 0.09613037109375, 0.11959075927734375, 0.1430511474609375, 0.16651153564453125, 0.189971923828125, 0.21343231201171875, 0.2368927001953125, 0.26035308837890625, 0.2838134765625, 0.30727386474609375, 0.3307342529296875, 0.35419464111328125, 0.377655029296875, 0.40111541748046875, 0.4245758056640625, 0.44803619384765625, 0.47149658203125, 0.49495697021484375, 0.5184173583984375, 0.5418777465820312, 0.565338134765625, 0.5887985229492188, 0.6122589111328125, 0.6357192993164062, 0.6591796875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 8.0, 7.0, 11.0, 4.0, 9.0, 7.0, 20.0, 22.0, 38.0, 20.0, 53.0, 59.0, 84.0, 85.0, 110.0, 95.0, 80.0, 73.0, 61.0, 38.0, 36.0, 17.0, 17.0, 15.0, 7.0, 10.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8231909275054932, -1.763755202293396, -1.7043195962905884, -1.6448838710784912, -1.5854482650756836, -1.5260125398635864, -1.4665768146514893, -1.4071412086486816, -1.347705602645874, -1.2882698774337769, -1.2288342714309692, -1.169398546218872, -1.1099629402160645, -1.0505272150039673, -0.9910915493965149, -0.9316558837890625, -0.8722201585769653, -0.8127844929695129, -0.7533488273620605, -0.6939131021499634, -0.6344774961471558, -0.5750417709350586, -0.5156061053276062, -0.4561704397201538, -0.3967347741127014, -0.337299108505249, -0.27786344289779663, -0.21842774748802185, -0.15899208188056946, -0.09955641627311707, -0.040120720863342285, 0.019314944744110107, 0.0787506103515625, 0.1381862759590149, 0.19762195646762848, 0.25705763697624207, 0.31649330258369446, 0.37592896819114685, 0.43536466360092163, 0.494800329208374, 0.5542359948158264, 0.6136716604232788, 0.6731073260307312, 0.7325429916381836, 0.7919787168502808, 0.8514143228530884, 0.9108500480651855, 0.9702857136726379, 1.0297213792800903, 1.0891571044921875, 1.1485927104949951, 1.2080284357070923, 1.2674640417099, 1.326899766921997, 1.3863353729248047, 1.4457710981369019, 1.505206823348999, 1.5646425485610962, 1.6240781545639038, 1.683513879776001, 1.7429494857788086, 1.8023852109909058, 1.861820936203003, 1.9212565422058105, 1.9806921482086182]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 5.0, 10.0, 4.0, 9.0, 17.0, 19.0, 13.0, 13.0, 24.0, 16.0, 23.0, 32.0, 28.0, 34.0, 34.0, 49.0, 50.0, 40.0, 47.0, 44.0, 48.0, 35.0, 52.0, 38.0, 26.0, 45.0, 29.0, 28.0, 26.0, 27.0, 24.0, 18.0, 17.0, 12.0, 10.0, 9.0, 6.0, 9.0, 4.0, 7.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-1.2771055698394775, -1.2403209209442139, -1.2035361528396606, -1.166751503944397, -1.1299667358398438, -1.09318208694458, -1.0563974380493164, -1.0196127891540527, -0.9828280210494995, -0.9460433125495911, -0.9092586040496826, -0.872473955154419, -0.8356892466545105, -0.798904538154602, -0.7621198892593384, -0.7253351807594299, -0.6885504722595215, -0.651765763759613, -0.6149810552597046, -0.5781964063644409, -0.5414116978645325, -0.504626989364624, -0.46784231066703796, -0.4310576319694519, -0.39427292346954346, -0.357488214969635, -0.32070353627204895, -0.2839188575744629, -0.24713414907455444, -0.2103494554758072, -0.17356476187705994, -0.13678008317947388, -0.09999525547027588, -0.06321056187152863, -0.026425868272781372, 0.010358825325965881, 0.047143518924713135, 0.08392821252346039, 0.12071290612220764, 0.1574975848197937, 0.19428229331970215, 0.2310669869184494, 0.26785168051719666, 0.3046363592147827, 0.34142106771469116, 0.3782057762145996, 0.41499045491218567, 0.45177513360977173, 0.4885598421096802, 0.5253445506095886, 0.5621292591094971, 0.5989139080047607, 0.6356986165046692, 0.6724833250045776, 0.7092679738998413, 0.7460526823997498, 0.7828373908996582, 0.8196220993995667, 0.8564068078994751, 0.8931914567947388, 0.9299761652946472, 0.9667608737945557, 1.0035455226898193, 1.040330171585083, 1.0771149396896362]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 10.0, 7.0, 16.0, 52.0, 123.0, 344.0, 1461.0, 10214.0, 154159.0, 833900.0, 42747.0, 4411.0, 740.0, 207.0, 81.0, 29.0, 16.0, 3.0, 12.0, 5.0, 2.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6162109375, -0.590850830078125, -0.56549072265625, -0.540130615234375, -0.5147705078125, -0.489410400390625, -0.46405029296875, -0.438690185546875, -0.413330078125, -0.387969970703125, -0.36260986328125, -0.337249755859375, -0.3118896484375, -0.286529541015625, -0.26116943359375, -0.235809326171875, -0.21044921875, -0.185089111328125, -0.15972900390625, -0.134368896484375, -0.1090087890625, -0.083648681640625, -0.05828857421875, -0.032928466796875, -0.007568359375, 0.017791748046875, 0.04315185546875, 0.068511962890625, 0.0938720703125, 0.119232177734375, 0.14459228515625, 0.169952392578125, 0.1953125, 0.220672607421875, 0.24603271484375, 0.271392822265625, 0.2967529296875, 0.322113037109375, 0.34747314453125, 0.372833251953125, 0.398193359375, 0.423553466796875, 0.44891357421875, 0.474273681640625, 0.4996337890625, 0.524993896484375, 0.55035400390625, 0.575714111328125, 0.60107421875, 0.626434326171875, 0.65179443359375, 0.677154541015625, 0.7025146484375, 0.727874755859375, 0.75323486328125, 0.778594970703125, 0.803955078125, 0.829315185546875, 0.85467529296875, 0.880035400390625, 0.9053955078125, 0.930755615234375, 0.95611572265625, 0.981475830078125, 1.0068359375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 4.0, 4.0, 8.0, 12.0, 15.0, 13.0, 16.0, 19.0, 29.0, 29.0, 36.0, 44.0, 60.0, 59.0, 58.0, 67.0, 74.0, 69.0, 71.0, 44.0, 60.0, 43.0, 34.0, 37.0, 17.0, 22.0, 9.0, 9.0, 11.0, 8.0, 2.0, 5.0, 5.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.919921875, -0.8831634521484375, -0.846405029296875, -0.8096466064453125, -0.77288818359375, -0.7361297607421875, -0.699371337890625, -0.6626129150390625, -0.6258544921875, -0.5890960693359375, -0.552337646484375, -0.5155792236328125, -0.47882080078125, -0.4420623779296875, -0.405303955078125, -0.3685455322265625, -0.331787109375, -0.2950286865234375, -0.258270263671875, -0.2215118408203125, -0.18475341796875, -0.1479949951171875, -0.111236572265625, -0.0744781494140625, -0.0377197265625, -0.0009613037109375, 0.035797119140625, 0.0725555419921875, 0.10931396484375, 0.1460723876953125, 0.182830810546875, 0.2195892333984375, 0.25634765625, 0.2931060791015625, 0.329864501953125, 0.3666229248046875, 0.40338134765625, 0.4401397705078125, 0.476898193359375, 0.5136566162109375, 0.5504150390625, 0.5871734619140625, 0.623931884765625, 0.6606903076171875, 0.69744873046875, 0.7342071533203125, 0.770965576171875, 0.8077239990234375, 0.844482421875, 0.8812408447265625, 0.917999267578125, 0.9547576904296875, 0.99151611328125, 1.0282745361328125, 1.065032958984375, 1.1017913818359375, 1.1385498046875, 1.1753082275390625, 1.212066650390625, 1.2488250732421875, 1.28558349609375, 1.3223419189453125, 1.359100341796875, 1.3958587646484375, 1.4326171875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 6.0, 10.0, 13.0, 16.0, 19.0, 35.0, 61.0, 105.0, 154.0, 261.0, 488.0, 882.0, 1728.0, 3423.0, 7999.0, 19785.0, 57524.0, 208773.0, 462509.0, 195696.0, 55228.0, 19196.0, 7630.0, 3332.0, 1646.0, 853.0, 470.0, 266.0, 150.0, 114.0, 65.0, 46.0, 19.0, 19.0, 16.0, 9.0, 4.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.213623046875, -0.20611953735351562, -0.19861602783203125, -0.19111251831054688, -0.1836090087890625, -0.17610549926757812, -0.16860198974609375, -0.16109848022460938, -0.153594970703125, -0.14609146118164062, -0.13858795166015625, -0.13108444213867188, -0.1235809326171875, -0.11607742309570312, -0.10857391357421875, -0.10107040405273438, -0.09356689453125, -0.08606338500976562, -0.07855987548828125, -0.07105636596679688, -0.0635528564453125, -0.056049346923828125, -0.04854583740234375, -0.041042327880859375, -0.033538818359375, -0.026035308837890625, -0.01853179931640625, -0.011028289794921875, -0.0035247802734375, 0.003978729248046875, 0.01148223876953125, 0.018985748291015625, 0.0264892578125, 0.033992767333984375, 0.04149627685546875, 0.048999786376953125, 0.0565032958984375, 0.06400680541992188, 0.07151031494140625, 0.07901382446289062, 0.086517333984375, 0.09402084350585938, 0.10152435302734375, 0.10902786254882812, 0.1165313720703125, 0.12403488159179688, 0.13153839111328125, 0.13904190063476562, 0.14654541015625, 0.15404891967773438, 0.16155242919921875, 0.16905593872070312, 0.1765594482421875, 0.18406295776367188, 0.19156646728515625, 0.19906997680664062, 0.206573486328125, 0.21407699584960938, 0.22158050537109375, 0.22908401489257812, 0.2365875244140625, 0.24409103393554688, 0.25159454345703125, 0.2590980529785156, 0.2666015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 4.0, 3.0, 9.0, 9.0, 10.0, 10.0, 14.0, 15.0, 14.0, 20.0, 22.0, 30.0, 20.0, 41.0, 35.0, 45.0, 32.0, 55.0, 53.0, 45.0, 45.0, 43.0, 41.0, 41.0, 45.0, 37.0, 44.0, 38.0, 34.0, 27.0, 16.0, 17.0, 11.0, 14.0, 9.0, 3.0, 7.0, 10.0, 5.0, 11.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7841796875, -1.7292938232421875, -1.674407958984375, -1.6195220947265625, -1.56463623046875, -1.5097503662109375, -1.454864501953125, -1.3999786376953125, -1.3450927734375, -1.2902069091796875, -1.235321044921875, -1.1804351806640625, -1.12554931640625, -1.0706634521484375, -1.015777587890625, -0.9608917236328125, -0.906005859375, -0.8511199951171875, -0.796234130859375, -0.7413482666015625, -0.68646240234375, -0.6315765380859375, -0.576690673828125, -0.5218048095703125, -0.4669189453125, -0.4120330810546875, -0.357147216796875, -0.3022613525390625, -0.24737548828125, -0.1924896240234375, -0.137603759765625, -0.0827178955078125, -0.02783203125, 0.0270538330078125, 0.081939697265625, 0.1368255615234375, 0.19171142578125, 0.2465972900390625, 0.301483154296875, 0.3563690185546875, 0.4112548828125, 0.4661407470703125, 0.521026611328125, 0.5759124755859375, 0.63079833984375, 0.6856842041015625, 0.740570068359375, 0.7954559326171875, 0.850341796875, 0.9052276611328125, 0.960113525390625, 1.0149993896484375, 1.06988525390625, 1.1247711181640625, 1.179656982421875, 1.2345428466796875, 1.2894287109375, 1.3443145751953125, 1.399200439453125, 1.4540863037109375, 1.50897216796875, 1.5638580322265625, 1.618743896484375, 1.6736297607421875, 1.728515625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 7.0, 11.0, 12.0, 20.0, 21.0, 26.0, 42.0, 52.0, 84.0, 114.0, 181.0, 265.0, 438.0, 730.0, 1195.0, 2106.0, 3950.0, 7817.0, 17386.0, 45553.0, 141797.0, 386624.0, 290643.0, 91811.0, 31343.0, 12809.0, 5993.0, 3160.0, 1720.0, 922.0, 623.0, 387.0, 228.0, 155.0, 95.0, 66.0, 50.0, 35.0, 23.0, 19.0, 15.0, 11.0, 3.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06341552734375, -0.06135749816894531, -0.059299468994140625, -0.05724143981933594, -0.05518341064453125, -0.05312538146972656, -0.051067352294921875, -0.04900932312011719, -0.0469512939453125, -0.04489326477050781, -0.042835235595703125, -0.04077720642089844, -0.03871917724609375, -0.03666114807128906, -0.034603118896484375, -0.03254508972167969, -0.030487060546875, -0.028429031372070312, -0.026371002197265625, -0.024312973022460938, -0.02225494384765625, -0.020196914672851562, -0.018138885498046875, -0.016080856323242188, -0.0140228271484375, -0.011964797973632812, -0.009906768798828125, -0.007848739624023438, -0.00579071044921875, -0.0037326812744140625, -0.001674652099609375, 0.0003833770751953125, 0.00244140625, 0.0044994354248046875, 0.006557464599609375, 0.008615493774414062, 0.01067352294921875, 0.012731552124023438, 0.014789581298828125, 0.016847610473632812, 0.0189056396484375, 0.020963668823242188, 0.023021697998046875, 0.025079727172851562, 0.02713775634765625, 0.029195785522460938, 0.031253814697265625, 0.03331184387207031, 0.035369873046875, 0.03742790222167969, 0.039485931396484375, 0.04154396057128906, 0.04360198974609375, 0.04566001892089844, 0.047718048095703125, 0.04977607727050781, 0.0518341064453125, 0.05389213562011719, 0.055950164794921875, 0.05800819396972656, 0.06006622314453125, 0.06212425231933594, 0.06418228149414062, 0.06624031066894531, 0.06829833984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 7.0, 7.0, 10.0, 17.0, 30.0, 25.0, 33.0, 57.0, 73.0, 81.0, 104.0, 94.0, 108.0, 90.0, 78.0, 53.0, 31.0, 24.0, 19.0, 9.0, 12.0, 8.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.882978439331055e-05, -5.7256780564785004e-05, -5.568377673625946e-05, -5.411077290773392e-05, -5.2537769079208374e-05, -5.096476525068283e-05, -4.939176142215729e-05, -4.7818757593631744e-05, -4.62457537651062e-05, -4.467274993658066e-05, -4.3099746108055115e-05, -4.152674227952957e-05, -3.995373845100403e-05, -3.8380734622478485e-05, -3.680773079395294e-05, -3.52347269654274e-05, -3.3661723136901855e-05, -3.208871930837631e-05, -3.051571547985077e-05, -2.8942711651325226e-05, -2.7369707822799683e-05, -2.579670399427414e-05, -2.4223700165748596e-05, -2.2650696337223053e-05, -2.107769250869751e-05, -1.9504688680171967e-05, -1.7931684851646423e-05, -1.635868102312088e-05, -1.4785677194595337e-05, -1.3212673366069794e-05, -1.163966953754425e-05, -1.0066665709018707e-05, -8.493661880493164e-06, -6.920658051967621e-06, -5.347654223442078e-06, -3.7746503949165344e-06, -2.201646566390991e-06, -6.28642737865448e-07, 9.443610906600952e-07, 2.5173649191856384e-06, 4.090368747711182e-06, 5.663372576236725e-06, 7.236376404762268e-06, 8.809380233287811e-06, 1.0382384061813354e-05, 1.1955387890338898e-05, 1.3528391718864441e-05, 1.5101395547389984e-05, 1.6674399375915527e-05, 1.824740320444107e-05, 1.9820407032966614e-05, 2.1393410861492157e-05, 2.29664146900177e-05, 2.4539418518543243e-05, 2.6112422347068787e-05, 2.768542617559433e-05, 2.9258430004119873e-05, 3.0831433832645416e-05, 3.240443766117096e-05, 3.39774414896965e-05, 3.5550445318222046e-05, 3.712344914674759e-05, 3.869645297527313e-05, 4.0269456803798676e-05, 4.184246063232422e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 5.0, 8.0, 14.0, 17.0, 23.0, 40.0, 39.0, 92.0, 147.0, 211.0, 363.0, 634.0, 1285.0, 2530.0, 5310.0, 12624.0, 34264.0, 115310.0, 353939.0, 350609.0, 113800.0, 34078.0, 12510.0, 5406.0, 2471.0, 1221.0, 715.0, 335.0, 185.0, 122.0, 83.0, 44.0, 34.0, 22.0, 13.0, 16.0, 12.0, 6.0, 4.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.08294677734375, -0.0807638168334961, -0.07858085632324219, -0.07639789581298828, -0.07421493530273438, -0.07203197479248047, -0.06984901428222656, -0.06766605377197266, -0.06548309326171875, -0.06330013275146484, -0.06111717224121094, -0.05893421173095703, -0.056751251220703125, -0.05456829071044922, -0.05238533020019531, -0.050202369689941406, -0.0480194091796875, -0.045836448669433594, -0.04365348815917969, -0.04147052764892578, -0.039287567138671875, -0.03710460662841797, -0.03492164611816406, -0.032738685607910156, -0.03055572509765625, -0.028372764587402344, -0.026189804077148438, -0.02400684356689453, -0.021823883056640625, -0.01964092254638672, -0.017457962036132812, -0.015275001525878906, -0.013092041015625, -0.010909080505371094, -0.008726119995117188, -0.006543159484863281, -0.004360198974609375, -0.0021772384643554688, 5.7220458984375e-06, 0.0021886825561523438, 0.00437164306640625, 0.006554603576660156, 0.008737564086914062, 0.010920524597167969, 0.013103485107421875, 0.015286445617675781, 0.017469406127929688, 0.019652366638183594, 0.0218353271484375, 0.024018287658691406, 0.026201248168945312, 0.02838420867919922, 0.030567169189453125, 0.03275012969970703, 0.03493309020996094, 0.037116050720214844, 0.03929901123046875, 0.041481971740722656, 0.04366493225097656, 0.04584789276123047, 0.048030853271484375, 0.05021381378173828, 0.05239677429199219, 0.054579734802246094, 0.0567626953125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 4.0, 6.0, 8.0, 11.0, 10.0, 10.0, 20.0, 21.0, 26.0, 30.0, 43.0, 35.0, 62.0, 53.0, 75.0, 56.0, 58.0, 63.0, 49.0, 58.0, 50.0, 48.0, 31.0, 32.0, 21.0, 25.0, 21.0, 9.0, 14.0, 7.0, 5.0, 6.0, 7.0, 5.0, 1.0, 3.0, 6.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0168914794921875, -0.016341686248779297, -0.015791893005371094, -0.01524209976196289, -0.014692306518554688, -0.014142513275146484, -0.013592720031738281, -0.013042926788330078, -0.012493133544921875, -0.011943340301513672, -0.011393547058105469, -0.010843753814697266, -0.010293960571289062, -0.00974416732788086, -0.009194374084472656, -0.008644580841064453, -0.00809478759765625, -0.007544994354248047, -0.006995201110839844, -0.006445407867431641, -0.0058956146240234375, -0.005345821380615234, -0.004796028137207031, -0.004246234893798828, -0.003696441650390625, -0.003146648406982422, -0.0025968551635742188, -0.0020470619201660156, -0.0014972686767578125, -0.0009474754333496094, -0.00039768218994140625, 0.00015211105346679688, 0.000701904296875, 0.0012516975402832031, 0.0018014907836914062, 0.0023512840270996094, 0.0029010772705078125, 0.0034508705139160156, 0.004000663757324219, 0.004550457000732422, 0.005100250244140625, 0.005650043487548828, 0.006199836730957031, 0.006749629974365234, 0.0072994232177734375, 0.00784921646118164, 0.008399009704589844, 0.008948802947998047, 0.00949859619140625, 0.010048389434814453, 0.010598182678222656, 0.01114797592163086, 0.011697769165039062, 0.012247562408447266, 0.012797355651855469, 0.013347148895263672, 0.013896942138671875, 0.014446735382080078, 0.014996528625488281, 0.015546321868896484, 0.016096115112304688, 0.01664590835571289, 0.017195701599121094, 0.017745494842529297, 0.0182952880859375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 16.0, 21.0, 33.0, 78.0, 162.0, 287.0, 222.0, 107.0, 45.0, 24.0, 7.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4738221168518066, -1.3661812543869019, -1.258540391921997, -1.1508996486663818, -1.043258786201477, -0.9356179237365723, -0.8279771208763123, -0.7203363180160522, -0.6126954555511475, -0.5050545930862427, -0.39741379022598267, -0.28977295756340027, -0.18213212490081787, -0.07449126243591309, 0.033149540424346924, 0.14079034328460693, 0.24843120574951172, 0.3560720384120941, 0.4637128710746765, 0.5713536739349365, 0.6789945363998413, 0.7866353988647461, 0.8942762017250061, 1.0019170045852661, 1.109557867050171, 1.2171987295150757, 1.3248395919799805, 1.4324803352355957, 1.5401211977005005, 1.6477620601654053, 1.7554028034210205, 1.8630436658859253, 1.97068452835083, 2.0783252716064453, 2.1859662532806396, 2.293606996536255, 2.401247978210449, 2.5088887214660645, 2.6165294647216797, 2.724170207977295, 2.8318111896514893, 2.9394519329071045, 3.047092914581299, 3.154733657836914, 3.2623744010925293, 3.3700153827667236, 3.477656126022339, 3.585297107696533, 3.6929378509521484, 3.8005785942077637, 3.908219575881958, 4.015860557556152, 4.123501300811768, 4.231142044067383, 4.338782787322998, 4.446423530578613, 4.554064750671387, 4.661705493927002, 4.769346237182617, 4.876987457275391, 4.984628200531006, 5.092268943786621, 5.199909687042236, 5.307550430297852, 5.415191173553467]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 7.0, 3.0, 11.0, 13.0, 10.0, 25.0, 17.0, 26.0, 18.0, 39.0, 37.0, 42.0, 66.0, 63.0, 58.0, 67.0, 69.0, 59.0, 62.0, 47.0, 45.0, 43.0, 38.0, 35.0, 21.0, 21.0, 16.0, 9.0, 8.0, 9.0, 5.0, 2.0, 5.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8897004723548889, -0.8552725315093994, -0.8208446502685547, -0.7864167094230652, -0.7519888281822205, -0.717560887336731, -0.6831330060958862, -0.6487050652503967, -0.6142771244049072, -0.5798491835594177, -0.545421302318573, -0.5109933614730835, -0.47656548023223877, -0.44213753938674927, -0.40770962834358215, -0.37328171730041504, -0.3388538360595703, -0.3044259250164032, -0.2699980139732361, -0.23557008802890778, -0.20114217698574066, -0.16671426594257355, -0.13228633999824524, -0.09785842895507812, -0.06343051791191101, -0.029002603143453598, 0.005425311625003815, 0.039853230118751526, 0.07428114116191864, 0.10870905220508575, 0.14313697814941406, 0.17756488919258118, 0.21199274063110352, 0.24642065167427063, 0.28084856271743774, 0.31527650356292725, 0.349704384803772, 0.3841323256492615, 0.4185602366924286, 0.4529881477355957, 0.4874160587787628, 0.5218439698219299, 0.5562719106674194, 0.5906997919082642, 0.6251277327537537, 0.6595556139945984, 0.6939835548400879, 0.7284114360809326, 0.7628393769264221, 0.7972673177719116, 0.8316951990127563, 0.8661231398582458, 0.9005510210990906, 0.9349789619445801, 0.9694068431854248, 1.0038347244262695, 1.0382627248764038, 1.0726906061172485, 1.1071186065673828, 1.1415464878082275, 1.1759743690490723, 1.210402250289917, 1.2448302507400513, 1.279258131980896, 1.3136860132217407]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 2.0, 6.0, 9.0, 13.0, 37.0, 51.0, 140.0, 364.0, 1147.0, 6624.0, 712731.0, 320721.0, 5155.0, 960.0, 313.0, 142.0, 63.0, 30.0, 17.0, 9.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.98828125, -5.84881591796875, -5.7093505859375, -5.56988525390625, -5.430419921875, -5.29095458984375, -5.1514892578125, -5.01202392578125, -4.87255859375, -4.73309326171875, -4.5936279296875, -4.45416259765625, -4.314697265625, -4.17523193359375, -4.0357666015625, -3.89630126953125, -3.7568359375, -3.61737060546875, -3.4779052734375, -3.33843994140625, -3.198974609375, -3.05950927734375, -2.9200439453125, -2.78057861328125, -2.64111328125, -2.50164794921875, -2.3621826171875, -2.22271728515625, -2.083251953125, -1.94378662109375, -1.8043212890625, -1.66485595703125, -1.525390625, -1.38592529296875, -1.2464599609375, -1.10699462890625, -0.967529296875, -0.82806396484375, -0.6885986328125, -0.54913330078125, -0.40966796875, -0.27020263671875, -0.1307373046875, 0.00872802734375, 0.148193359375, 0.28765869140625, 0.4271240234375, 0.56658935546875, 0.7060546875, 0.84552001953125, 0.9849853515625, 1.12445068359375, 1.263916015625, 1.40338134765625, 1.5428466796875, 1.68231201171875, 1.82177734375, 1.96124267578125, 2.1007080078125, 2.24017333984375, 2.379638671875, 2.51910400390625, 2.6585693359375, 2.79803466796875, 2.9375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 7.0, 4.0, 13.0, 20.0, 30.0, 39.0, 65.0, 86.0, 114.0, 115.0, 124.0, 123.0, 95.0, 57.0, 39.0, 26.0, 23.0, 18.0, 8.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.748046875, -1.623748779296875, -1.49945068359375, -1.375152587890625, -1.2508544921875, -1.126556396484375, -1.00225830078125, -0.877960205078125, -0.753662109375, -0.629364013671875, -0.50506591796875, -0.380767822265625, -0.2564697265625, -0.132171630859375, -0.00787353515625, 0.116424560546875, 0.24072265625, 0.365020751953125, 0.48931884765625, 0.613616943359375, 0.7379150390625, 0.862213134765625, 0.98651123046875, 1.110809326171875, 1.235107421875, 1.359405517578125, 1.48370361328125, 1.608001708984375, 1.7322998046875, 1.856597900390625, 1.98089599609375, 2.105194091796875, 2.2294921875, 2.353790283203125, 2.47808837890625, 2.602386474609375, 2.7266845703125, 2.850982666015625, 2.97528076171875, 3.099578857421875, 3.223876953125, 3.348175048828125, 3.47247314453125, 3.596771240234375, 3.7210693359375, 3.845367431640625, 3.96966552734375, 4.093963623046875, 4.21826171875, 4.342559814453125, 4.46685791015625, 4.591156005859375, 4.7154541015625, 4.839752197265625, 4.96405029296875, 5.088348388671875, 5.212646484375, 5.336944580078125, 5.46124267578125, 5.585540771484375, 5.7098388671875, 5.834136962890625, 5.95843505859375, 6.082733154296875, 6.20703125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 4.0, 12.0, 14.0, 28.0, 56.0, 144.0, 337.0, 1191.0, 7145.0, 994972.0, 41430.0, 2263.0, 557.0, 207.0, 97.0, 38.0, 27.0, 8.0, 11.0, 5.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4921875, -5.33843994140625, -5.1846923828125, -5.03094482421875, -4.877197265625, -4.72344970703125, -4.5697021484375, -4.41595458984375, -4.26220703125, -4.10845947265625, -3.9547119140625, -3.80096435546875, -3.647216796875, -3.49346923828125, -3.3397216796875, -3.18597412109375, -3.0322265625, -2.87847900390625, -2.7247314453125, -2.57098388671875, -2.417236328125, -2.26348876953125, -2.1097412109375, -1.95599365234375, -1.80224609375, -1.64849853515625, -1.4947509765625, -1.34100341796875, -1.187255859375, -1.03350830078125, -0.8797607421875, -0.72601318359375, -0.572265625, -0.41851806640625, -0.2647705078125, -0.11102294921875, 0.042724609375, 0.19647216796875, 0.3502197265625, 0.50396728515625, 0.65771484375, 0.81146240234375, 0.9652099609375, 1.11895751953125, 1.272705078125, 1.42645263671875, 1.5802001953125, 1.73394775390625, 1.8876953125, 2.04144287109375, 2.1951904296875, 2.34893798828125, 2.502685546875, 2.65643310546875, 2.8101806640625, 2.96392822265625, 3.11767578125, 3.27142333984375, 3.4251708984375, 3.57891845703125, 3.732666015625, 3.88641357421875, 4.0401611328125, 4.19390869140625, 4.34765625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 7.0, 3.0, 12.0, 9.0, 18.0, 17.0, 17.0, 18.0, 25.0, 36.0, 33.0, 26.0, 43.0, 45.0, 54.0, 58.0, 50.0, 49.0, 61.0, 47.0, 46.0, 33.0, 39.0, 35.0, 22.0, 30.0, 26.0, 22.0, 27.0, 12.0, 23.0, 12.0, 19.0, 8.0, 7.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0, -1.93939208984375, -1.8787841796875, -1.81817626953125, -1.757568359375, -1.69696044921875, -1.6363525390625, -1.57574462890625, -1.51513671875, -1.45452880859375, -1.3939208984375, -1.33331298828125, -1.272705078125, -1.21209716796875, -1.1514892578125, -1.09088134765625, -1.0302734375, -0.96966552734375, -0.9090576171875, -0.84844970703125, -0.787841796875, -0.72723388671875, -0.6666259765625, -0.60601806640625, -0.54541015625, -0.48480224609375, -0.4241943359375, -0.36358642578125, -0.302978515625, -0.24237060546875, -0.1817626953125, -0.12115478515625, -0.060546875, 6.103515625e-05, 0.0606689453125, 0.12127685546875, 0.181884765625, 0.24249267578125, 0.3031005859375, 0.36370849609375, 0.42431640625, 0.48492431640625, 0.5455322265625, 0.60614013671875, 0.666748046875, 0.72735595703125, 0.7879638671875, 0.84857177734375, 0.9091796875, 0.96978759765625, 1.0303955078125, 1.09100341796875, 1.151611328125, 1.21221923828125, 1.2728271484375, 1.33343505859375, 1.39404296875, 1.45465087890625, 1.5152587890625, 1.57586669921875, 1.636474609375, 1.69708251953125, 1.7576904296875, 1.81829833984375, 1.87890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 9.0, 11.0, 17.0, 20.0, 48.0, 91.0, 216.0, 848.0, 9849.0, 984756.0, 50500.0, 1647.0, 312.0, 134.0, 44.0, 20.0, 14.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.90966796875, -0.8609695434570312, -0.8122711181640625, -0.7635726928710938, -0.714874267578125, -0.6661758422851562, -0.6174774169921875, -0.5687789916992188, -0.52008056640625, -0.47138214111328125, -0.4226837158203125, -0.37398529052734375, -0.325286865234375, -0.27658843994140625, -0.2278900146484375, -0.17919158935546875, -0.1304931640625, -0.08179473876953125, -0.0330963134765625, 0.01560211181640625, 0.064300537109375, 0.11299896240234375, 0.1616973876953125, 0.21039581298828125, 0.25909423828125, 0.30779266357421875, 0.3564910888671875, 0.40518951416015625, 0.453887939453125, 0.5025863647460938, 0.5512847900390625, 0.5999832153320312, 0.648681640625, 0.6973800659179688, 0.7460784912109375, 0.7947769165039062, 0.843475341796875, 0.8921737670898438, 0.9408721923828125, 0.9895706176757812, 1.03826904296875, 1.0869674682617188, 1.1356658935546875, 1.1843643188476562, 1.233062744140625, 1.2817611694335938, 1.3304595947265625, 1.3791580200195312, 1.4278564453125, 1.4765548706054688, 1.5252532958984375, 1.5739517211914062, 1.622650146484375, 1.6713485717773438, 1.7200469970703125, 1.7687454223632812, 1.81744384765625, 1.8661422729492188, 1.9148406982421875, 1.9635391235351562, 2.012237548828125, 2.0609359741210938, 2.1096343994140625, 2.1583328247070312, 2.20703125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 6.0, 8.0, 10.0, 15.0, 23.0, 37.0, 51.0, 77.0, 110.0, 131.0, 147.0, 121.0, 90.0, 65.0, 35.0, 26.0, 15.0, 9.0, 8.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.872415542602539e-05, -6.586965173482895e-05, -6.301514804363251e-05, -6.0160644352436066e-05, -5.7306140661239624e-05, -5.445163697004318e-05, -5.159713327884674e-05, -4.87426295876503e-05, -4.588812589645386e-05, -4.3033622205257416e-05, -4.0179118514060974e-05, -3.732461482286453e-05, -3.447011113166809e-05, -3.161560744047165e-05, -2.8761103749275208e-05, -2.5906600058078766e-05, -2.3052096366882324e-05, -2.0197592675685883e-05, -1.734308898448944e-05, -1.4488585293293e-05, -1.1634081602096558e-05, -8.779577910900116e-06, -5.925074219703674e-06, -3.0705705285072327e-06, -2.1606683731079102e-07, 2.6384368538856506e-06, 5.492940545082092e-06, 8.347444236278534e-06, 1.1201947927474976e-05, 1.4056451618671417e-05, 1.691095530986786e-05, 1.97654590010643e-05, 2.2619962692260742e-05, 2.5474466383457184e-05, 2.8328970074653625e-05, 3.118347376585007e-05, 3.403797745704651e-05, 3.689248114824295e-05, 3.974698483943939e-05, 4.2601488530635834e-05, 4.5455992221832275e-05, 4.831049591302872e-05, 5.116499960422516e-05, 5.40195032954216e-05, 5.687400698661804e-05, 5.9728510677814484e-05, 6.258301436901093e-05, 6.543751806020737e-05, 6.829202175140381e-05, 7.114652544260025e-05, 7.400102913379669e-05, 7.685553282499313e-05, 7.971003651618958e-05, 8.256454020738602e-05, 8.541904389858246e-05, 8.82735475897789e-05, 9.112805128097534e-05, 9.398255497217178e-05, 9.683705866336823e-05, 9.969156235456467e-05, 0.00010254606604576111, 0.00010540056973695755, 0.00010825507342815399, 0.00011110957711935043, 0.00011396408081054688]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 9.0, 18.0, 15.0, 26.0, 91.0, 253.0, 925.0, 9201.0, 983904.0, 51539.0, 1944.0, 391.0, 131.0, 58.0, 24.0, 12.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.74609375, -1.69268798828125, -1.6392822265625, -1.58587646484375, -1.532470703125, -1.47906494140625, -1.4256591796875, -1.37225341796875, -1.31884765625, -1.26544189453125, -1.2120361328125, -1.15863037109375, -1.105224609375, -1.05181884765625, -0.9984130859375, -0.94500732421875, -0.8916015625, -0.83819580078125, -0.7847900390625, -0.73138427734375, -0.677978515625, -0.62457275390625, -0.5711669921875, -0.51776123046875, -0.46435546875, -0.41094970703125, -0.3575439453125, -0.30413818359375, -0.250732421875, -0.19732666015625, -0.1439208984375, -0.09051513671875, -0.037109375, 0.01629638671875, 0.0697021484375, 0.12310791015625, 0.176513671875, 0.22991943359375, 0.2833251953125, 0.33673095703125, 0.39013671875, 0.44354248046875, 0.4969482421875, 0.55035400390625, 0.603759765625, 0.65716552734375, 0.7105712890625, 0.76397705078125, 0.8173828125, 0.87078857421875, 0.9241943359375, 0.97760009765625, 1.031005859375, 1.08441162109375, 1.1378173828125, 1.19122314453125, 1.24462890625, 1.29803466796875, 1.3514404296875, 1.40484619140625, 1.458251953125, 1.51165771484375, 1.5650634765625, 1.61846923828125, 1.671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 2.0, 10.0, 6.0, 22.0, 47.0, 89.0, 203.0, 254.0, 193.0, 94.0, 40.0, 18.0, 14.0, 4.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.430908203125, -0.41674041748046875, -0.4025726318359375, -0.38840484619140625, -0.374237060546875, -0.36006927490234375, -0.3459014892578125, -0.33173370361328125, -0.31756591796875, -0.30339813232421875, -0.2892303466796875, -0.27506256103515625, -0.260894775390625, -0.24672698974609375, -0.2325592041015625, -0.21839141845703125, -0.2042236328125, -0.19005584716796875, -0.1758880615234375, -0.16172027587890625, -0.147552490234375, -0.13338470458984375, -0.1192169189453125, -0.10504913330078125, -0.09088134765625, -0.07671356201171875, -0.0625457763671875, -0.04837799072265625, -0.034210205078125, -0.02004241943359375, -0.0058746337890625, 0.00829315185546875, 0.0224609375, 0.03662872314453125, 0.0507965087890625, 0.06496429443359375, 0.079132080078125, 0.09329986572265625, 0.1074676513671875, 0.12163543701171875, 0.13580322265625, 0.14997100830078125, 0.1641387939453125, 0.17830657958984375, 0.192474365234375, 0.20664215087890625, 0.2208099365234375, 0.23497772216796875, 0.2491455078125, 0.26331329345703125, 0.2774810791015625, 0.29164886474609375, 0.305816650390625, 0.31998443603515625, 0.3341522216796875, 0.34832000732421875, 0.36248779296875, 0.37665557861328125, 0.3908233642578125, 0.40499114990234375, 0.419158935546875, 0.43332672119140625, 0.4474945068359375, 0.46166229248046875, 0.475830078125]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 9.0, 6.0, 12.0, 16.0, 12.0, 16.0, 21.0, 37.0, 55.0, 45.0, 84.0, 106.0, 94.0, 132.0, 84.0, 69.0, 53.0, 45.0, 25.0, 24.0, 10.0, 11.0, 6.0, 10.0, 8.0, 1.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.9204657077789307, -2.8390283584594727, -2.7575907707214355, -2.6761534214019775, -2.5947160720825195, -2.5132784843444824, -2.4318411350250244, -2.3504037857055664, -2.2689661979675293, -2.1875288486480713, -2.106091260910034, -2.024653911590576, -1.9432165622711182, -1.8617790937423706, -1.780341625213623, -1.698904275894165, -1.617466926574707, -1.5360294580459595, -1.4545921087265015, -1.373154640197754, -1.291717290878296, -1.2102798223495483, -1.1288423538208008, -1.0474050045013428, -0.9659675359725952, -0.8845301270484924, -0.8030927181243896, -0.7216552495956421, -0.6402178406715393, -0.5587804317474365, -0.47734299302101135, -0.3959055542945862, -0.3144681453704834, -0.23303072154521942, -0.15159329771995544, -0.07015587389469147, 0.01128154993057251, 0.09271895885467529, 0.17415639758110046, 0.25559383630752563, 0.3370312452316284, 0.4184686541557312, 0.49990609288215637, 0.5813435316085815, 0.6627809405326843, 0.7442183494567871, 0.8256558179855347, 0.9070932269096375, 0.9885306358337402, 1.0699681043624878, 1.1514054536819458, 1.2328429222106934, 1.3142802715301514, 1.395717740058899, 1.4771552085876465, 1.5585925579071045, 1.640030026435852, 1.7214674949645996, 1.8029048442840576, 1.8843423128128052, 1.9657797813415527, 2.0472171306610107, 2.1286544799804688, 2.210092067718506, 2.291529417037964]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 8.0, 6.0, 9.0, 18.0, 25.0, 18.0, 30.0, 29.0, 46.0, 35.0, 45.0, 68.0, 59.0, 73.0, 57.0, 65.0, 76.0, 59.0, 46.0, 37.0, 48.0, 37.0, 30.0, 29.0, 16.0, 14.0, 13.0, 7.0, 6.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8982648849487305, -2.756880521774292, -2.6154961585998535, -2.474111795425415, -2.3327274322509766, -2.191343307495117, -2.0499589443206787, -1.9085745811462402, -1.7671902179718018, -1.6258058547973633, -1.4844214916229248, -1.3430372476577759, -1.2016528844833374, -1.060268521308899, -0.9188842177391052, -0.7774999141693115, -0.636115550994873, -0.49473121762275696, -0.35334688425064087, -0.21196255087852478, -0.07057821750640869, 0.07080614566802979, 0.2121904492378235, 0.3535747528076172, 0.49495911598205566, 0.6363434791564941, 0.7777277827262878, 0.9191120862960815, 1.06049644947052, 1.2018808126449585, 1.3432650566101074, 1.484649419784546, 1.6260337829589844, 1.7674181461334229, 1.9088025093078613, 2.0501868724823, 2.1915712356567383, 2.3329553604125977, 2.474339723587036, 2.6157240867614746, 2.757108449935913, 2.8984928131103516, 3.03987717628479, 3.1812615394592285, 3.322645664215088, 3.4640302658081055, 3.605414390563965, 3.7467987537384033, 3.888183116912842, 4.029567241668701, 4.170951843261719, 4.312335968017578, 4.453720569610596, 4.595104694366455, 4.736489295959473, 4.877873420715332, 5.019257545471191, 5.160641670227051, 5.302026271820068, 5.443410396575928, 5.584794998168945, 5.726179122924805, 5.867563724517822, 6.008947849273682, 6.150332450866699]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 4.0, 2.0, 6.0, 5.0, 6.0, 11.0, 11.0, 14.0, 21.0, 30.0, 39.0, 64.0, 75.0, 129.0, 201.0, 327.0, 610.0, 1390.0, 3614.0, 17932.0, 284192.0, 3446205.0, 405749.0, 24892.0, 4715.0, 2051.0, 919.0, 448.0, 229.0, 131.0, 81.0, 56.0, 37.0, 26.0, 20.0, 11.0, 9.0, 9.0, 5.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.310546875, -2.2296142578125, -2.148681640625, -2.0677490234375, -1.98681640625, -1.9058837890625, -1.824951171875, -1.7440185546875, -1.6630859375, -1.5821533203125, -1.501220703125, -1.4202880859375, -1.33935546875, -1.2584228515625, -1.177490234375, -1.0965576171875, -1.015625, -0.9346923828125, -0.853759765625, -0.7728271484375, -0.69189453125, -0.6109619140625, -0.530029296875, -0.4490966796875, -0.3681640625, -0.2872314453125, -0.206298828125, -0.1253662109375, -0.04443359375, 0.0364990234375, 0.117431640625, 0.1983642578125, 0.279296875, 0.3602294921875, 0.441162109375, 0.5220947265625, 0.60302734375, 0.6839599609375, 0.764892578125, 0.8458251953125, 0.9267578125, 1.0076904296875, 1.088623046875, 1.1695556640625, 1.25048828125, 1.3314208984375, 1.412353515625, 1.4932861328125, 1.57421875, 1.6551513671875, 1.736083984375, 1.8170166015625, 1.89794921875, 1.9788818359375, 2.059814453125, 2.1407470703125, 2.2216796875, 2.3026123046875, 2.383544921875, 2.4644775390625, 2.54541015625, 2.6263427734375, 2.707275390625, 2.7882080078125, 2.869140625]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 8.0, 10.0, 24.0, 27.0, 32.0, 51.0, 52.0, 70.0, 105.0, 95.0, 81.0, 89.0, 74.0, 73.0, 73.0, 43.0, 24.0, 21.0, 12.0, 17.0, 4.0, 2.0, 5.0, 4.0, 2.0, 3.0], "bins": [-3.060546875, -2.997100830078125, -2.93365478515625, -2.870208740234375, -2.8067626953125, -2.743316650390625, -2.67987060546875, -2.616424560546875, -2.552978515625, -2.489532470703125, -2.42608642578125, -2.362640380859375, -2.2991943359375, -2.235748291015625, -2.17230224609375, -2.108856201171875, -2.04541015625, -1.981964111328125, -1.91851806640625, -1.855072021484375, -1.7916259765625, -1.728179931640625, -1.66473388671875, -1.601287841796875, -1.537841796875, -1.474395751953125, -1.41094970703125, -1.347503662109375, -1.2840576171875, -1.220611572265625, -1.15716552734375, -1.093719482421875, -1.0302734375, -0.966827392578125, -0.90338134765625, -0.839935302734375, -0.7764892578125, -0.713043212890625, -0.64959716796875, -0.586151123046875, -0.522705078125, -0.459259033203125, -0.39581298828125, -0.332366943359375, -0.2689208984375, -0.205474853515625, -0.14202880859375, -0.078582763671875, -0.01513671875, 0.048309326171875, 0.11175537109375, 0.175201416015625, 0.2386474609375, 0.302093505859375, 0.36553955078125, 0.428985595703125, 0.492431640625, 0.555877685546875, 0.61932373046875, 0.682769775390625, 0.7462158203125, 0.809661865234375, 0.87310791015625, 0.936553955078125, 1.0]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 10.0, 9.0, 17.0, 14.0, 37.0, 57.0, 84.0, 128.0, 184.0, 327.0, 519.0, 1027.0, 1998.0, 4324.0, 11990.0, 47906.0, 482787.0, 3345498.0, 247675.0, 33016.0, 9348.0, 3577.0, 1669.0, 854.0, 454.0, 256.0, 203.0, 95.0, 63.0, 46.0, 34.0, 20.0, 19.0, 8.0, 6.0, 2.0, 7.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5546875, -1.506683349609375, -1.45867919921875, -1.410675048828125, -1.3626708984375, -1.314666748046875, -1.26666259765625, -1.218658447265625, -1.170654296875, -1.122650146484375, -1.07464599609375, -1.026641845703125, -0.9786376953125, -0.930633544921875, -0.88262939453125, -0.834625244140625, -0.78662109375, -0.738616943359375, -0.69061279296875, -0.642608642578125, -0.5946044921875, -0.546600341796875, -0.49859619140625, -0.450592041015625, -0.402587890625, -0.354583740234375, -0.30657958984375, -0.258575439453125, -0.2105712890625, -0.162567138671875, -0.11456298828125, -0.066558837890625, -0.0185546875, 0.029449462890625, 0.07745361328125, 0.125457763671875, 0.1734619140625, 0.221466064453125, 0.26947021484375, 0.317474365234375, 0.365478515625, 0.413482666015625, 0.46148681640625, 0.509490966796875, 0.5574951171875, 0.605499267578125, 0.65350341796875, 0.701507568359375, 0.74951171875, 0.797515869140625, 0.84552001953125, 0.893524169921875, 0.9415283203125, 0.989532470703125, 1.03753662109375, 1.085540771484375, 1.133544921875, 1.181549072265625, 1.22955322265625, 1.277557373046875, 1.3255615234375, 1.373565673828125, 1.42156982421875, 1.469573974609375, 1.517578125]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 6.0, 8.0, 8.0, 16.0, 15.0, 25.0, 24.0, 51.0, 72.0, 133.0, 220.0, 385.0, 574.0, 749.0, 638.0, 405.0, 257.0, 169.0, 105.0, 60.0, 42.0, 25.0, 23.0, 13.0, 8.0, 8.0, 2.0, 7.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.464599609375, -0.4489860534667969, -0.43337249755859375, -0.4177589416503906, -0.4021453857421875, -0.3865318298339844, -0.37091827392578125, -0.3553047180175781, -0.339691162109375, -0.3240776062011719, -0.30846405029296875, -0.2928504943847656, -0.2772369384765625, -0.2616233825683594, -0.24600982666015625, -0.23039627075195312, -0.21478271484375, -0.19916915893554688, -0.18355560302734375, -0.16794204711914062, -0.1523284912109375, -0.13671493530273438, -0.12110137939453125, -0.10548782348632812, -0.089874267578125, -0.07426071166992188, -0.05864715576171875, -0.043033599853515625, -0.0274200439453125, -0.011806488037109375, 0.00380706787109375, 0.019420623779296875, 0.0350341796875, 0.050647735595703125, 0.06626129150390625, 0.08187484741210938, 0.0974884033203125, 0.11310195922851562, 0.12871551513671875, 0.14432907104492188, 0.159942626953125, 0.17555618286132812, 0.19116973876953125, 0.20678329467773438, 0.2223968505859375, 0.23801040649414062, 0.25362396240234375, 0.2692375183105469, 0.28485107421875, 0.3004646301269531, 0.31607818603515625, 0.3316917419433594, 0.3473052978515625, 0.3629188537597656, 0.37853240966796875, 0.3941459655761719, 0.409759521484375, 0.4253730773925781, 0.44098663330078125, 0.4566001892089844, 0.4722137451171875, 0.4878273010253906, 0.5034408569335938, 0.5190544128417969, 0.53466796875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 4.0, 3.0, 11.0, 9.0, 12.0, 16.0, 34.0, 37.0, 44.0, 57.0, 82.0, 95.0, 123.0, 103.0, 107.0, 67.0, 61.0, 31.0, 27.0, 22.0, 16.0, 9.0, 7.0, 10.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9541956186294556, -1.8948231935501099, -1.8354507684707642, -1.7760783433914185, -1.7167059183120728, -1.657333493232727, -1.597961187362671, -1.5385887622833252, -1.4792163372039795, -1.4198439121246338, -1.360471487045288, -1.3010990619659424, -1.2417266368865967, -1.182354211807251, -1.1229817867279053, -1.0636093616485596, -1.0042369365692139, -0.9448645114898682, -0.8854920864105225, -0.8261196613311768, -0.766747236251831, -0.7073748111724854, -0.6480024456977844, -0.5886300206184387, -0.529257595539093, -0.4698851704597473, -0.4105127453804016, -0.3511403501033783, -0.2917679250240326, -0.2323954999446869, -0.17302310466766357, -0.11365067958831787, -0.05427825450897217, 0.005094163119792938, 0.06446658074855804, 0.12383899092674255, 0.18321141600608826, 0.24258384108543396, 0.3019562363624573, 0.361328661441803, 0.4207010865211487, 0.4800735116004944, 0.5394459366798401, 0.598818302154541, 0.6581907272338867, 0.7175631523132324, 0.7769355773925781, 0.8363080024719238, 0.8956804275512695, 0.9550528526306152, 1.014425277709961, 1.0737977027893066, 1.1331701278686523, 1.192542552947998, 1.2519149780273438, 1.3112874031066895, 1.3706598281860352, 1.4300322532653809, 1.4894046783447266, 1.5487771034240723, 1.608149528503418, 1.6675219535827637, 1.7268943786621094, 1.786266803741455, 1.8456391096115112]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 3.0, 5.0, 7.0, 7.0, 13.0, 20.0, 17.0, 18.0, 17.0, 30.0, 31.0, 29.0, 28.0, 42.0, 51.0, 57.0, 49.0, 59.0, 71.0, 52.0, 57.0, 46.0, 39.0, 31.0, 41.0, 29.0, 28.0, 21.0, 14.0, 18.0, 18.0, 12.0, 7.0, 6.0, 5.0, 4.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1175644397735596, -1.0779024362564087, -1.0382405519485474, -0.9985785484313965, -0.9589165449142456, -0.9192546010017395, -0.8795926570892334, -0.8399306535720825, -0.8002687096595764, -0.7606067657470703, -0.7209447622299194, -0.6812828183174133, -0.6416208744049072, -0.6019588708877563, -0.5622969269752502, -0.5226349830627441, -0.48297297954559326, -0.44331100583076477, -0.4036490321159363, -0.3639870882034302, -0.3243251144886017, -0.2846631407737732, -0.2450011819601059, -0.2053392231464386, -0.1656772494316101, -0.12601527571678162, -0.08635331690311432, -0.046691350638866425, -0.00702938437461853, 0.03263258934020996, 0.07229454815387726, 0.11195650696754456, 0.1516183614730835, 0.191280335187912, 0.23094229400157928, 0.2706042528152466, 0.3102662265300751, 0.34992820024490356, 0.38959014415740967, 0.42925211787223816, 0.46891409158706665, 0.5085760354995728, 0.5482380390167236, 0.5878999829292297, 0.6275619268417358, 0.6672239303588867, 0.7068858742713928, 0.7465478181838989, 0.7862098217010498, 0.8258717656135559, 0.8655337691307068, 0.9051957130432129, 0.9448577165603638, 0.9845196604728699, 1.024181604385376, 1.0638436079025269, 1.1035056114196777, 1.1431676149368286, 1.18282949924469, 1.2224915027618408, 1.2621535062789917, 1.3018155097961426, 1.341477394104004, 1.3811393976211548, 1.4208012819290161]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 6.0, 5.0, 7.0, 3.0, 9.0, 7.0, 15.0, 18.0, 15.0, 16.0, 29.0, 25.0, 43.0, 51.0, 77.0, 122.0, 361.0, 894.0, 2629.0, 9265.0, 45213.0, 329901.0, 550525.0, 87733.0, 15344.0, 3846.0, 1378.0, 446.0, 196.0, 99.0, 62.0, 57.0, 28.0, 25.0, 20.0, 18.0, 13.0, 9.0, 8.0, 7.0, 12.0, 8.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.316650390625, -0.3068084716796875, -0.296966552734375, -0.2871246337890625, -0.27728271484375, -0.2674407958984375, -0.257598876953125, -0.2477569580078125, -0.2379150390625, -0.2280731201171875, -0.218231201171875, -0.2083892822265625, -0.19854736328125, -0.1887054443359375, -0.178863525390625, -0.1690216064453125, -0.1591796875, -0.1493377685546875, -0.139495849609375, -0.1296539306640625, -0.11981201171875, -0.1099700927734375, -0.100128173828125, -0.0902862548828125, -0.0804443359375, -0.0706024169921875, -0.060760498046875, -0.0509185791015625, -0.04107666015625, -0.0312347412109375, -0.021392822265625, -0.0115509033203125, -0.001708984375, 0.0081329345703125, 0.017974853515625, 0.0278167724609375, 0.03765869140625, 0.0475006103515625, 0.057342529296875, 0.0671844482421875, 0.0770263671875, 0.0868682861328125, 0.096710205078125, 0.1065521240234375, 0.11639404296875, 0.1262359619140625, 0.136077880859375, 0.1459197998046875, 0.15576171875, 0.1656036376953125, 0.175445556640625, 0.1852874755859375, 0.19512939453125, 0.2049713134765625, 0.214813232421875, 0.2246551513671875, 0.2344970703125, 0.2443389892578125, 0.254180908203125, 0.2640228271484375, 0.27386474609375, 0.2837066650390625, 0.293548583984375, 0.3033905029296875, 0.313232421875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 9.0, 5.0, 21.0, 30.0, 49.0, 58.0, 97.0, 126.0, 160.0, 156.0, 103.0, 63.0, 52.0, 35.0, 17.0, 7.0, 8.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.154296875, -3.08795166015625, -3.0216064453125, -2.95526123046875, -2.888916015625, -2.82257080078125, -2.7562255859375, -2.68988037109375, -2.62353515625, -2.55718994140625, -2.4908447265625, -2.42449951171875, -2.358154296875, -2.29180908203125, -2.2254638671875, -2.15911865234375, -2.0927734375, -2.02642822265625, -1.9600830078125, -1.89373779296875, -1.827392578125, -1.76104736328125, -1.6947021484375, -1.62835693359375, -1.56201171875, -1.49566650390625, -1.4293212890625, -1.36297607421875, -1.296630859375, -1.23028564453125, -1.1639404296875, -1.09759521484375, -1.03125, -0.96490478515625, -0.8985595703125, -0.83221435546875, -0.765869140625, -0.69952392578125, -0.6331787109375, -0.56683349609375, -0.50048828125, -0.43414306640625, -0.3677978515625, -0.30145263671875, -0.235107421875, -0.16876220703125, -0.1024169921875, -0.03607177734375, 0.0302734375, 0.09661865234375, 0.1629638671875, 0.22930908203125, 0.295654296875, 0.36199951171875, 0.4283447265625, 0.49468994140625, 0.56103515625, 0.62738037109375, 0.6937255859375, 0.76007080078125, 0.826416015625, 0.89276123046875, 0.9591064453125, 1.02545166015625, 1.091796875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 4.0, 2.0, 3.0, 7.0, 8.0, 13.0, 16.0, 20.0, 29.0, 29.0, 66.0, 91.0, 130.0, 231.0, 316.0, 566.0, 964.0, 1922.0, 3874.0, 9119.0, 24534.0, 72144.0, 231511.0, 419048.0, 188609.0, 59000.0, 20840.0, 8259.0, 3403.0, 1667.0, 862.0, 459.0, 263.0, 197.0, 94.0, 79.0, 51.0, 40.0, 24.0, 21.0, 15.0, 16.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.1949462890625, -0.1895923614501953, -0.18423843383789062, -0.17888450622558594, -0.17353057861328125, -0.16817665100097656, -0.16282272338867188, -0.1574687957763672, -0.1521148681640625, -0.1467609405517578, -0.14140701293945312, -0.13605308532714844, -0.13069915771484375, -0.12534523010253906, -0.11999130249023438, -0.11463737487792969, -0.109283447265625, -0.10392951965332031, -0.09857559204101562, -0.09322166442871094, -0.08786773681640625, -0.08251380920410156, -0.07715988159179688, -0.07180595397949219, -0.0664520263671875, -0.06109809875488281, -0.055744171142578125, -0.05039024353027344, -0.04503631591796875, -0.03968238830566406, -0.034328460693359375, -0.028974533081054688, -0.02362060546875, -0.018266677856445312, -0.012912750244140625, -0.0075588226318359375, -0.00220489501953125, 0.0031490325927734375, 0.008502960205078125, 0.013856887817382812, 0.0192108154296875, 0.024564743041992188, 0.029918670654296875, 0.03527259826660156, 0.04062652587890625, 0.04598045349121094, 0.051334381103515625, 0.05668830871582031, 0.062042236328125, 0.06739616394042969, 0.07275009155273438, 0.07810401916503906, 0.08345794677734375, 0.08881187438964844, 0.09416580200195312, 0.09951972961425781, 0.1048736572265625, 0.11022758483886719, 0.11558151245117188, 0.12093544006347656, 0.12628936767578125, 0.13164329528808594, 0.13699722290039062, 0.1423511505126953, 0.147705078125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 9.0, 5.0, 8.0, 8.0, 22.0, 22.0, 14.0, 15.0, 24.0, 31.0, 37.0, 34.0, 49.0, 51.0, 55.0, 51.0, 45.0, 44.0, 62.0, 50.0, 49.0, 34.0, 37.0, 37.0, 33.0, 25.0, 24.0, 28.0, 19.0, 19.0, 7.0, 16.0, 11.0, 6.0, 8.0, 1.0, 4.0, 5.0, 4.0], "bins": [-2.1484375, -2.0975341796875, -2.046630859375, -1.9957275390625, -1.94482421875, -1.8939208984375, -1.843017578125, -1.7921142578125, -1.7412109375, -1.6903076171875, -1.639404296875, -1.5885009765625, -1.53759765625, -1.4866943359375, -1.435791015625, -1.3848876953125, -1.333984375, -1.2830810546875, -1.232177734375, -1.1812744140625, -1.13037109375, -1.0794677734375, -1.028564453125, -0.9776611328125, -0.9267578125, -0.8758544921875, -0.824951171875, -0.7740478515625, -0.72314453125, -0.6722412109375, -0.621337890625, -0.5704345703125, -0.51953125, -0.4686279296875, -0.417724609375, -0.3668212890625, -0.31591796875, -0.2650146484375, -0.214111328125, -0.1632080078125, -0.1123046875, -0.0614013671875, -0.010498046875, 0.0404052734375, 0.09130859375, 0.1422119140625, 0.193115234375, 0.2440185546875, 0.294921875, 0.3458251953125, 0.396728515625, 0.4476318359375, 0.49853515625, 0.5494384765625, 0.600341796875, 0.6512451171875, 0.7021484375, 0.7530517578125, 0.803955078125, 0.8548583984375, 0.90576171875, 0.9566650390625, 1.007568359375, 1.0584716796875, 1.109375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 14.0, 10.0, 15.0, 19.0, 36.0, 50.0, 84.0, 139.0, 227.0, 448.0, 1068.0, 2792.0, 10085.0, 53132.0, 440815.0, 466199.0, 57611.0, 10579.0, 2975.0, 1091.0, 500.0, 255.0, 135.0, 89.0, 60.0, 33.0, 28.0, 16.0, 17.0, 6.0, 6.0, 2.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.09307861328125, -0.09025955200195312, -0.08744049072265625, -0.08462142944335938, -0.0818023681640625, -0.07898330688476562, -0.07616424560546875, -0.07334518432617188, -0.070526123046875, -0.06770706176757812, -0.06488800048828125, -0.062068939208984375, -0.0592498779296875, -0.056430816650390625, -0.05361175537109375, -0.050792694091796875, -0.0479736328125, -0.045154571533203125, -0.04233551025390625, -0.039516448974609375, -0.0366973876953125, -0.033878326416015625, -0.03105926513671875, -0.028240203857421875, -0.025421142578125, -0.022602081298828125, -0.01978302001953125, -0.016963958740234375, -0.0141448974609375, -0.011325836181640625, -0.00850677490234375, -0.005687713623046875, -0.00286865234375, -4.9591064453125e-05, 0.00276947021484375, 0.005588531494140625, 0.0084075927734375, 0.011226654052734375, 0.01404571533203125, 0.016864776611328125, 0.019683837890625, 0.022502899169921875, 0.02532196044921875, 0.028141021728515625, 0.0309600830078125, 0.033779144287109375, 0.03659820556640625, 0.039417266845703125, 0.042236328125, 0.045055389404296875, 0.04787445068359375, 0.050693511962890625, 0.0535125732421875, 0.056331634521484375, 0.05915069580078125, 0.061969757080078125, 0.064788818359375, 0.06760787963867188, 0.07042694091796875, 0.07324600219726562, 0.0760650634765625, 0.07888412475585938, 0.08170318603515625, 0.08452224731445312, 0.08734130859375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 8.0, 8.0, 11.0, 8.0, 22.0, 28.0, 32.0, 46.0, 63.0, 78.0, 94.0, 110.0, 110.0, 96.0, 75.0, 54.0, 58.0, 23.0, 24.0, 15.0, 13.0, 5.0, 7.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.820657730102539e-05, -3.700517117977142e-05, -3.5803765058517456e-05, -3.460235893726349e-05, -3.340095281600952e-05, -3.2199546694755554e-05, -3.099814057350159e-05, -2.979673445224762e-05, -2.8595328330993652e-05, -2.7393922209739685e-05, -2.6192516088485718e-05, -2.499110996723175e-05, -2.3789703845977783e-05, -2.2588297724723816e-05, -2.138689160346985e-05, -2.018548548221588e-05, -1.8984079360961914e-05, -1.7782673239707947e-05, -1.658126711845398e-05, -1.5379860997200012e-05, -1.4178454875946045e-05, -1.2977048754692078e-05, -1.177564263343811e-05, -1.0574236512184143e-05, -9.372830390930176e-06, -8.171424269676208e-06, -6.970018148422241e-06, -5.768612027168274e-06, -4.567205905914307e-06, -3.3657997846603394e-06, -2.164393663406372e-06, -9.629875421524048e-07, 2.384185791015625e-07, 1.4398247003555298e-06, 2.641230821609497e-06, 3.842636942863464e-06, 5.044043064117432e-06, 6.245449185371399e-06, 7.446855306625366e-06, 8.648261427879333e-06, 9.8496675491333e-06, 1.1051073670387268e-05, 1.2252479791641235e-05, 1.3453885912895203e-05, 1.465529203414917e-05, 1.5856698155403137e-05, 1.7058104276657104e-05, 1.8259510397911072e-05, 1.946091651916504e-05, 2.0662322640419006e-05, 2.1863728761672974e-05, 2.306513488292694e-05, 2.4266541004180908e-05, 2.5467947125434875e-05, 2.6669353246688843e-05, 2.787075936794281e-05, 2.9072165489196777e-05, 3.0273571610450745e-05, 3.147497773170471e-05, 3.267638385295868e-05, 3.3877789974212646e-05, 3.5079196095466614e-05, 3.628060221672058e-05, 3.748200833797455e-05, 3.8683414459228516e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 5.0, 7.0, 13.0, 20.0, 30.0, 31.0, 73.0, 96.0, 169.0, 303.0, 565.0, 1111.0, 2258.0, 5093.0, 13241.0, 37969.0, 117304.0, 308031.0, 343093.0, 144606.0, 46842.0, 16039.0, 6301.0, 2623.0, 1236.0, 659.0, 327.0, 192.0, 119.0, 73.0, 48.0, 27.0, 17.0, 9.0, 9.0, 3.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0579833984375, -0.056461334228515625, -0.05493927001953125, -0.053417205810546875, -0.0518951416015625, -0.050373077392578125, -0.04885101318359375, -0.047328948974609375, -0.045806884765625, -0.044284820556640625, -0.04276275634765625, -0.041240692138671875, -0.0397186279296875, -0.038196563720703125, -0.03667449951171875, -0.035152435302734375, -0.03363037109375, -0.032108306884765625, -0.03058624267578125, -0.029064178466796875, -0.0275421142578125, -0.026020050048828125, -0.02449798583984375, -0.022975921630859375, -0.021453857421875, -0.019931793212890625, -0.01840972900390625, -0.016887664794921875, -0.0153656005859375, -0.013843536376953125, -0.01232147216796875, -0.010799407958984375, -0.00927734375, -0.007755279541015625, -0.00623321533203125, -0.004711151123046875, -0.0031890869140625, -0.001667022705078125, -0.00014495849609375, 0.001377105712890625, 0.002899169921875, 0.004421234130859375, 0.00594329833984375, 0.007465362548828125, 0.0089874267578125, 0.010509490966796875, 0.01203155517578125, 0.013553619384765625, 0.01507568359375, 0.016597747802734375, 0.01811981201171875, 0.019641876220703125, 0.0211639404296875, 0.022686004638671875, 0.02420806884765625, 0.025730133056640625, 0.027252197265625, 0.028774261474609375, 0.03029632568359375, 0.031818389892578125, 0.0333404541015625, 0.034862518310546875, 0.03638458251953125, 0.037906646728515625, 0.0394287109375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 0.0, 3.0, 6.0, 4.0, 9.0, 13.0, 12.0, 12.0, 21.0, 16.0, 25.0, 29.0, 33.0, 49.0, 49.0, 37.0, 53.0, 49.0, 64.0, 58.0, 63.0, 71.0, 56.0, 49.0, 46.0, 35.0, 26.0, 22.0, 20.0, 17.0, 10.0, 8.0, 11.0, 4.0, 9.0, 3.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010772705078125, -0.010311126708984375, -0.00984954833984375, -0.009387969970703125, -0.0089263916015625, -0.008464813232421875, -0.00800323486328125, -0.007541656494140625, -0.007080078125, -0.006618499755859375, -0.00615692138671875, -0.005695343017578125, -0.0052337646484375, -0.004772186279296875, -0.00431060791015625, -0.003849029541015625, -0.003387451171875, -0.002925872802734375, -0.00246429443359375, -0.002002716064453125, -0.0015411376953125, -0.001079559326171875, -0.00061798095703125, -0.000156402587890625, 0.00030517578125, 0.000766754150390625, 0.00122833251953125, 0.001689910888671875, 0.0021514892578125, 0.002613067626953125, 0.00307464599609375, 0.003536224365234375, 0.003997802734375, 0.004459381103515625, 0.00492095947265625, 0.005382537841796875, 0.0058441162109375, 0.006305694580078125, 0.00676727294921875, 0.007228851318359375, 0.0076904296875, 0.008152008056640625, 0.00861358642578125, 0.009075164794921875, 0.0095367431640625, 0.009998321533203125, 0.01045989990234375, 0.010921478271484375, 0.011383056640625, 0.011844635009765625, 0.01230621337890625, 0.012767791748046875, 0.0132293701171875, 0.013690948486328125, 0.01415252685546875, 0.014614105224609375, 0.01507568359375, 0.015537261962890625, 0.01599884033203125, 0.016460418701171875, 0.0169219970703125, 0.017383575439453125, 0.01784515380859375, 0.018306732177734375, 0.018768310546875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 15.0, 29.0, 68.0, 175.0, 291.0, 248.0, 102.0, 45.0, 16.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.492897868156433, -1.3916181325912476, -1.2903382778167725, -1.189058542251587, -1.0877788066864014, -0.9864989519119263, -0.8852192163467407, -0.7839394211769104, -0.6826596260070801, -0.5813798308372498, -0.4801000654697418, -0.3788203001022339, -0.27754050493240356, -0.17626070976257324, -0.0749809741973877, 0.026298820972442627, 0.12757861614227295, 0.22885839641094208, 0.3301381766796112, 0.43141794204711914, 0.5326977372169495, 0.6339775323867798, 0.7352572679519653, 0.8365370631217957, 0.937816858291626, 1.0390965938568115, 1.1403764486312866, 1.2416561841964722, 1.3429360389709473, 1.4442157745361328, 1.5454955101013184, 1.646775245666504, 1.7480549812316895, 1.849334716796875, 1.95061457157135, 2.051894187927246, 2.1531741619110107, 2.2544538974761963, 2.355733633041382, 2.4570133686065674, 2.558293342590332, 2.6595730781555176, 2.760852813720703, 2.8621325492858887, 2.9634125232696533, 3.064692258834839, 3.1659719944000244, 3.26725172996521, 3.3685314655303955, 3.469811201095581, 3.5710909366607666, 3.6723709106445312, 3.773650646209717, 3.8749303817749023, 3.976210117340088, 4.077489852905273, 4.178769588470459, 4.2800493240356445, 4.38132905960083, 4.482608795166016, 4.583888530731201, 4.685168266296387, 4.7864484786987305, 4.887728214263916, 4.989007949829102]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 1.0, 4.0, 4.0, 5.0, 7.0, 10.0, 18.0, 21.0, 18.0, 23.0, 34.0, 36.0, 40.0, 44.0, 68.0, 67.0, 59.0, 81.0, 74.0, 70.0, 51.0, 40.0, 47.0, 44.0, 30.0, 21.0, 17.0, 21.0, 10.0, 8.0, 6.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8784547448158264, -0.8474689722061157, -0.816483199596405, -0.7854974269866943, -0.7545115947723389, -0.7235258221626282, -0.6925400495529175, -0.6615542769432068, -0.6305685043334961, -0.5995827317237854, -0.5685969591140747, -0.5376111268997192, -0.5066253542900085, -0.47563958168029785, -0.44465380907058716, -0.41366803646087646, -0.382682204246521, -0.3516964316368103, -0.3207106292247772, -0.28972485661506653, -0.25873905420303345, -0.22775328159332275, -0.19676750898361206, -0.16578172147274017, -0.1347959339618683, -0.1038101464509964, -0.07282436639070511, -0.04183858633041382, -0.010852798819541931, 0.020132988691329956, 0.05111876130104065, 0.08210454881191254, 0.11309027671813965, 0.14407606422901154, 0.17506185173988342, 0.20604762434959412, 0.237033411860466, 0.2680191993713379, 0.2990049719810486, 0.3299907445907593, 0.36097654700279236, 0.39196231961250305, 0.42294812202453613, 0.4539338946342468, 0.4849196672439575, 0.515905499458313, 0.5468912124633789, 0.5778770446777344, 0.6088628172874451, 0.6398485898971558, 0.6708343625068665, 0.7018201351165771, 0.7328059673309326, 0.7637917399406433, 0.794777512550354, 0.8257632851600647, 0.8567490577697754, 0.8877348303794861, 0.9187206029891968, 0.9497064352035522, 0.9806922078132629, 1.0116779804229736, 1.042663812637329, 1.073649525642395, 1.1046353578567505]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 9.0, 16.0, 10.0, 14.0, 30.0, 52.0, 104.0, 190.0, 402.0, 838.0, 1937.0, 4847.0, 14138.0, 52634.0, 325768.0, 529410.0, 86259.0, 20532.0, 6720.0, 2511.0, 1110.0, 490.0, 230.0, 122.0, 74.0, 24.0, 18.0, 15.0, 9.0, 10.0, 6.0, 4.0, 4.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.78515625, -0.7582244873046875, -0.731292724609375, -0.7043609619140625, -0.67742919921875, -0.6504974365234375, -0.623565673828125, -0.5966339111328125, -0.5697021484375, -0.5427703857421875, -0.515838623046875, -0.4889068603515625, -0.46197509765625, -0.4350433349609375, -0.408111572265625, -0.3811798095703125, -0.354248046875, -0.3273162841796875, -0.300384521484375, -0.2734527587890625, -0.24652099609375, -0.2195892333984375, -0.192657470703125, -0.1657257080078125, -0.1387939453125, -0.1118621826171875, -0.084930419921875, -0.0579986572265625, -0.03106689453125, -0.0041351318359375, 0.022796630859375, 0.0497283935546875, 0.07666015625, 0.1035919189453125, 0.130523681640625, 0.1574554443359375, 0.18438720703125, 0.2113189697265625, 0.238250732421875, 0.2651824951171875, 0.2921142578125, 0.3190460205078125, 0.345977783203125, 0.3729095458984375, 0.39984130859375, 0.4267730712890625, 0.453704833984375, 0.4806365966796875, 0.507568359375, 0.5345001220703125, 0.561431884765625, 0.5883636474609375, 0.61529541015625, 0.6422271728515625, 0.669158935546875, 0.6960906982421875, 0.7230224609375, 0.7499542236328125, 0.776885986328125, 0.8038177490234375, 0.83074951171875, 0.8576812744140625, 0.884613037109375, 0.9115447998046875, 0.9384765625]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 6.0, 14.0, 13.0, 13.0, 12.0, 22.0, 32.0, 45.0, 34.0, 55.0, 63.0, 59.0, 68.0, 70.0, 71.0, 73.0, 51.0, 45.0, 45.0, 44.0, 31.0, 29.0, 25.0, 14.0, 15.0, 12.0, 4.0, 5.0, 9.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6064453125, -1.5441436767578125, -1.481842041015625, -1.4195404052734375, -1.35723876953125, -1.2949371337890625, -1.232635498046875, -1.1703338623046875, -1.1080322265625, -1.0457305908203125, -0.983428955078125, -0.9211273193359375, -0.85882568359375, -0.7965240478515625, -0.734222412109375, -0.6719207763671875, -0.609619140625, -0.5473175048828125, -0.485015869140625, -0.4227142333984375, -0.36041259765625, -0.2981109619140625, -0.235809326171875, -0.1735076904296875, -0.1112060546875, -0.0489044189453125, 0.013397216796875, 0.0756988525390625, 0.13800048828125, 0.2003021240234375, 0.262603759765625, 0.3249053955078125, 0.38720703125, 0.4495086669921875, 0.511810302734375, 0.5741119384765625, 0.63641357421875, 0.6987152099609375, 0.761016845703125, 0.8233184814453125, 0.8856201171875, 0.9479217529296875, 1.010223388671875, 1.0725250244140625, 1.13482666015625, 1.1971282958984375, 1.259429931640625, 1.3217315673828125, 1.384033203125, 1.4463348388671875, 1.508636474609375, 1.5709381103515625, 1.63323974609375, 1.6955413818359375, 1.757843017578125, 1.8201446533203125, 1.8824462890625, 1.9447479248046875, 2.007049560546875, 2.0693511962890625, 2.13165283203125, 2.1939544677734375, 2.256256103515625, 2.3185577392578125, 2.380859375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 7.0, 5.0, 14.0, 8.0, 11.0, 18.0, 22.0, 29.0, 39.0, 52.0, 88.0, 121.0, 198.0, 356.0, 691.0, 2478.0, 16628.0, 277751.0, 705665.0, 37647.0, 4553.0, 1028.0, 411.0, 225.0, 127.0, 109.0, 56.0, 55.0, 39.0, 34.0, 22.0, 14.0, 13.0, 11.0, 5.0, 3.0, 7.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.05078125, -1.0106353759765625, -0.970489501953125, -0.9303436279296875, -0.89019775390625, -0.8500518798828125, -0.809906005859375, -0.7697601318359375, -0.7296142578125, -0.6894683837890625, -0.649322509765625, -0.6091766357421875, -0.56903076171875, -0.5288848876953125, -0.488739013671875, -0.4485931396484375, -0.408447265625, -0.3683013916015625, -0.328155517578125, -0.2880096435546875, -0.24786376953125, -0.2077178955078125, -0.167572021484375, -0.1274261474609375, -0.0872802734375, -0.0471343994140625, -0.006988525390625, 0.0331573486328125, 0.07330322265625, 0.1134490966796875, 0.153594970703125, 0.1937408447265625, 0.23388671875, 0.2740325927734375, 0.314178466796875, 0.3543243408203125, 0.39447021484375, 0.4346160888671875, 0.474761962890625, 0.5149078369140625, 0.5550537109375, 0.5951995849609375, 0.635345458984375, 0.6754913330078125, 0.71563720703125, 0.7557830810546875, 0.795928955078125, 0.8360748291015625, 0.876220703125, 0.9163665771484375, 0.956512451171875, 0.9966583251953125, 1.03680419921875, 1.0769500732421875, 1.117095947265625, 1.1572418212890625, 1.1973876953125, 1.2375335693359375, 1.277679443359375, 1.3178253173828125, 1.35797119140625, 1.3981170654296875, 1.438262939453125, 1.4784088134765625, 1.5185546875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 6.0, 3.0, 3.0, 3.0, 7.0, 8.0, 9.0, 3.0, 7.0, 12.0, 20.0, 13.0, 20.0, 23.0, 14.0, 22.0, 21.0, 32.0, 25.0, 28.0, 28.0, 36.0, 33.0, 34.0, 42.0, 28.0, 41.0, 40.0, 30.0, 39.0, 40.0, 32.0, 28.0, 34.0, 34.0, 36.0, 24.0, 11.0, 19.0, 16.0, 18.0, 7.0, 14.0, 14.0, 11.0, 8.0, 6.0, 6.0, 2.0, 8.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0], "bins": [-1.4521484375, -1.409637451171875, -1.36712646484375, -1.324615478515625, -1.2821044921875, -1.239593505859375, -1.19708251953125, -1.154571533203125, -1.112060546875, -1.069549560546875, -1.02703857421875, -0.984527587890625, -0.9420166015625, -0.899505615234375, -0.85699462890625, -0.814483642578125, -0.77197265625, -0.729461669921875, -0.68695068359375, -0.644439697265625, -0.6019287109375, -0.559417724609375, -0.51690673828125, -0.474395751953125, -0.431884765625, -0.389373779296875, -0.34686279296875, -0.304351806640625, -0.2618408203125, -0.219329833984375, -0.17681884765625, -0.134307861328125, -0.091796875, -0.049285888671875, -0.00677490234375, 0.035736083984375, 0.0782470703125, 0.120758056640625, 0.16326904296875, 0.205780029296875, 0.248291015625, 0.290802001953125, 0.33331298828125, 0.375823974609375, 0.4183349609375, 0.460845947265625, 0.50335693359375, 0.545867919921875, 0.58837890625, 0.630889892578125, 0.67340087890625, 0.715911865234375, 0.7584228515625, 0.800933837890625, 0.84344482421875, 0.885955810546875, 0.928466796875, 0.970977783203125, 1.01348876953125, 1.055999755859375, 1.0985107421875, 1.141021728515625, 1.18353271484375, 1.226043701171875, 1.2685546875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 5.0, 10.0, 13.0, 22.0, 23.0, 55.0, 145.0, 302.0, 1173.0, 7888.0, 560374.0, 469558.0, 7273.0, 1109.0, 334.0, 129.0, 64.0, 36.0, 15.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0302734375, -1.00384521484375, -0.9774169921875, -0.95098876953125, -0.924560546875, -0.89813232421875, -0.8717041015625, -0.84527587890625, -0.81884765625, -0.79241943359375, -0.7659912109375, -0.73956298828125, -0.713134765625, -0.68670654296875, -0.6602783203125, -0.63385009765625, -0.607421875, -0.58099365234375, -0.5545654296875, -0.52813720703125, -0.501708984375, -0.47528076171875, -0.4488525390625, -0.42242431640625, -0.39599609375, -0.36956787109375, -0.3431396484375, -0.31671142578125, -0.290283203125, -0.26385498046875, -0.2374267578125, -0.21099853515625, -0.1845703125, -0.15814208984375, -0.1317138671875, -0.10528564453125, -0.078857421875, -0.05242919921875, -0.0260009765625, 0.00042724609375, 0.02685546875, 0.05328369140625, 0.0797119140625, 0.10614013671875, 0.132568359375, 0.15899658203125, 0.1854248046875, 0.21185302734375, 0.23828125, 0.26470947265625, 0.2911376953125, 0.31756591796875, 0.343994140625, 0.37042236328125, 0.3968505859375, 0.42327880859375, 0.44970703125, 0.47613525390625, 0.5025634765625, 0.52899169921875, 0.555419921875, 0.58184814453125, 0.6082763671875, 0.63470458984375, 0.6611328125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 9.0, 11.0, 24.0, 44.0, 91.0, 194.0, 263.0, 172.0, 101.0, 48.0, 20.0, 16.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00016307830810546875, -0.00015956629067659378, -0.0001560542732477188, -0.00015254225581884384, -0.00014903023838996887, -0.0001455182209610939, -0.00014200620353221893, -0.00013849418610334396, -0.000134982168674469, -0.00013147015124559402, -0.00012795813381671906, -0.00012444611638784409, -0.00012093409895896912, -0.00011742208153009415, -0.00011391006410121918, -0.00011039804667234421, -0.00010688602924346924, -0.00010337401181459427, -9.98619943857193e-05, -9.634997695684433e-05, -9.283795952796936e-05, -8.932594209909439e-05, -8.581392467021942e-05, -8.230190724134445e-05, -7.878988981246948e-05, -7.527787238359451e-05, -7.176585495471954e-05, -6.825383752584457e-05, -6.47418200969696e-05, -6.122980266809464e-05, -5.7717785239219666e-05, -5.4205767810344696e-05, -5.0693750381469727e-05, -4.718173295259476e-05, -4.366971552371979e-05, -4.015769809484482e-05, -3.664568066596985e-05, -3.313366323709488e-05, -2.962164580821991e-05, -2.610962837934494e-05, -2.259761095046997e-05, -1.9085593521595e-05, -1.5573576092720032e-05, -1.2061558663845062e-05, -8.549541234970093e-06, -5.037523806095123e-06, -1.5255063772201538e-06, 1.9865110516548157e-06, 5.498528480529785e-06, 9.010545909404755e-06, 1.2522563338279724e-05, 1.6034580767154694e-05, 1.9546598196029663e-05, 2.3058615624904633e-05, 2.6570633053779602e-05, 3.008265048265457e-05, 3.359466791152954e-05, 3.710668534040451e-05, 4.061870276927948e-05, 4.413072019815445e-05, 4.764273762702942e-05, 5.115475505590439e-05, 5.466677248477936e-05, 5.817878991365433e-05, 6.16908073425293e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 5.0, 9.0, 17.0, 23.0, 42.0, 85.0, 198.0, 419.0, 1092.0, 3044.0, 15968.0, 550345.0, 458188.0, 14372.0, 2953.0, 1026.0, 400.0, 164.0, 78.0, 44.0, 24.0, 15.0, 15.0, 6.0, 3.0, 3.0, 3.0, 5.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6044921875, -0.5843276977539062, -0.5641632080078125, -0.5439987182617188, -0.523834228515625, -0.5036697387695312, -0.4835052490234375, -0.46334075927734375, -0.44317626953125, -0.42301177978515625, -0.4028472900390625, -0.38268280029296875, -0.362518310546875, -0.34235382080078125, -0.3221893310546875, -0.30202484130859375, -0.2818603515625, -0.26169586181640625, -0.2415313720703125, -0.22136688232421875, -0.201202392578125, -0.18103790283203125, -0.1608734130859375, -0.14070892333984375, -0.12054443359375, -0.10037994384765625, -0.0802154541015625, -0.06005096435546875, -0.039886474609375, -0.01972198486328125, 0.0004425048828125, 0.02060699462890625, 0.040771484375, 0.06093597412109375, 0.0811004638671875, 0.10126495361328125, 0.121429443359375, 0.14159393310546875, 0.1617584228515625, 0.18192291259765625, 0.20208740234375, 0.22225189208984375, 0.2424163818359375, 0.26258087158203125, 0.282745361328125, 0.30290985107421875, 0.3230743408203125, 0.34323883056640625, 0.3634033203125, 0.38356781005859375, 0.4037322998046875, 0.42389678955078125, 0.444061279296875, 0.46422576904296875, 0.4843902587890625, 0.5045547485351562, 0.52471923828125, 0.5448837280273438, 0.5650482177734375, 0.5852127075195312, 0.605377197265625, 0.6255416870117188, 0.6457061767578125, 0.6658706665039062, 0.68603515625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 5.0, 15.0, 29.0, 28.0, 67.0, 104.0, 153.0, 176.0, 148.0, 90.0, 57.0, 48.0, 29.0, 13.0, 9.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.216552734375, -0.2100696563720703, -0.20358657836914062, -0.19710350036621094, -0.19062042236328125, -0.18413734436035156, -0.17765426635742188, -0.1711711883544922, -0.1646881103515625, -0.1582050323486328, -0.15172195434570312, -0.14523887634277344, -0.13875579833984375, -0.13227272033691406, -0.12578964233398438, -0.11930656433105469, -0.112823486328125, -0.10634040832519531, -0.09985733032226562, -0.09337425231933594, -0.08689117431640625, -0.08040809631347656, -0.07392501831054688, -0.06744194030761719, -0.0609588623046875, -0.05447578430175781, -0.047992706298828125, -0.04150962829589844, -0.03502655029296875, -0.028543472290039062, -0.022060394287109375, -0.015577316284179688, -0.00909423828125, -0.0026111602783203125, 0.003871917724609375, 0.010354995727539062, 0.01683807373046875, 0.023321151733398438, 0.029804229736328125, 0.03628730773925781, 0.0427703857421875, 0.04925346374511719, 0.055736541748046875, 0.06221961975097656, 0.06870269775390625, 0.07518577575683594, 0.08166885375976562, 0.08815193176269531, 0.094635009765625, 0.10111808776855469, 0.10760116577148438, 0.11408424377441406, 0.12056732177734375, 0.12705039978027344, 0.13353347778320312, 0.1400165557861328, 0.1464996337890625, 0.1529827117919922, 0.15946578979492188, 0.16594886779785156, 0.17243194580078125, 0.17891502380371094, 0.18539810180664062, 0.1918811798095703, 0.1983642578125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 9.0, 13.0, 35.0, 90.0, 233.0, 311.0, 195.0, 79.0, 22.0, 8.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.189291000366211, -10.975666999816895, -10.762042999267578, -10.548418998718262, -10.334795951843262, -10.121171951293945, -9.907547950744629, -9.693923950195312, -9.480299949645996, -9.26667594909668, -9.053051948547363, -8.839427947998047, -8.625804901123047, -8.41218090057373, -8.198556900024414, -7.984932899475098, -7.771308898925781, -7.557684898376465, -7.344061374664307, -7.13043737411499, -6.916813373565674, -6.703189849853516, -6.489565849304199, -6.275941848754883, -6.062318325042725, -5.848694324493408, -5.63507080078125, -5.421446800231934, -5.207822799682617, -4.994198799133301, -4.780575275421143, -4.566951274871826, -4.35332727432251, -4.139703273773193, -3.926079511642456, -3.7124557495117188, -3.4988317489624023, -3.285207986831665, -3.0715842247009277, -2.8579602241516113, -2.644336223602295, -2.4307124614715576, -2.217088460922241, -2.003464698791504, -1.7898406982421875, -1.5762169361114502, -1.3625930547714233, -1.1489691734313965, -0.9353454113006592, -0.7217215299606323, -0.5080976486206055, -0.2944738268852234, -0.08084994554519653, 0.13277387619018555, 0.3463977575302124, 0.5600216388702393, 0.7736455202102661, 0.987269401550293, 1.2008932828903198, 1.4145171642303467, 1.628140926361084, 1.8417648077011108, 2.0553886890411377, 2.269012451171875, 2.4826364517211914]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 9.0, 6.0, 6.0, 10.0, 9.0, 16.0, 9.0, 18.0, 13.0, 22.0, 25.0, 25.0, 28.0, 27.0, 51.0, 43.0, 50.0, 49.0, 35.0, 43.0, 41.0, 46.0, 36.0, 34.0, 43.0, 36.0, 33.0, 33.0, 31.0, 22.0, 18.0, 19.0, 17.0, 21.0, 13.0, 12.0, 9.0, 10.0, 9.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.9308040142059326, -2.8450233936309814, -2.7592430114746094, -2.673462390899658, -2.587681770324707, -2.501901149749756, -2.4161205291748047, -2.3303401470184326, -2.2445595264434814, -2.1587789058685303, -2.072998523712158, -1.987217903137207, -1.9014372825622559, -1.8156566619873047, -1.729876160621643, -1.6440956592559814, -1.5583150386810303, -1.472534418106079, -1.3867539167404175, -1.3009734153747559, -1.2151927947998047, -1.1294121742248535, -1.043631672859192, -0.9578511118888855, -0.8720705509185791, -0.7862899899482727, -0.7005094289779663, -0.6147288680076599, -0.5289483070373535, -0.4431677460670471, -0.3573871850967407, -0.2716066241264343, -0.18582582473754883, -0.10004526376724243, -0.014264702796936035, 0.07151585817337036, 0.15729641914367676, 0.24307698011398315, 0.32885754108428955, 0.41463810205459595, 0.5004186630249023, 0.5861992239952087, 0.6719797849655151, 0.7577603459358215, 0.8435409069061279, 0.9293214678764343, 1.0151020288467407, 1.1008825302124023, 1.1866631507873535, 1.2724437713623047, 1.3582242727279663, 1.444004774093628, 1.529785394668579, 1.6155660152435303, 1.701346516609192, 1.7871270179748535, 1.8729076385498047, 1.9586882591247559, 2.044468879699707, 2.130249261856079, 2.2160298824310303, 2.3018105030059814, 2.3875908851623535, 2.4733715057373047, 2.559152126312256]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 10.0, 5.0, 12.0, 15.0, 10.0, 26.0, 48.0, 43.0, 74.0, 116.0, 186.0, 307.0, 621.0, 1415.0, 4961.0, 40397.0, 1737134.0, 2350566.0, 50571.0, 4923.0, 1343.0, 562.0, 296.0, 211.0, 96.0, 96.0, 53.0, 39.0, 42.0, 19.0, 16.0, 15.0, 12.0, 8.0, 5.0, 6.0, 4.0, 1.0, 3.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.65234375, -2.564056396484375, -2.47576904296875, -2.387481689453125, -2.2991943359375, -2.210906982421875, -2.12261962890625, -2.034332275390625, -1.946044921875, -1.857757568359375, -1.76947021484375, -1.681182861328125, -1.5928955078125, -1.504608154296875, -1.41632080078125, -1.328033447265625, -1.23974609375, -1.151458740234375, -1.06317138671875, -0.974884033203125, -0.8865966796875, -0.798309326171875, -0.71002197265625, -0.621734619140625, -0.533447265625, -0.445159912109375, -0.35687255859375, -0.268585205078125, -0.1802978515625, -0.092010498046875, -0.00372314453125, 0.084564208984375, 0.1728515625, 0.261138916015625, 0.34942626953125, 0.437713623046875, 0.5260009765625, 0.614288330078125, 0.70257568359375, 0.790863037109375, 0.879150390625, 0.967437744140625, 1.05572509765625, 1.144012451171875, 1.2322998046875, 1.320587158203125, 1.40887451171875, 1.497161865234375, 1.58544921875, 1.673736572265625, 1.76202392578125, 1.850311279296875, 1.9385986328125, 2.026885986328125, 2.11517333984375, 2.203460693359375, 2.291748046875, 2.380035400390625, 2.46832275390625, 2.556610107421875, 2.6448974609375, 2.733184814453125, 2.82147216796875, 2.909759521484375, 2.998046875]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 8.0, 7.0, 8.0, 10.0, 16.0, 14.0, 15.0, 31.0, 36.0, 36.0, 49.0, 55.0, 55.0, 78.0, 74.0, 65.0, 66.0, 49.0, 52.0, 59.0, 52.0, 34.0, 23.0, 30.0, 19.0, 11.0, 13.0, 9.0, 1.0, 4.0, 4.0, 6.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.103515625, -1.065704345703125, -1.02789306640625, -0.990081787109375, -0.9522705078125, -0.914459228515625, -0.87664794921875, -0.838836669921875, -0.801025390625, -0.763214111328125, -0.72540283203125, -0.687591552734375, -0.6497802734375, -0.611968994140625, -0.57415771484375, -0.536346435546875, -0.49853515625, -0.460723876953125, -0.42291259765625, -0.385101318359375, -0.3472900390625, -0.309478759765625, -0.27166748046875, -0.233856201171875, -0.196044921875, -0.158233642578125, -0.12042236328125, -0.082611083984375, -0.0447998046875, -0.006988525390625, 0.03082275390625, 0.068634033203125, 0.1064453125, 0.144256591796875, 0.18206787109375, 0.219879150390625, 0.2576904296875, 0.295501708984375, 0.33331298828125, 0.371124267578125, 0.408935546875, 0.446746826171875, 0.48455810546875, 0.522369384765625, 0.5601806640625, 0.597991943359375, 0.63580322265625, 0.673614501953125, 0.71142578125, 0.749237060546875, 0.78704833984375, 0.824859619140625, 0.8626708984375, 0.900482177734375, 0.93829345703125, 0.976104736328125, 1.013916015625, 1.051727294921875, 1.08953857421875, 1.127349853515625, 1.1651611328125, 1.202972412109375, 1.24078369140625, 1.278594970703125, 1.31640625]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 10.0, 15.0, 16.0, 21.0, 31.0, 42.0, 82.0, 124.0, 187.0, 294.0, 651.0, 1146.0, 2372.0, 6067.0, 20888.0, 141848.0, 3112060.0, 835255.0, 53922.0, 11684.0, 3831.0, 1677.0, 838.0, 473.0, 279.0, 166.0, 88.0, 74.0, 35.0, 33.0, 11.0, 22.0, 10.0, 13.0, 5.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.822265625, -1.7740325927734375, -1.725799560546875, -1.6775665283203125, -1.62933349609375, -1.5811004638671875, -1.532867431640625, -1.4846343994140625, -1.4364013671875, -1.3881683349609375, -1.339935302734375, -1.2917022705078125, -1.24346923828125, -1.1952362060546875, -1.147003173828125, -1.0987701416015625, -1.050537109375, -1.0023040771484375, -0.954071044921875, -0.9058380126953125, -0.85760498046875, -0.8093719482421875, -0.761138916015625, -0.7129058837890625, -0.6646728515625, -0.6164398193359375, -0.568206787109375, -0.5199737548828125, -0.47174072265625, -0.4235076904296875, -0.375274658203125, -0.3270416259765625, -0.27880859375, -0.2305755615234375, -0.182342529296875, -0.1341094970703125, -0.08587646484375, -0.0376434326171875, 0.010589599609375, 0.0588226318359375, 0.1070556640625, 0.1552886962890625, 0.203521728515625, 0.2517547607421875, 0.29998779296875, 0.3482208251953125, 0.396453857421875, 0.4446868896484375, 0.492919921875, 0.5411529541015625, 0.589385986328125, 0.6376190185546875, 0.68585205078125, 0.7340850830078125, 0.782318115234375, 0.8305511474609375, 0.8787841796875, 0.9270172119140625, 0.975250244140625, 1.0234832763671875, 1.07171630859375, 1.1199493408203125, 1.168182373046875, 1.2164154052734375, 1.2646484375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 7.0, 13.0, 25.0, 24.0, 27.0, 54.0, 75.0, 138.0, 281.0, 512.0, 734.0, 832.0, 546.0, 318.0, 182.0, 106.0, 57.0, 44.0, 29.0, 15.0, 12.0, 11.0, 1.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5625, -0.5459938049316406, -0.5294876098632812, -0.5129814147949219, -0.4964752197265625, -0.4799690246582031, -0.46346282958984375, -0.4469566345214844, -0.430450439453125, -0.4139442443847656, -0.39743804931640625, -0.3809318542480469, -0.3644256591796875, -0.3479194641113281, -0.33141326904296875, -0.3149070739746094, -0.29840087890625, -0.2818946838378906, -0.26538848876953125, -0.24888229370117188, -0.2323760986328125, -0.21586990356445312, -0.19936370849609375, -0.18285751342773438, -0.166351318359375, -0.14984512329101562, -0.13333892822265625, -0.11683273315429688, -0.1003265380859375, -0.08382034301757812, -0.06731414794921875, -0.050807952880859375, -0.0343017578125, -0.017795562744140625, -0.00128936767578125, 0.015216827392578125, 0.0317230224609375, 0.048229217529296875, 0.06473541259765625, 0.08124160766601562, 0.097747802734375, 0.11425399780273438, 0.13076019287109375, 0.14726638793945312, 0.1637725830078125, 0.18027877807617188, 0.19678497314453125, 0.21329116821289062, 0.22979736328125, 0.24630355834960938, 0.26280975341796875, 0.2793159484863281, 0.2958221435546875, 0.3123283386230469, 0.32883453369140625, 0.3453407287597656, 0.361846923828125, 0.3783531188964844, 0.39485931396484375, 0.4113655090332031, 0.4278717041015625, 0.4443778991699219, 0.46088409423828125, 0.4773902893066406, 0.493896484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 6.0, 8.0, 18.0, 24.0, 38.0, 51.0, 94.0, 127.0, 170.0, 159.0, 112.0, 82.0, 42.0, 36.0, 17.0, 6.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7463443279266357, -3.6642932891845703, -3.582242250442505, -3.5001912117004395, -3.418140172958374, -3.3360891342163086, -3.254038095474243, -3.1719870567321777, -3.089935779571533, -3.0078847408294678, -2.9258337020874023, -2.843782663345337, -2.7617316246032715, -2.679680585861206, -2.5976295471191406, -2.515578269958496, -2.4335274696350098, -2.3514764308929443, -2.269425392150879, -2.1873743534088135, -2.105323314666748, -2.0232722759246826, -1.9412211179733276, -1.8591700792312622, -1.7771190404891968, -1.6950680017471313, -1.613016963005066, -1.5309659242630005, -1.4489147663116455, -1.36686372756958, -1.2848126888275146, -1.2027616500854492, -1.1207103729248047, -1.0386593341827393, -0.9566082954406738, -0.8745571970939636, -0.7925061583518982, -0.7104551196098328, -0.6284040212631226, -0.5463529825210571, -0.4643019437789917, -0.38225090503692627, -0.30019983649253845, -0.21814878284931183, -0.1360977292060852, -0.054046690464019775, 0.028004378080368042, 0.11005544662475586, 0.1921064853668213, 0.2741575241088867, 0.35620859265327454, 0.43825966119766235, 0.5203106999397278, 0.6023617386817932, 0.6844128370285034, 0.7664638757705688, 0.8485149145126343, 0.9305659532546997, 1.0126169919967651, 1.0946680307388306, 1.1767191886901855, 1.258770227432251, 1.3408212661743164, 1.4228723049163818, 1.5049233436584473]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 2.0, 3.0, 8.0, 6.0, 6.0, 14.0, 16.0, 19.0, 19.0, 21.0, 27.0, 41.0, 33.0, 52.0, 51.0, 60.0, 49.0, 53.0, 55.0, 57.0, 48.0, 58.0, 39.0, 31.0, 52.0, 28.0, 31.0, 22.0, 21.0, 19.0, 13.0, 16.0, 9.0, 3.0, 3.0, 6.0, 1.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2287441492080688, -1.19148588180542, -1.154227614402771, -1.1169694662094116, -1.0797111988067627, -1.0424529314041138, -1.0051946640014648, -0.9679363965988159, -0.9306781888008118, -0.8934199213981628, -0.8561617136001587, -0.8189034461975098, -0.7816451787948608, -0.7443869709968567, -0.7071287035942078, -0.6698704957962036, -0.6326122283935547, -0.5953539609909058, -0.5580957531929016, -0.5208374857902527, -0.48357924818992615, -0.4463210105895996, -0.4090627431869507, -0.37180450558662415, -0.3345462679862976, -0.29728803038597107, -0.26002979278564453, -0.2227715253829956, -0.18551328778266907, -0.14825505018234253, -0.1109967976808548, -0.07373854517936707, -0.03648042678833008, 0.0007778182625770569, 0.03803606331348419, 0.07529430836439133, 0.11255255341529846, 0.149810791015625, 0.18706904351711273, 0.22432729601860046, 0.261585533618927, 0.29884377121925354, 0.3361020088195801, 0.373360276222229, 0.41061851382255554, 0.4478767514228821, 0.485135018825531, 0.5223932266235352, 0.5596514940261841, 0.596909761428833, 0.6341679692268372, 0.6714262366294861, 0.7086844444274902, 0.7459427118301392, 0.7832009792327881, 0.820459246635437, 0.8577174544334412, 0.8949757218360901, 0.9322339296340942, 0.9694921970367432, 1.006750464439392, 1.044008731842041, 1.0812668800354004, 1.1185251474380493, 1.1557834148406982]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 12.0, 5.0, 13.0, 12.0, 18.0, 21.0, 39.0, 44.0, 100.0, 169.0, 252.0, 477.0, 981.0, 1930.0, 4701.0, 12043.0, 38586.0, 145271.0, 443814.0, 290810.0, 74327.0, 21300.0, 7596.0, 3017.0, 1361.0, 703.0, 364.0, 182.0, 142.0, 72.0, 52.0, 29.0, 27.0, 28.0, 14.0, 12.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1920166015625, -0.1855640411376953, -0.17911148071289062, -0.17265892028808594, -0.16620635986328125, -0.15975379943847656, -0.15330123901367188, -0.1468486785888672, -0.1403961181640625, -0.1339435577392578, -0.12749099731445312, -0.12103843688964844, -0.11458587646484375, -0.10813331604003906, -0.10168075561523438, -0.09522819519042969, -0.088775634765625, -0.08232307434082031, -0.07587051391601562, -0.06941795349121094, -0.06296539306640625, -0.05651283264160156, -0.050060272216796875, -0.04360771179199219, -0.0371551513671875, -0.030702590942382812, -0.024250030517578125, -0.017797470092773438, -0.01134490966796875, -0.0048923492431640625, 0.001560211181640625, 0.008012771606445312, 0.01446533203125, 0.020917892456054688, 0.027370452880859375, 0.03382301330566406, 0.04027557373046875, 0.04672813415527344, 0.053180694580078125, 0.05963325500488281, 0.0660858154296875, 0.07253837585449219, 0.07899093627929688, 0.08544349670410156, 0.09189605712890625, 0.09834861755371094, 0.10480117797851562, 0.11125373840332031, 0.117706298828125, 0.12415885925292969, 0.13061141967773438, 0.13706398010253906, 0.14351654052734375, 0.14996910095214844, 0.15642166137695312, 0.1628742218017578, 0.1693267822265625, 0.1757793426513672, 0.18223190307617188, 0.18868446350097656, 0.19513702392578125, 0.20158958435058594, 0.20804214477539062, 0.2144947052001953, 0.220947265625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 2.0, 6.0, 6.0, 11.0, 7.0, 5.0, 11.0, 20.0, 23.0, 29.0, 30.0, 34.0, 45.0, 63.0, 52.0, 66.0, 46.0, 52.0, 72.0, 55.0, 47.0, 52.0, 50.0, 29.0, 38.0, 29.0, 28.0, 23.0, 11.0, 15.0, 10.0, 10.0, 6.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9228515625, -0.8954696655273438, -0.8680877685546875, -0.8407058715820312, -0.813323974609375, -0.7859420776367188, -0.7585601806640625, -0.7311782836914062, -0.70379638671875, -0.6764144897460938, -0.6490325927734375, -0.6216506958007812, -0.594268798828125, -0.5668869018554688, -0.5395050048828125, -0.5121231079101562, -0.4847412109375, -0.45735931396484375, -0.4299774169921875, -0.40259552001953125, -0.375213623046875, -0.34783172607421875, -0.3204498291015625, -0.29306793212890625, -0.26568603515625, -0.23830413818359375, -0.2109222412109375, -0.18354034423828125, -0.156158447265625, -0.12877655029296875, -0.1013946533203125, -0.07401275634765625, -0.046630859375, -0.01924896240234375, 0.0081329345703125, 0.03551483154296875, 0.062896728515625, 0.09027862548828125, 0.1176605224609375, 0.14504241943359375, 0.17242431640625, 0.19980621337890625, 0.2271881103515625, 0.25457000732421875, 0.281951904296875, 0.30933380126953125, 0.3367156982421875, 0.36409759521484375, 0.3914794921875, 0.41886138916015625, 0.4462432861328125, 0.47362518310546875, 0.501007080078125, 0.5283889770507812, 0.5557708740234375, 0.5831527709960938, 0.61053466796875, 0.6379165649414062, 0.6652984619140625, 0.6926803588867188, 0.720062255859375, 0.7474441528320312, 0.7748260498046875, 0.8022079467773438, 0.82958984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 6.0, 7.0, 10.0, 13.0, 19.0, 39.0, 54.0, 59.0, 97.0, 138.0, 208.0, 292.0, 472.0, 733.0, 1328.0, 2226.0, 4038.0, 7904.0, 16683.0, 35268.0, 79018.0, 175199.0, 290214.0, 229538.0, 110500.0, 49142.0, 22346.0, 10696.0, 5401.0, 2785.0, 1546.0, 950.0, 525.0, 337.0, 234.0, 158.0, 109.0, 82.0, 47.0, 28.0, 31.0, 24.0, 8.0, 7.0, 12.0, 7.0, 7.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.12103271484375, -0.11744022369384766, -0.11384773254394531, -0.11025524139404297, -0.10666275024414062, -0.10307025909423828, -0.09947776794433594, -0.0958852767944336, -0.09229278564453125, -0.0887002944946289, -0.08510780334472656, -0.08151531219482422, -0.07792282104492188, -0.07433032989501953, -0.07073783874511719, -0.06714534759521484, -0.0635528564453125, -0.059960365295410156, -0.05636787414550781, -0.05277538299560547, -0.049182891845703125, -0.04559040069580078, -0.04199790954589844, -0.038405418395996094, -0.03481292724609375, -0.031220436096191406, -0.027627944946289062, -0.02403545379638672, -0.020442962646484375, -0.01685047149658203, -0.013257980346679688, -0.009665489196777344, -0.006072998046875, -0.0024805068969726562, 0.0011119842529296875, 0.004704475402832031, 0.008296966552734375, 0.011889457702636719, 0.015481948852539062, 0.019074440002441406, 0.02266693115234375, 0.026259422302246094, 0.029851913452148438, 0.03344440460205078, 0.037036895751953125, 0.04062938690185547, 0.04422187805175781, 0.047814369201660156, 0.0514068603515625, 0.054999351501464844, 0.05859184265136719, 0.06218433380126953, 0.06577682495117188, 0.06936931610107422, 0.07296180725097656, 0.0765542984008789, 0.08014678955078125, 0.0837392807006836, 0.08733177185058594, 0.09092426300048828, 0.09451675415039062, 0.09810924530029297, 0.10170173645019531, 0.10529422760009766, 0.10888671875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 7.0, 7.0, 10.0, 10.0, 13.0, 18.0, 20.0, 12.0, 27.0, 21.0, 25.0, 30.0, 44.0, 31.0, 32.0, 53.0, 43.0, 38.0, 46.0, 42.0, 52.0, 39.0, 53.0, 41.0, 36.0, 45.0, 32.0, 31.0, 21.0, 22.0, 20.0, 12.0, 11.0, 16.0, 6.0, 5.0, 6.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4189453125, -1.376251220703125, -1.33355712890625, -1.290863037109375, -1.2481689453125, -1.205474853515625, -1.16278076171875, -1.120086669921875, -1.077392578125, -1.034698486328125, -0.99200439453125, -0.949310302734375, -0.9066162109375, -0.863922119140625, -0.82122802734375, -0.778533935546875, -0.73583984375, -0.693145751953125, -0.65045166015625, -0.607757568359375, -0.5650634765625, -0.522369384765625, -0.47967529296875, -0.436981201171875, -0.394287109375, -0.351593017578125, -0.30889892578125, -0.266204833984375, -0.2235107421875, -0.180816650390625, -0.13812255859375, -0.095428466796875, -0.052734375, -0.010040283203125, 0.03265380859375, 0.075347900390625, 0.1180419921875, 0.160736083984375, 0.20343017578125, 0.246124267578125, 0.288818359375, 0.331512451171875, 0.37420654296875, 0.416900634765625, 0.4595947265625, 0.502288818359375, 0.54498291015625, 0.587677001953125, 0.63037109375, 0.673065185546875, 0.71575927734375, 0.758453369140625, 0.8011474609375, 0.843841552734375, 0.88653564453125, 0.929229736328125, 0.971923828125, 1.014617919921875, 1.05731201171875, 1.100006103515625, 1.1427001953125, 1.185394287109375, 1.22808837890625, 1.270782470703125, 1.3134765625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 7.0, 10.0, 16.0, 11.0, 19.0, 28.0, 42.0, 68.0, 96.0, 177.0, 313.0, 518.0, 987.0, 2099.0, 4519.0, 12020.0, 40884.0, 172163.0, 454875.0, 265997.0, 64574.0, 17430.0, 6113.0, 2560.0, 1339.0, 684.0, 384.0, 239.0, 144.0, 72.0, 49.0, 43.0, 27.0, 17.0, 13.0, 3.0, 2.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.055206298828125, -0.05340576171875, -0.051605224609375, -0.0498046875, -0.048004150390625, -0.04620361328125, -0.044403076171875, -0.0426025390625, -0.040802001953125, -0.03900146484375, -0.037200927734375, -0.035400390625, -0.033599853515625, -0.03179931640625, -0.029998779296875, -0.0281982421875, -0.026397705078125, -0.02459716796875, -0.022796630859375, -0.02099609375, -0.019195556640625, -0.01739501953125, -0.015594482421875, -0.0137939453125, -0.011993408203125, -0.01019287109375, -0.008392333984375, -0.006591796875, -0.004791259765625, -0.00299072265625, -0.001190185546875, 0.0006103515625, 0.002410888671875, 0.00421142578125, 0.006011962890625, 0.0078125, 0.009613037109375, 0.01141357421875, 0.013214111328125, 0.0150146484375, 0.016815185546875, 0.01861572265625, 0.020416259765625, 0.022216796875, 0.024017333984375, 0.02581787109375, 0.027618408203125, 0.0294189453125, 0.031219482421875, 0.03302001953125, 0.034820556640625, 0.03662109375, 0.038421630859375, 0.04022216796875, 0.042022705078125, 0.0438232421875, 0.045623779296875, 0.04742431640625, 0.049224853515625, 0.051025390625, 0.052825927734375, 0.05462646484375, 0.056427001953125, 0.0582275390625, 0.060028076171875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 13.0, 11.0, 9.0, 18.0, 18.0, 18.0, 20.0, 42.0, 53.0, 61.0, 63.0, 90.0, 86.0, 104.0, 69.0, 82.0, 59.0, 31.0, 36.0, 38.0, 21.0, 10.0, 8.0, 10.0, 9.0, 4.0, 6.0, 6.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.325939178466797e-05, -3.231316804885864e-05, -3.1366944313049316e-05, -3.042072057723999e-05, -2.9474496841430664e-05, -2.8528273105621338e-05, -2.7582049369812012e-05, -2.6635825634002686e-05, -2.568960189819336e-05, -2.4743378162384033e-05, -2.3797154426574707e-05, -2.285093069076538e-05, -2.1904706954956055e-05, -2.095848321914673e-05, -2.0012259483337402e-05, -1.9066035747528076e-05, -1.811981201171875e-05, -1.7173588275909424e-05, -1.6227364540100098e-05, -1.528114080429077e-05, -1.4334917068481445e-05, -1.3388693332672119e-05, -1.2442469596862793e-05, -1.1496245861053467e-05, -1.055002212524414e-05, -9.603798389434814e-06, -8.657574653625488e-06, -7.711350917816162e-06, -6.765127182006836e-06, -5.81890344619751e-06, -4.872679710388184e-06, -3.926455974578857e-06, -2.9802322387695312e-06, -2.034008502960205e-06, -1.087784767150879e-06, -1.4156103134155273e-07, 8.046627044677734e-07, 1.7508864402770996e-06, 2.6971101760864258e-06, 3.643333911895752e-06, 4.589557647705078e-06, 5.535781383514404e-06, 6.4820051193237305e-06, 7.428228855133057e-06, 8.374452590942383e-06, 9.320676326751709e-06, 1.0266900062561035e-05, 1.1213123798370361e-05, 1.2159347534179688e-05, 1.3105571269989014e-05, 1.405179500579834e-05, 1.4998018741607666e-05, 1.5944242477416992e-05, 1.689046621322632e-05, 1.7836689949035645e-05, 1.878291368484497e-05, 1.9729137420654297e-05, 2.0675361156463623e-05, 2.162158489227295e-05, 2.2567808628082275e-05, 2.35140323638916e-05, 2.4460256099700928e-05, 2.5406479835510254e-05, 2.635270357131958e-05, 2.7298927307128906e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 8.0, 6.0, 7.0, 12.0, 12.0, 12.0, 32.0, 26.0, 39.0, 56.0, 107.0, 104.0, 189.0, 275.0, 395.0, 683.0, 1061.0, 1919.0, 3654.0, 7326.0, 15207.0, 35352.0, 87712.0, 202933.0, 304879.0, 216979.0, 96221.0, 39227.0, 17001.0, 7746.0, 3983.0, 2139.0, 1184.0, 757.0, 437.0, 296.0, 169.0, 127.0, 70.0, 53.0, 54.0, 30.0, 23.0, 22.0, 14.0, 5.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.041290283203125, -0.04009532928466797, -0.03890037536621094, -0.037705421447753906, -0.036510467529296875, -0.035315513610839844, -0.03412055969238281, -0.03292560577392578, -0.03173065185546875, -0.03053569793701172, -0.029340744018554688, -0.028145790100097656, -0.026950836181640625, -0.025755882263183594, -0.024560928344726562, -0.02336597442626953, -0.0221710205078125, -0.02097606658935547, -0.019781112670898438, -0.018586158752441406, -0.017391204833984375, -0.016196250915527344, -0.015001296997070312, -0.013806343078613281, -0.01261138916015625, -0.011416435241699219, -0.010221481323242188, -0.009026527404785156, -0.007831573486328125, -0.006636619567871094, -0.0054416656494140625, -0.004246711730957031, -0.0030517578125, -0.0018568038940429688, -0.0006618499755859375, 0.0005331039428710938, 0.001728057861328125, 0.0029230117797851562, 0.0041179656982421875, 0.005312919616699219, 0.00650787353515625, 0.007702827453613281, 0.008897781372070312, 0.010092735290527344, 0.011287689208984375, 0.012482643127441406, 0.013677597045898438, 0.014872550964355469, 0.0160675048828125, 0.01726245880126953, 0.018457412719726562, 0.019652366638183594, 0.020847320556640625, 0.022042274475097656, 0.023237228393554688, 0.02443218231201172, 0.02562713623046875, 0.02682209014892578, 0.028017044067382812, 0.029211997985839844, 0.030406951904296875, 0.031601905822753906, 0.03279685974121094, 0.03399181365966797, 0.035186767578125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 2.0, 4.0, 6.0, 7.0, 13.0, 18.0, 16.0, 13.0, 23.0, 34.0, 30.0, 33.0, 45.0, 24.0, 47.0, 45.0, 53.0, 46.0, 51.0, 52.0, 39.0, 42.0, 42.0, 36.0, 34.0, 33.0, 31.0, 16.0, 25.0, 26.0, 17.0, 14.0, 14.0, 11.0, 8.0, 8.0, 4.0, 3.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.0105438232421875, -0.01016700267791748, -0.009790182113647461, -0.009413361549377441, -0.009036540985107422, -0.008659720420837402, -0.008282899856567383, -0.007906079292297363, -0.007529258728027344, -0.007152438163757324, -0.006775617599487305, -0.006398797035217285, -0.006021976470947266, -0.005645155906677246, -0.0052683353424072266, -0.004891514778137207, -0.0045146942138671875, -0.004137873649597168, -0.0037610530853271484, -0.003384232521057129, -0.0030074119567871094, -0.00263059139251709, -0.0022537708282470703, -0.0018769502639770508, -0.0015001296997070312, -0.0011233091354370117, -0.0007464885711669922, -0.00036966800689697266, 7.152557373046875e-06, 0.0003839731216430664, 0.0007607936859130859, 0.0011376142501831055, 0.001514434814453125, 0.0018912553787231445, 0.002268075942993164, 0.0026448965072631836, 0.003021717071533203, 0.0033985376358032227, 0.003775358200073242, 0.004152178764343262, 0.004528999328613281, 0.004905819892883301, 0.00528264045715332, 0.00565946102142334, 0.006036281585693359, 0.006413102149963379, 0.0067899227142333984, 0.007166743278503418, 0.0075435638427734375, 0.007920384407043457, 0.008297204971313477, 0.008674025535583496, 0.009050846099853516, 0.009427666664123535, 0.009804487228393555, 0.010181307792663574, 0.010558128356933594, 0.010934948921203613, 0.011311769485473633, 0.011688590049743652, 0.012065410614013672, 0.012442231178283691, 0.012819051742553711, 0.01319587230682373, 0.01357269287109375]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 4.0, 7.0, 13.0, 28.0, 60.0, 102.0, 217.0, 252.0, 172.0, 82.0, 35.0, 22.0, 4.0, 5.0, 3.0, 5.0, 0.0, 1.0, 1.0], "bins": [-4.247142791748047, -4.165737152099609, -4.084331512451172, -4.002925872802734, -3.9215199947357178, -3.8401143550872803, -3.7587084770202637, -3.677302837371826, -3.5958971977233887, -3.514491558074951, -3.4330856800079346, -3.351680040359497, -3.2702744007110596, -3.188868761062622, -3.1074628829956055, -3.026057243347168, -2.9446516036987305, -2.863245964050293, -2.7818400859832764, -2.700434446334839, -2.6190288066864014, -2.537623167037964, -2.4562172889709473, -2.3748116493225098, -2.293405771255493, -2.2120001316070557, -2.130594253540039, -2.0491886138916016, -1.967782974243164, -1.886377215385437, -1.80497145652771, -1.7235658168792725, -1.642160177230835, -1.560754418373108, -1.4793487787246704, -1.3979430198669434, -1.3165373802185059, -1.2351316213607788, -1.1537258625030518, -1.0723202228546143, -0.9909145832061768, -0.9095088839530945, -0.8281031847000122, -0.7466974258422852, -0.6652917861938477, -0.5838860273361206, -0.5024803280830383, -0.42107462882995605, -0.3396689295768738, -0.2582632303237915, -0.17685751616954803, -0.09545180201530457, -0.01404610276222229, 0.06735959649085999, 0.14876532554626465, 0.23017102479934692, 0.3115767240524292, 0.3929824233055115, 0.47438812255859375, 0.5557938814163208, 0.6371995210647583, 0.7186052799224854, 0.8000109791755676, 0.8814166784286499, 0.9628223776817322]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 9.0, 9.0, 18.0, 8.0, 19.0, 24.0, 36.0, 30.0, 45.0, 60.0, 69.0, 69.0, 65.0, 67.0, 57.0, 71.0, 55.0, 49.0, 45.0, 47.0, 36.0, 22.0, 27.0, 10.0, 20.0, 11.0, 0.0, 5.0, 4.0, 5.0, 1.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8462040424346924, -0.8155025839805603, -0.7848011255264282, -0.7540996670722961, -0.7233982086181641, -0.692696750164032, -0.6619952917098999, -0.631293773651123, -0.6005923748016357, -0.5698909163475037, -0.5391894578933716, -0.5084879994392395, -0.4777865409851074, -0.44708508253097534, -0.4163835942745209, -0.3856821358203888, -0.3549806475639343, -0.32427918910980225, -0.29357773065567017, -0.2628762722015381, -0.2321747988462448, -0.20147334039211273, -0.17077186703681946, -0.14007040858268738, -0.1093689501285553, -0.07866749167442322, -0.04796602576971054, -0.017264559864997864, 0.013436898589134216, 0.044138357043266296, 0.07483983039855957, 0.10554128885269165, 0.13624274730682373, 0.1669442057609558, 0.1976456642150879, 0.22834713757038116, 0.25904858112335205, 0.28975003957748413, 0.3204515278339386, 0.3511529862880707, 0.38185444474220276, 0.41255590319633484, 0.4432573616504669, 0.4739588499069214, 0.5046603083610535, 0.5353617668151855, 0.5660632252693176, 0.5967646837234497, 0.6274661421775818, 0.6581676006317139, 0.688869059085846, 0.719570517539978, 0.7502719759941101, 0.7809734344482422, 0.811674952507019, 0.8423763513565063, 0.8730778694152832, 0.9037793278694153, 0.9344807863235474, 0.9651822447776794, 0.9958837032318115, 1.0265852212905884, 1.0572866201400757, 1.0879881381988525, 1.1186895370483398]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 1.0, 7.0, 10.0, 9.0, 7.0, 11.0, 18.0, 17.0, 28.0, 52.0, 89.0, 124.0, 178.0, 325.0, 514.0, 986.0, 1715.0, 3399.0, 7416.0, 18290.0, 52164.0, 208577.0, 539677.0, 147089.0, 40119.0, 14711.0, 6265.0, 3098.0, 1585.0, 840.0, 479.0, 269.0, 140.0, 114.0, 65.0, 54.0, 41.0, 25.0, 15.0, 7.0, 6.0, 5.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.560546875, -0.541473388671875, -0.52239990234375, -0.503326416015625, -0.4842529296875, -0.465179443359375, -0.44610595703125, -0.427032470703125, -0.407958984375, -0.388885498046875, -0.36981201171875, -0.350738525390625, -0.3316650390625, -0.312591552734375, -0.29351806640625, -0.274444580078125, -0.25537109375, -0.236297607421875, -0.21722412109375, -0.198150634765625, -0.1790771484375, -0.160003662109375, -0.14093017578125, -0.121856689453125, -0.102783203125, -0.083709716796875, -0.06463623046875, -0.045562744140625, -0.0264892578125, -0.007415771484375, 0.01165771484375, 0.030731201171875, 0.0498046875, 0.068878173828125, 0.08795166015625, 0.107025146484375, 0.1260986328125, 0.145172119140625, 0.16424560546875, 0.183319091796875, 0.202392578125, 0.221466064453125, 0.24053955078125, 0.259613037109375, 0.2786865234375, 0.297760009765625, 0.31683349609375, 0.335906982421875, 0.35498046875, 0.374053955078125, 0.39312744140625, 0.412200927734375, 0.4312744140625, 0.450347900390625, 0.46942138671875, 0.488494873046875, 0.507568359375, 0.526641845703125, 0.54571533203125, 0.564788818359375, 0.5838623046875, 0.602935791015625, 0.62200927734375, 0.641082763671875, 0.66015625]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 5.0, 3.0, 5.0, 12.0, 5.0, 7.0, 7.0, 10.0, 11.0, 11.0, 27.0, 23.0, 22.0, 24.0, 50.0, 48.0, 55.0, 54.0, 47.0, 55.0, 54.0, 52.0, 39.0, 42.0, 45.0, 51.0, 36.0, 36.0, 24.0, 28.0, 20.0, 22.0, 11.0, 11.0, 9.0, 13.0, 5.0, 6.0, 5.0, 7.0, 5.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6015625, -1.553924560546875, -1.50628662109375, -1.458648681640625, -1.4110107421875, -1.363372802734375, -1.31573486328125, -1.268096923828125, -1.220458984375, -1.172821044921875, -1.12518310546875, -1.077545166015625, -1.0299072265625, -0.982269287109375, -0.93463134765625, -0.886993408203125, -0.83935546875, -0.791717529296875, -0.74407958984375, -0.696441650390625, -0.6488037109375, -0.601165771484375, -0.55352783203125, -0.505889892578125, -0.458251953125, -0.410614013671875, -0.36297607421875, -0.315338134765625, -0.2677001953125, -0.220062255859375, -0.17242431640625, -0.124786376953125, -0.0771484375, -0.029510498046875, 0.01812744140625, 0.065765380859375, 0.1134033203125, 0.161041259765625, 0.20867919921875, 0.256317138671875, 0.303955078125, 0.351593017578125, 0.39923095703125, 0.446868896484375, 0.4945068359375, 0.542144775390625, 0.58978271484375, 0.637420654296875, 0.68505859375, 0.732696533203125, 0.78033447265625, 0.827972412109375, 0.8756103515625, 0.923248291015625, 0.97088623046875, 1.018524169921875, 1.066162109375, 1.113800048828125, 1.16143798828125, 1.209075927734375, 1.2567138671875, 1.304351806640625, 1.35198974609375, 1.399627685546875, 1.447265625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 5.0, 6.0, 10.0, 14.0, 14.0, 24.0, 47.0, 55.0, 60.0, 96.0, 141.0, 253.0, 547.0, 1570.0, 7441.0, 75756.0, 871618.0, 80045.0, 7805.0, 1654.0, 605.0, 272.0, 145.0, 94.0, 78.0, 54.0, 36.0, 25.0, 15.0, 13.0, 16.0, 10.0, 7.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.408203125, -1.366180419921875, -1.32415771484375, -1.282135009765625, -1.2401123046875, -1.198089599609375, -1.15606689453125, -1.114044189453125, -1.072021484375, -1.029998779296875, -0.98797607421875, -0.945953369140625, -0.9039306640625, -0.861907958984375, -0.81988525390625, -0.777862548828125, -0.73583984375, -0.693817138671875, -0.65179443359375, -0.609771728515625, -0.5677490234375, -0.525726318359375, -0.48370361328125, -0.441680908203125, -0.399658203125, -0.357635498046875, -0.31561279296875, -0.273590087890625, -0.2315673828125, -0.189544677734375, -0.14752197265625, -0.105499267578125, -0.0634765625, -0.021453857421875, 0.02056884765625, 0.062591552734375, 0.1046142578125, 0.146636962890625, 0.18865966796875, 0.230682373046875, 0.272705078125, 0.314727783203125, 0.35675048828125, 0.398773193359375, 0.4407958984375, 0.482818603515625, 0.52484130859375, 0.566864013671875, 0.60888671875, 0.650909423828125, 0.69293212890625, 0.734954833984375, 0.7769775390625, 0.819000244140625, 0.86102294921875, 0.903045654296875, 0.945068359375, 0.987091064453125, 1.02911376953125, 1.071136474609375, 1.1131591796875, 1.155181884765625, 1.19720458984375, 1.239227294921875, 1.28125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 7.0, 4.0, 7.0, 8.0, 6.0, 5.0, 10.0, 16.0, 18.0, 15.0, 16.0, 23.0, 26.0, 29.0, 32.0, 31.0, 30.0, 23.0, 38.0, 37.0, 36.0, 37.0, 46.0, 28.0, 39.0, 40.0, 32.0, 33.0, 34.0, 39.0, 36.0, 25.0, 22.0, 31.0, 22.0, 19.0, 10.0, 16.0, 11.0, 13.0, 10.0, 4.0, 10.0, 7.0, 5.0, 3.0, 2.0, 4.0, 3.0, 2.0, 4.0], "bins": [-1.5126953125, -1.4703216552734375, -1.427947998046875, -1.3855743408203125, -1.34320068359375, -1.3008270263671875, -1.258453369140625, -1.2160797119140625, -1.1737060546875, -1.1313323974609375, -1.088958740234375, -1.0465850830078125, -1.00421142578125, -0.9618377685546875, -0.919464111328125, -0.8770904541015625, -0.834716796875, -0.7923431396484375, -0.749969482421875, -0.7075958251953125, -0.66522216796875, -0.6228485107421875, -0.580474853515625, -0.5381011962890625, -0.4957275390625, -0.4533538818359375, -0.410980224609375, -0.3686065673828125, -0.32623291015625, -0.2838592529296875, -0.241485595703125, -0.1991119384765625, -0.15673828125, -0.1143646240234375, -0.071990966796875, -0.0296173095703125, 0.01275634765625, 0.0551300048828125, 0.097503662109375, 0.1398773193359375, 0.1822509765625, 0.2246246337890625, 0.266998291015625, 0.3093719482421875, 0.35174560546875, 0.3941192626953125, 0.436492919921875, 0.4788665771484375, 0.521240234375, 0.5636138916015625, 0.605987548828125, 0.6483612060546875, 0.69073486328125, 0.7331085205078125, 0.775482177734375, 0.8178558349609375, 0.8602294921875, 0.9026031494140625, 0.944976806640625, 0.9873504638671875, 1.02972412109375, 1.0720977783203125, 1.114471435546875, 1.1568450927734375, 1.19921875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 8.0, 8.0, 17.0, 34.0, 58.0, 90.0, 203.0, 384.0, 1199.0, 7082.0, 292719.0, 733124.0, 11155.0, 1563.0, 460.0, 204.0, 96.0, 54.0, 34.0, 20.0, 18.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.96142578125, -0.9374465942382812, -0.9134674072265625, -0.8894882202148438, -0.865509033203125, -0.8415298461914062, -0.8175506591796875, -0.7935714721679688, -0.76959228515625, -0.7456130981445312, -0.7216339111328125, -0.6976547241210938, -0.673675537109375, -0.6496963500976562, -0.6257171630859375, -0.6017379760742188, -0.5777587890625, -0.5537796020507812, -0.5298004150390625, -0.5058212280273438, -0.481842041015625, -0.45786285400390625, -0.4338836669921875, -0.40990447998046875, -0.38592529296875, -0.36194610595703125, -0.3379669189453125, -0.31398773193359375, -0.290008544921875, -0.26602935791015625, -0.2420501708984375, -0.21807098388671875, -0.194091796875, -0.17011260986328125, -0.1461334228515625, -0.12215423583984375, -0.098175048828125, -0.07419586181640625, -0.0502166748046875, -0.02623748779296875, -0.00225830078125, 0.02172088623046875, 0.0457000732421875, 0.06967926025390625, 0.093658447265625, 0.11763763427734375, 0.1416168212890625, 0.16559600830078125, 0.1895751953125, 0.21355438232421875, 0.2375335693359375, 0.26151275634765625, 0.285491943359375, 0.30947113037109375, 0.3334503173828125, 0.35742950439453125, 0.38140869140625, 0.40538787841796875, 0.4293670654296875, 0.45334625244140625, 0.477325439453125, 0.5013046264648438, 0.5252838134765625, 0.5492630004882812, 0.5732421875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 19.0, 32.0, 74.0, 118.0, 251.0, 246.0, 126.0, 60.0, 44.0, 18.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015044212341308594, -0.000146377831697464, -0.00014231353998184204, -0.0001382492482662201, -0.00013418495655059814, -0.0001301206648349762, -0.00012605637311935425, -0.0001219920814037323, -0.00011792778968811035, -0.0001138634979724884, -0.00010979920625686646, -0.00010573491454124451, -0.00010167062282562256, -9.760633111000061e-05, -9.354203939437866e-05, -8.947774767875671e-05, -8.541345596313477e-05, -8.134916424751282e-05, -7.728487253189087e-05, -7.322058081626892e-05, -6.915628910064697e-05, -6.509199738502502e-05, -6.1027705669403076e-05, -5.696341395378113e-05, -5.289912223815918e-05, -4.883483052253723e-05, -4.477053880691528e-05, -4.0706247091293335e-05, -3.664195537567139e-05, -3.257766366004944e-05, -2.851337194442749e-05, -2.4449080228805542e-05, -2.0384788513183594e-05, -1.6320496797561646e-05, -1.2256205081939697e-05, -8.191913366317749e-06, -4.127621650695801e-06, -6.332993507385254e-08, 4.000961780548096e-06, 8.065253496170044e-06, 1.2129545211791992e-05, 1.619383692741394e-05, 2.025812864303589e-05, 2.4322420358657837e-05, 2.8386712074279785e-05, 3.2451003789901733e-05, 3.651529550552368e-05, 4.057958722114563e-05, 4.464387893676758e-05, 4.8708170652389526e-05, 5.2772462368011475e-05, 5.683675408363342e-05, 6.090104579925537e-05, 6.496533751487732e-05, 6.902962923049927e-05, 7.309392094612122e-05, 7.715821266174316e-05, 8.122250437736511e-05, 8.528679609298706e-05, 8.935108780860901e-05, 9.341537952423096e-05, 9.74796712398529e-05, 0.00010154396295547485, 0.0001056082546710968, 0.00010967254638671875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 5.0, 5.0, 21.0, 21.0, 28.0, 51.0, 89.0, 182.0, 409.0, 977.0, 2815.0, 11908.0, 157594.0, 831414.0, 34433.0, 5610.0, 1690.0, 651.0, 310.0, 139.0, 82.0, 47.0, 28.0, 10.0, 9.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.443603515625, -0.4245338439941406, -0.40546417236328125, -0.3863945007324219, -0.3673248291015625, -0.3482551574707031, -0.32918548583984375, -0.3101158142089844, -0.291046142578125, -0.2719764709472656, -0.25290679931640625, -0.23383712768554688, -0.2147674560546875, -0.19569778442382812, -0.17662811279296875, -0.15755844116210938, -0.13848876953125, -0.11941909790039062, -0.10034942626953125, -0.08127975463867188, -0.0622100830078125, -0.043140411376953125, -0.02407073974609375, -0.005001068115234375, 0.014068603515625, 0.033138275146484375, 0.05220794677734375, 0.07127761840820312, 0.0903472900390625, 0.10941696166992188, 0.12848663330078125, 0.14755630493164062, 0.1666259765625, 0.18569564819335938, 0.20476531982421875, 0.22383499145507812, 0.2429046630859375, 0.2619743347167969, 0.28104400634765625, 0.3001136779785156, 0.319183349609375, 0.3382530212402344, 0.35732269287109375, 0.3763923645019531, 0.3954620361328125, 0.4145317077636719, 0.43360137939453125, 0.4526710510253906, 0.47174072265625, 0.4908103942871094, 0.5098800659179688, 0.5289497375488281, 0.5480194091796875, 0.5670890808105469, 0.5861587524414062, 0.6052284240722656, 0.624298095703125, 0.6433677673339844, 0.6624374389648438, 0.6815071105957031, 0.7005767822265625, 0.7196464538574219, 0.7387161254882812, 0.7577857971191406, 0.77685546875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 7.0, 10.0, 13.0, 7.0, 16.0, 22.0, 43.0, 76.0, 99.0, 183.0, 190.0, 121.0, 78.0, 46.0, 29.0, 17.0, 6.0, 10.0, 10.0, 7.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.2724609375, -0.2660026550292969, -0.25954437255859375, -0.2530860900878906, -0.2466278076171875, -0.24016952514648438, -0.23371124267578125, -0.22725296020507812, -0.220794677734375, -0.21433639526367188, -0.20787811279296875, -0.20141983032226562, -0.1949615478515625, -0.18850326538085938, -0.18204498291015625, -0.17558670043945312, -0.16912841796875, -0.16267013549804688, -0.15621185302734375, -0.14975357055664062, -0.1432952880859375, -0.13683700561523438, -0.13037872314453125, -0.12392044067382812, -0.117462158203125, -0.11100387573242188, -0.10454559326171875, -0.09808731079101562, -0.0916290283203125, -0.08517074584960938, -0.07871246337890625, -0.07225418090820312, -0.0657958984375, -0.059337615966796875, -0.05287933349609375, -0.046421051025390625, -0.0399627685546875, -0.033504486083984375, -0.02704620361328125, -0.020587921142578125, -0.014129638671875, -0.007671356201171875, -0.00121307373046875, 0.005245208740234375, 0.0117034912109375, 0.018161773681640625, 0.02462005615234375, 0.031078338623046875, 0.03753662109375, 0.043994903564453125, 0.05045318603515625, 0.056911468505859375, 0.0633697509765625, 0.06982803344726562, 0.07628631591796875, 0.08274459838867188, 0.089202880859375, 0.09566116333007812, 0.10211944580078125, 0.10857772827148438, 0.1150360107421875, 0.12149429321289062, 0.12795257568359375, 0.13441085815429688, 0.140869140625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 13.0, 34.0, 114.0, 282.0, 314.0, 161.0, 56.0, 12.0, 9.0, 4.0, 2.0, 2.0], "bins": [-13.127320289611816, -12.893108367919922, -12.658896446228027, -12.424684524536133, -12.190472602844238, -11.956260681152344, -11.722049713134766, -11.487837791442871, -11.253625869750977, -11.019413948059082, -10.785202026367188, -10.550990104675293, -10.316778182983398, -10.08256721496582, -9.84835433959961, -9.614143371582031, -9.37993049621582, -9.145718574523926, -8.911506652832031, -8.677294731140137, -8.443082809448242, -8.208871841430664, -7.974659442901611, -7.740447521209717, -7.5062360763549805, -7.272024154663086, -7.037812232971191, -6.803600311279297, -6.5693888664245605, -6.335176944732666, -6.1009650230407715, -5.866753101348877, -5.632541656494141, -5.398329734802246, -5.164117813110352, -4.929905891418457, -4.695694446563721, -4.461482524871826, -4.227270603179932, -3.993058681488037, -3.758847236633301, -3.5246353149414062, -3.290423631668091, -3.0562117099761963, -2.822000026702881, -2.5877881050109863, -2.353576183319092, -2.1193642616271973, -1.8851525783538818, -1.6509407758712769, -1.4167289733886719, -1.1825170516967773, -0.9483052492141724, -0.7140934467315674, -0.47988152503967285, -0.24566972255706787, -0.01145792007446289, 0.22275391221046448, 0.45696574449539185, 0.6911776065826416, 0.9253894090652466, 1.1596012115478516, 1.393813133239746, 1.628024935722351, 1.862236738204956]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 4.0, 2.0, 5.0, 2.0, 5.0, 16.0, 10.0, 14.0, 10.0, 12.0, 15.0, 11.0, 23.0, 23.0, 30.0, 23.0, 22.0, 29.0, 21.0, 34.0, 26.0, 34.0, 34.0, 31.0, 30.0, 27.0, 35.0, 33.0, 35.0, 32.0, 26.0, 28.0, 33.0, 28.0, 29.0, 33.0, 26.0, 26.0, 23.0, 14.0, 18.0, 17.0, 14.0, 5.0, 9.0, 6.0, 6.0, 5.0, 4.0, 7.0, 3.0, 3.0, 5.0, 5.0, 1.0, 3.0, 5.0], "bins": [-2.1108129024505615, -2.0463504791259766, -1.981887936592102, -1.917425513267517, -1.8529629707336426, -1.7885005474090576, -1.7240381240844727, -1.6595757007598877, -1.5951131582260132, -1.5306507349014282, -1.4661881923675537, -1.4017257690429688, -1.3372633457183838, -1.2728008031845093, -1.2083383798599243, -1.1438758373260498, -1.0794134140014648, -1.0149509906768799, -0.9504884481430054, -0.8860260248184204, -0.8215635418891907, -0.7571010589599609, -0.692638635635376, -0.6281761527061462, -0.5637136697769165, -0.49925118684768677, -0.4347887337207794, -0.37032628059387207, -0.30586379766464233, -0.2414013147354126, -0.17693886160850525, -0.1124764084815979, -0.048014163970947266, 0.016448304057121277, 0.08091077208518982, 0.14537324011325836, 0.2098357081413269, 0.27429819107055664, 0.338760644197464, 0.40322309732437134, 0.4676855802536011, 0.5321480631828308, 0.5966105461120605, 0.6610729694366455, 0.7255354523658752, 0.789997935295105, 0.8544603586196899, 0.9189228415489197, 0.9833853244781494, 1.0478477478027344, 1.1123102903366089, 1.1767727136611938, 1.2412352561950684, 1.3056976795196533, 1.3701601028442383, 1.4346225261688232, 1.4990850687026978, 1.5635474920272827, 1.6280100345611572, 1.6924724578857422, 1.7569348812103271, 1.8213974237442017, 1.8858598470687866, 1.9503223896026611, 2.014784812927246]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 11.0, 4.0, 6.0, 9.0, 30.0, 27.0, 27.0, 57.0, 85.0, 112.0, 193.0, 306.0, 567.0, 1167.0, 2884.0, 9317.0, 80128.0, 2947349.0, 1107046.0, 35589.0, 5533.0, 1813.0, 834.0, 467.0, 255.0, 182.0, 98.0, 70.0, 34.0, 23.0, 21.0, 14.0, 4.0, 4.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.220703125, -2.143707275390625, -2.06671142578125, -1.989715576171875, -1.9127197265625, -1.835723876953125, -1.75872802734375, -1.681732177734375, -1.604736328125, -1.527740478515625, -1.45074462890625, -1.373748779296875, -1.2967529296875, -1.219757080078125, -1.14276123046875, -1.065765380859375, -0.98876953125, -0.911773681640625, -0.83477783203125, -0.757781982421875, -0.6807861328125, -0.603790283203125, -0.52679443359375, -0.449798583984375, -0.372802734375, -0.295806884765625, -0.21881103515625, -0.141815185546875, -0.0648193359375, 0.012176513671875, 0.08917236328125, 0.166168212890625, 0.2431640625, 0.320159912109375, 0.39715576171875, 0.474151611328125, 0.5511474609375, 0.628143310546875, 0.70513916015625, 0.782135009765625, 0.859130859375, 0.936126708984375, 1.01312255859375, 1.090118408203125, 1.1671142578125, 1.244110107421875, 1.32110595703125, 1.398101806640625, 1.47509765625, 1.552093505859375, 1.62908935546875, 1.706085205078125, 1.7830810546875, 1.860076904296875, 1.93707275390625, 2.014068603515625, 2.091064453125, 2.168060302734375, 2.24505615234375, 2.322052001953125, 2.3990478515625, 2.476043701171875, 2.55303955078125, 2.630035400390625, 2.70703125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 1.0, 10.0, 11.0, 11.0, 18.0, 27.0, 33.0, 42.0, 65.0, 70.0, 67.0, 78.0, 85.0, 75.0, 78.0, 72.0, 62.0, 53.0, 35.0, 31.0, 28.0, 8.0, 14.0, 14.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1064453125, -1.06170654296875, -1.0169677734375, -0.97222900390625, -0.927490234375, -0.88275146484375, -0.8380126953125, -0.79327392578125, -0.74853515625, -0.70379638671875, -0.6590576171875, -0.61431884765625, -0.569580078125, -0.52484130859375, -0.4801025390625, -0.43536376953125, -0.390625, -0.34588623046875, -0.3011474609375, -0.25640869140625, -0.211669921875, -0.16693115234375, -0.1221923828125, -0.07745361328125, -0.03271484375, 0.01202392578125, 0.0567626953125, 0.10150146484375, 0.146240234375, 0.19097900390625, 0.2357177734375, 0.28045654296875, 0.3251953125, 0.36993408203125, 0.4146728515625, 0.45941162109375, 0.504150390625, 0.54888916015625, 0.5936279296875, 0.63836669921875, 0.68310546875, 0.72784423828125, 0.7725830078125, 0.81732177734375, 0.862060546875, 0.90679931640625, 0.9515380859375, 0.99627685546875, 1.041015625, 1.08575439453125, 1.1304931640625, 1.17523193359375, 1.219970703125, 1.26470947265625, 1.3094482421875, 1.35418701171875, 1.39892578125, 1.44366455078125, 1.4884033203125, 1.53314208984375, 1.577880859375, 1.62261962890625, 1.6673583984375, 1.71209716796875, 1.7568359375]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 1.0, 13.0, 17.0, 23.0, 37.0, 65.0, 103.0, 227.0, 526.0, 1438.0, 5082.0, 29958.0, 1881080.0, 2235320.0, 32447.0, 5285.0, 1569.0, 554.0, 253.0, 136.0, 53.0, 34.0, 20.0, 18.0, 8.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.591796875, -1.51226806640625, -1.4327392578125, -1.35321044921875, -1.273681640625, -1.19415283203125, -1.1146240234375, -1.03509521484375, -0.95556640625, -0.87603759765625, -0.7965087890625, -0.71697998046875, -0.637451171875, -0.55792236328125, -0.4783935546875, -0.39886474609375, -0.3193359375, -0.23980712890625, -0.1602783203125, -0.08074951171875, -0.001220703125, 0.07830810546875, 0.1578369140625, 0.23736572265625, 0.31689453125, 0.39642333984375, 0.4759521484375, 0.55548095703125, 0.635009765625, 0.71453857421875, 0.7940673828125, 0.87359619140625, 0.953125, 1.03265380859375, 1.1121826171875, 1.19171142578125, 1.271240234375, 1.35076904296875, 1.4302978515625, 1.50982666015625, 1.58935546875, 1.66888427734375, 1.7484130859375, 1.82794189453125, 1.907470703125, 1.98699951171875, 2.0665283203125, 2.14605712890625, 2.2255859375, 2.30511474609375, 2.3846435546875, 2.46417236328125, 2.543701171875, 2.62322998046875, 2.7027587890625, 2.78228759765625, 2.86181640625, 2.94134521484375, 3.0208740234375, 3.10040283203125, 3.179931640625, 3.25946044921875, 3.3389892578125, 3.41851806640625, 3.498046875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 10.0, 11.0, 12.0, 17.0, 30.0, 55.0, 91.0, 157.0, 384.0, 828.0, 1035.0, 726.0, 370.0, 136.0, 76.0, 51.0, 28.0, 21.0, 7.0, 10.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.8466796875, -0.8261985778808594, -0.8057174682617188, -0.7852363586425781, -0.7647552490234375, -0.7442741394042969, -0.7237930297851562, -0.7033119201660156, -0.682830810546875, -0.6623497009277344, -0.6418685913085938, -0.6213874816894531, -0.6009063720703125, -0.5804252624511719, -0.5599441528320312, -0.5394630432128906, -0.51898193359375, -0.4985008239746094, -0.47801971435546875, -0.4575386047363281, -0.4370574951171875, -0.4165763854980469, -0.39609527587890625, -0.3756141662597656, -0.355133056640625, -0.3346519470214844, -0.31417083740234375, -0.2936897277832031, -0.2732086181640625, -0.2527275085449219, -0.23224639892578125, -0.21176528930664062, -0.1912841796875, -0.17080307006835938, -0.15032196044921875, -0.12984085083007812, -0.1093597412109375, -0.08887863159179688, -0.06839752197265625, -0.047916412353515625, -0.027435302734375, -0.006954193115234375, 0.01352691650390625, 0.034008026123046875, 0.0544891357421875, 0.07497024536132812, 0.09545135498046875, 0.11593246459960938, 0.13641357421875, 0.15689468383789062, 0.17737579345703125, 0.19785690307617188, 0.2183380126953125, 0.23881912231445312, 0.25930023193359375, 0.2797813415527344, 0.300262451171875, 0.3207435607910156, 0.34122467041015625, 0.3617057800292969, 0.3821868896484375, 0.4026679992675781, 0.42314910888671875, 0.4436302185058594, 0.464111328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 6.0, 4.0, 9.0, 8.0, 13.0, 29.0, 51.0, 89.0, 100.0, 162.0, 168.0, 121.0, 120.0, 54.0, 24.0, 21.0, 9.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.3088536262512207, -3.229905366897583, -3.1509573459625244, -3.0720090866088867, -2.993060827255249, -2.9141125679016113, -2.8351645469665527, -2.756216287612915, -2.6772680282592773, -2.5983197689056396, -2.519371747970581, -2.4404234886169434, -2.3614752292633057, -2.282526969909668, -2.2035789489746094, -2.1246306896209717, -2.045682668685913, -1.966734528541565, -1.8877862691879272, -1.808838129043579, -1.7298898696899414, -1.6509417295455933, -1.5719935894012451, -1.4930453300476074, -1.4140971899032593, -1.3351490497589111, -1.2562007904052734, -1.1772526502609253, -1.0983045101165771, -1.0193562507629395, -0.9404081106185913, -0.8614599108695984, -0.7825114727020264, -0.7035632729530334, -0.6246150732040405, -0.5456669330596924, -0.46671873331069946, -0.38777053356170654, -0.308822363615036, -0.22987419366836548, -0.15092599391937256, -0.07197780907154083, 0.0069703757762908936, 0.08591856062412262, 0.16486674547195435, 0.24381494522094727, 0.3227631151676178, 0.40171128511428833, 0.48065948486328125, 0.5596076846122742, 0.6385558843612671, 0.7175040245056152, 0.7964522242546082, 0.8754004240036011, 0.9543485641479492, 1.033296823501587, 1.112244963645935, 1.1911931037902832, 1.270141363143921, 1.349089503288269, 1.4280376434326172, 1.5069859027862549, 1.585934042930603, 1.6648821830749512, 1.7438304424285889]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 7.0, 3.0, 6.0, 10.0, 14.0, 14.0, 9.0, 15.0, 18.0, 23.0, 29.0, 24.0, 35.0, 36.0, 38.0, 52.0, 43.0, 52.0, 50.0, 50.0, 48.0, 51.0, 48.0, 42.0, 42.0, 41.0, 36.0, 32.0, 27.0, 20.0, 16.0, 10.0, 9.0, 8.0, 6.0, 9.0, 3.0, 4.0, 4.0, 5.0, 8.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.8334425687789917, -0.801851212978363, -0.7702597975730896, -0.7386684417724609, -0.7070770859718323, -0.6754857301712036, -0.6438943147659302, -0.6123029589653015, -0.5807116031646729, -0.5491202473640442, -0.5175288319587708, -0.4859374761581421, -0.4543461203575134, -0.4227547347545624, -0.39116334915161133, -0.35957199335098267, -0.32798057794570923, -0.2963891923427582, -0.2647978365421295, -0.23320645093917847, -0.2016150802373886, -0.17002370953559875, -0.1384323239326477, -0.10684095323085785, -0.075249582529068, -0.04365820810198784, -0.012066833674907684, 0.01952454447746277, 0.051115915179252625, 0.08270728588104248, 0.11429867148399353, 0.1458900421857834, 0.17748141288757324, 0.2090727835893631, 0.24066415429115295, 0.272255539894104, 0.30384689569473267, 0.3354382812976837, 0.36702966690063477, 0.3986210227012634, 0.4302124083042145, 0.4618037939071655, 0.4933951497077942, 0.5249865055084229, 0.5565779209136963, 0.588169276714325, 0.6197606325149536, 0.651352047920227, 0.6829434037208557, 0.7145347595214844, 0.7461261749267578, 0.7777175307273865, 0.8093088865280151, 0.8409003019332886, 0.8724916577339172, 0.9040830135345459, 0.9356744289398193, 0.967265784740448, 0.9988572001457214, 1.03044855594635, 1.0620399713516235, 1.0936312675476074, 1.1252226829528809, 1.1568140983581543, 1.1884053945541382]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 9.0, 13.0, 19.0, 29.0, 61.0, 95.0, 201.0, 450.0, 1144.0, 3398.0, 12396.0, 81496.0, 773289.0, 151702.0, 17176.0, 4550.0, 1506.0, 495.0, 248.0, 106.0, 64.0, 27.0, 18.0, 15.0, 7.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.52001953125, -0.5054168701171875, -0.490814208984375, -0.4762115478515625, -0.46160888671875, -0.4470062255859375, -0.432403564453125, -0.4178009033203125, -0.4031982421875, -0.3885955810546875, -0.373992919921875, -0.3593902587890625, -0.34478759765625, -0.3301849365234375, -0.315582275390625, -0.3009796142578125, -0.286376953125, -0.2717742919921875, -0.257171630859375, -0.2425689697265625, -0.22796630859375, -0.2133636474609375, -0.198760986328125, -0.1841583251953125, -0.1695556640625, -0.1549530029296875, -0.140350341796875, -0.1257476806640625, -0.11114501953125, -0.0965423583984375, -0.081939697265625, -0.0673370361328125, -0.052734375, -0.0381317138671875, -0.023529052734375, -0.0089263916015625, 0.00567626953125, 0.0202789306640625, 0.034881591796875, 0.0494842529296875, 0.0640869140625, 0.0786895751953125, 0.093292236328125, 0.1078948974609375, 0.12249755859375, 0.1371002197265625, 0.151702880859375, 0.1663055419921875, 0.180908203125, 0.1955108642578125, 0.210113525390625, 0.2247161865234375, 0.23931884765625, 0.2539215087890625, 0.268524169921875, 0.2831268310546875, 0.2977294921875, 0.3123321533203125, 0.326934814453125, 0.3415374755859375, 0.35614013671875, 0.3707427978515625, 0.385345458984375, 0.3999481201171875, 0.41455078125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 10.0, 4.0, 11.0, 8.0, 17.0, 30.0, 34.0, 26.0, 45.0, 62.0, 60.0, 57.0, 79.0, 85.0, 74.0, 70.0, 65.0, 58.0, 47.0, 52.0, 32.0, 15.0, 19.0, 10.0, 9.0, 4.0, 9.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72509765625, -0.6944198608398438, -0.6637420654296875, -0.6330642700195312, -0.602386474609375, -0.5717086791992188, -0.5410308837890625, -0.5103530883789062, -0.47967529296875, -0.44899749755859375, -0.4183197021484375, -0.38764190673828125, -0.356964111328125, -0.32628631591796875, -0.2956085205078125, -0.26493072509765625, -0.2342529296875, -0.20357513427734375, -0.1728973388671875, -0.14221954345703125, -0.111541748046875, -0.08086395263671875, -0.0501861572265625, -0.01950836181640625, 0.01116943359375, 0.04184722900390625, 0.0725250244140625, 0.10320281982421875, 0.133880615234375, 0.16455841064453125, 0.1952362060546875, 0.22591400146484375, 0.256591796875, 0.28726959228515625, 0.3179473876953125, 0.34862518310546875, 0.379302978515625, 0.40998077392578125, 0.4406585693359375, 0.47133636474609375, 0.50201416015625, 0.5326919555664062, 0.5633697509765625, 0.5940475463867188, 0.624725341796875, 0.6554031372070312, 0.6860809326171875, 0.7167587280273438, 0.7474365234375, 0.7781143188476562, 0.8087921142578125, 0.8394699096679688, 0.870147705078125, 0.9008255004882812, 0.9315032958984375, 0.9621810913085938, 0.99285888671875, 1.0235366821289062, 1.0542144775390625, 1.0848922729492188, 1.115570068359375, 1.1462478637695312, 1.1769256591796875, 1.2076034545898438, 1.23828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 12.0, 8.0, 17.0, 12.0, 27.0, 29.0, 44.0, 61.0, 72.0, 118.0, 175.0, 300.0, 490.0, 851.0, 1549.0, 2903.0, 5812.0, 12100.0, 33684.0, 127768.0, 444419.0, 303418.0, 73994.0, 21954.0, 9034.0, 4320.0, 2203.0, 1252.0, 718.0, 401.0, 245.0, 177.0, 115.0, 69.0, 54.0, 42.0, 28.0, 18.0, 19.0, 11.0, 7.0, 9.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.1951904296875, -0.1892414093017578, -0.18329238891601562, -0.17734336853027344, -0.17139434814453125, -0.16544532775878906, -0.15949630737304688, -0.1535472869873047, -0.1475982666015625, -0.1416492462158203, -0.13570022583007812, -0.12975120544433594, -0.12380218505859375, -0.11785316467285156, -0.11190414428710938, -0.10595512390136719, -0.100006103515625, -0.09405708312988281, -0.08810806274414062, -0.08215904235839844, -0.07621002197265625, -0.07026100158691406, -0.06431198120117188, -0.05836296081542969, -0.0524139404296875, -0.04646492004394531, -0.040515899658203125, -0.03456687927246094, -0.02861785888671875, -0.022668838500976562, -0.016719818115234375, -0.010770797729492188, -0.00482177734375, 0.0011272430419921875, 0.007076263427734375, 0.013025283813476562, 0.01897430419921875, 0.024923324584960938, 0.030872344970703125, 0.03682136535644531, 0.0427703857421875, 0.04871940612792969, 0.054668426513671875, 0.06061744689941406, 0.06656646728515625, 0.07251548767089844, 0.07846450805664062, 0.08441352844238281, 0.090362548828125, 0.09631156921386719, 0.10226058959960938, 0.10820960998535156, 0.11415863037109375, 0.12010765075683594, 0.12605667114257812, 0.1320056915283203, 0.1379547119140625, 0.1439037322998047, 0.14985275268554688, 0.15580177307128906, 0.16175079345703125, 0.16769981384277344, 0.17364883422851562, 0.1795978546142578, 0.185546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 0.0, 4.0, 6.0, 15.0, 15.0, 22.0, 26.0, 40.0, 39.0, 36.0, 45.0, 36.0, 35.0, 52.0, 58.0, 60.0, 58.0, 68.0, 44.0, 62.0, 44.0, 41.0, 42.0, 24.0, 27.0, 23.0, 20.0, 14.0, 8.0, 5.0, 3.0, 7.0, 2.0, 4.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.564453125, -1.5181884765625, -1.471923828125, -1.4256591796875, -1.37939453125, -1.3331298828125, -1.286865234375, -1.2406005859375, -1.1943359375, -1.1480712890625, -1.101806640625, -1.0555419921875, -1.00927734375, -0.9630126953125, -0.916748046875, -0.8704833984375, -0.82421875, -0.7779541015625, -0.731689453125, -0.6854248046875, -0.63916015625, -0.5928955078125, -0.546630859375, -0.5003662109375, -0.4541015625, -0.4078369140625, -0.361572265625, -0.3153076171875, -0.26904296875, -0.2227783203125, -0.176513671875, -0.1302490234375, -0.083984375, -0.0377197265625, 0.008544921875, 0.0548095703125, 0.10107421875, 0.1473388671875, 0.193603515625, 0.2398681640625, 0.2861328125, 0.3323974609375, 0.378662109375, 0.4249267578125, 0.47119140625, 0.5174560546875, 0.563720703125, 0.6099853515625, 0.65625, 0.7025146484375, 0.748779296875, 0.7950439453125, 0.84130859375, 0.8875732421875, 0.933837890625, 0.9801025390625, 1.0263671875, 1.0726318359375, 1.118896484375, 1.1651611328125, 1.21142578125, 1.2576904296875, 1.303955078125, 1.3502197265625, 1.396484375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 6.0, 9.0, 11.0, 26.0, 21.0, 33.0, 46.0, 61.0, 97.0, 163.0, 211.0, 300.0, 566.0, 900.0, 1583.0, 3310.0, 8402.0, 26753.0, 131765.0, 550185.0, 256901.0, 45408.0, 12214.0, 4520.0, 2075.0, 1132.0, 635.0, 408.0, 256.0, 169.0, 114.0, 73.0, 48.0, 33.0, 29.0, 19.0, 14.0, 12.0, 10.0, 9.0, 6.0, 6.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0787353515625, -0.07632637023925781, -0.07391738891601562, -0.07150840759277344, -0.06909942626953125, -0.06669044494628906, -0.06428146362304688, -0.06187248229980469, -0.0594635009765625, -0.05705451965332031, -0.054645538330078125, -0.05223655700683594, -0.04982757568359375, -0.04741859436035156, -0.045009613037109375, -0.04260063171386719, -0.040191650390625, -0.03778266906738281, -0.035373687744140625, -0.03296470642089844, -0.03055572509765625, -0.028146743774414062, -0.025737762451171875, -0.023328781127929688, -0.0209197998046875, -0.018510818481445312, -0.016101837158203125, -0.013692855834960938, -0.01128387451171875, -0.008874893188476562, -0.006465911865234375, -0.0040569305419921875, -0.00164794921875, 0.0007610321044921875, 0.003170013427734375, 0.0055789947509765625, 0.00798797607421875, 0.010396957397460938, 0.012805938720703125, 0.015214920043945312, 0.0176239013671875, 0.020032882690429688, 0.022441864013671875, 0.024850845336914062, 0.02725982666015625, 0.029668807983398438, 0.032077789306640625, 0.03448677062988281, 0.036895751953125, 0.03930473327636719, 0.041713714599609375, 0.04412269592285156, 0.04653167724609375, 0.04894065856933594, 0.051349639892578125, 0.05375862121582031, 0.0561676025390625, 0.05857658386230469, 0.060985565185546875, 0.06339454650878906, 0.06580352783203125, 0.06821250915527344, 0.07062149047851562, 0.07303047180175781, 0.075439453125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 5.0, 12.0, 8.0, 36.0, 81.0, 232.0, 344.0, 185.0, 53.0, 19.0, 13.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011342763900756836, -0.00010955985635519028, -0.0001056920737028122, -0.00010182429105043411, -9.795650839805603e-05, -9.408872574567795e-05, -9.022094309329987e-05, -8.635316044092178e-05, -8.24853777885437e-05, -7.861759513616562e-05, -7.474981248378754e-05, -7.088202983140945e-05, -6.701424717903137e-05, -6.314646452665329e-05, -5.927868187427521e-05, -5.5410899221897125e-05, -5.154311656951904e-05, -4.767533391714096e-05, -4.380755126476288e-05, -3.9939768612384796e-05, -3.6071985960006714e-05, -3.220420330762863e-05, -2.833642065525055e-05, -2.4468638002872467e-05, -2.0600855350494385e-05, -1.6733072698116302e-05, -1.286529004573822e-05, -8.997507393360138e-06, -5.129724740982056e-06, -1.2619420886039734e-06, 2.605840563774109e-06, 6.473623216152191e-06, 1.0341405868530273e-05, 1.4209188520908356e-05, 1.8076971173286438e-05, 2.194475382566452e-05, 2.5812536478042603e-05, 2.9680319130420685e-05, 3.354810178279877e-05, 3.741588443517685e-05, 4.128366708755493e-05, 4.5151449739933014e-05, 4.9019232392311096e-05, 5.288701504468918e-05, 5.675479769706726e-05, 6.062258034944534e-05, 6.449036300182343e-05, 6.835814565420151e-05, 7.222592830657959e-05, 7.609371095895767e-05, 7.996149361133575e-05, 8.382927626371384e-05, 8.769705891609192e-05, 9.156484156847e-05, 9.543262422084808e-05, 9.930040687322617e-05, 0.00010316818952560425, 0.00010703597217798233, 0.00011090375483036041, 0.0001147715374827385, 0.00011863932013511658, 0.00012250710278749466, 0.00012637488543987274, 0.00013024266809225082, 0.0001341104507446289]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 6.0, 5.0, 8.0, 14.0, 20.0, 20.0, 35.0, 39.0, 56.0, 99.0, 140.0, 239.0, 354.0, 609.0, 1105.0, 1972.0, 4210.0, 10882.0, 36743.0, 160811.0, 486709.0, 259887.0, 57461.0, 15729.0, 5710.0, 2420.0, 1331.0, 698.0, 427.0, 284.0, 170.0, 120.0, 74.0, 42.0, 38.0, 26.0, 23.0, 6.0, 10.0, 7.0, 9.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0723876953125, -0.07017135620117188, -0.06795501708984375, -0.06573867797851562, -0.0635223388671875, -0.061305999755859375, -0.05908966064453125, -0.056873321533203125, -0.054656982421875, -0.052440643310546875, -0.05022430419921875, -0.048007965087890625, -0.0457916259765625, -0.043575286865234375, -0.04135894775390625, -0.039142608642578125, -0.03692626953125, -0.034709930419921875, -0.03249359130859375, -0.030277252197265625, -0.0280609130859375, -0.025844573974609375, -0.02362823486328125, -0.021411895751953125, -0.019195556640625, -0.016979217529296875, -0.01476287841796875, -0.012546539306640625, -0.0103302001953125, -0.008113861083984375, -0.00589752197265625, -0.003681182861328125, -0.00146484375, 0.000751495361328125, 0.00296783447265625, 0.005184173583984375, 0.0074005126953125, 0.009616851806640625, 0.01183319091796875, 0.014049530029296875, 0.016265869140625, 0.018482208251953125, 0.02069854736328125, 0.022914886474609375, 0.0251312255859375, 0.027347564697265625, 0.02956390380859375, 0.031780242919921875, 0.03399658203125, 0.036212921142578125, 0.03842926025390625, 0.040645599365234375, 0.0428619384765625, 0.045078277587890625, 0.04729461669921875, 0.049510955810546875, 0.051727294921875, 0.053943634033203125, 0.05615997314453125, 0.058376312255859375, 0.0605926513671875, 0.06280899047851562, 0.06502532958984375, 0.06724166870117188, 0.0694580078125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 2.0, 7.0, 4.0, 5.0, 9.0, 12.0, 12.0, 20.0, 29.0, 28.0, 36.0, 41.0, 63.0, 71.0, 75.0, 82.0, 77.0, 76.0, 67.0, 67.0, 46.0, 33.0, 27.0, 22.0, 14.0, 22.0, 13.0, 12.0, 9.0, 7.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0175933837890625, -0.01701831817626953, -0.016443252563476562, -0.015868186950683594, -0.015293121337890625, -0.014718055725097656, -0.014142990112304688, -0.013567924499511719, -0.01299285888671875, -0.012417793273925781, -0.011842727661132812, -0.011267662048339844, -0.010692596435546875, -0.010117530822753906, -0.009542465209960938, -0.008967399597167969, -0.008392333984375, -0.007817268371582031, -0.0072422027587890625, -0.006667137145996094, -0.006092071533203125, -0.005517005920410156, -0.0049419403076171875, -0.004366874694824219, -0.00379180908203125, -0.0032167434692382812, -0.0026416778564453125, -0.0020666122436523438, -0.001491546630859375, -0.0009164810180664062, -0.0003414154052734375, 0.00023365020751953125, 0.0008087158203125, 0.0013837814331054688, 0.0019588470458984375, 0.0025339126586914062, 0.003108978271484375, 0.0036840438842773438, 0.0042591094970703125, 0.004834175109863281, 0.00540924072265625, 0.005984306335449219, 0.0065593719482421875, 0.007134437561035156, 0.007709503173828125, 0.008284568786621094, 0.008859634399414062, 0.009434700012207031, 0.010009765625, 0.010584831237792969, 0.011159896850585938, 0.011734962463378906, 0.012310028076171875, 0.012885093688964844, 0.013460159301757812, 0.014035224914550781, 0.01461029052734375, 0.015185356140136719, 0.015760421752929688, 0.016335487365722656, 0.016910552978515625, 0.017485618591308594, 0.018060684204101562, 0.01863574981689453, 0.0192108154296875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 13.0, 11.0, 25.0, 77.0, 170.0, 293.0, 228.0, 113.0, 37.0, 16.0, 8.0, 6.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.750623941421509, -3.6717898845672607, -3.5929555892944336, -3.5141215324401855, -3.4352874755859375, -3.3564534187316895, -3.2776191234588623, -3.1987850666046143, -3.119950771331787, -3.041116714477539, -2.962282419204712, -2.883448362350464, -2.804614305496216, -2.7257800102233887, -2.6469459533691406, -2.5681118965148926, -2.4892778396606445, -2.4104437828063965, -2.3316094875335693, -2.2527754306793213, -2.1739413738250732, -2.095107078552246, -2.016273021697998, -1.93743896484375, -1.8586047887802124, -1.7797706127166748, -1.7009365558624268, -1.6221023797988892, -1.5432682037353516, -1.4644341468811035, -1.385599970817566, -1.3067657947540283, -1.2279317378997803, -1.1490975618362427, -1.0702635049819946, -0.991429328918457, -0.9125952124595642, -0.8337610960006714, -0.7549269199371338, -0.676092803478241, -0.5972586870193481, -0.5184245705604553, -0.4395904242992401, -0.3607562780380249, -0.2819221615791321, -0.20308804512023926, -0.12425389885902405, -0.04541975259780884, 0.033414363861083984, 0.112248495221138, 0.19108262658119202, 0.2699167728424072, 0.34875088930130005, 0.42758500576019287, 0.5064191818237305, 0.5852532982826233, 0.6640874147415161, 0.7429215312004089, 0.8217556476593018, 0.9005898237228394, 0.9794239401817322, 1.058258056640625, 1.1370922327041626, 1.2159264087677002, 1.2947604656219482]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 5.0, 7.0, 6.0, 12.0, 14.0, 18.0, 18.0, 26.0, 35.0, 31.0, 44.0, 56.0, 67.0, 64.0, 73.0, 79.0, 71.0, 76.0, 58.0, 52.0, 42.0, 45.0, 25.0, 24.0, 11.0, 7.0, 14.0, 8.0, 6.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8210428357124329, -0.7928128838539124, -0.7645828723907471, -0.7363529205322266, -0.708122968673706, -0.6798929572105408, -0.6516630053520203, -0.623432993888855, -0.5952030420303345, -0.566973090171814, -0.5387430787086487, -0.5105131268501282, -0.4822831451892853, -0.4540531635284424, -0.4258232116699219, -0.397593230009079, -0.36936327815055847, -0.3411332964897156, -0.31290334463119507, -0.2846733629703522, -0.2564433813095093, -0.22821341454982758, -0.19998344779014587, -0.17175346612930298, -0.14352349936962128, -0.11529352515935898, -0.08706355094909668, -0.05883358418941498, -0.03060360997915268, -0.002373635768890381, 0.02585633099079132, 0.054086312651634216, 0.08231627941131592, 0.11054625362157822, 0.13877622783184052, 0.16700619459152222, 0.1952361762523651, 0.22346614301204681, 0.2516961097717285, 0.2799260914325714, 0.3081560730934143, 0.3363860547542572, 0.3646160066127777, 0.3928459882736206, 0.4210759699344635, 0.4493059515953064, 0.4775359034538269, 0.5057659149169922, 0.5339958667755127, 0.5622258186340332, 0.5904558300971985, 0.618685781955719, 0.6469157338142395, 0.6751457452774048, 0.7033756971359253, 0.7316056489944458, 0.7598356008529663, 0.7880655527114868, 0.8162955641746521, 0.8445255160331726, 0.8727554678916931, 0.9009854793548584, 0.9292154312133789, 0.9574453830718994, 0.9856753945350647]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 6.0, 6.0, 11.0, 17.0, 24.0, 25.0, 37.0, 45.0, 81.0, 144.0, 271.0, 446.0, 915.0, 2080.0, 5970.0, 23429.0, 157744.0, 742349.0, 91118.0, 15912.0, 4517.0, 1649.0, 764.0, 375.0, 218.0, 155.0, 65.0, 57.0, 44.0, 16.0, 14.0, 8.0, 13.0, 5.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.99658203125, -0.9667205810546875, -0.936859130859375, -0.9069976806640625, -0.87713623046875, -0.8472747802734375, -0.817413330078125, -0.7875518798828125, -0.7576904296875, -0.7278289794921875, -0.697967529296875, -0.6681060791015625, -0.63824462890625, -0.6083831787109375, -0.578521728515625, -0.5486602783203125, -0.518798828125, -0.4889373779296875, -0.459075927734375, -0.4292144775390625, -0.39935302734375, -0.3694915771484375, -0.339630126953125, -0.3097686767578125, -0.2799072265625, -0.2500457763671875, -0.220184326171875, -0.1903228759765625, -0.16046142578125, -0.1305999755859375, -0.100738525390625, -0.0708770751953125, -0.041015625, -0.0111541748046875, 0.018707275390625, 0.0485687255859375, 0.07843017578125, 0.1082916259765625, 0.138153076171875, 0.1680145263671875, 0.1978759765625, 0.2277374267578125, 0.257598876953125, 0.2874603271484375, 0.31732177734375, 0.3471832275390625, 0.377044677734375, 0.4069061279296875, 0.436767578125, 0.4666290283203125, 0.496490478515625, 0.5263519287109375, 0.55621337890625, 0.5860748291015625, 0.615936279296875, 0.6457977294921875, 0.6756591796875, 0.7055206298828125, 0.735382080078125, 0.7652435302734375, 0.79510498046875, 0.8249664306640625, 0.854827880859375, 0.8846893310546875, 0.91455078125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 7.0, 8.0, 6.0, 11.0, 8.0, 12.0, 17.0, 11.0, 32.0, 31.0, 40.0, 40.0, 52.0, 53.0, 60.0, 66.0, 79.0, 66.0, 64.0, 60.0, 59.0, 48.0, 28.0, 29.0, 28.0, 18.0, 17.0, 11.0, 12.0, 9.0, 8.0, 6.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.736328125, -1.6845550537109375, -1.632781982421875, -1.5810089111328125, -1.52923583984375, -1.4774627685546875, -1.425689697265625, -1.3739166259765625, -1.3221435546875, -1.2703704833984375, -1.218597412109375, -1.1668243408203125, -1.11505126953125, -1.0632781982421875, -1.011505126953125, -0.9597320556640625, -0.907958984375, -0.8561859130859375, -0.804412841796875, -0.7526397705078125, -0.70086669921875, -0.6490936279296875, -0.597320556640625, -0.5455474853515625, -0.4937744140625, -0.4420013427734375, -0.390228271484375, -0.3384552001953125, -0.28668212890625, -0.2349090576171875, -0.183135986328125, -0.1313629150390625, -0.07958984375, -0.0278167724609375, 0.023956298828125, 0.0757293701171875, 0.12750244140625, 0.1792755126953125, 0.231048583984375, 0.2828216552734375, 0.3345947265625, 0.3863677978515625, 0.438140869140625, 0.4899139404296875, 0.54168701171875, 0.5934600830078125, 0.645233154296875, 0.6970062255859375, 0.748779296875, 0.8005523681640625, 0.852325439453125, 0.9040985107421875, 0.95587158203125, 1.0076446533203125, 1.059417724609375, 1.1111907958984375, 1.1629638671875, 1.2147369384765625, 1.266510009765625, 1.3182830810546875, 1.37005615234375, 1.4218292236328125, 1.473602294921875, 1.5253753662109375, 1.5771484375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 10.0, 10.0, 7.0, 9.0, 11.0, 11.0, 19.0, 28.0, 31.0, 31.0, 28.0, 51.0, 73.0, 107.0, 174.0, 413.0, 1942.0, 19025.0, 942857.0, 78343.0, 4019.0, 685.0, 215.0, 136.0, 68.0, 54.0, 39.0, 26.0, 28.0, 19.0, 19.0, 13.0, 8.0, 8.0, 14.0, 4.0, 5.0, 3.0, 2.0, 0.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0], "bins": [-2.453125, -2.386260986328125, -2.31939697265625, -2.252532958984375, -2.1856689453125, -2.118804931640625, -2.05194091796875, -1.985076904296875, -1.918212890625, -1.851348876953125, -1.78448486328125, -1.717620849609375, -1.6507568359375, -1.583892822265625, -1.51702880859375, -1.450164794921875, -1.38330078125, -1.316436767578125, -1.24957275390625, -1.182708740234375, -1.1158447265625, -1.048980712890625, -0.98211669921875, -0.915252685546875, -0.848388671875, -0.781524658203125, -0.71466064453125, -0.647796630859375, -0.5809326171875, -0.514068603515625, -0.44720458984375, -0.380340576171875, -0.3134765625, -0.246612548828125, -0.17974853515625, -0.112884521484375, -0.0460205078125, 0.020843505859375, 0.08770751953125, 0.154571533203125, 0.221435546875, 0.288299560546875, 0.35516357421875, 0.422027587890625, 0.4888916015625, 0.555755615234375, 0.62261962890625, 0.689483642578125, 0.75634765625, 0.823211669921875, 0.89007568359375, 0.956939697265625, 1.0238037109375, 1.090667724609375, 1.15753173828125, 1.224395751953125, 1.291259765625, 1.358123779296875, 1.42498779296875, 1.491851806640625, 1.5587158203125, 1.625579833984375, 1.69244384765625, 1.759307861328125, 1.826171875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 6.0, 9.0, 13.0, 15.0, 20.0, 24.0, 33.0, 21.0, 36.0, 33.0, 42.0, 44.0, 44.0, 51.0, 56.0, 60.0, 58.0, 54.0, 45.0, 51.0, 40.0, 38.0, 32.0, 29.0, 17.0, 20.0, 17.0, 17.0, 5.0, 11.0, 11.0, 5.0, 6.0, 10.0, 2.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 3.0], "bins": [-1.9912109375, -1.938751220703125, -1.88629150390625, -1.833831787109375, -1.7813720703125, -1.728912353515625, -1.67645263671875, -1.623992919921875, -1.571533203125, -1.519073486328125, -1.46661376953125, -1.414154052734375, -1.3616943359375, -1.309234619140625, -1.25677490234375, -1.204315185546875, -1.15185546875, -1.099395751953125, -1.04693603515625, -0.994476318359375, -0.9420166015625, -0.889556884765625, -0.83709716796875, -0.784637451171875, -0.732177734375, -0.679718017578125, -0.62725830078125, -0.574798583984375, -0.5223388671875, -0.469879150390625, -0.41741943359375, -0.364959716796875, -0.3125, -0.260040283203125, -0.20758056640625, -0.155120849609375, -0.1026611328125, -0.050201416015625, 0.00225830078125, 0.054718017578125, 0.107177734375, 0.159637451171875, 0.21209716796875, 0.264556884765625, 0.3170166015625, 0.369476318359375, 0.42193603515625, 0.474395751953125, 0.52685546875, 0.579315185546875, 0.63177490234375, 0.684234619140625, 0.7366943359375, 0.789154052734375, 0.84161376953125, 0.894073486328125, 0.946533203125, 0.998992919921875, 1.05145263671875, 1.103912353515625, 1.1563720703125, 1.208831787109375, 1.26129150390625, 1.313751220703125, 1.3662109375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 5.0, 10.0, 10.0, 10.0, 23.0, 38.0, 80.0, 119.0, 254.0, 535.0, 1548.0, 7182.0, 175700.0, 842251.0, 16710.0, 2540.0, 812.0, 350.0, 145.0, 81.0, 50.0, 32.0, 16.0, 14.0, 6.0, 5.0, 9.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.845703125, -0.82232666015625, -0.7989501953125, -0.77557373046875, -0.752197265625, -0.72882080078125, -0.7054443359375, -0.68206787109375, -0.65869140625, -0.63531494140625, -0.6119384765625, -0.58856201171875, -0.565185546875, -0.54180908203125, -0.5184326171875, -0.49505615234375, -0.4716796875, -0.44830322265625, -0.4249267578125, -0.40155029296875, -0.378173828125, -0.35479736328125, -0.3314208984375, -0.30804443359375, -0.28466796875, -0.26129150390625, -0.2379150390625, -0.21453857421875, -0.191162109375, -0.16778564453125, -0.1444091796875, -0.12103271484375, -0.09765625, -0.07427978515625, -0.0509033203125, -0.02752685546875, -0.004150390625, 0.01922607421875, 0.0426025390625, 0.06597900390625, 0.08935546875, 0.11273193359375, 0.1361083984375, 0.15948486328125, 0.182861328125, 0.20623779296875, 0.2296142578125, 0.25299072265625, 0.2763671875, 0.29974365234375, 0.3231201171875, 0.34649658203125, 0.369873046875, 0.39324951171875, 0.4166259765625, 0.44000244140625, 0.46337890625, 0.48675537109375, 0.5101318359375, 0.53350830078125, 0.556884765625, 0.58026123046875, 0.6036376953125, 0.62701416015625, 0.650390625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 8.0, 8.0, 7.0, 13.0, 20.0, 28.0, 50.0, 77.0, 116.0, 302.0, 151.0, 83.0, 56.0, 25.0, 22.0, 12.0, 10.0, 2.0, 5.0, 5.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.602836608886719e-05, -5.3301453590393066e-05, -5.0574541091918945e-05, -4.7847628593444824e-05, -4.51207160949707e-05, -4.239380359649658e-05, -3.966689109802246e-05, -3.693997859954834e-05, -3.421306610107422e-05, -3.14861536026001e-05, -2.8759241104125977e-05, -2.6032328605651855e-05, -2.3305416107177734e-05, -2.0578503608703613e-05, -1.7851591110229492e-05, -1.5124678611755371e-05, -1.239776611328125e-05, -9.670853614807129e-06, -6.943941116333008e-06, -4.217028617858887e-06, -1.4901161193847656e-06, 1.2367963790893555e-06, 3.9637088775634766e-06, 6.690621376037598e-06, 9.417533874511719e-06, 1.214444637298584e-05, 1.4871358871459961e-05, 1.7598271369934082e-05, 2.0325183868408203e-05, 2.3052096366882324e-05, 2.5779008865356445e-05, 2.8505921363830566e-05, 3.123283386230469e-05, 3.395974636077881e-05, 3.668665885925293e-05, 3.941357135772705e-05, 4.214048385620117e-05, 4.486739635467529e-05, 4.7594308853149414e-05, 5.0321221351623535e-05, 5.3048133850097656e-05, 5.577504634857178e-05, 5.85019588470459e-05, 6.122887134552002e-05, 6.395578384399414e-05, 6.668269634246826e-05, 6.940960884094238e-05, 7.21365213394165e-05, 7.486343383789062e-05, 7.759034633636475e-05, 8.031725883483887e-05, 8.304417133331299e-05, 8.577108383178711e-05, 8.849799633026123e-05, 9.122490882873535e-05, 9.395182132720947e-05, 9.66787338256836e-05, 9.940564632415771e-05, 0.00010213255882263184, 0.00010485947132110596, 0.00010758638381958008, 0.0001103132963180542, 0.00011304020881652832, 0.00011576712131500244, 0.00011849403381347656]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 5.0, 4.0, 8.0, 4.0, 12.0, 5.0, 20.0, 19.0, 23.0, 25.0, 34.0, 47.0, 76.0, 100.0, 146.0, 186.0, 338.0, 694.0, 1539.0, 5548.0, 54366.0, 918792.0, 57556.0, 5675.0, 1526.0, 653.0, 389.0, 241.0, 150.0, 96.0, 64.0, 52.0, 34.0, 30.0, 14.0, 26.0, 20.0, 12.0, 14.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.74609375, -0.7208099365234375, -0.695526123046875, -0.6702423095703125, -0.64495849609375, -0.6196746826171875, -0.594390869140625, -0.5691070556640625, -0.5438232421875, -0.5185394287109375, -0.493255615234375, -0.4679718017578125, -0.44268798828125, -0.4174041748046875, -0.392120361328125, -0.3668365478515625, -0.341552734375, -0.3162689208984375, -0.290985107421875, -0.2657012939453125, -0.24041748046875, -0.2151336669921875, -0.189849853515625, -0.1645660400390625, -0.1392822265625, -0.1139984130859375, -0.088714599609375, -0.0634307861328125, -0.03814697265625, -0.0128631591796875, 0.012420654296875, 0.0377044677734375, 0.06298828125, 0.0882720947265625, 0.113555908203125, 0.1388397216796875, 0.16412353515625, 0.1894073486328125, 0.214691162109375, 0.2399749755859375, 0.2652587890625, 0.2905426025390625, 0.315826416015625, 0.3411102294921875, 0.36639404296875, 0.3916778564453125, 0.416961669921875, 0.4422454833984375, 0.467529296875, 0.4928131103515625, 0.518096923828125, 0.5433807373046875, 0.56866455078125, 0.5939483642578125, 0.619232177734375, 0.6445159912109375, 0.6697998046875, 0.6950836181640625, 0.720367431640625, 0.7456512451171875, 0.77093505859375, 0.7962188720703125, 0.821502685546875, 0.8467864990234375, 0.8720703125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 7.0, 15.0, 7.0, 12.0, 16.0, 20.0, 27.0, 40.0, 78.0, 115.0, 243.0, 155.0, 80.0, 46.0, 38.0, 33.0, 16.0, 16.0, 16.0, 7.0, 6.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2015380859375, -0.19429588317871094, -0.18705368041992188, -0.1798114776611328, -0.17256927490234375, -0.1653270721435547, -0.15808486938476562, -0.15084266662597656, -0.1436004638671875, -0.13635826110839844, -0.12911605834960938, -0.12187385559082031, -0.11463165283203125, -0.10738945007324219, -0.10014724731445312, -0.09290504455566406, -0.085662841796875, -0.07842063903808594, -0.07117843627929688, -0.06393623352050781, -0.05669403076171875, -0.04945182800292969, -0.042209625244140625, -0.03496742248535156, -0.0277252197265625, -0.020483016967773438, -0.013240814208984375, -0.0059986114501953125, 0.00124359130859375, 0.008485794067382812, 0.015727996826171875, 0.022970199584960938, 0.03021240234375, 0.03745460510253906, 0.044696807861328125, 0.05193901062011719, 0.05918121337890625, 0.06642341613769531, 0.07366561889648438, 0.08090782165527344, 0.0881500244140625, 0.09539222717285156, 0.10263442993164062, 0.10987663269042969, 0.11711883544921875, 0.12436103820800781, 0.13160324096679688, 0.13884544372558594, 0.146087646484375, 0.15332984924316406, 0.16057205200195312, 0.1678142547607422, 0.17505645751953125, 0.1822986602783203, 0.18954086303710938, 0.19678306579589844, 0.2040252685546875, 0.21126747131347656, 0.21850967407226562, 0.2257518768310547, 0.23299407958984375, 0.2402362823486328, 0.24747848510742188, 0.25472068786621094, 0.261962890625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 21.0, 54.0, 158.0, 361.0, 254.0, 94.0, 33.0, 8.0, 8.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.069937705993652, -3.862356424331665, -3.6547751426696777, -3.4471936225891113, -3.239612340927124, -3.0320310592651367, -2.8244495391845703, -2.616868257522583, -2.4092869758605957, -2.2017056941986084, -1.9941242933273315, -1.7865428924560547, -1.5789616107940674, -1.37138032913208, -1.1637989282608032, -0.9562175273895264, -0.7486362457275391, -0.541054904460907, -0.3334735631942749, -0.12589222192764282, 0.08168911933898926, 0.28927040100097656, 0.4968518018722534, 0.7044332027435303, 0.9120144844055176, 1.1195957660675049, 1.3271771669387817, 1.5347585678100586, 1.742339849472046, 1.9499211311340332, 2.1575026512145996, 2.365083932876587, 2.572665214538574, 2.7802464962005615, 2.987827777862549, 3.1954092979431152, 3.4029905796051025, 3.61057186126709, 3.8181533813476562, 4.025734901428223, 4.233315944671631, 4.440897464752197, 4.6484785079956055, 4.856060028076172, 5.063641548156738, 5.2712225914001465, 5.478804111480713, 5.686385154724121, 5.8939666748046875, 6.101548194885254, 6.309129238128662, 6.5167107582092285, 6.724291801452637, 6.931873321533203, 7.1394548416137695, 7.347036361694336, 7.554617404937744, 7.7621989250183105, 7.969779968261719, 8.177361488342285, 8.384943008422852, 8.592523574829102, 8.800105094909668, 9.007686614990234, 9.2152681350708]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 7.0, 2.0, 10.0, 6.0, 7.0, 6.0, 14.0, 9.0, 21.0, 27.0, 29.0, 39.0, 24.0, 37.0, 30.0, 54.0, 43.0, 54.0, 49.0, 49.0, 34.0, 45.0, 51.0, 50.0, 49.0, 37.0, 33.0, 32.0, 27.0, 20.0, 22.0, 11.0, 18.0, 20.0, 9.0, 8.0, 5.0, 6.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3316848278045654, -2.250019073486328, -2.16835355758667, -2.0866880416870117, -2.0050222873687744, -1.9233566522598267, -1.841691017150879, -1.7600253820419312, -1.6783597469329834, -1.5966941118240356, -1.515028476715088, -1.4333628416061401, -1.3516972064971924, -1.2700315713882446, -1.1883659362792969, -1.1067003011703491, -1.0250346660614014, -0.9433690309524536, -0.8617033958435059, -0.7800377607345581, -0.6983721256256104, -0.6167064905166626, -0.5350408554077148, -0.4533752202987671, -0.37170958518981934, -0.2900439500808716, -0.20837831497192383, -0.12671267986297607, -0.04504704475402832, 0.036618590354919434, 0.11828422546386719, 0.19994986057281494, 0.2816157341003418, 0.36328136920928955, 0.4449470043182373, 0.5266126394271851, 0.6082782745361328, 0.6899439096450806, 0.7716095447540283, 0.8532751798629761, 0.9349408149719238, 1.0166064500808716, 1.0982720851898193, 1.179937720298767, 1.2616033554077148, 1.3432689905166626, 1.4249346256256104, 1.506600260734558, 1.5882658958435059, 1.6699315309524536, 1.7515971660614014, 1.8332628011703491, 1.9149284362792969, 1.9965940713882446, 2.0782597064971924, 2.1599254608154297, 2.241590976715088, 2.323256492614746, 2.4049222469329834, 2.4865880012512207, 2.568253517150879, 2.649919033050537, 2.7315847873687744, 2.8132505416870117, 2.89491605758667]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 9.0, 5.0, 11.0, 10.0, 17.0, 28.0, 34.0, 78.0, 111.0, 139.0, 250.0, 474.0, 891.0, 2099.0, 7984.0, 92449.0, 3778264.0, 295043.0, 11507.0, 2686.0, 1018.0, 491.0, 237.0, 154.0, 93.0, 57.0, 38.0, 38.0, 20.0, 16.0, 14.0, 9.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.83984375, -2.7528076171875, -2.665771484375, -2.5787353515625, -2.49169921875, -2.4046630859375, -2.317626953125, -2.2305908203125, -2.1435546875, -2.0565185546875, -1.969482421875, -1.8824462890625, -1.79541015625, -1.7083740234375, -1.621337890625, -1.5343017578125, -1.447265625, -1.3602294921875, -1.273193359375, -1.1861572265625, -1.09912109375, -1.0120849609375, -0.925048828125, -0.8380126953125, -0.7509765625, -0.6639404296875, -0.576904296875, -0.4898681640625, -0.40283203125, -0.3157958984375, -0.228759765625, -0.1417236328125, -0.0546875, 0.0323486328125, 0.119384765625, 0.2064208984375, 0.29345703125, 0.3804931640625, 0.467529296875, 0.5545654296875, 0.6416015625, 0.7286376953125, 0.815673828125, 0.9027099609375, 0.98974609375, 1.0767822265625, 1.163818359375, 1.2508544921875, 1.337890625, 1.4249267578125, 1.511962890625, 1.5989990234375, 1.68603515625, 1.7730712890625, 1.860107421875, 1.9471435546875, 2.0341796875, 2.1212158203125, 2.208251953125, 2.2952880859375, 2.38232421875, 2.4693603515625, 2.556396484375, 2.6434326171875, 2.73046875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 4.0, 7.0, 12.0, 12.0, 12.0, 19.0, 13.0, 31.0, 38.0, 32.0, 44.0, 59.0, 47.0, 59.0, 69.0, 66.0, 60.0, 61.0, 48.0, 56.0, 51.0, 38.0, 28.0, 36.0, 30.0, 16.0, 10.0, 10.0, 7.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.83447265625, -0.8041000366210938, -0.7737274169921875, -0.7433547973632812, -0.712982177734375, -0.6826095581054688, -0.6522369384765625, -0.6218643188476562, -0.59149169921875, -0.5611190795898438, -0.5307464599609375, -0.5003738403320312, -0.470001220703125, -0.43962860107421875, -0.4092559814453125, -0.37888336181640625, -0.3485107421875, -0.31813812255859375, -0.2877655029296875, -0.25739288330078125, -0.227020263671875, -0.19664764404296875, -0.1662750244140625, -0.13590240478515625, -0.10552978515625, -0.07515716552734375, -0.0447845458984375, -0.01441192626953125, 0.015960693359375, 0.04633331298828125, 0.0767059326171875, 0.10707855224609375, 0.137451171875, 0.16782379150390625, 0.1981964111328125, 0.22856903076171875, 0.258941650390625, 0.28931427001953125, 0.3196868896484375, 0.35005950927734375, 0.38043212890625, 0.41080474853515625, 0.4411773681640625, 0.47154998779296875, 0.501922607421875, 0.5322952270507812, 0.5626678466796875, 0.5930404663085938, 0.6234130859375, 0.6537857055664062, 0.6841583251953125, 0.7145309448242188, 0.744903564453125, 0.7752761840820312, 0.8056488037109375, 0.8360214233398438, 0.86639404296875, 0.8967666625976562, 0.9271392822265625, 0.9575119018554688, 0.987884521484375, 1.0182571411132812, 1.0486297607421875, 1.0790023803710938, 1.109375]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 8.0, 12.0, 11.0, 24.0, 32.0, 75.0, 139.0, 316.0, 692.0, 1880.0, 6989.0, 45434.0, 3086619.0, 1016476.0, 27774.0, 5146.0, 1487.0, 586.0, 257.0, 138.0, 64.0, 48.0, 29.0, 13.0, 13.0, 7.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.90625, -1.835357666015625, -1.76446533203125, -1.693572998046875, -1.6226806640625, -1.551788330078125, -1.48089599609375, -1.410003662109375, -1.339111328125, -1.268218994140625, -1.19732666015625, -1.126434326171875, -1.0555419921875, -0.984649658203125, -0.91375732421875, -0.842864990234375, -0.77197265625, -0.701080322265625, -0.63018798828125, -0.559295654296875, -0.4884033203125, -0.417510986328125, -0.34661865234375, -0.275726318359375, -0.204833984375, -0.133941650390625, -0.06304931640625, 0.007843017578125, 0.0787353515625, 0.149627685546875, 0.22052001953125, 0.291412353515625, 0.3623046875, 0.433197021484375, 0.50408935546875, 0.574981689453125, 0.6458740234375, 0.716766357421875, 0.78765869140625, 0.858551025390625, 0.929443359375, 1.000335693359375, 1.07122802734375, 1.142120361328125, 1.2130126953125, 1.283905029296875, 1.35479736328125, 1.425689697265625, 1.49658203125, 1.567474365234375, 1.63836669921875, 1.709259033203125, 1.7801513671875, 1.851043701171875, 1.92193603515625, 1.992828369140625, 2.063720703125, 2.134613037109375, 2.20550537109375, 2.276397705078125, 2.3472900390625, 2.418182373046875, 2.48907470703125, 2.559967041015625, 2.630859375]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 0.0, 4.0, 6.0, 4.0, 15.0, 19.0, 25.0, 29.0, 57.0, 82.0, 149.0, 296.0, 584.0, 875.0, 798.0, 501.0, 270.0, 137.0, 77.0, 51.0, 27.0, 21.0, 11.0, 11.0, 5.0, 4.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58251953125, -0.5662879943847656, -0.5500564575195312, -0.5338249206542969, -0.5175933837890625, -0.5013618469238281, -0.48513031005859375, -0.4688987731933594, -0.452667236328125, -0.4364356994628906, -0.42020416259765625, -0.4039726257324219, -0.3877410888671875, -0.3715095520019531, -0.35527801513671875, -0.3390464782714844, -0.32281494140625, -0.3065834045410156, -0.29035186767578125, -0.2741203308105469, -0.2578887939453125, -0.24165725708007812, -0.22542572021484375, -0.20919418334960938, -0.192962646484375, -0.17673110961914062, -0.16049957275390625, -0.14426803588867188, -0.1280364990234375, -0.11180496215820312, -0.09557342529296875, -0.07934188842773438, -0.0631103515625, -0.046878814697265625, -0.03064727783203125, -0.014415740966796875, 0.0018157958984375, 0.018047332763671875, 0.03427886962890625, 0.050510406494140625, 0.066741943359375, 0.08297348022460938, 0.09920501708984375, 0.11543655395507812, 0.1316680908203125, 0.14789962768554688, 0.16413116455078125, 0.18036270141601562, 0.19659423828125, 0.21282577514648438, 0.22905731201171875, 0.24528884887695312, 0.2615203857421875, 0.2777519226074219, 0.29398345947265625, 0.3102149963378906, 0.326446533203125, 0.3426780700683594, 0.35890960693359375, 0.3751411437988281, 0.3913726806640625, 0.4076042175292969, 0.42383575439453125, 0.4400672912597656, 0.456298828125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 4.0, 10.0, 18.0, 25.0, 49.0, 52.0, 93.0, 137.0, 161.0, 161.0, 106.0, 67.0, 53.0, 30.0, 12.0, 9.0, 10.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4348981380462646, -2.364973306655884, -2.295048475265503, -2.225123643875122, -2.155198812484741, -2.0852739810943604, -2.0153491497039795, -1.9454243183135986, -1.8754994869232178, -1.805574655532837, -1.735649824142456, -1.6657249927520752, -1.5958001613616943, -1.5258753299713135, -1.4559504985809326, -1.3860256671905518, -1.316100835800171, -1.24617600440979, -1.1762511730194092, -1.1063263416290283, -1.0364015102386475, -0.9664766788482666, -0.8965518474578857, -0.8266270160675049, -0.756702184677124, -0.6867773532867432, -0.6168525218963623, -0.5469276905059814, -0.4770028591156006, -0.4070780277252197, -0.33715319633483887, -0.267228364944458, -0.19730353355407715, -0.1273787021636963, -0.05745387077331543, 0.01247096061706543, 0.08239579200744629, 0.15232062339782715, 0.222245454788208, 0.29217028617858887, 0.3620951175689697, 0.4320199489593506, 0.5019447803497314, 0.5718696117401123, 0.6417944431304932, 0.711719274520874, 0.7816441059112549, 0.8515689373016357, 0.9214937686920166, 0.9914186000823975, 1.0613434314727783, 1.1312682628631592, 1.20119309425354, 1.271117925643921, 1.3410427570343018, 1.4109675884246826, 1.4808924198150635, 1.5508172512054443, 1.6207420825958252, 1.690666913986206, 1.760591745376587, 1.8305165767669678, 1.9004414081573486, 1.9703662395477295, 2.0402910709381104]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 9.0, 4.0, 5.0, 17.0, 13.0, 11.0, 14.0, 22.0, 25.0, 23.0, 27.0, 31.0, 33.0, 36.0, 47.0, 38.0, 44.0, 37.0, 37.0, 46.0, 35.0, 37.0, 46.0, 55.0, 44.0, 34.0, 32.0, 23.0, 27.0, 15.0, 20.0, 15.0, 18.0, 17.0, 12.0, 6.0, 8.0, 10.0, 6.0, 7.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.7492051124572754, -0.7236148715019226, -0.6980246901512146, -0.6724344491958618, -0.6468442678451538, -0.621254026889801, -0.5956637859344482, -0.5700736045837402, -0.5444833636283875, -0.5188931226730347, -0.49330294132232666, -0.4677127003669739, -0.4421224892139435, -0.4165322780609131, -0.3909420669078827, -0.3653518557548523, -0.3397616446018219, -0.3141714334487915, -0.2885812222957611, -0.2629910111427307, -0.23740077018737793, -0.21181055903434753, -0.18622034788131714, -0.16063012182712555, -0.13503991067409515, -0.10944969207048416, -0.08385947346687317, -0.05826926231384277, -0.03267904371023178, -0.007088825106620789, 0.018501386046409607, 0.044091612100601196, 0.06968182325363159, 0.09527204185724258, 0.12086226046085358, 0.14645247161388397, 0.17204269766807556, 0.19763290882110596, 0.22322311997413635, 0.24881334602832794, 0.27440357208251953, 0.2999937832355499, 0.3255839943885803, 0.3511742353439331, 0.3767644464969635, 0.4023546576499939, 0.4279448688030243, 0.4535350799560547, 0.4791252911090851, 0.5047155022621155, 0.5303057432174683, 0.5558959245681763, 0.581486165523529, 0.6070764064788818, 0.6326665878295898, 0.6582568287849426, 0.6838470101356506, 0.7094372510910034, 0.7350274324417114, 0.7606176733970642, 0.7862078547477722, 0.811798095703125, 0.837388277053833, 0.8629785180091858, 0.8885687589645386]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 1.0, 5.0, 4.0, 5.0, 13.0, 17.0, 22.0, 32.0, 41.0, 57.0, 117.0, 205.0, 362.0, 656.0, 1235.0, 2368.0, 4953.0, 11935.0, 41902.0, 333614.0, 555331.0, 67395.0, 15782.0, 6339.0, 2890.0, 1457.0, 760.0, 410.0, 257.0, 132.0, 81.0, 59.0, 38.0, 25.0, 14.0, 10.0, 11.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.396484375, -0.38187408447265625, -0.3672637939453125, -0.35265350341796875, -0.338043212890625, -0.32343292236328125, -0.3088226318359375, -0.29421234130859375, -0.27960205078125, -0.26499176025390625, -0.2503814697265625, -0.23577117919921875, -0.221160888671875, -0.20655059814453125, -0.1919403076171875, -0.17733001708984375, -0.1627197265625, -0.14810943603515625, -0.1334991455078125, -0.11888885498046875, -0.104278564453125, -0.08966827392578125, -0.0750579833984375, -0.06044769287109375, -0.04583740234375, -0.03122711181640625, -0.0166168212890625, -0.00200653076171875, 0.012603759765625, 0.02721405029296875, 0.0418243408203125, 0.05643463134765625, 0.071044921875, 0.08565521240234375, 0.1002655029296875, 0.11487579345703125, 0.129486083984375, 0.14409637451171875, 0.1587066650390625, 0.17331695556640625, 0.18792724609375, 0.20253753662109375, 0.2171478271484375, 0.23175811767578125, 0.246368408203125, 0.26097869873046875, 0.2755889892578125, 0.29019927978515625, 0.3048095703125, 0.31941986083984375, 0.3340301513671875, 0.34864044189453125, 0.363250732421875, 0.37786102294921875, 0.3924713134765625, 0.40708160400390625, 0.42169189453125, 0.43630218505859375, 0.4509124755859375, 0.46552276611328125, 0.480133056640625, 0.49474334716796875, 0.5093536376953125, 0.5239639282226562, 0.53857421875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 5.0, 7.0, 5.0, 12.0, 10.0, 18.0, 14.0, 25.0, 20.0, 30.0, 28.0, 38.0, 28.0, 39.0, 53.0, 47.0, 43.0, 49.0, 50.0, 46.0, 48.0, 42.0, 40.0, 48.0, 45.0, 25.0, 26.0, 18.0, 21.0, 26.0, 12.0, 12.0, 10.0, 12.0, 8.0, 7.0, 11.0, 4.0, 4.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.6533203125, -0.6338348388671875, -0.614349365234375, -0.5948638916015625, -0.57537841796875, -0.5558929443359375, -0.536407470703125, -0.5169219970703125, -0.4974365234375, -0.4779510498046875, -0.458465576171875, -0.4389801025390625, -0.41949462890625, -0.4000091552734375, -0.380523681640625, -0.3610382080078125, -0.341552734375, -0.3220672607421875, -0.302581787109375, -0.2830963134765625, -0.26361083984375, -0.2441253662109375, -0.224639892578125, -0.2051544189453125, -0.1856689453125, -0.1661834716796875, -0.146697998046875, -0.1272125244140625, -0.10772705078125, -0.0882415771484375, -0.068756103515625, -0.0492706298828125, -0.02978515625, -0.0102996826171875, 0.009185791015625, 0.0286712646484375, 0.04815673828125, 0.0676422119140625, 0.087127685546875, 0.1066131591796875, 0.1260986328125, 0.1455841064453125, 0.165069580078125, 0.1845550537109375, 0.20404052734375, 0.2235260009765625, 0.243011474609375, 0.2624969482421875, 0.281982421875, 0.3014678955078125, 0.320953369140625, 0.3404388427734375, 0.35992431640625, 0.3794097900390625, 0.398895263671875, 0.4183807373046875, 0.4378662109375, 0.4573516845703125, 0.476837158203125, 0.4963226318359375, 0.51580810546875, 0.5352935791015625, 0.554779052734375, 0.5742645263671875, 0.59375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 5.0, 7.0, 9.0, 9.0, 14.0, 25.0, 28.0, 50.0, 73.0, 120.0, 192.0, 307.0, 496.0, 879.0, 1683.0, 3036.0, 5958.0, 13138.0, 33540.0, 110524.0, 397603.0, 340832.0, 89634.0, 28005.0, 11055.0, 5245.0, 2723.0, 1444.0, 783.0, 430.0, 251.0, 168.0, 106.0, 59.0, 41.0, 28.0, 19.0, 16.0, 9.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.2489013671875, -0.2417736053466797, -0.23464584350585938, -0.22751808166503906, -0.22039031982421875, -0.21326255798339844, -0.20613479614257812, -0.1990070343017578, -0.1918792724609375, -0.1847515106201172, -0.17762374877929688, -0.17049598693847656, -0.16336822509765625, -0.15624046325683594, -0.14911270141601562, -0.1419849395751953, -0.134857177734375, -0.1277294158935547, -0.12060165405273438, -0.11347389221191406, -0.10634613037109375, -0.09921836853027344, -0.09209060668945312, -0.08496284484863281, -0.0778350830078125, -0.07070732116699219, -0.06357955932617188, -0.05645179748535156, -0.04932403564453125, -0.04219627380371094, -0.035068511962890625, -0.027940750122070312, -0.02081298828125, -0.013685226440429688, -0.006557464599609375, 0.0005702972412109375, 0.00769805908203125, 0.014825820922851562, 0.021953582763671875, 0.029081344604492188, 0.0362091064453125, 0.04333686828613281, 0.050464630126953125, 0.05759239196777344, 0.06472015380859375, 0.07184791564941406, 0.07897567749023438, 0.08610343933105469, 0.093231201171875, 0.10035896301269531, 0.10748672485351562, 0.11461448669433594, 0.12174224853515625, 0.12887001037597656, 0.13599777221679688, 0.1431255340576172, 0.1502532958984375, 0.1573810577392578, 0.16450881958007812, 0.17163658142089844, 0.17876434326171875, 0.18589210510253906, 0.19301986694335938, 0.2001476287841797, 0.207275390625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 6.0, 5.0, 3.0, 6.0, 5.0, 11.0, 8.0, 13.0, 8.0, 20.0, 19.0, 25.0, 18.0, 26.0, 28.0, 26.0, 40.0, 38.0, 44.0, 38.0, 54.0, 38.0, 43.0, 44.0, 47.0, 57.0, 38.0, 40.0, 38.0, 33.0, 32.0, 26.0, 25.0, 18.0, 16.0, 11.0, 11.0, 11.0, 5.0, 10.0, 4.0, 5.0, 2.0, 5.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.166015625, -1.1275482177734375, -1.089080810546875, -1.0506134033203125, -1.01214599609375, -0.9736785888671875, -0.935211181640625, -0.8967437744140625, -0.8582763671875, -0.8198089599609375, -0.781341552734375, -0.7428741455078125, -0.70440673828125, -0.6659393310546875, -0.627471923828125, -0.5890045166015625, -0.550537109375, -0.5120697021484375, -0.473602294921875, -0.4351348876953125, -0.39666748046875, -0.3582000732421875, -0.319732666015625, -0.2812652587890625, -0.2427978515625, -0.2043304443359375, -0.165863037109375, -0.1273956298828125, -0.08892822265625, -0.0504608154296875, -0.011993408203125, 0.0264739990234375, 0.06494140625, 0.1034088134765625, 0.141876220703125, 0.1803436279296875, 0.21881103515625, 0.2572784423828125, 0.295745849609375, 0.3342132568359375, 0.3726806640625, 0.4111480712890625, 0.449615478515625, 0.4880828857421875, 0.52655029296875, 0.5650177001953125, 0.603485107421875, 0.6419525146484375, 0.680419921875, 0.7188873291015625, 0.757354736328125, 0.7958221435546875, 0.83428955078125, 0.8727569580078125, 0.911224365234375, 0.9496917724609375, 0.9881591796875, 1.0266265869140625, 1.065093994140625, 1.1035614013671875, 1.14202880859375, 1.1804962158203125, 1.218963623046875, 1.2574310302734375, 1.2958984375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 17.0, 11.0, 10.0, 27.0, 28.0, 34.0, 64.0, 117.0, 182.0, 326.0, 517.0, 1057.0, 2036.0, 4688.0, 12753.0, 49454.0, 254611.0, 520341.0, 154109.0, 31658.0, 9341.0, 3603.0, 1605.0, 813.0, 441.0, 263.0, 176.0, 91.0, 55.0, 32.0, 23.0, 21.0, 7.0, 11.0, 10.0, 2.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08233642578125, -0.07979106903076172, -0.07724571228027344, -0.07470035552978516, -0.07215499877929688, -0.0696096420288086, -0.06706428527832031, -0.06451892852783203, -0.06197357177734375, -0.05942821502685547, -0.05688285827636719, -0.054337501525878906, -0.051792144775390625, -0.049246788024902344, -0.04670143127441406, -0.04415607452392578, -0.0416107177734375, -0.03906536102294922, -0.03652000427246094, -0.033974647521972656, -0.031429290771484375, -0.028883934020996094, -0.026338577270507812, -0.02379322052001953, -0.02124786376953125, -0.01870250701904297, -0.016157150268554688, -0.013611793518066406, -0.011066436767578125, -0.008521080017089844, -0.0059757232666015625, -0.0034303665161132812, -0.000885009765625, 0.0016603469848632812, 0.0042057037353515625, 0.006751060485839844, 0.009296417236328125, 0.011841773986816406, 0.014387130737304688, 0.01693248748779297, 0.01947784423828125, 0.02202320098876953, 0.024568557739257812, 0.027113914489746094, 0.029659271240234375, 0.032204627990722656, 0.03474998474121094, 0.03729534149169922, 0.0398406982421875, 0.04238605499267578, 0.04493141174316406, 0.047476768493652344, 0.050022125244140625, 0.052567481994628906, 0.05511283874511719, 0.05765819549560547, 0.06020355224609375, 0.06274890899658203, 0.06529426574707031, 0.0678396224975586, 0.07038497924804688, 0.07293033599853516, 0.07547569274902344, 0.07802104949951172, 0.08056640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 3.0, 6.0, 10.0, 8.0, 14.0, 24.0, 22.0, 32.0, 45.0, 62.0, 90.0, 72.0, 91.0, 92.0, 91.0, 87.0, 65.0, 43.0, 33.0, 32.0, 15.0, 16.0, 9.0, 5.0, 6.0, 6.0, 6.0, 8.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.612041473388672e-05, -3.492925316095352e-05, -3.3738091588020325e-05, -3.254693001508713e-05, -3.135576844215393e-05, -3.0164606869220734e-05, -2.8973445296287537e-05, -2.778228372335434e-05, -2.6591122150421143e-05, -2.5399960577487946e-05, -2.420879900455475e-05, -2.301763743162155e-05, -2.1826475858688354e-05, -2.0635314285755157e-05, -1.944415271282196e-05, -1.8252991139888763e-05, -1.7061829566955566e-05, -1.587066799402237e-05, -1.4679506421089172e-05, -1.3488344848155975e-05, -1.2297183275222778e-05, -1.1106021702289581e-05, -9.914860129356384e-06, -8.723698556423187e-06, -7.53253698348999e-06, -6.341375410556793e-06, -5.150213837623596e-06, -3.959052264690399e-06, -2.767890691757202e-06, -1.5767291188240051e-06, -3.855675458908081e-07, 8.055940270423889e-07, 1.996755599975586e-06, 3.187917172908783e-06, 4.37907874584198e-06, 5.570240318775177e-06, 6.761401891708374e-06, 7.952563464641571e-06, 9.143725037574768e-06, 1.0334886610507965e-05, 1.1526048183441162e-05, 1.2717209756374359e-05, 1.3908371329307556e-05, 1.5099532902240753e-05, 1.629069447517395e-05, 1.7481856048107147e-05, 1.8673017621040344e-05, 1.986417919397354e-05, 2.1055340766906738e-05, 2.2246502339839935e-05, 2.3437663912773132e-05, 2.462882548570633e-05, 2.5819987058639526e-05, 2.7011148631572723e-05, 2.820231020450592e-05, 2.9393471777439117e-05, 3.0584633350372314e-05, 3.177579492330551e-05, 3.296695649623871e-05, 3.4158118069171906e-05, 3.53492796421051e-05, 3.65404412150383e-05, 3.7731602787971497e-05, 3.8922764360904694e-05, 4.011392593383789e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 1.0, 2.0, 0.0, 4.0, 6.0, 8.0, 6.0, 11.0, 23.0, 31.0, 74.0, 117.0, 198.0, 375.0, 856.0, 2116.0, 6204.0, 24994.0, 143571.0, 565553.0, 249919.0, 40340.0, 9103.0, 2829.0, 1129.0, 501.0, 237.0, 139.0, 85.0, 34.0, 27.0, 13.0, 16.0, 5.0, 8.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.104736328125, -0.10142707824707031, -0.09811782836914062, -0.09480857849121094, -0.09149932861328125, -0.08819007873535156, -0.08488082885742188, -0.08157157897949219, -0.0782623291015625, -0.07495307922363281, -0.07164382934570312, -0.06833457946777344, -0.06502532958984375, -0.06171607971191406, -0.058406829833984375, -0.05509757995605469, -0.051788330078125, -0.04847908020019531, -0.045169830322265625, -0.04186058044433594, -0.03855133056640625, -0.03524208068847656, -0.031932830810546875, -0.028623580932617188, -0.0253143310546875, -0.022005081176757812, -0.018695831298828125, -0.015386581420898438, -0.01207733154296875, -0.008768081665039062, -0.005458831787109375, -0.0021495819091796875, 0.00115966796875, 0.0044689178466796875, 0.007778167724609375, 0.011087417602539062, 0.01439666748046875, 0.017705917358398438, 0.021015167236328125, 0.024324417114257812, 0.0276336669921875, 0.030942916870117188, 0.034252166748046875, 0.03756141662597656, 0.04087066650390625, 0.04417991638183594, 0.047489166259765625, 0.05079841613769531, 0.054107666015625, 0.05741691589355469, 0.060726165771484375, 0.06403541564941406, 0.06734466552734375, 0.07065391540527344, 0.07396316528320312, 0.07727241516113281, 0.0805816650390625, 0.08389091491699219, 0.08720016479492188, 0.09050941467285156, 0.09381866455078125, 0.09712791442871094, 0.10043716430664062, 0.10374641418457031, 0.1070556640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 0.0, 10.0, 14.0, 15.0, 27.0, 38.0, 48.0, 83.0, 79.0, 108.0, 100.0, 115.0, 96.0, 70.0, 61.0, 42.0, 29.0, 24.0, 10.0, 8.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03045654296875, -0.02939748764038086, -0.02833843231201172, -0.027279376983642578, -0.026220321655273438, -0.025161266326904297, -0.024102210998535156, -0.023043155670166016, -0.021984100341796875, -0.020925045013427734, -0.019865989685058594, -0.018806934356689453, -0.017747879028320312, -0.016688823699951172, -0.01562976837158203, -0.01457071304321289, -0.01351165771484375, -0.01245260238647461, -0.011393547058105469, -0.010334491729736328, -0.009275436401367188, -0.008216381072998047, -0.007157325744628906, -0.006098270416259766, -0.005039215087890625, -0.003980159759521484, -0.0029211044311523438, -0.0018620491027832031, -0.0008029937744140625, 0.0002560615539550781, 0.0013151168823242188, 0.0023741722106933594, 0.0034332275390625, 0.004492282867431641, 0.005551338195800781, 0.006610393524169922, 0.0076694488525390625, 0.008728504180908203, 0.009787559509277344, 0.010846614837646484, 0.011905670166015625, 0.012964725494384766, 0.014023780822753906, 0.015082836151123047, 0.016141891479492188, 0.017200946807861328, 0.01826000213623047, 0.01931905746459961, 0.02037811279296875, 0.02143716812133789, 0.02249622344970703, 0.023555278778076172, 0.024614334106445312, 0.025673389434814453, 0.026732444763183594, 0.027791500091552734, 0.028850555419921875, 0.029909610748291016, 0.030968666076660156, 0.0320277214050293, 0.03308677673339844, 0.03414583206176758, 0.03520488739013672, 0.03626394271850586, 0.037322998046875]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 6.0, 10.0, 24.0, 22.0, 43.0, 65.0, 77.0, 132.0, 154.0, 138.0, 124.0, 79.0, 54.0, 21.0, 22.0, 12.0, 5.0, 1.0, 7.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.242753028869629, -1.199507474899292, -1.1562620401382446, -1.1130164861679077, -1.0697710514068604, -1.0265254974365234, -0.9832800030708313, -0.9400345087051392, -0.896789014339447, -0.8535435199737549, -0.8102980256080627, -0.7670525312423706, -0.7238069772720337, -0.6805615425109863, -0.6373159885406494, -0.5940704941749573, -0.5508249998092651, -0.507579505443573, -0.46433401107788086, -0.42108848690986633, -0.3778429925441742, -0.33459749817848206, -0.29135197401046753, -0.2481064796447754, -0.20486098527908325, -0.1616154909133911, -0.11836998164653778, -0.07512447237968445, -0.03187897801399231, 0.011366516351699829, 0.054612040519714355, 0.0978575348854065, 0.14110314846038818, 0.18434864282608032, 0.22759415209293365, 0.270839661359787, 0.3140851557254791, 0.35733065009117126, 0.4005761742591858, 0.44382166862487793, 0.48706716299057007, 0.5303126573562622, 0.5735581517219543, 0.6168036460876465, 0.6600492000579834, 0.7032946348190308, 0.7465401887893677, 0.7897856831550598, 0.833031177520752, 0.8762766718864441, 0.9195221662521362, 0.9627677202224731, 1.0060131549835205, 1.0492587089538574, 1.0925042629241943, 1.1357496976852417, 1.178995132446289, 1.222240686416626, 1.2654861211776733, 1.3087316751480103, 1.3519771099090576, 1.3952226638793945, 1.4384682178497314, 1.4817136526107788, 1.5249592065811157]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 9.0, 8.0, 8.0, 13.0, 18.0, 12.0, 26.0, 26.0, 24.0, 35.0, 32.0, 46.0, 42.0, 47.0, 43.0, 42.0, 42.0, 53.0, 57.0, 47.0, 48.0, 54.0, 34.0, 48.0, 18.0, 22.0, 21.0, 19.0, 18.0, 19.0, 17.0, 11.0, 6.0, 10.0, 5.0, 5.0, 2.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6448963284492493, -0.6255130767822266, -0.6061298251152039, -0.5867465734481812, -0.5673632621765137, -0.547980010509491, -0.5285967588424683, -0.5092135071754456, -0.48983025550842285, -0.47044700384140015, -0.45106372237205505, -0.43168047070503235, -0.41229721903800964, -0.39291393756866455, -0.37353068590164185, -0.35414743423461914, -0.33476415276527405, -0.31538090109825134, -0.29599761962890625, -0.27661436796188354, -0.25723111629486084, -0.23784784972667694, -0.21846458315849304, -0.19908133149147034, -0.17969806492328644, -0.16031479835510254, -0.14093154668807983, -0.12154828011989594, -0.10216502100229263, -0.08278176188468933, -0.06339849531650543, -0.04401524364948273, -0.024631977081298828, -0.005248716101050377, 0.014134544879198074, 0.033517807722091675, 0.05290106683969498, 0.07228432595729828, 0.09166759252548218, 0.11105084419250488, 0.13043411076068878, 0.14981737732887268, 0.16920062899589539, 0.18858389556407928, 0.20796716213226318, 0.2273504137992859, 0.2467336803674698, 0.2661169171333313, 0.2855001986026764, 0.3048834502696991, 0.3242667317390442, 0.3436499834060669, 0.3630332350730896, 0.3824164867401123, 0.4017997682094574, 0.4211830198764801, 0.4405663013458252, 0.4599495530128479, 0.479332834482193, 0.4987160861492157, 0.5180993676185608, 0.5374826192855835, 0.5568658709526062, 0.5762491226196289, 0.5956323742866516]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 10.0, 10.0, 14.0, 12.0, 29.0, 49.0, 53.0, 91.0, 165.0, 221.0, 403.0, 692.0, 1370.0, 2892.0, 6818.0, 19327.0, 65930.0, 279510.0, 507130.0, 114531.0, 31236.0, 10269.0, 3830.0, 1738.0, 881.0, 501.0, 293.0, 192.0, 104.0, 68.0, 66.0, 29.0, 23.0, 29.0, 11.0, 12.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.86181640625, -0.8392562866210938, -0.8166961669921875, -0.7941360473632812, -0.771575927734375, -0.7490158081054688, -0.7264556884765625, -0.7038955688476562, -0.68133544921875, -0.6587753295898438, -0.6362152099609375, -0.6136550903320312, -0.591094970703125, -0.5685348510742188, -0.5459747314453125, -0.5234146118164062, -0.5008544921875, -0.47829437255859375, -0.4557342529296875, -0.43317413330078125, -0.410614013671875, -0.38805389404296875, -0.3654937744140625, -0.34293365478515625, -0.32037353515625, -0.29781341552734375, -0.2752532958984375, -0.25269317626953125, -0.230133056640625, -0.20757293701171875, -0.1850128173828125, -0.16245269775390625, -0.139892578125, -0.11733245849609375, -0.0947723388671875, -0.07221221923828125, -0.049652099609375, -0.02709197998046875, -0.0045318603515625, 0.01802825927734375, 0.04058837890625, 0.06314849853515625, 0.0857086181640625, 0.10826873779296875, 0.130828857421875, 0.15338897705078125, 0.1759490966796875, 0.19850921630859375, 0.2210693359375, 0.24362945556640625, 0.2661895751953125, 0.28874969482421875, 0.311309814453125, 0.33386993408203125, 0.3564300537109375, 0.37899017333984375, 0.40155029296875, 0.42411041259765625, 0.4466705322265625, 0.46923065185546875, 0.491790771484375, 0.5143508911132812, 0.5369110107421875, 0.5594711303710938, 0.58203125]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 3.0, 10.0, 14.0, 22.0, 16.0, 21.0, 21.0, 41.0, 35.0, 37.0, 51.0, 51.0, 58.0, 59.0, 65.0, 50.0, 45.0, 62.0, 46.0, 62.0, 42.0, 28.0, 27.0, 25.0, 29.0, 17.0, 10.0, 11.0, 16.0, 7.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.470703125, -1.428741455078125, -1.38677978515625, -1.344818115234375, -1.3028564453125, -1.260894775390625, -1.21893310546875, -1.176971435546875, -1.135009765625, -1.093048095703125, -1.05108642578125, -1.009124755859375, -0.9671630859375, -0.925201416015625, -0.88323974609375, -0.841278076171875, -0.79931640625, -0.757354736328125, -0.71539306640625, -0.673431396484375, -0.6314697265625, -0.589508056640625, -0.54754638671875, -0.505584716796875, -0.463623046875, -0.421661376953125, -0.37969970703125, -0.337738037109375, -0.2957763671875, -0.253814697265625, -0.21185302734375, -0.169891357421875, -0.1279296875, -0.085968017578125, -0.04400634765625, -0.002044677734375, 0.0399169921875, 0.081878662109375, 0.12384033203125, 0.165802001953125, 0.207763671875, 0.249725341796875, 0.29168701171875, 0.333648681640625, 0.3756103515625, 0.417572021484375, 0.45953369140625, 0.501495361328125, 0.54345703125, 0.585418701171875, 0.62738037109375, 0.669342041015625, 0.7113037109375, 0.753265380859375, 0.79522705078125, 0.837188720703125, 0.879150390625, 0.921112060546875, 0.96307373046875, 1.005035400390625, 1.0469970703125, 1.088958740234375, 1.13092041015625, 1.172882080078125, 1.21484375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 0.0, 7.0, 8.0, 12.0, 21.0, 23.0, 22.0, 38.0, 52.0, 75.0, 132.0, 230.0, 622.0, 3085.0, 127030.0, 900817.0, 14366.0, 1115.0, 374.0, 184.0, 104.0, 62.0, 44.0, 34.0, 22.0, 24.0, 17.0, 10.0, 10.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.873046875, -2.793792724609375, -2.71453857421875, -2.635284423828125, -2.5560302734375, -2.476776123046875, -2.39752197265625, -2.318267822265625, -2.239013671875, -2.159759521484375, -2.08050537109375, -2.001251220703125, -1.9219970703125, -1.842742919921875, -1.76348876953125, -1.684234619140625, -1.60498046875, -1.525726318359375, -1.44647216796875, -1.367218017578125, -1.2879638671875, -1.208709716796875, -1.12945556640625, -1.050201416015625, -0.970947265625, -0.891693115234375, -0.81243896484375, -0.733184814453125, -0.6539306640625, -0.574676513671875, -0.49542236328125, -0.416168212890625, -0.3369140625, -0.257659912109375, -0.17840576171875, -0.099151611328125, -0.0198974609375, 0.059356689453125, 0.13861083984375, 0.217864990234375, 0.297119140625, 0.376373291015625, 0.45562744140625, 0.534881591796875, 0.6141357421875, 0.693389892578125, 0.77264404296875, 0.851898193359375, 0.93115234375, 1.010406494140625, 1.08966064453125, 1.168914794921875, 1.2481689453125, 1.327423095703125, 1.40667724609375, 1.485931396484375, 1.565185546875, 1.644439697265625, 1.72369384765625, 1.802947998046875, 1.8822021484375, 1.961456298828125, 2.04071044921875, 2.119964599609375, 2.19921875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 1.0, 7.0, 6.0, 8.0, 14.0, 17.0, 14.0, 11.0, 33.0, 17.0, 21.0, 30.0, 34.0, 51.0, 39.0, 59.0, 42.0, 75.0, 44.0, 60.0, 57.0, 49.0, 46.0, 43.0, 32.0, 48.0, 29.0, 14.0, 23.0, 20.0, 11.0, 11.0, 11.0, 4.0, 9.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.63671875, -1.5918731689453125, -1.547027587890625, -1.5021820068359375, -1.45733642578125, -1.4124908447265625, -1.367645263671875, -1.3227996826171875, -1.2779541015625, -1.2331085205078125, -1.188262939453125, -1.1434173583984375, -1.09857177734375, -1.0537261962890625, -1.008880615234375, -0.9640350341796875, -0.919189453125, -0.8743438720703125, -0.829498291015625, -0.7846527099609375, -0.73980712890625, -0.6949615478515625, -0.650115966796875, -0.6052703857421875, -0.5604248046875, -0.5155792236328125, -0.470733642578125, -0.4258880615234375, -0.38104248046875, -0.3361968994140625, -0.291351318359375, -0.2465057373046875, -0.20166015625, -0.1568145751953125, -0.111968994140625, -0.0671234130859375, -0.02227783203125, 0.0225677490234375, 0.067413330078125, 0.1122589111328125, 0.1571044921875, 0.2019500732421875, 0.246795654296875, 0.2916412353515625, 0.33648681640625, 0.3813323974609375, 0.426177978515625, 0.4710235595703125, 0.515869140625, 0.5607147216796875, 0.605560302734375, 0.6504058837890625, 0.69525146484375, 0.7400970458984375, 0.784942626953125, 0.8297882080078125, 0.8746337890625, 0.9194793701171875, 0.964324951171875, 1.0091705322265625, 1.05401611328125, 1.0988616943359375, 1.143707275390625, 1.1885528564453125, 1.2333984375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 3.0, 7.0, 6.0, 11.0, 9.0, 21.0, 30.0, 43.0, 64.0, 123.0, 196.0, 338.0, 713.0, 1777.0, 6353.0, 34418.0, 372180.0, 572345.0, 48242.0, 7848.0, 2080.0, 772.0, 392.0, 195.0, 119.0, 77.0, 56.0, 30.0, 26.0, 15.0, 10.0, 16.0, 3.0, 7.0, 7.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.356201171875, -0.3439521789550781, -0.33170318603515625, -0.3194541931152344, -0.3072052001953125, -0.2949562072753906, -0.28270721435546875, -0.2704582214355469, -0.258209228515625, -0.24596023559570312, -0.23371124267578125, -0.22146224975585938, -0.2092132568359375, -0.19696426391601562, -0.18471527099609375, -0.17246627807617188, -0.16021728515625, -0.14796829223632812, -0.13571929931640625, -0.12347030639648438, -0.1112213134765625, -0.09897232055664062, -0.08672332763671875, -0.07447433471679688, -0.062225341796875, -0.049976348876953125, -0.03772735595703125, -0.025478363037109375, -0.0132293701171875, -0.000980377197265625, 0.01126861572265625, 0.023517608642578125, 0.0357666015625, 0.048015594482421875, 0.06026458740234375, 0.07251358032226562, 0.0847625732421875, 0.09701156616210938, 0.10926055908203125, 0.12150955200195312, 0.133758544921875, 0.14600753784179688, 0.15825653076171875, 0.17050552368164062, 0.1827545166015625, 0.19500350952148438, 0.20725250244140625, 0.21950149536132812, 0.23175048828125, 0.24399948120117188, 0.25624847412109375, 0.2684974670410156, 0.2807464599609375, 0.2929954528808594, 0.30524444580078125, 0.3174934387207031, 0.329742431640625, 0.3419914245605469, 0.35424041748046875, 0.3664894104003906, 0.3787384033203125, 0.3909873962402344, 0.40323638916015625, 0.4154853820800781, 0.427734375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 8.0, 6.0, 5.0, 6.0, 22.0, 20.0, 38.0, 42.0, 77.0, 109.0, 185.0, 135.0, 101.0, 68.0, 55.0, 28.0, 32.0, 20.0, 10.0, 7.0, 6.0, 5.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.56382942199707e-05, -7.358472794294357e-05, -7.153116166591644e-05, -6.947759538888931e-05, -6.742402911186218e-05, -6.537046283483505e-05, -6.331689655780792e-05, -6.126333028078079e-05, -5.920976400375366e-05, -5.715619772672653e-05, -5.51026314496994e-05, -5.304906517267227e-05, -5.099549889564514e-05, -4.894193261861801e-05, -4.688836634159088e-05, -4.483480006456375e-05, -4.278123378753662e-05, -4.072766751050949e-05, -3.867410123348236e-05, -3.662053495645523e-05, -3.45669686794281e-05, -3.251340240240097e-05, -3.045983612537384e-05, -2.840626984834671e-05, -2.635270357131958e-05, -2.429913729429245e-05, -2.224557101726532e-05, -2.019200474023819e-05, -1.813843846321106e-05, -1.608487218618393e-05, -1.40313059091568e-05, -1.197773963212967e-05, -9.924173355102539e-06, -7.870607078075409e-06, -5.817040801048279e-06, -3.7634745240211487e-06, -1.7099082469940186e-06, 3.4365803003311157e-07, 2.3972243070602417e-06, 4.450790584087372e-06, 6.504356861114502e-06, 8.557923138141632e-06, 1.0611489415168762e-05, 1.2665055692195892e-05, 1.4718621969223022e-05, 1.6772188246250153e-05, 1.8825754523277283e-05, 2.0879320800304413e-05, 2.2932887077331543e-05, 2.4986453354358673e-05, 2.7040019631385803e-05, 2.9093585908412933e-05, 3.1147152185440063e-05, 3.3200718462467194e-05, 3.5254284739494324e-05, 3.7307851016521454e-05, 3.9361417293548584e-05, 4.1414983570575714e-05, 4.3468549847602844e-05, 4.5522116124629974e-05, 4.7575682401657104e-05, 4.9629248678684235e-05, 5.1682814955711365e-05, 5.3736381232738495e-05, 5.5789947509765625e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 10.0, 7.0, 12.0, 26.0, 35.0, 30.0, 77.0, 139.0, 267.0, 644.0, 1659.0, 4498.0, 21034.0, 235908.0, 714210.0, 56873.0, 8600.0, 2676.0, 967.0, 423.0, 217.0, 97.0, 64.0, 26.0, 16.0, 8.0, 12.0, 9.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.6796875, -0.6635932922363281, -0.6474990844726562, -0.6314048767089844, -0.6153106689453125, -0.5992164611816406, -0.5831222534179688, -0.5670280456542969, -0.550933837890625, -0.5348396301269531, -0.5187454223632812, -0.5026512145996094, -0.4865570068359375, -0.4704627990722656, -0.45436859130859375, -0.4382743835449219, -0.42218017578125, -0.4060859680175781, -0.38999176025390625, -0.3738975524902344, -0.3578033447265625, -0.3417091369628906, -0.32561492919921875, -0.3095207214355469, -0.293426513671875, -0.2773323059082031, -0.26123809814453125, -0.24514389038085938, -0.2290496826171875, -0.21295547485351562, -0.19686126708984375, -0.18076705932617188, -0.1646728515625, -0.14857864379882812, -0.13248443603515625, -0.11639022827148438, -0.1002960205078125, -0.08420181274414062, -0.06810760498046875, -0.052013397216796875, -0.035919189453125, -0.019824981689453125, -0.00373077392578125, 0.012363433837890625, 0.0284576416015625, 0.044551849365234375, 0.06064605712890625, 0.07674026489257812, 0.09283447265625, 0.10892868041992188, 0.12502288818359375, 0.14111709594726562, 0.1572113037109375, 0.17330551147460938, 0.18939971923828125, 0.20549392700195312, 0.221588134765625, 0.23768234252929688, 0.25377655029296875, 0.2698707580566406, 0.2859649658203125, 0.3020591735839844, 0.31815338134765625, 0.3342475891113281, 0.350341796875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 9.0, 9.0, 24.0, 21.0, 21.0, 45.0, 64.0, 77.0, 98.0, 191.0, 117.0, 91.0, 72.0, 58.0, 23.0, 26.0, 12.0, 12.0, 3.0, 6.0, 4.0, 3.0, 2.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1304931640625, -0.12446022033691406, -0.11842727661132812, -0.11239433288574219, -0.10636138916015625, -0.10032844543457031, -0.09429550170898438, -0.08826255798339844, -0.0822296142578125, -0.07619667053222656, -0.07016372680664062, -0.06413078308105469, -0.05809783935546875, -0.05206489562988281, -0.046031951904296875, -0.03999900817871094, -0.033966064453125, -0.027933120727539062, -0.021900177001953125, -0.015867233276367188, -0.00983428955078125, -0.0038013458251953125, 0.002231597900390625, 0.008264541625976562, 0.0142974853515625, 0.020330429077148438, 0.026363372802734375, 0.03239631652832031, 0.03842926025390625, 0.04446220397949219, 0.050495147705078125, 0.05652809143066406, 0.06256103515625, 0.06859397888183594, 0.07462692260742188, 0.08065986633300781, 0.08669281005859375, 0.09272575378417969, 0.09875869750976562, 0.10479164123535156, 0.1108245849609375, 0.11685752868652344, 0.12289047241210938, 0.1289234161376953, 0.13495635986328125, 0.1409893035888672, 0.14702224731445312, 0.15305519104003906, 0.159088134765625, 0.16512107849121094, 0.17115402221679688, 0.1771869659423828, 0.18321990966796875, 0.1892528533935547, 0.19528579711914062, 0.20131874084472656, 0.2073516845703125, 0.21338462829589844, 0.21941757202148438, 0.2254505157470703, 0.23148345947265625, 0.2375164031982422, 0.24354934692382812, 0.24958229064941406, 0.255615234375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 7.0, 18.0, 45.0, 61.0, 143.0, 177.0, 196.0, 155.0, 102.0, 44.0, 29.0, 11.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.593125581741333, -2.4704627990722656, -2.3478000164031982, -2.225137233734131, -2.1024744510650635, -1.979811668395996, -1.8571490049362183, -1.7344862222671509, -1.6118234395980835, -1.4891606569290161, -1.3664978742599487, -1.243835210800171, -1.1211724281311035, -0.9985095858573914, -0.8758468627929688, -0.7531840801239014, -0.630521297454834, -0.5078585147857666, -0.3851957619190216, -0.2625330090522766, -0.13987022638320923, -0.017207443714141846, 0.10545527935028076, 0.22811806201934814, 0.3507808446884155, 0.4734436273574829, 0.5961064100265503, 0.7187691330909729, 0.8414319157600403, 0.9640946984291077, 1.0867574214935303, 1.2094202041625977, 1.332082748413086, 1.4547455310821533, 1.5774083137512207, 1.700071096420288, 1.8227338790893555, 1.9453966617584229, 2.0680594444274902, 2.1907219886779785, 2.313385009765625, 2.4360477924346924, 2.5587105751037598, 2.681373357772827, 2.8040361404418945, 2.926698923110962, 3.0493617057800293, 3.1720242500305176, 3.294687032699585, 3.4173498153686523, 3.5400125980377197, 3.662675380706787, 3.7853381633758545, 3.908000946044922, 4.03066349029541, 4.153326511383057, 4.275989055633545, 4.398651599884033, 4.52131462097168, 4.643977165222168, 4.7666401863098145, 4.889302730560303, 5.011965751647949, 5.1346282958984375, 5.257291316986084]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 7.0, 7.0, 5.0, 15.0, 14.0, 20.0, 19.0, 26.0, 23.0, 23.0, 28.0, 30.0, 33.0, 41.0, 38.0, 50.0, 47.0, 38.0, 37.0, 48.0, 45.0, 35.0, 30.0, 33.0, 38.0, 34.0, 29.0, 34.0, 24.0, 26.0, 18.0, 23.0, 18.0, 15.0, 10.0, 12.0, 8.0, 4.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0123181343078613, -1.9492347240447998, -1.8861511945724487, -1.8230676651000977, -1.7599842548370361, -1.6969008445739746, -1.6338173151016235, -1.5707337856292725, -1.507650375366211, -1.4445669651031494, -1.3814834356307983, -1.3183999061584473, -1.2553164958953857, -1.1922330856323242, -1.1291495561599731, -1.066066026687622, -1.0029826164245605, -0.9398991465568542, -0.876815676689148, -0.8137322068214417, -0.7506487369537354, -0.687565267086029, -0.6244817972183228, -0.5613983273506165, -0.49831485748291016, -0.43523138761520386, -0.37214791774749756, -0.30906444787979126, -0.24598097801208496, -0.18289750814437866, -0.11981403827667236, -0.056730568408966064, 0.006352901458740234, 0.06943637132644653, 0.13251984119415283, 0.19560331106185913, 0.25868678092956543, 0.32177025079727173, 0.384853720664978, 0.4479371905326843, 0.5110206604003906, 0.5741041302680969, 0.6371876001358032, 0.7002710700035095, 0.7633545398712158, 0.8264380097389221, 0.8895214796066284, 0.9526049494743347, 1.015688419342041, 1.0787718296051025, 1.1418553590774536, 1.2049388885498047, 1.2680222988128662, 1.3311057090759277, 1.3941892385482788, 1.4572727680206299, 1.5203561782836914, 1.583439588546753, 1.646523118019104, 1.709606647491455, 1.7726900577545166, 1.8357734680175781, 1.8988569974899292, 1.9619405269622803, 2.025023937225342]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 3.0, 4.0, 10.0, 10.0, 21.0, 24.0, 46.0, 52.0, 71.0, 123.0, 175.0, 241.0, 384.0, 654.0, 1002.0, 1757.0, 3533.0, 8381.0, 29531.0, 210290.0, 2300380.0, 1490467.0, 114513.0, 19160.0, 6414.0, 2911.0, 1518.0, 907.0, 557.0, 368.0, 211.0, 147.0, 129.0, 81.0, 64.0, 31.0, 26.0, 19.0, 14.0, 16.0, 4.0, 10.0, 6.0, 6.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.048828125, -1.0112152099609375, -0.973602294921875, -0.9359893798828125, -0.89837646484375, -0.8607635498046875, -0.823150634765625, -0.7855377197265625, -0.7479248046875, -0.7103118896484375, -0.672698974609375, -0.6350860595703125, -0.59747314453125, -0.5598602294921875, -0.522247314453125, -0.4846343994140625, -0.447021484375, -0.4094085693359375, -0.371795654296875, -0.3341827392578125, -0.29656982421875, -0.2589569091796875, -0.221343994140625, -0.1837310791015625, -0.1461181640625, -0.1085052490234375, -0.070892333984375, -0.0332794189453125, 0.00433349609375, 0.0419464111328125, 0.079559326171875, 0.1171722412109375, 0.15478515625, 0.1923980712890625, 0.230010986328125, 0.2676239013671875, 0.30523681640625, 0.3428497314453125, 0.380462646484375, 0.4180755615234375, 0.4556884765625, 0.4933013916015625, 0.530914306640625, 0.5685272216796875, 0.60614013671875, 0.6437530517578125, 0.681365966796875, 0.7189788818359375, 0.756591796875, 0.7942047119140625, 0.831817626953125, 0.8694305419921875, 0.90704345703125, 0.9446563720703125, 0.982269287109375, 1.0198822021484375, 1.0574951171875, 1.0951080322265625, 1.132720947265625, 1.1703338623046875, 1.20794677734375, 1.2455596923828125, 1.283172607421875, 1.3207855224609375, 1.3583984375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 9.0, 8.0, 13.0, 17.0, 13.0, 18.0, 20.0, 32.0, 37.0, 33.0, 38.0, 28.0, 50.0, 53.0, 58.0, 52.0, 48.0, 37.0, 57.0, 60.0, 37.0, 42.0, 31.0, 30.0, 20.0, 22.0, 25.0, 16.0, 16.0, 12.0, 11.0, 9.0, 7.0, 8.0, 7.0, 8.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.59814453125, -0.5762481689453125, -0.554351806640625, -0.5324554443359375, -0.51055908203125, -0.4886627197265625, -0.466766357421875, -0.4448699951171875, -0.4229736328125, -0.4010772705078125, -0.379180908203125, -0.3572845458984375, -0.33538818359375, -0.3134918212890625, -0.291595458984375, -0.2696990966796875, -0.247802734375, -0.2259063720703125, -0.204010009765625, -0.1821136474609375, -0.16021728515625, -0.1383209228515625, -0.116424560546875, -0.0945281982421875, -0.0726318359375, -0.0507354736328125, -0.028839111328125, -0.0069427490234375, 0.01495361328125, 0.0368499755859375, 0.058746337890625, 0.0806427001953125, 0.1025390625, 0.1244354248046875, 0.146331787109375, 0.1682281494140625, 0.19012451171875, 0.2120208740234375, 0.233917236328125, 0.2558135986328125, 0.2777099609375, 0.2996063232421875, 0.321502685546875, 0.3433990478515625, 0.36529541015625, 0.3871917724609375, 0.409088134765625, 0.4309844970703125, 0.452880859375, 0.4747772216796875, 0.496673583984375, 0.5185699462890625, 0.54046630859375, 0.5623626708984375, 0.584259033203125, 0.6061553955078125, 0.6280517578125, 0.6499481201171875, 0.671844482421875, 0.6937408447265625, 0.71563720703125, 0.7375335693359375, 0.759429931640625, 0.7813262939453125, 0.80322265625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 6.0, 5.0, 7.0, 9.0, 13.0, 19.0, 23.0, 33.0, 50.0, 75.0, 128.0, 209.0, 348.0, 745.0, 1801.0, 5216.0, 22520.0, 324694.0, 3718928.0, 99772.0, 13202.0, 3651.0, 1314.0, 648.0, 318.0, 182.0, 114.0, 74.0, 49.0, 40.0, 26.0, 18.0, 13.0, 11.0, 8.0, 5.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.455078125, -2.3910369873046875, -2.326995849609375, -2.2629547119140625, -2.19891357421875, -2.1348724365234375, -2.070831298828125, -2.0067901611328125, -1.9427490234375, -1.8787078857421875, -1.814666748046875, -1.7506256103515625, -1.68658447265625, -1.6225433349609375, -1.558502197265625, -1.4944610595703125, -1.430419921875, -1.3663787841796875, -1.302337646484375, -1.2382965087890625, -1.17425537109375, -1.1102142333984375, -1.046173095703125, -0.9821319580078125, -0.9180908203125, -0.8540496826171875, -0.790008544921875, -0.7259674072265625, -0.66192626953125, -0.5978851318359375, -0.533843994140625, -0.4698028564453125, -0.40576171875, -0.3417205810546875, -0.277679443359375, -0.2136383056640625, -0.14959716796875, -0.0855560302734375, -0.021514892578125, 0.0425262451171875, 0.1065673828125, 0.1706085205078125, 0.234649658203125, 0.2986907958984375, 0.36273193359375, 0.4267730712890625, 0.490814208984375, 0.5548553466796875, 0.618896484375, 0.6829376220703125, 0.746978759765625, 0.8110198974609375, 0.87506103515625, 0.9391021728515625, 1.003143310546875, 1.0671844482421875, 1.1312255859375, 1.1952667236328125, 1.259307861328125, 1.3233489990234375, 1.38739013671875, 1.4514312744140625, 1.515472412109375, 1.5795135498046875, 1.6435546875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 2.0, 4.0, 6.0, 15.0, 12.0, 28.0, 23.0, 57.0, 100.0, 228.0, 559.0, 1029.0, 1063.0, 529.0, 211.0, 83.0, 48.0, 21.0, 16.0, 9.0, 6.0, 8.0, 7.0, 3.0, 5.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54541015625, -0.5243911743164062, -0.5033721923828125, -0.48235321044921875, -0.461334228515625, -0.44031524658203125, -0.4192962646484375, -0.39827728271484375, -0.37725830078125, -0.35623931884765625, -0.3352203369140625, -0.31420135498046875, -0.293182373046875, -0.27216339111328125, -0.2511444091796875, -0.23012542724609375, -0.2091064453125, -0.18808746337890625, -0.1670684814453125, -0.14604949951171875, -0.125030517578125, -0.10401153564453125, -0.0829925537109375, -0.06197357177734375, -0.04095458984375, -0.01993560791015625, 0.0010833740234375, 0.02210235595703125, 0.043121337890625, 0.06414031982421875, 0.0851593017578125, 0.10617828369140625, 0.127197265625, 0.14821624755859375, 0.1692352294921875, 0.19025421142578125, 0.211273193359375, 0.23229217529296875, 0.2533111572265625, 0.27433013916015625, 0.29534912109375, 0.31636810302734375, 0.3373870849609375, 0.35840606689453125, 0.379425048828125, 0.40044403076171875, 0.4214630126953125, 0.44248199462890625, 0.4635009765625, 0.48451995849609375, 0.5055389404296875, 0.5265579223632812, 0.547576904296875, 0.5685958862304688, 0.5896148681640625, 0.6106338500976562, 0.63165283203125, 0.6526718139648438, 0.6736907958984375, 0.6947097778320312, 0.715728759765625, 0.7367477416992188, 0.7577667236328125, 0.7787857055664062, 0.7998046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 7.0, 10.0, 21.0, 30.0, 55.0, 113.0, 145.0, 172.0, 177.0, 111.0, 72.0, 45.0, 22.0, 11.0, 10.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.555267333984375, -3.479269504547119, -3.4032719135284424, -3.3272740840911865, -3.2512762546539307, -3.175278425216675, -3.099280834197998, -3.023283004760742, -2.9472851753234863, -2.8712873458862305, -2.7952897548675537, -2.719291925430298, -2.643294095993042, -2.567296266555786, -2.4912986755371094, -2.4153008460998535, -2.3393030166625977, -2.263305187225342, -2.187307596206665, -2.111309766769409, -2.0353119373321533, -1.959314227104187, -1.8833165168762207, -1.8073186874389648, -1.731321096420288, -1.6553233861923218, -1.579325556755066, -1.5033278465270996, -1.4273300170898438, -1.3513323068618774, -1.2753345966339111, -1.1993367671966553, -1.123339056968689, -1.0473413467407227, -0.9713435173034668, -0.8953458070755005, -0.8193479776382446, -0.7433502674102783, -0.6673524975776672, -0.5913547277450562, -0.5153569579124451, -0.439359188079834, -0.3633614182472229, -0.2873636782169342, -0.21136590838432312, -0.13536813855171204, -0.05937039852142334, 0.016627371311187744, 0.09262514114379883, 0.1686229109764099, 0.2446206659078598, 0.3206184208393097, 0.3966161906719208, 0.47261396050453186, 0.5486117005348206, 0.6246094703674316, 0.7006072402000427, 0.7766050100326538, 0.8526027798652649, 0.928600549697876, 1.0045982599258423, 1.0805960893630981, 1.1565937995910645, 1.2325916290283203, 1.3085893392562866]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 3.0, 5.0, 4.0, 2.0, 7.0, 11.0, 10.0, 14.0, 20.0, 13.0, 13.0, 28.0, 20.0, 22.0, 38.0, 46.0, 45.0, 49.0, 52.0, 56.0, 51.0, 36.0, 41.0, 40.0, 44.0, 45.0, 44.0, 35.0, 40.0, 22.0, 27.0, 23.0, 14.0, 19.0, 18.0, 14.0, 10.0, 5.0, 4.0, 7.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.9607695937156677, -0.9340108036994934, -0.9072520732879639, -0.8804932832717896, -0.8537344932556152, -0.8269757032394409, -0.8002169728279114, -0.7734581828117371, -0.7466993927955627, -0.7199406027793884, -0.6931818723678589, -0.6664230823516846, -0.6396642923355103, -0.6129055023193359, -0.5861467719078064, -0.5593879818916321, -0.5326292514801025, -0.5058704614639282, -0.4791117012500763, -0.45235294103622437, -0.42559415102005005, -0.3988353908061981, -0.3720766305923462, -0.3453178405761719, -0.31855905055999756, -0.29180029034614563, -0.2650415003299713, -0.23828274011611938, -0.21152395009994507, -0.18476518988609314, -0.15800641477108002, -0.1312476396560669, -0.10448884963989258, -0.07773007452487946, -0.05097130313515663, -0.024212531745433807, 0.002546243369579315, 0.02930501103401184, 0.05606378614902496, 0.08282256126403809, 0.10958133637905121, 0.13634011149406433, 0.16309888660907745, 0.18985766172409058, 0.2166164219379425, 0.24337519705295563, 0.27013397216796875, 0.29689276218414307, 0.323651522397995, 0.3504102826118469, 0.37716907262802124, 0.40392783284187317, 0.4306866228580475, 0.4574453830718994, 0.48420417308807373, 0.510962963104248, 0.5377216935157776, 0.5644804835319519, 0.5912392139434814, 0.6179980039596558, 0.6447567939758301, 0.6715155839920044, 0.6982743144035339, 0.7250331044197083, 0.7517918944358826]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 7.0, 0.0, 3.0, 7.0, 6.0, 13.0, 13.0, 34.0, 35.0, 64.0, 108.0, 222.0, 436.0, 931.0, 1925.0, 4449.0, 11608.0, 50814.0, 578495.0, 350101.0, 33243.0, 9163.0, 3667.0, 1647.0, 734.0, 352.0, 202.0, 127.0, 53.0, 33.0, 22.0, 12.0, 17.0, 8.0, 4.0, 4.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4052734375, -0.389617919921875, -0.37396240234375, -0.358306884765625, -0.3426513671875, -0.326995849609375, -0.31134033203125, -0.295684814453125, -0.280029296875, -0.264373779296875, -0.24871826171875, -0.233062744140625, -0.2174072265625, -0.201751708984375, -0.18609619140625, -0.170440673828125, -0.15478515625, -0.139129638671875, -0.12347412109375, -0.107818603515625, -0.0921630859375, -0.076507568359375, -0.06085205078125, -0.045196533203125, -0.029541015625, -0.013885498046875, 0.00177001953125, 0.017425537109375, 0.0330810546875, 0.048736572265625, 0.06439208984375, 0.080047607421875, 0.095703125, 0.111358642578125, 0.12701416015625, 0.142669677734375, 0.1583251953125, 0.173980712890625, 0.18963623046875, 0.205291748046875, 0.220947265625, 0.236602783203125, 0.25225830078125, 0.267913818359375, 0.2835693359375, 0.299224853515625, 0.31488037109375, 0.330535888671875, 0.34619140625, 0.361846923828125, 0.37750244140625, 0.393157958984375, 0.4088134765625, 0.424468994140625, 0.44012451171875, 0.455780029296875, 0.471435546875, 0.487091064453125, 0.50274658203125, 0.518402099609375, 0.5340576171875, 0.549713134765625, 0.56536865234375, 0.581024169921875, 0.5966796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 0.0, 4.0, 3.0, 8.0, 4.0, 16.0, 14.0, 16.0, 22.0, 22.0, 28.0, 33.0, 40.0, 47.0, 55.0, 64.0, 44.0, 48.0, 53.0, 52.0, 62.0, 53.0, 57.0, 48.0, 36.0, 31.0, 23.0, 22.0, 21.0, 14.0, 18.0, 11.0, 5.0, 12.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 6.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.68310546875, -0.6649665832519531, -0.6468276977539062, -0.6286888122558594, -0.6105499267578125, -0.5924110412597656, -0.5742721557617188, -0.5561332702636719, -0.537994384765625, -0.5198554992675781, -0.5017166137695312, -0.4835777282714844, -0.4654388427734375, -0.4472999572753906, -0.42916107177734375, -0.4110221862792969, -0.39288330078125, -0.3747444152832031, -0.35660552978515625, -0.3384666442871094, -0.3203277587890625, -0.3021888732910156, -0.28404998779296875, -0.2659111022949219, -0.247772216796875, -0.22963333129882812, -0.21149444580078125, -0.19335556030273438, -0.1752166748046875, -0.15707778930664062, -0.13893890380859375, -0.12080001831054688, -0.1026611328125, -0.08452224731445312, -0.06638336181640625, -0.048244476318359375, -0.0301055908203125, -0.011966705322265625, 0.00617218017578125, 0.024311065673828125, 0.042449951171875, 0.060588836669921875, 0.07872772216796875, 0.09686660766601562, 0.1150054931640625, 0.13314437866210938, 0.15128326416015625, 0.16942214965820312, 0.18756103515625, 0.20569992065429688, 0.22383880615234375, 0.24197769165039062, 0.2601165771484375, 0.2782554626464844, 0.29639434814453125, 0.3145332336425781, 0.332672119140625, 0.3508110046386719, 0.36894989013671875, 0.3870887756347656, 0.4052276611328125, 0.4233665466308594, 0.44150543212890625, 0.4596443176269531, 0.477783203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 6.0, 8.0, 20.0, 23.0, 17.0, 30.0, 39.0, 67.0, 116.0, 155.0, 225.0, 415.0, 654.0, 1108.0, 1925.0, 3547.0, 6771.0, 14688.0, 40185.0, 139074.0, 411374.0, 296270.0, 82834.0, 26318.0, 10687.0, 5323.0, 2692.0, 1526.0, 907.0, 518.0, 350.0, 221.0, 153.0, 89.0, 70.0, 48.0, 34.0, 15.0, 16.0, 10.0, 3.0, 7.0, 5.0, 1.0, 4.0, 2.0, 0.0, 2.0, 5.0], "bins": [-0.1866455078125, -0.18143272399902344, -0.17621994018554688, -0.1710071563720703, -0.16579437255859375, -0.1605815887451172, -0.15536880493164062, -0.15015602111816406, -0.1449432373046875, -0.13973045349121094, -0.13451766967773438, -0.1293048858642578, -0.12409210205078125, -0.11887931823730469, -0.11366653442382812, -0.10845375061035156, -0.103240966796875, -0.09802818298339844, -0.09281539916992188, -0.08760261535644531, -0.08238983154296875, -0.07717704772949219, -0.07196426391601562, -0.06675148010253906, -0.0615386962890625, -0.05632591247558594, -0.051113128662109375, -0.04590034484863281, -0.04068756103515625, -0.03547477722167969, -0.030261993408203125, -0.025049209594726562, -0.01983642578125, -0.014623641967773438, -0.009410858154296875, -0.0041980743408203125, 0.00101470947265625, 0.0062274932861328125, 0.011440277099609375, 0.016653060913085938, 0.0218658447265625, 0.027078628540039062, 0.032291412353515625, 0.03750419616699219, 0.04271697998046875, 0.04792976379394531, 0.053142547607421875, 0.05835533142089844, 0.063568115234375, 0.06878089904785156, 0.07399368286132812, 0.07920646667480469, 0.08441925048828125, 0.08963203430175781, 0.09484481811523438, 0.10005760192871094, 0.1052703857421875, 0.11048316955566406, 0.11569595336914062, 0.12090873718261719, 0.12612152099609375, 0.1313343048095703, 0.13654708862304688, 0.14175987243652344, 0.14697265625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 8.0, 8.0, 15.0, 21.0, 20.0, 18.0, 18.0, 21.0, 30.0, 35.0, 33.0, 53.0, 55.0, 49.0, 45.0, 53.0, 54.0, 46.0, 41.0, 42.0, 41.0, 29.0, 29.0, 34.0, 29.0, 24.0, 26.0, 15.0, 18.0, 11.0, 12.0, 7.0, 10.0, 9.0, 7.0, 2.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8232421875, -0.79400634765625, -0.7647705078125, -0.73553466796875, -0.706298828125, -0.67706298828125, -0.6478271484375, -0.61859130859375, -0.58935546875, -0.56011962890625, -0.5308837890625, -0.50164794921875, -0.472412109375, -0.44317626953125, -0.4139404296875, -0.38470458984375, -0.35546875, -0.32623291015625, -0.2969970703125, -0.26776123046875, -0.238525390625, -0.20928955078125, -0.1800537109375, -0.15081787109375, -0.12158203125, -0.09234619140625, -0.0631103515625, -0.03387451171875, -0.004638671875, 0.02459716796875, 0.0538330078125, 0.08306884765625, 0.1123046875, 0.14154052734375, 0.1707763671875, 0.20001220703125, 0.229248046875, 0.25848388671875, 0.2877197265625, 0.31695556640625, 0.34619140625, 0.37542724609375, 0.4046630859375, 0.43389892578125, 0.463134765625, 0.49237060546875, 0.5216064453125, 0.55084228515625, 0.580078125, 0.60931396484375, 0.6385498046875, 0.66778564453125, 0.697021484375, 0.72625732421875, 0.7554931640625, 0.78472900390625, 0.81396484375, 0.84320068359375, 0.8724365234375, 0.90167236328125, 0.930908203125, 0.96014404296875, 0.9893798828125, 1.01861572265625, 1.0478515625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 10.0, 12.0, 24.0, 47.0, 94.0, 171.0, 395.0, 891.0, 2400.0, 7796.0, 38238.0, 383037.0, 545593.0, 55090.0, 9898.0, 2934.0, 1036.0, 444.0, 220.0, 93.0, 59.0, 22.0, 24.0, 12.0, 5.0, 2.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09906005859375, -0.09526348114013672, -0.09146690368652344, -0.08767032623291016, -0.08387374877929688, -0.0800771713256836, -0.07628059387207031, -0.07248401641845703, -0.06868743896484375, -0.06489086151123047, -0.06109428405761719, -0.057297706604003906, -0.053501129150390625, -0.049704551696777344, -0.04590797424316406, -0.04211139678955078, -0.0383148193359375, -0.03451824188232422, -0.030721664428710938, -0.026925086975097656, -0.023128509521484375, -0.019331932067871094, -0.015535354614257812, -0.011738777160644531, -0.00794219970703125, -0.004145622253417969, -0.0003490447998046875, 0.0034475326538085938, 0.007244110107421875, 0.011040687561035156, 0.014837265014648438, 0.01863384246826172, 0.022430419921875, 0.02622699737548828, 0.030023574829101562, 0.033820152282714844, 0.037616729736328125, 0.041413307189941406, 0.04520988464355469, 0.04900646209716797, 0.05280303955078125, 0.05659961700439453, 0.06039619445800781, 0.0641927719116211, 0.06798934936523438, 0.07178592681884766, 0.07558250427246094, 0.07937908172607422, 0.0831756591796875, 0.08697223663330078, 0.09076881408691406, 0.09456539154052734, 0.09836196899414062, 0.1021585464477539, 0.10595512390136719, 0.10975170135498047, 0.11354827880859375, 0.11734485626220703, 0.12114143371582031, 0.1249380111694336, 0.12873458862304688, 0.13253116607666016, 0.13632774353027344, 0.14012432098388672, 0.1439208984375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 2.0, 9.0, 6.0, 18.0, 17.0, 46.0, 69.0, 166.0, 222.0, 203.0, 103.0, 55.0, 33.0, 24.0, 12.0, 2.0, 4.0, 7.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.936094284057617e-05, -9.67998057603836e-05, -9.423866868019104e-05, -9.167753159999847e-05, -8.911639451980591e-05, -8.655525743961334e-05, -8.399412035942078e-05, -8.143298327922821e-05, -7.887184619903564e-05, -7.631070911884308e-05, -7.374957203865051e-05, -7.118843495845795e-05, -6.862729787826538e-05, -6.606616079807281e-05, -6.350502371788025e-05, -6.094388663768768e-05, -5.838274955749512e-05, -5.582161247730255e-05, -5.3260475397109985e-05, -5.069933831691742e-05, -4.8138201236724854e-05, -4.557706415653229e-05, -4.301592707633972e-05, -4.0454789996147156e-05, -3.789365291595459e-05, -3.5332515835762024e-05, -3.277137875556946e-05, -3.0210241675376892e-05, -2.7649104595184326e-05, -2.508796751499176e-05, -2.2526830434799194e-05, -1.996569335460663e-05, -1.7404556274414062e-05, -1.4843419194221497e-05, -1.228228211402893e-05, -9.721145033836365e-06, -7.160007953643799e-06, -4.598870873451233e-06, -2.037733793258667e-06, 5.234032869338989e-07, 3.084540367126465e-06, 5.645677447319031e-06, 8.206814527511597e-06, 1.0767951607704163e-05, 1.3329088687896729e-05, 1.5890225768089294e-05, 1.845136284828186e-05, 2.1012499928474426e-05, 2.3573637008666992e-05, 2.6134774088859558e-05, 2.8695911169052124e-05, 3.125704824924469e-05, 3.3818185329437256e-05, 3.637932240962982e-05, 3.894045948982239e-05, 4.1501596570014954e-05, 4.406273365020752e-05, 4.6623870730400085e-05, 4.918500781059265e-05, 5.174614489078522e-05, 5.430728197097778e-05, 5.686841905117035e-05, 5.9429556131362915e-05, 6.199069321155548e-05, 6.455183029174805e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 9.0, 6.0, 16.0, 35.0, 44.0, 76.0, 151.0, 255.0, 530.0, 1037.0, 2539.0, 6975.0, 22303.0, 94417.0, 476392.0, 352882.0, 64707.0, 16814.0, 5426.0, 2060.0, 893.0, 444.0, 236.0, 137.0, 59.0, 36.0, 23.0, 17.0, 14.0, 7.0, 6.0, 1.0, 4.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.128173828125, -0.12469863891601562, -0.12122344970703125, -0.11774826049804688, -0.1142730712890625, -0.11079788208007812, -0.10732269287109375, -0.10384750366210938, -0.100372314453125, -0.09689712524414062, -0.09342193603515625, -0.08994674682617188, -0.0864715576171875, -0.08299636840820312, -0.07952117919921875, -0.07604598999023438, -0.07257080078125, -0.06909561157226562, -0.06562042236328125, -0.062145233154296875, -0.0586700439453125, -0.055194854736328125, -0.05171966552734375, -0.048244476318359375, -0.044769287109375, -0.041294097900390625, -0.03781890869140625, -0.034343719482421875, -0.0308685302734375, -0.027393341064453125, -0.02391815185546875, -0.020442962646484375, -0.0169677734375, -0.013492584228515625, -0.01001739501953125, -0.006542205810546875, -0.0030670166015625, 0.000408172607421875, 0.00388336181640625, 0.007358551025390625, 0.010833740234375, 0.014308929443359375, 0.01778411865234375, 0.021259307861328125, 0.0247344970703125, 0.028209686279296875, 0.03168487548828125, 0.035160064697265625, 0.03863525390625, 0.042110443115234375, 0.04558563232421875, 0.049060821533203125, 0.0525360107421875, 0.056011199951171875, 0.05948638916015625, 0.06296157836914062, 0.066436767578125, 0.06991195678710938, 0.07338714599609375, 0.07686233520507812, 0.0803375244140625, 0.08381271362304688, 0.08728790283203125, 0.09076309204101562, 0.09423828125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 6.0, 8.0, 5.0, 8.0, 9.0, 18.0, 18.0, 27.0, 49.0, 51.0, 90.0, 82.0, 115.0, 98.0, 117.0, 75.0, 59.0, 43.0, 37.0, 28.0, 11.0, 9.0, 12.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0244598388671875, -0.023560762405395508, -0.022661685943603516, -0.021762609481811523, -0.02086353302001953, -0.01996445655822754, -0.019065380096435547, -0.018166303634643555, -0.017267227172851562, -0.01636815071105957, -0.015469074249267578, -0.014569997787475586, -0.013670921325683594, -0.012771844863891602, -0.01187276840209961, -0.010973691940307617, -0.010074615478515625, -0.009175539016723633, -0.00827646255493164, -0.0073773860931396484, -0.006478309631347656, -0.005579233169555664, -0.004680156707763672, -0.0037810802459716797, -0.0028820037841796875, -0.0019829273223876953, -0.0010838508605957031, -0.00018477439880371094, 0.0007143020629882812, 0.0016133785247802734, 0.0025124549865722656, 0.003411531448364258, 0.00431060791015625, 0.005209684371948242, 0.006108760833740234, 0.0070078372955322266, 0.007906913757324219, 0.008805990219116211, 0.009705066680908203, 0.010604143142700195, 0.011503219604492188, 0.01240229606628418, 0.013301372528076172, 0.014200448989868164, 0.015099525451660156, 0.01599860191345215, 0.01689767837524414, 0.017796754837036133, 0.018695831298828125, 0.019594907760620117, 0.02049398422241211, 0.0213930606842041, 0.022292137145996094, 0.023191213607788086, 0.024090290069580078, 0.02498936653137207, 0.025888442993164062, 0.026787519454956055, 0.027686595916748047, 0.02858567237854004, 0.02948474884033203, 0.030383825302124023, 0.031282901763916016, 0.03218197822570801, 0.0330810546875]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 14.0, 19.0, 28.0, 60.0, 94.0, 130.0, 158.0, 168.0, 126.0, 73.0, 56.0, 28.0, 17.0, 9.0, 5.0, 3.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6006691455841064, -1.5624265670776367, -1.5241841077804565, -1.4859415292739868, -1.447698950767517, -1.4094563722610474, -1.3712139129638672, -1.3329713344573975, -1.2947287559509277, -1.256486177444458, -1.2182437181472778, -1.180001139640808, -1.1417585611343384, -1.1035159826278687, -1.0652735233306885, -1.0270309448242188, -0.9887884259223938, -0.9505459070205688, -0.9123033285140991, -0.8740608096122742, -0.8358182311058044, -0.7975757122039795, -0.7593331336975098, -0.7210906147956848, -0.6828480958938599, -0.6446055769920349, -0.6063629984855652, -0.5681204795837402, -0.5298779010772705, -0.49163538217544556, -0.4533928334712982, -0.4151502847671509, -0.3769076466560364, -0.33866509795188904, -0.3004225492477417, -0.26218003034591675, -0.22393746674060822, -0.18569491803646088, -0.14745238423347473, -0.10920983552932739, -0.07096728682518005, -0.03272474184632301, 0.005517803132534027, 0.04376034438610077, 0.08200289309024811, 0.12024544179439545, 0.1584879755973816, 0.19673052430152893, 0.23497307300567627, 0.2732156217098236, 0.31145817041397095, 0.3497006893157959, 0.3879432678222656, 0.4261857867240906, 0.4644283354282379, 0.5026708841323853, 0.540913462638855, 0.5791559815406799, 0.6173985600471497, 0.6556410789489746, 0.6938836574554443, 0.7321261763572693, 0.7703686952590942, 0.808611273765564, 0.8468537926673889]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 5.0, 8.0, 8.0, 6.0, 19.0, 13.0, 17.0, 19.0, 17.0, 34.0, 30.0, 42.0, 48.0, 49.0, 54.0, 61.0, 51.0, 41.0, 52.0, 44.0, 54.0, 51.0, 39.0, 42.0, 34.0, 35.0, 23.0, 19.0, 21.0, 19.0, 9.0, 6.0, 5.0, 5.0, 4.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.6077475547790527, -0.5911387801170349, -0.5745299458503723, -0.5579211711883545, -0.5413123369216919, -0.5247035622596741, -0.5080947875976562, -0.49148598313331604, -0.47487717866897583, -0.4582683742046356, -0.4416595697402954, -0.4250507950782776, -0.4084419906139374, -0.39183318614959717, -0.37522441148757935, -0.35861560702323914, -0.3420068025588989, -0.3253979980945587, -0.3087891936302185, -0.2921804189682007, -0.2755716145038605, -0.25896281003952026, -0.24235402047634125, -0.22574523091316223, -0.20913642644882202, -0.1925276219844818, -0.1759188324213028, -0.15931004285812378, -0.14270123839378357, -0.12609243392944336, -0.10948364436626434, -0.09287484735250473, -0.07626610994338989, -0.05965731292963028, -0.043048515915870667, -0.026439718902111053, -0.00983092188835144, 0.006777875125408173, 0.023386672139167786, 0.0399954691529274, 0.05660426616668701, 0.07321306318044662, 0.08982186019420624, 0.10643065720796585, 0.12303945422172546, 0.13964825868606567, 0.1562570482492447, 0.1728658378124237, 0.18947464227676392, 0.20608344674110413, 0.22269223630428314, 0.23930102586746216, 0.25590983033180237, 0.2725186347961426, 0.2891274094581604, 0.3057362139225006, 0.3223450183868408, 0.33895382285118103, 0.35556262731552124, 0.37217140197753906, 0.3887802064418793, 0.4053890109062195, 0.4219977855682373, 0.4386065900325775, 0.4552153944969177]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 12.0, 21.0, 26.0, 41.0, 80.0, 161.0, 270.0, 565.0, 1143.0, 2494.0, 6392.0, 20757.0, 103645.0, 589174.0, 264020.0, 41895.0, 10759.0, 3826.0, 1621.0, 781.0, 408.0, 179.0, 102.0, 66.0, 45.0, 23.0, 16.0, 9.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78271484375, -0.7534408569335938, -0.7241668701171875, -0.6948928833007812, -0.665618896484375, -0.6363449096679688, -0.6070709228515625, -0.5777969360351562, -0.54852294921875, -0.5192489624023438, -0.4899749755859375, -0.46070098876953125, -0.431427001953125, -0.40215301513671875, -0.3728790283203125, -0.34360504150390625, -0.3143310546875, -0.28505706787109375, -0.2557830810546875, -0.22650909423828125, -0.197235107421875, -0.16796112060546875, -0.1386871337890625, -0.10941314697265625, -0.08013916015625, -0.05086517333984375, -0.0215911865234375, 0.00768280029296875, 0.036956787109375, 0.06623077392578125, 0.0955047607421875, 0.12477874755859375, 0.154052734375, 0.18332672119140625, 0.2126007080078125, 0.24187469482421875, 0.271148681640625, 0.30042266845703125, 0.3296966552734375, 0.35897064208984375, 0.38824462890625, 0.41751861572265625, 0.4467926025390625, 0.47606658935546875, 0.505340576171875, 0.5346145629882812, 0.5638885498046875, 0.5931625366210938, 0.6224365234375, 0.6517105102539062, 0.6809844970703125, 0.7102584838867188, 0.739532470703125, 0.7688064575195312, 0.7980804443359375, 0.8273544311523438, 0.85662841796875, 0.8859024047851562, 0.9151763916015625, 0.9444503784179688, 0.973724365234375, 1.0029983520507812, 1.0322723388671875, 1.0615463256835938, 1.0908203125]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 5.0, 13.0, 10.0, 25.0, 22.0, 25.0, 41.0, 27.0, 52.0, 59.0, 76.0, 72.0, 65.0, 78.0, 64.0, 67.0, 60.0, 43.0, 41.0, 44.0, 27.0, 21.0, 21.0, 14.0, 8.0, 5.0, 4.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7900390625, -1.7443389892578125, -1.698638916015625, -1.6529388427734375, -1.60723876953125, -1.5615386962890625, -1.515838623046875, -1.4701385498046875, -1.4244384765625, -1.3787384033203125, -1.333038330078125, -1.2873382568359375, -1.24163818359375, -1.1959381103515625, -1.150238037109375, -1.1045379638671875, -1.058837890625, -1.0131378173828125, -0.967437744140625, -0.9217376708984375, -0.87603759765625, -0.8303375244140625, -0.784637451171875, -0.7389373779296875, -0.6932373046875, -0.6475372314453125, -0.601837158203125, -0.5561370849609375, -0.51043701171875, -0.4647369384765625, -0.419036865234375, -0.3733367919921875, -0.32763671875, -0.2819366455078125, -0.236236572265625, -0.1905364990234375, -0.14483642578125, -0.0991363525390625, -0.053436279296875, -0.0077362060546875, 0.0379638671875, 0.0836639404296875, 0.129364013671875, 0.1750640869140625, 0.22076416015625, 0.2664642333984375, 0.312164306640625, 0.3578643798828125, 0.403564453125, 0.4492645263671875, 0.494964599609375, 0.5406646728515625, 0.58636474609375, 0.6320648193359375, 0.677764892578125, 0.7234649658203125, 0.7691650390625, 0.8148651123046875, 0.860565185546875, 0.9062652587890625, 0.95196533203125, 0.9976654052734375, 1.043365478515625, 1.0890655517578125, 1.134765625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 11.0, 5.0, 11.0, 7.0, 15.0, 14.0, 30.0, 24.0, 33.0, 48.0, 79.0, 90.0, 136.0, 236.0, 448.0, 993.0, 2216.0, 6943.0, 29488.0, 250370.0, 659935.0, 76861.0, 13644.0, 3863.0, 1455.0, 633.0, 344.0, 187.0, 126.0, 76.0, 60.0, 49.0, 38.0, 28.0, 17.0, 17.0, 10.0, 6.0, 5.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88623046875, -0.8524703979492188, -0.8187103271484375, -0.7849502563476562, -0.751190185546875, -0.7174301147460938, -0.6836700439453125, -0.6499099731445312, -0.61614990234375, -0.5823898315429688, -0.5486297607421875, -0.5148696899414062, -0.481109619140625, -0.44734954833984375, -0.4135894775390625, -0.37982940673828125, -0.3460693359375, -0.31230926513671875, -0.2785491943359375, -0.24478912353515625, -0.211029052734375, -0.17726898193359375, -0.1435089111328125, -0.10974884033203125, -0.07598876953125, -0.04222869873046875, -0.0084686279296875, 0.02529144287109375, 0.059051513671875, 0.09281158447265625, 0.1265716552734375, 0.16033172607421875, 0.194091796875, 0.22785186767578125, 0.2616119384765625, 0.29537200927734375, 0.329132080078125, 0.36289215087890625, 0.3966522216796875, 0.43041229248046875, 0.46417236328125, 0.49793243408203125, 0.5316925048828125, 0.5654525756835938, 0.599212646484375, 0.6329727172851562, 0.6667327880859375, 0.7004928588867188, 0.7342529296875, 0.7680130004882812, 0.8017730712890625, 0.8355331420898438, 0.869293212890625, 0.9030532836914062, 0.9368133544921875, 0.9705734252929688, 1.00433349609375, 1.0380935668945312, 1.0718536376953125, 1.1056137084960938, 1.139373779296875, 1.1731338500976562, 1.2068939208984375, 1.2406539916992188, 1.2744140625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 8.0, 7.0, 17.0, 9.0, 16.0, 13.0, 15.0, 29.0, 14.0, 30.0, 33.0, 32.0, 54.0, 52.0, 53.0, 66.0, 61.0, 56.0, 58.0, 52.0, 50.0, 41.0, 34.0, 32.0, 18.0, 29.0, 19.0, 17.0, 23.0, 12.0, 12.0, 5.0, 7.0, 1.0, 3.0, 7.0, 4.0, 1.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.30078125, -1.262359619140625, -1.22393798828125, -1.185516357421875, -1.1470947265625, -1.108673095703125, -1.07025146484375, -1.031829833984375, -0.993408203125, -0.954986572265625, -0.91656494140625, -0.878143310546875, -0.8397216796875, -0.801300048828125, -0.76287841796875, -0.724456787109375, -0.68603515625, -0.647613525390625, -0.60919189453125, -0.570770263671875, -0.5323486328125, -0.493927001953125, -0.45550537109375, -0.417083740234375, -0.378662109375, -0.340240478515625, -0.30181884765625, -0.263397216796875, -0.2249755859375, -0.186553955078125, -0.14813232421875, -0.109710693359375, -0.0712890625, -0.032867431640625, 0.00555419921875, 0.043975830078125, 0.0823974609375, 0.120819091796875, 0.15924072265625, 0.197662353515625, 0.236083984375, 0.274505615234375, 0.31292724609375, 0.351348876953125, 0.3897705078125, 0.428192138671875, 0.46661376953125, 0.505035400390625, 0.54345703125, 0.581878662109375, 0.62030029296875, 0.658721923828125, 0.6971435546875, 0.735565185546875, 0.77398681640625, 0.812408447265625, 0.850830078125, 0.889251708984375, 0.92767333984375, 0.966094970703125, 1.0045166015625, 1.042938232421875, 1.08135986328125, 1.119781494140625, 1.158203125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 8.0, 9.0, 10.0, 17.0, 31.0, 36.0, 46.0, 103.0, 233.0, 493.0, 1425.0, 5066.0, 28683.0, 321141.0, 617878.0, 61596.0, 8382.0, 2055.0, 682.0, 317.0, 133.0, 76.0, 49.0, 28.0, 19.0, 8.0, 7.0, 8.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.33349609375, -0.324981689453125, -0.31646728515625, -0.307952880859375, -0.2994384765625, -0.290924072265625, -0.28240966796875, -0.273895263671875, -0.265380859375, -0.256866455078125, -0.24835205078125, -0.239837646484375, -0.2313232421875, -0.222808837890625, -0.21429443359375, -0.205780029296875, -0.197265625, -0.188751220703125, -0.18023681640625, -0.171722412109375, -0.1632080078125, -0.154693603515625, -0.14617919921875, -0.137664794921875, -0.129150390625, -0.120635986328125, -0.11212158203125, -0.103607177734375, -0.0950927734375, -0.086578369140625, -0.07806396484375, -0.069549560546875, -0.06103515625, -0.052520751953125, -0.04400634765625, -0.035491943359375, -0.0269775390625, -0.018463134765625, -0.00994873046875, -0.001434326171875, 0.007080078125, 0.015594482421875, 0.02410888671875, 0.032623291015625, 0.0411376953125, 0.049652099609375, 0.05816650390625, 0.066680908203125, 0.0751953125, 0.083709716796875, 0.09222412109375, 0.100738525390625, 0.1092529296875, 0.117767333984375, 0.12628173828125, 0.134796142578125, 0.143310546875, 0.151824951171875, 0.16033935546875, 0.168853759765625, 0.1773681640625, 0.185882568359375, 0.19439697265625, 0.202911376953125, 0.21142578125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 9.0, 6.0, 12.0, 7.0, 20.0, 23.0, 30.0, 50.0, 38.0, 44.0, 72.0, 72.0, 78.0, 78.0, 77.0, 71.0, 48.0, 46.0, 43.0, 29.0, 20.0, 27.0, 18.0, 15.0, 16.0, 12.0, 8.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.7239322662353516e-05, -2.6467256247997284e-05, -2.5695189833641052e-05, -2.492312341928482e-05, -2.415105700492859e-05, -2.3378990590572357e-05, -2.2606924176216125e-05, -2.1834857761859894e-05, -2.1062791347503662e-05, -2.029072493314743e-05, -1.95186585187912e-05, -1.8746592104434967e-05, -1.7974525690078735e-05, -1.7202459275722504e-05, -1.6430392861366272e-05, -1.565832644701004e-05, -1.4886260032653809e-05, -1.4114193618297577e-05, -1.3342127203941345e-05, -1.2570060789585114e-05, -1.1797994375228882e-05, -1.102592796087265e-05, -1.0253861546516418e-05, -9.481795132160187e-06, -8.709728717803955e-06, -7.937662303447723e-06, -7.165595889091492e-06, -6.39352947473526e-06, -5.621463060379028e-06, -4.849396646022797e-06, -4.077330231666565e-06, -3.3052638173103333e-06, -2.5331974029541016e-06, -1.7611309885978699e-06, -9.890645742416382e-07, -2.169981598854065e-07, 5.550682544708252e-07, 1.3271346688270569e-06, 2.0992010831832886e-06, 2.8712674975395203e-06, 3.643333911895752e-06, 4.415400326251984e-06, 5.187466740608215e-06, 5.959533154964447e-06, 6.731599569320679e-06, 7.50366598367691e-06, 8.275732398033142e-06, 9.047798812389374e-06, 9.819865226745605e-06, 1.0591931641101837e-05, 1.1363998055458069e-05, 1.21360644698143e-05, 1.2908130884170532e-05, 1.3680197298526764e-05, 1.4452263712882996e-05, 1.5224330127239227e-05, 1.599639654159546e-05, 1.676846295595169e-05, 1.7540529370307922e-05, 1.8312595784664154e-05, 1.9084662199020386e-05, 1.9856728613376617e-05, 2.062879502773285e-05, 2.140086144208908e-05, 2.2172927856445312e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 3.0, 4.0, 7.0, 13.0, 17.0, 40.0, 49.0, 65.0, 96.0, 166.0, 284.0, 396.0, 711.0, 1226.0, 2207.0, 4652.0, 11770.0, 39644.0, 172976.0, 518579.0, 220557.0, 49509.0, 14335.0, 5312.0, 2650.0, 1300.0, 754.0, 459.0, 288.0, 167.0, 109.0, 72.0, 44.0, 33.0, 20.0, 10.0, 8.0, 2.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.181396484375, -0.1752643585205078, -0.16913223266601562, -0.16300010681152344, -0.15686798095703125, -0.15073585510253906, -0.14460372924804688, -0.1384716033935547, -0.1323394775390625, -0.1262073516845703, -0.12007522583007812, -0.11394309997558594, -0.10781097412109375, -0.10167884826660156, -0.09554672241210938, -0.08941459655761719, -0.083282470703125, -0.07715034484863281, -0.07101821899414062, -0.06488609313964844, -0.05875396728515625, -0.05262184143066406, -0.046489715576171875, -0.04035758972167969, -0.0342254638671875, -0.028093338012695312, -0.021961212158203125, -0.015829086303710938, -0.00969696044921875, -0.0035648345947265625, 0.002567291259765625, 0.008699417114257812, 0.01483154296875, 0.020963668823242188, 0.027095794677734375, 0.03322792053222656, 0.03936004638671875, 0.04549217224121094, 0.051624298095703125, 0.05775642395019531, 0.0638885498046875, 0.07002067565917969, 0.07615280151367188, 0.08228492736816406, 0.08841705322265625, 0.09454917907714844, 0.10068130493164062, 0.10681343078613281, 0.112945556640625, 0.11907768249511719, 0.12520980834960938, 0.13134193420410156, 0.13747406005859375, 0.14360618591308594, 0.14973831176757812, 0.1558704376220703, 0.1620025634765625, 0.1681346893310547, 0.17426681518554688, 0.18039894104003906, 0.18653106689453125, 0.19266319274902344, 0.19879531860351562, 0.2049274444580078, 0.2110595703125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 9.0, 10.0, 7.0, 15.0, 15.0, 16.0, 23.0, 28.0, 45.0, 40.0, 61.0, 74.0, 73.0, 78.0, 94.0, 68.0, 57.0, 38.0, 53.0, 38.0, 24.0, 20.0, 26.0, 15.0, 16.0, 17.0, 11.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08807373046875, -0.08568096160888672, -0.08328819274902344, -0.08089542388916016, -0.07850265502929688, -0.0761098861694336, -0.07371711730957031, -0.07132434844970703, -0.06893157958984375, -0.06653881072998047, -0.06414604187011719, -0.061753273010253906, -0.059360504150390625, -0.056967735290527344, -0.05457496643066406, -0.05218219757080078, -0.0497894287109375, -0.04739665985107422, -0.04500389099121094, -0.042611122131347656, -0.040218353271484375, -0.037825584411621094, -0.03543281555175781, -0.03304004669189453, -0.03064727783203125, -0.02825450897216797, -0.025861740112304688, -0.023468971252441406, -0.021076202392578125, -0.018683433532714844, -0.016290664672851562, -0.013897895812988281, -0.011505126953125, -0.009112358093261719, -0.0067195892333984375, -0.004326820373535156, -0.001934051513671875, 0.00045871734619140625, 0.0028514862060546875, 0.005244255065917969, 0.00763702392578125, 0.010029792785644531, 0.012422561645507812, 0.014815330505371094, 0.017208099365234375, 0.019600868225097656, 0.021993637084960938, 0.02438640594482422, 0.0267791748046875, 0.02917194366455078, 0.03156471252441406, 0.033957481384277344, 0.036350250244140625, 0.038743019104003906, 0.04113578796386719, 0.04352855682373047, 0.04592132568359375, 0.04831409454345703, 0.05070686340332031, 0.053099632263183594, 0.055492401123046875, 0.057885169982910156, 0.06027793884277344, 0.06267070770263672, 0.0650634765625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 11.0, 33.0, 112.0, 261.0, 330.0, 195.0, 47.0, 14.0, 5.0, 6.0], "bins": [-10.385149955749512, -10.206710815429688, -10.028271675109863, -9.849832534790039, -9.671394348144531, -9.492955207824707, -9.314516067504883, -9.136076927185059, -8.957637786865234, -8.77919864654541, -8.600759506225586, -8.422320365905762, -8.243882179260254, -8.06544303894043, -7.8870038986206055, -7.708564758300781, -7.530125617980957, -7.351686477661133, -7.173247814178467, -6.994808673858643, -6.816369533538818, -6.637930393218994, -6.459491729736328, -6.281052589416504, -6.102613925933838, -5.924174785614014, -5.745736122131348, -5.567296981811523, -5.388857841491699, -5.210418701171875, -5.031980037689209, -4.853540897369385, -4.6751017570495605, -4.496662616729736, -4.31822395324707, -4.139784812927246, -3.961345672607422, -3.7829067707061768, -3.6044678688049316, -3.4260287284851074, -3.247589588165283, -3.069150686264038, -2.890711545944214, -2.7122726440429688, -2.5338335037231445, -2.3553946018218994, -2.1769556999206543, -1.99851655960083, -1.8200775384902954, -1.6416385173797607, -1.463199496269226, -1.2847604751586914, -1.1063215732574463, -0.9278824925422668, -0.749443531036377, -0.5710045099258423, -0.3925654888153076, -0.21412648260593414, -0.03568747639656067, 0.1427515149116516, 0.3211905360221863, 0.49962955713272095, 0.6780685186386108, 0.8565075397491455, 1.0349465608596802]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 4.0, 7.0, 8.0, 8.0, 9.0, 10.0, 16.0, 24.0, 12.0, 26.0, 27.0, 22.0, 16.0, 37.0, 33.0, 24.0, 46.0, 33.0, 47.0, 54.0, 35.0, 50.0, 38.0, 29.0, 35.0, 41.0, 49.0, 23.0, 27.0, 31.0, 23.0, 21.0, 29.0, 14.0, 17.0, 13.0, 10.0, 10.0, 8.0, 7.0, 8.0, 10.0, 4.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.7313416004180908, -1.680737853050232, -1.6301339864730835, -1.5795302391052246, -1.5289264917373657, -1.4783227443695068, -1.4277188777923584, -1.3771151304244995, -1.3265113830566406, -1.2759076356887817, -1.2253037691116333, -1.1747000217437744, -1.1240962743759155, -1.0734925270080566, -1.0228886604309082, -0.9722849130630493, -0.9216810464859009, -0.8710772395133972, -0.8204734921455383, -0.7698696851730347, -0.7192659378051758, -0.6686621308326721, -0.6180583238601685, -0.5674545764923096, -0.5168507695198059, -0.46624699234962463, -0.41564321517944336, -0.3650394082069397, -0.3144356310367584, -0.26383185386657715, -0.2132280468940735, -0.1626242697238922, -0.11202049255371094, -0.061416707932949066, -0.010812923312187195, 0.03979086875915527, 0.09039464592933655, 0.14099842309951782, 0.19160223007202148, 0.24220600724220276, 0.29280978441238403, 0.3434135615825653, 0.3940173387527466, 0.44462114572525024, 0.4952249228954315, 0.5458287000656128, 0.5964325070381165, 0.6470363140106201, 0.697640061378479, 0.7482438683509827, 0.7988476157188416, 0.8494514226913452, 0.9000551700592041, 0.9506589770317078, 1.0012627840042114, 1.0518665313720703, 1.1024703979492188, 1.1530741453170776, 1.203678011894226, 1.254281759262085, 1.3048855066299438, 1.3554892539978027, 1.4060931205749512, 1.45669686794281, 1.507300615310669]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 8.0, 11.0, 13.0, 18.0, 24.0, 32.0, 48.0, 91.0, 137.0, 211.0, 417.0, 849.0, 1644.0, 3578.0, 10609.0, 70164.0, 2287188.0, 1748843.0, 52943.0, 9908.0, 3959.0, 1741.0, 762.0, 457.0, 224.0, 155.0, 82.0, 48.0, 37.0, 20.0, 8.0, 10.0, 10.0, 6.0, 2.0, 0.0, 5.0], "bins": [-2.150390625, -2.1014633178710938, -2.0525360107421875, -2.0036087036132812, -1.954681396484375, -1.9057540893554688, -1.8568267822265625, -1.8078994750976562, -1.75897216796875, -1.7100448608398438, -1.6611175537109375, -1.6121902465820312, -1.563262939453125, -1.5143356323242188, -1.4654083251953125, -1.4164810180664062, -1.3675537109375, -1.3186264038085938, -1.2696990966796875, -1.2207717895507812, -1.171844482421875, -1.1229171752929688, -1.0739898681640625, -1.0250625610351562, -0.97613525390625, -0.9272079467773438, -0.8782806396484375, -0.8293533325195312, -0.780426025390625, -0.7314987182617188, -0.6825714111328125, -0.6336441040039062, -0.584716796875, -0.5357894897460938, -0.4868621826171875, -0.43793487548828125, -0.389007568359375, -0.34008026123046875, -0.2911529541015625, -0.24222564697265625, -0.19329833984375, -0.14437103271484375, -0.0954437255859375, -0.04651641845703125, 0.002410888671875, 0.05133819580078125, 0.1002655029296875, 0.14919281005859375, 0.1981201171875, 0.24704742431640625, 0.2959747314453125, 0.34490203857421875, 0.393829345703125, 0.44275665283203125, 0.4916839599609375, 0.5406112670898438, 0.58953857421875, 0.6384658813476562, 0.6873931884765625, 0.7363204956054688, 0.785247802734375, 0.8341751098632812, 0.8831024169921875, 0.9320297241210938, 0.98095703125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 17.0, 22.0, 24.0, 42.0, 47.0, 68.0, 58.0, 71.0, 79.0, 91.0, 72.0, 71.0, 76.0, 53.0, 41.0, 48.0, 30.0, 27.0, 19.0, 14.0, 11.0, 7.0, 4.0, 6.0, 2.0, 0.0, 1.0], "bins": [-1.3115234375, -1.2834930419921875, -1.255462646484375, -1.2274322509765625, -1.19940185546875, -1.1713714599609375, -1.143341064453125, -1.1153106689453125, -1.0872802734375, -1.0592498779296875, -1.031219482421875, -1.0031890869140625, -0.97515869140625, -0.9471282958984375, -0.919097900390625, -0.8910675048828125, -0.863037109375, -0.8350067138671875, -0.806976318359375, -0.7789459228515625, -0.75091552734375, -0.7228851318359375, -0.694854736328125, -0.6668243408203125, -0.6387939453125, -0.6107635498046875, -0.582733154296875, -0.5547027587890625, -0.52667236328125, -0.4986419677734375, -0.470611572265625, -0.4425811767578125, -0.41455078125, -0.3865203857421875, -0.358489990234375, -0.3304595947265625, -0.30242919921875, -0.2743988037109375, -0.246368408203125, -0.2183380126953125, -0.1903076171875, -0.1622772216796875, -0.134246826171875, -0.1062164306640625, -0.07818603515625, -0.0501556396484375, -0.022125244140625, 0.0059051513671875, 0.033935546875, 0.0619659423828125, 0.089996337890625, 0.1180267333984375, 0.14605712890625, 0.1740875244140625, 0.202117919921875, 0.2301483154296875, 0.2581787109375, 0.2862091064453125, 0.314239501953125, 0.3422698974609375, 0.37030029296875, 0.3983306884765625, 0.426361083984375, 0.4543914794921875, 0.482421875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 8.0, 10.0, 23.0, 35.0, 44.0, 69.0, 160.0, 335.0, 752.0, 2673.0, 16870.0, 1680109.0, 2469099.0, 19446.0, 3005.0, 917.0, 385.0, 159.0, 79.0, 44.0, 20.0, 10.0, 8.0, 6.0, 4.0, 4.0, 7.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.96875, -2.8863525390625, -2.803955078125, -2.7215576171875, -2.63916015625, -2.5567626953125, -2.474365234375, -2.3919677734375, -2.3095703125, -2.2271728515625, -2.144775390625, -2.0623779296875, -1.97998046875, -1.8975830078125, -1.815185546875, -1.7327880859375, -1.650390625, -1.5679931640625, -1.485595703125, -1.4031982421875, -1.32080078125, -1.2384033203125, -1.156005859375, -1.0736083984375, -0.9912109375, -0.9088134765625, -0.826416015625, -0.7440185546875, -0.66162109375, -0.5792236328125, -0.496826171875, -0.4144287109375, -0.33203125, -0.2496337890625, -0.167236328125, -0.0848388671875, -0.00244140625, 0.0799560546875, 0.162353515625, 0.2447509765625, 0.3271484375, 0.4095458984375, 0.491943359375, 0.5743408203125, 0.65673828125, 0.7391357421875, 0.821533203125, 0.9039306640625, 0.986328125, 1.0687255859375, 1.151123046875, 1.2335205078125, 1.31591796875, 1.3983154296875, 1.480712890625, 1.5631103515625, 1.6455078125, 1.7279052734375, 1.810302734375, 1.8927001953125, 1.97509765625, 2.0574951171875, 2.139892578125, 2.2222900390625, 2.3046875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 1.0, 8.0, 9.0, 16.0, 21.0, 43.0, 74.0, 130.0, 258.0, 532.0, 855.0, 938.0, 597.0, 274.0, 123.0, 74.0, 44.0, 23.0, 20.0, 7.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.471435546875, -0.4546318054199219, -0.43782806396484375, -0.4210243225097656, -0.4042205810546875, -0.3874168395996094, -0.37061309814453125, -0.3538093566894531, -0.337005615234375, -0.3202018737792969, -0.30339813232421875, -0.2865943908691406, -0.2697906494140625, -0.2529869079589844, -0.23618316650390625, -0.21937942504882812, -0.20257568359375, -0.18577194213867188, -0.16896820068359375, -0.15216445922851562, -0.1353607177734375, -0.11855697631835938, -0.10175323486328125, -0.08494949340820312, -0.068145751953125, -0.051342010498046875, -0.03453826904296875, -0.017734527587890625, -0.0009307861328125, 0.015872955322265625, 0.03267669677734375, 0.049480438232421875, 0.0662841796875, 0.08308792114257812, 0.09989166259765625, 0.11669540405273438, 0.1334991455078125, 0.15030288696289062, 0.16710662841796875, 0.18391036987304688, 0.200714111328125, 0.21751785278320312, 0.23432159423828125, 0.2511253356933594, 0.2679290771484375, 0.2847328186035156, 0.30153656005859375, 0.3183403015136719, 0.33514404296875, 0.3519477844238281, 0.36875152587890625, 0.3855552673339844, 0.4023590087890625, 0.4191627502441406, 0.43596649169921875, 0.4527702331542969, 0.469573974609375, 0.4863777160644531, 0.5031814575195312, 0.5199851989746094, 0.5367889404296875, 0.5535926818847656, 0.5703964233398438, 0.5872001647949219, 0.60400390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 5.0, 6.0, 4.0, 12.0, 18.0, 25.0, 30.0, 36.0, 47.0, 40.0, 46.0, 51.0, 60.0, 65.0, 50.0, 71.0, 57.0, 69.0, 53.0, 57.0, 42.0, 33.0, 28.0, 22.0, 17.0, 5.0, 10.0, 6.0, 12.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9081579446792603, -0.8820516467094421, -0.8559452891349792, -0.8298389911651611, -0.8037326335906982, -0.7776263356208801, -0.751520037651062, -0.7254136800765991, -0.699307382106781, -0.6732010841369629, -0.6470947265625, -0.6209884285926819, -0.594882071018219, -0.5687757730484009, -0.542669415473938, -0.5165631175041199, -0.49045678973197937, -0.46435046195983887, -0.43824413418769836, -0.41213780641555786, -0.38603150844573975, -0.35992518067359924, -0.33381885290145874, -0.3077125549316406, -0.28160619735717773, -0.25549986958503723, -0.22939355671405792, -0.20328722894191742, -0.1771809160709381, -0.1510745882987976, -0.1249682605266571, -0.0988619476556778, -0.07275563478469849, -0.04664931446313858, -0.020542990416288376, 0.005563333630561829, 0.031669653952121735, 0.05777597427368164, 0.08388230204582214, 0.10998861491680145, 0.13609494268894196, 0.16220127046108246, 0.18830758333206177, 0.21441391110420227, 0.24052023887634277, 0.2666265368461609, 0.2927328944206238, 0.3188391923904419, 0.3449455201625824, 0.3710518479347229, 0.3971581757068634, 0.4232645034790039, 0.449370801448822, 0.4754771292209625, 0.501583456993103, 0.5276897549629211, 0.553796112537384, 0.5799024105072021, 0.606008768081665, 0.6321150660514832, 0.658221423625946, 0.6843277215957642, 0.710434079170227, 0.7365403771400452, 0.7626466751098633]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 6.0, 6.0, 7.0, 6.0, 10.0, 12.0, 13.0, 11.0, 19.0, 15.0, 20.0, 29.0, 16.0, 24.0, 23.0, 39.0, 32.0, 44.0, 29.0, 43.0, 41.0, 51.0, 40.0, 36.0, 38.0, 36.0, 38.0, 28.0, 30.0, 33.0, 28.0, 22.0, 24.0, 22.0, 29.0, 12.0, 18.0, 15.0, 10.0, 8.0, 11.0, 11.0, 3.0, 6.0, 3.0, 7.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5380727648735046, -0.5195364952087402, -0.5010002851486206, -0.4824640452861786, -0.4639278054237366, -0.44539153575897217, -0.42685529589653015, -0.40831905603408813, -0.3897828161716461, -0.3712465763092041, -0.3527103364467621, -0.33417409658432007, -0.31563782691955566, -0.29710161685943604, -0.27856534719467163, -0.2600291073322296, -0.2414928674697876, -0.22295662760734558, -0.20442038774490356, -0.18588413298130035, -0.16734789311885834, -0.14881165325641632, -0.1302753984928131, -0.1117391586303711, -0.09320291876792908, -0.07466667890548706, -0.05613043159246445, -0.03759418800473213, -0.019057944416999817, -0.0005217045545578003, 0.018014542758464813, 0.03655079007148743, 0.05508708953857422, 0.07362332940101624, 0.09215957671403885, 0.11069582402706146, 0.12923206388950348, 0.1477683037519455, 0.1663045585155487, 0.18484079837799072, 0.20337703824043274, 0.22191327810287476, 0.24044951796531677, 0.2589857578277588, 0.2775220274925232, 0.2960582375526428, 0.3145945072174072, 0.33313074707984924, 0.35166698694229126, 0.3702032268047333, 0.3887394666671753, 0.4072757065296173, 0.4258119463920593, 0.44434821605682373, 0.46288445591926575, 0.48142069578170776, 0.4999569356441498, 0.5184931755065918, 0.5370294451713562, 0.5555656552314758, 0.5741019248962402, 0.5926381349563599, 0.6111744046211243, 0.6297106742858887, 0.6482468843460083]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 8.0, 10.0, 14.0, 17.0, 24.0, 34.0, 41.0, 43.0, 79.0, 110.0, 132.0, 173.0, 238.0, 383.0, 490.0, 764.0, 1232.0, 1968.0, 3618.0, 6829.0, 14772.0, 38835.0, 167058.0, 536770.0, 197954.0, 43645.0, 15947.0, 7439.0, 3904.0, 2202.0, 1260.0, 767.0, 524.0, 351.0, 254.0, 182.0, 127.0, 94.0, 72.0, 51.0, 29.0, 24.0, 18.0, 16.0, 15.0, 9.0, 5.0, 4.0, 3.0, 2.0, 8.0, 3.0, 1.0, 4.0], "bins": [-0.22216796875, -0.215545654296875, -0.20892333984375, -0.202301025390625, -0.1956787109375, -0.189056396484375, -0.18243408203125, -0.175811767578125, -0.169189453125, -0.162567138671875, -0.15594482421875, -0.149322509765625, -0.1427001953125, -0.136077880859375, -0.12945556640625, -0.122833251953125, -0.1162109375, -0.109588623046875, -0.10296630859375, -0.096343994140625, -0.0897216796875, -0.083099365234375, -0.07647705078125, -0.069854736328125, -0.063232421875, -0.056610107421875, -0.04998779296875, -0.043365478515625, -0.0367431640625, -0.030120849609375, -0.02349853515625, -0.016876220703125, -0.01025390625, -0.003631591796875, 0.00299072265625, 0.009613037109375, 0.0162353515625, 0.022857666015625, 0.02947998046875, 0.036102294921875, 0.042724609375, 0.049346923828125, 0.05596923828125, 0.062591552734375, 0.0692138671875, 0.075836181640625, 0.08245849609375, 0.089080810546875, 0.095703125, 0.102325439453125, 0.10894775390625, 0.115570068359375, 0.1221923828125, 0.128814697265625, 0.13543701171875, 0.142059326171875, 0.148681640625, 0.155303955078125, 0.16192626953125, 0.168548583984375, 0.1751708984375, 0.181793212890625, 0.18841552734375, 0.195037841796875, 0.20166015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 11.0, 13.0, 12.0, 8.0, 11.0, 20.0, 21.0, 17.0, 29.0, 26.0, 22.0, 24.0, 37.0, 38.0, 39.0, 34.0, 47.0, 44.0, 54.0, 40.0, 35.0, 40.0, 35.0, 40.0, 29.0, 29.0, 24.0, 29.0, 31.0, 28.0, 14.0, 22.0, 14.0, 16.0, 8.0, 11.0, 8.0, 6.0, 8.0, 4.0, 9.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.369140625, -0.3572273254394531, -0.34531402587890625, -0.3334007263183594, -0.3214874267578125, -0.3095741271972656, -0.29766082763671875, -0.2857475280761719, -0.273834228515625, -0.2619209289550781, -0.25000762939453125, -0.23809432983398438, -0.2261810302734375, -0.21426773071289062, -0.20235443115234375, -0.19044113159179688, -0.17852783203125, -0.16661453247070312, -0.15470123291015625, -0.14278793334960938, -0.1308746337890625, -0.11896133422851562, -0.10704803466796875, -0.09513473510742188, -0.083221435546875, -0.07130813598632812, -0.05939483642578125, -0.047481536865234375, -0.0355682373046875, -0.023654937744140625, -0.01174163818359375, 0.000171661376953125, 0.0120849609375, 0.023998260498046875, 0.03591156005859375, 0.047824859619140625, 0.0597381591796875, 0.07165145874023438, 0.08356475830078125, 0.09547805786132812, 0.107391357421875, 0.11930465698242188, 0.13121795654296875, 0.14313125610351562, 0.1550445556640625, 0.16695785522460938, 0.17887115478515625, 0.19078445434570312, 0.20269775390625, 0.21461105346679688, 0.22652435302734375, 0.23843765258789062, 0.2503509521484375, 0.2622642517089844, 0.27417755126953125, 0.2860908508300781, 0.298004150390625, 0.3099174499511719, 0.32183074951171875, 0.3337440490722656, 0.3456573486328125, 0.3575706481933594, 0.36948394775390625, 0.3813972473144531, 0.393310546875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 5.0, 3.0, 6.0, 5.0, 14.0, 12.0, 23.0, 33.0, 44.0, 56.0, 105.0, 126.0, 176.0, 246.0, 381.0, 638.0, 1037.0, 1656.0, 2764.0, 4873.0, 9424.0, 19402.0, 46043.0, 132112.0, 356005.0, 299072.0, 101660.0, 37235.0, 16474.0, 8215.0, 4440.0, 2389.0, 1362.0, 877.0, 534.0, 322.0, 251.0, 167.0, 104.0, 87.0, 56.0, 44.0, 17.0, 25.0, 11.0, 14.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11309814453125, -0.10904216766357422, -0.10498619079589844, -0.10093021392822266, -0.09687423706054688, -0.0928182601928711, -0.08876228332519531, -0.08470630645751953, -0.08065032958984375, -0.07659435272216797, -0.07253837585449219, -0.0684823989868164, -0.06442642211914062, -0.060370445251464844, -0.05631446838378906, -0.05225849151611328, -0.0482025146484375, -0.04414653778076172, -0.04009056091308594, -0.036034584045410156, -0.031978607177734375, -0.027922630310058594, -0.023866653442382812, -0.01981067657470703, -0.01575469970703125, -0.011698722839355469, -0.0076427459716796875, -0.0035867691040039062, 0.000469207763671875, 0.004525184631347656, 0.008581161499023438, 0.012637138366699219, 0.016693115234375, 0.02074909210205078, 0.024805068969726562, 0.028861045837402344, 0.032917022705078125, 0.036972999572753906, 0.04102897644042969, 0.04508495330810547, 0.04914093017578125, 0.05319690704345703, 0.05725288391113281, 0.061308860778808594, 0.06536483764648438, 0.06942081451416016, 0.07347679138183594, 0.07753276824951172, 0.0815887451171875, 0.08564472198486328, 0.08970069885253906, 0.09375667572021484, 0.09781265258789062, 0.1018686294555664, 0.10592460632324219, 0.10998058319091797, 0.11403656005859375, 0.11809253692626953, 0.12214851379394531, 0.1262044906616211, 0.13026046752929688, 0.13431644439697266, 0.13837242126464844, 0.14242839813232422, 0.146484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 10.0, 3.0, 6.0, 7.0, 16.0, 17.0, 12.0, 22.0, 16.0, 21.0, 32.0, 30.0, 38.0, 36.0, 40.0, 48.0, 39.0, 37.0, 40.0, 35.0, 55.0, 41.0, 34.0, 45.0, 34.0, 30.0, 34.0, 28.0, 29.0, 24.0, 24.0, 23.0, 24.0, 11.0, 14.0, 16.0, 4.0, 4.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.0390625, -1.009063720703125, -0.97906494140625, -0.949066162109375, -0.9190673828125, -0.889068603515625, -0.85906982421875, -0.829071044921875, -0.799072265625, -0.769073486328125, -0.73907470703125, -0.709075927734375, -0.6790771484375, -0.649078369140625, -0.61907958984375, -0.589080810546875, -0.55908203125, -0.529083251953125, -0.49908447265625, -0.469085693359375, -0.4390869140625, -0.409088134765625, -0.37908935546875, -0.349090576171875, -0.319091796875, -0.289093017578125, -0.25909423828125, -0.229095458984375, -0.1990966796875, -0.169097900390625, -0.13909912109375, -0.109100341796875, -0.0791015625, -0.049102783203125, -0.01910400390625, 0.010894775390625, 0.0408935546875, 0.070892333984375, 0.10089111328125, 0.130889892578125, 0.160888671875, 0.190887451171875, 0.22088623046875, 0.250885009765625, 0.2808837890625, 0.310882568359375, 0.34088134765625, 0.370880126953125, 0.40087890625, 0.430877685546875, 0.46087646484375, 0.490875244140625, 0.5208740234375, 0.550872802734375, 0.58087158203125, 0.610870361328125, 0.640869140625, 0.670867919921875, 0.70086669921875, 0.730865478515625, 0.7608642578125, 0.790863037109375, 0.82086181640625, 0.850860595703125, 0.880859375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 9.0, 11.0, 26.0, 34.0, 58.0, 101.0, 198.0, 360.0, 766.0, 1639.0, 3747.0, 11103.0, 51442.0, 401430.0, 490133.0, 66628.0, 13164.0, 4231.0, 1765.0, 756.0, 408.0, 238.0, 109.0, 75.0, 50.0, 33.0, 14.0, 9.0, 6.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07635498046875, -0.0730447769165039, -0.06973457336425781, -0.06642436981201172, -0.06311416625976562, -0.05980396270751953, -0.05649375915527344, -0.053183555603027344, -0.04987335205078125, -0.046563148498535156, -0.04325294494628906, -0.03994274139404297, -0.036632537841796875, -0.03332233428955078, -0.030012130737304688, -0.026701927185058594, -0.0233917236328125, -0.020081520080566406, -0.016771316528320312, -0.013461112976074219, -0.010150909423828125, -0.006840705871582031, -0.0035305023193359375, -0.00022029876708984375, 0.00308990478515625, 0.006400108337402344, 0.009710311889648438, 0.013020515441894531, 0.016330718994140625, 0.01964092254638672, 0.022951126098632812, 0.026261329650878906, 0.029571533203125, 0.032881736755371094, 0.03619194030761719, 0.03950214385986328, 0.042812347412109375, 0.04612255096435547, 0.04943275451660156, 0.052742958068847656, 0.05605316162109375, 0.059363365173339844, 0.06267356872558594, 0.06598377227783203, 0.06929397583007812, 0.07260417938232422, 0.07591438293457031, 0.0792245864868164, 0.0825347900390625, 0.0858449935913086, 0.08915519714355469, 0.09246540069580078, 0.09577560424804688, 0.09908580780029297, 0.10239601135253906, 0.10570621490478516, 0.10901641845703125, 0.11232662200927734, 0.11563682556152344, 0.11894702911376953, 0.12225723266601562, 0.12556743621826172, 0.1288776397705078, 0.1321878433227539, 0.135498046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 2.0, 8.0, 7.0, 13.0, 19.0, 21.0, 31.0, 42.0, 81.0, 96.0, 140.0, 90.0, 116.0, 93.0, 70.0, 60.0, 27.0, 27.0, 15.0, 10.0, 3.0, 6.0, 6.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.054473876953125e-05, -4.915613681077957e-05, -4.776753485202789e-05, -4.6378932893276215e-05, -4.4990330934524536e-05, -4.360172897577286e-05, -4.221312701702118e-05, -4.08245250582695e-05, -3.943592309951782e-05, -3.8047321140766144e-05, -3.6658719182014465e-05, -3.527011722326279e-05, -3.388151526451111e-05, -3.249291330575943e-05, -3.110431134700775e-05, -2.9715709388256073e-05, -2.8327107429504395e-05, -2.6938505470752716e-05, -2.5549903512001038e-05, -2.416130155324936e-05, -2.277269959449768e-05, -2.1384097635746002e-05, -1.9995495676994324e-05, -1.8606893718242645e-05, -1.7218291759490967e-05, -1.582968980073929e-05, -1.444108784198761e-05, -1.3052485883235931e-05, -1.1663883924484253e-05, -1.0275281965732574e-05, -8.886680006980896e-06, -7.4980780482292175e-06, -6.109476089477539e-06, -4.720874130725861e-06, -3.332272171974182e-06, -1.9436702132225037e-06, -5.550682544708252e-07, 8.335337042808533e-07, 2.2221356630325317e-06, 3.61073762178421e-06, 4.999339580535889e-06, 6.387941539287567e-06, 7.776543498039246e-06, 9.165145456790924e-06, 1.0553747415542603e-05, 1.1942349374294281e-05, 1.333095133304596e-05, 1.4719553291797638e-05, 1.6108155250549316e-05, 1.7496757209300995e-05, 1.8885359168052673e-05, 2.0273961126804352e-05, 2.166256308555603e-05, 2.305116504430771e-05, 2.4439767003059387e-05, 2.5828368961811066e-05, 2.7216970920562744e-05, 2.8605572879314423e-05, 2.99941748380661e-05, 3.138277679681778e-05, 3.277137875556946e-05, 3.4159980714321136e-05, 3.5548582673072815e-05, 3.6937184631824493e-05, 3.832578659057617e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 11.0, 1.0, 12.0, 14.0, 10.0, 20.0, 26.0, 51.0, 67.0, 110.0, 136.0, 228.0, 348.0, 619.0, 1067.0, 2063.0, 3955.0, 8755.0, 21627.0, 58307.0, 170260.0, 359548.0, 266352.0, 96740.0, 33740.0, 12894.0, 5646.0, 2679.0, 1336.0, 754.0, 420.0, 239.0, 176.0, 103.0, 71.0, 52.0, 37.0, 27.0, 13.0, 14.0, 10.0, 5.0, 8.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06231689453125, -0.06035327911376953, -0.05838966369628906, -0.056426048278808594, -0.054462432861328125, -0.052498817443847656, -0.05053520202636719, -0.04857158660888672, -0.04660797119140625, -0.04464435577392578, -0.04268074035644531, -0.040717124938964844, -0.038753509521484375, -0.036789894104003906, -0.03482627868652344, -0.03286266326904297, -0.0308990478515625, -0.02893543243408203, -0.026971817016601562, -0.025008201599121094, -0.023044586181640625, -0.021080970764160156, -0.019117355346679688, -0.01715373992919922, -0.01519012451171875, -0.013226509094238281, -0.011262893676757812, -0.009299278259277344, -0.007335662841796875, -0.005372047424316406, -0.0034084320068359375, -0.0014448165893554688, 0.000518798828125, 0.0024824142456054688, 0.0044460296630859375, 0.006409645080566406, 0.008373260498046875, 0.010336875915527344, 0.012300491333007812, 0.014264106750488281, 0.01622772216796875, 0.01819133758544922, 0.020154953002929688, 0.022118568420410156, 0.024082183837890625, 0.026045799255371094, 0.028009414672851562, 0.02997303009033203, 0.0319366455078125, 0.03390026092529297, 0.03586387634277344, 0.037827491760253906, 0.039791107177734375, 0.041754722595214844, 0.04371833801269531, 0.04568195343017578, 0.04764556884765625, 0.04960918426513672, 0.05157279968261719, 0.053536415100097656, 0.055500030517578125, 0.057463645935058594, 0.05942726135253906, 0.06139087677001953, 0.0633544921875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 1.0, 7.0, 5.0, 7.0, 11.0, 3.0, 13.0, 16.0, 15.0, 23.0, 36.0, 43.0, 53.0, 57.0, 58.0, 87.0, 72.0, 78.0, 72.0, 52.0, 61.0, 43.0, 38.0, 36.0, 24.0, 24.0, 17.0, 10.0, 7.0, 6.0, 5.0, 2.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.023773193359375, -0.02312636375427246, -0.022479534149169922, -0.021832704544067383, -0.021185874938964844, -0.020539045333862305, -0.019892215728759766, -0.019245386123657227, -0.018598556518554688, -0.01795172691345215, -0.01730489730834961, -0.01665806770324707, -0.01601123809814453, -0.015364408493041992, -0.014717578887939453, -0.014070749282836914, -0.013423919677734375, -0.012777090072631836, -0.012130260467529297, -0.011483430862426758, -0.010836601257324219, -0.01018977165222168, -0.00954294204711914, -0.008896112442016602, -0.008249282836914062, -0.0076024532318115234, -0.006955623626708984, -0.006308794021606445, -0.005661964416503906, -0.005015134811401367, -0.004368305206298828, -0.003721475601196289, -0.00307464599609375, -0.002427816390991211, -0.0017809867858886719, -0.0011341571807861328, -0.00048732757568359375, 0.0001595020294189453, 0.0008063316345214844, 0.0014531612396240234, 0.0020999908447265625, 0.0027468204498291016, 0.0033936500549316406, 0.00404047966003418, 0.004687309265136719, 0.005334138870239258, 0.005980968475341797, 0.006627798080444336, 0.007274627685546875, 0.007921457290649414, 0.008568286895751953, 0.009215116500854492, 0.009861946105957031, 0.01050877571105957, 0.01115560531616211, 0.011802434921264648, 0.012449264526367188, 0.013096094131469727, 0.013742923736572266, 0.014389753341674805, 0.015036582946777344, 0.015683412551879883, 0.016330242156982422, 0.01697707176208496, 0.0176239013671875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 5.0, 4.0, 12.0, 17.0, 15.0, 19.0, 34.0, 25.0, 34.0, 37.0, 52.0, 41.0, 63.0, 61.0, 64.0, 57.0, 51.0, 63.0, 62.0, 48.0, 53.0, 36.0, 36.0, 19.0, 16.0, 13.0, 16.0, 8.0, 11.0, 6.0, 8.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5047309398651123, -0.4899222254753113, -0.47511351108551025, -0.46030479669570923, -0.4454961121082306, -0.43068739771842957, -0.41587868332862854, -0.4010699689388275, -0.3862612843513489, -0.37145256996154785, -0.3566438555717468, -0.3418351411819458, -0.32702645659446716, -0.31221774220466614, -0.2974090278148651, -0.2826003134250641, -0.26779159903526306, -0.25298288464546204, -0.2381741851568222, -0.22336547076702118, -0.20855677127838135, -0.19374805688858032, -0.1789393424987793, -0.16413062810897827, -0.14932192862033844, -0.13451321423053741, -0.11970451474189758, -0.10489580035209656, -0.09008709341287613, -0.0752783864736557, -0.060469672083854675, -0.04566096514463425, -0.03085225820541382, -0.01604354940354824, -0.001234840601682663, 0.013573870062828064, 0.028382577002048492, 0.04319128394126892, 0.057999998331069946, 0.07280870527029037, 0.0876174122095108, 0.10242611914873123, 0.11723482608795166, 0.13204354047775269, 0.1468522548675537, 0.16166095435619354, 0.17646966874599457, 0.1912783682346344, 0.20608708262443542, 0.22089579701423645, 0.23570449650287628, 0.2505131959915161, 0.26532191038131714, 0.28013062477111816, 0.2949393391609192, 0.3097480535507202, 0.32455676794052124, 0.33936548233032227, 0.3541741967201233, 0.3689829111099243, 0.38379159569740295, 0.398600310087204, 0.413409024477005, 0.42821773886680603, 0.44302642345428467]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 6.0, 1.0, 3.0, 11.0, 5.0, 8.0, 11.0, 16.0, 16.0, 13.0, 24.0, 17.0, 16.0, 25.0, 24.0, 30.0, 25.0, 37.0, 37.0, 37.0, 50.0, 43.0, 39.0, 42.0, 46.0, 36.0, 41.0, 27.0, 36.0, 34.0, 27.0, 19.0, 27.0, 25.0, 28.0, 21.0, 14.0, 13.0, 12.0, 18.0, 9.0, 6.0, 10.0, 7.0, 5.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.35974112153053284, -0.34840232133865356, -0.3370634913444519, -0.32572469115257263, -0.31438586115837097, -0.3030470609664917, -0.29170823097229004, -0.28036943078041077, -0.2690306007862091, -0.25769180059432983, -0.24635297060012817, -0.2350141555070877, -0.22367534041404724, -0.21233652532100677, -0.2009977102279663, -0.18965891003608704, -0.17832009494304657, -0.1669812798500061, -0.15564246475696564, -0.14430364966392517, -0.1329648345708847, -0.12162601947784424, -0.11028721183538437, -0.0989483967423439, -0.08760958164930344, -0.07627076655626297, -0.0649319514632225, -0.053593140095472336, -0.04225432500243187, -0.030915509909391403, -0.019576698541641235, -0.008237883448600769, 0.0031009316444396973, 0.014439745806157589, 0.02577855996787548, 0.0371173731982708, 0.048456188291311264, 0.05979500338435173, 0.0711338147521019, 0.08247262984514236, 0.09381144493818283, 0.1051502600312233, 0.11648907512426376, 0.12782788276672363, 0.1391666978597641, 0.15050551295280457, 0.16184432804584503, 0.1731831431388855, 0.18452195823192596, 0.19586077332496643, 0.2071995884180069, 0.21853840351104736, 0.22987721860408783, 0.2412160336971283, 0.25255483388900757, 0.26389366388320923, 0.2752324640750885, 0.2865712642669678, 0.29791009426116943, 0.3092488944530487, 0.32058772444725037, 0.33192652463912964, 0.3432653546333313, 0.35460415482521057, 0.36594298481941223]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 3.0, 6.0, 12.0, 22.0, 37.0, 51.0, 94.0, 168.0, 322.0, 507.0, 1003.0, 2147.0, 4441.0, 10508.0, 28622.0, 94114.0, 342733.0, 393104.0, 115104.0, 33433.0, 12242.0, 5086.0, 2340.0, 1115.0, 583.0, 327.0, 189.0, 90.0, 42.0, 42.0, 16.0, 19.0, 10.0, 6.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.84228515625, -0.8160247802734375, -0.789764404296875, -0.7635040283203125, -0.73724365234375, -0.7109832763671875, -0.684722900390625, -0.6584625244140625, -0.6322021484375, -0.6059417724609375, -0.579681396484375, -0.5534210205078125, -0.52716064453125, -0.5009002685546875, -0.474639892578125, -0.4483795166015625, -0.422119140625, -0.3958587646484375, -0.369598388671875, -0.3433380126953125, -0.31707763671875, -0.2908172607421875, -0.264556884765625, -0.2382965087890625, -0.2120361328125, -0.1857757568359375, -0.159515380859375, -0.1332550048828125, -0.10699462890625, -0.0807342529296875, -0.054473876953125, -0.0282135009765625, -0.001953125, 0.0243072509765625, 0.050567626953125, 0.0768280029296875, 0.10308837890625, 0.1293487548828125, 0.155609130859375, 0.1818695068359375, 0.2081298828125, 0.2343902587890625, 0.260650634765625, 0.2869110107421875, 0.31317138671875, 0.3394317626953125, 0.365692138671875, 0.3919525146484375, 0.418212890625, 0.4444732666015625, 0.470733642578125, 0.4969940185546875, 0.52325439453125, 0.5495147705078125, 0.575775146484375, 0.6020355224609375, 0.6282958984375, 0.6545562744140625, 0.680816650390625, 0.7070770263671875, 0.73333740234375, 0.7595977783203125, 0.785858154296875, 0.8121185302734375, 0.83837890625]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 7.0, 4.0, 5.0, 4.0, 8.0, 22.0, 10.0, 23.0, 16.0, 17.0, 14.0, 17.0, 36.0, 30.0, 45.0, 42.0, 49.0, 54.0, 59.0, 38.0, 65.0, 48.0, 44.0, 45.0, 34.0, 45.0, 31.0, 36.0, 27.0, 25.0, 26.0, 20.0, 10.0, 10.0, 7.0, 10.0, 13.0, 7.0, 3.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63134765625, -0.6061172485351562, -0.5808868408203125, -0.5556564331054688, -0.530426025390625, -0.5051956176757812, -0.4799652099609375, -0.45473480224609375, -0.42950439453125, -0.40427398681640625, -0.3790435791015625, -0.35381317138671875, -0.328582763671875, -0.30335235595703125, -0.2781219482421875, -0.25289154052734375, -0.2276611328125, -0.20243072509765625, -0.1772003173828125, -0.15196990966796875, -0.126739501953125, -0.10150909423828125, -0.0762786865234375, -0.05104827880859375, -0.02581787109375, -0.00058746337890625, 0.0246429443359375, 0.04987335205078125, 0.075103759765625, 0.10033416748046875, 0.1255645751953125, 0.15079498291015625, 0.176025390625, 0.20125579833984375, 0.2264862060546875, 0.25171661376953125, 0.276947021484375, 0.30217742919921875, 0.3274078369140625, 0.35263824462890625, 0.37786865234375, 0.40309906005859375, 0.4283294677734375, 0.45355987548828125, 0.478790283203125, 0.5040206909179688, 0.5292510986328125, 0.5544815063476562, 0.5797119140625, 0.6049423217773438, 0.6301727294921875, 0.6554031372070312, 0.680633544921875, 0.7058639526367188, 0.7310943603515625, 0.7563247680664062, 0.78155517578125, 0.8067855834960938, 0.8320159912109375, 0.8572463989257812, 0.882476806640625, 0.9077072143554688, 0.9329376220703125, 0.9581680297851562, 0.9833984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 10.0, 9.0, 11.0, 6.0, 18.0, 18.0, 36.0, 56.0, 65.0, 94.0, 153.0, 251.0, 397.0, 756.0, 1402.0, 3297.0, 8570.0, 25908.0, 97204.0, 398488.0, 380667.0, 91633.0, 25190.0, 8020.0, 3084.0, 1411.0, 682.0, 407.0, 240.0, 151.0, 85.0, 68.0, 53.0, 33.0, 16.0, 16.0, 9.0, 11.0, 12.0, 9.0, 1.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.1650390625, -1.1307525634765625, -1.096466064453125, -1.0621795654296875, -1.02789306640625, -0.9936065673828125, -0.959320068359375, -0.9250335693359375, -0.8907470703125, -0.8564605712890625, -0.822174072265625, -0.7878875732421875, -0.75360107421875, -0.7193145751953125, -0.685028076171875, -0.6507415771484375, -0.616455078125, -0.5821685791015625, -0.547882080078125, -0.5135955810546875, -0.47930908203125, -0.4450225830078125, -0.410736083984375, -0.3764495849609375, -0.3421630859375, -0.3078765869140625, -0.273590087890625, -0.2393035888671875, -0.20501708984375, -0.1707305908203125, -0.136444091796875, -0.1021575927734375, -0.06787109375, -0.0335845947265625, 0.000701904296875, 0.0349884033203125, 0.06927490234375, 0.1035614013671875, 0.137847900390625, 0.1721343994140625, 0.2064208984375, 0.2407073974609375, 0.274993896484375, 0.3092803955078125, 0.34356689453125, 0.3778533935546875, 0.412139892578125, 0.4464263916015625, 0.480712890625, 0.5149993896484375, 0.549285888671875, 0.5835723876953125, 0.61785888671875, 0.6521453857421875, 0.686431884765625, 0.7207183837890625, 0.7550048828125, 0.7892913818359375, 0.823577880859375, 0.8578643798828125, 0.89215087890625, 0.9264373779296875, 0.960723876953125, 0.9950103759765625, 1.029296875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 5.0, 7.0, 5.0, 8.0, 15.0, 15.0, 16.0, 21.0, 23.0, 17.0, 27.0, 28.0, 25.0, 36.0, 38.0, 35.0, 42.0, 47.0, 53.0, 47.0, 49.0, 37.0, 49.0, 49.0, 38.0, 35.0, 32.0, 27.0, 27.0, 26.0, 17.0, 16.0, 14.0, 10.0, 8.0, 14.0, 8.0, 5.0, 5.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.73486328125, -0.7114181518554688, -0.6879730224609375, -0.6645278930664062, -0.641082763671875, -0.6176376342773438, -0.5941925048828125, -0.5707473754882812, -0.54730224609375, -0.5238571166992188, -0.5004119873046875, -0.47696685791015625, -0.453521728515625, -0.43007659912109375, -0.4066314697265625, -0.38318634033203125, -0.3597412109375, -0.33629608154296875, -0.3128509521484375, -0.28940582275390625, -0.265960693359375, -0.24251556396484375, -0.2190704345703125, -0.19562530517578125, -0.17218017578125, -0.14873504638671875, -0.1252899169921875, -0.10184478759765625, -0.078399658203125, -0.05495452880859375, -0.0315093994140625, -0.00806427001953125, 0.015380859375, 0.03882598876953125, 0.0622711181640625, 0.08571624755859375, 0.109161376953125, 0.13260650634765625, 0.1560516357421875, 0.17949676513671875, 0.20294189453125, 0.22638702392578125, 0.2498321533203125, 0.27327728271484375, 0.296722412109375, 0.32016754150390625, 0.3436126708984375, 0.36705780029296875, 0.3905029296875, 0.41394805908203125, 0.4373931884765625, 0.46083831787109375, 0.484283447265625, 0.5077285766601562, 0.5311737060546875, 0.5546188354492188, 0.57806396484375, 0.6015090942382812, 0.6249542236328125, 0.6483993530273438, 0.671844482421875, 0.6952896118164062, 0.7187347412109375, 0.7421798706054688, 0.765625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 9.0, 5.0, 5.0, 7.0, 7.0, 25.0, 28.0, 34.0, 83.0, 94.0, 163.0, 247.0, 464.0, 883.0, 1671.0, 3846.0, 9619.0, 26978.0, 79703.0, 220315.0, 414998.0, 186967.0, 65242.0, 22313.0, 8210.0, 3353.0, 1447.0, 773.0, 417.0, 233.0, 120.0, 100.0, 61.0, 49.0, 29.0, 17.0, 13.0, 9.0, 7.0, 4.0, 8.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11505126953125, -0.1112680435180664, -0.10748481750488281, -0.10370159149169922, -0.09991836547851562, -0.09613513946533203, -0.09235191345214844, -0.08856868743896484, -0.08478546142578125, -0.08100223541259766, -0.07721900939941406, -0.07343578338623047, -0.06965255737304688, -0.06586933135986328, -0.06208610534667969, -0.058302879333496094, -0.0545196533203125, -0.050736427307128906, -0.04695320129394531, -0.04316997528076172, -0.039386749267578125, -0.03560352325439453, -0.03182029724121094, -0.028037071228027344, -0.02425384521484375, -0.020470619201660156, -0.016687393188476562, -0.012904167175292969, -0.009120941162109375, -0.005337715148925781, -0.0015544891357421875, 0.0022287368774414062, 0.006011962890625, 0.009795188903808594, 0.013578414916992188, 0.01736164093017578, 0.021144866943359375, 0.02492809295654297, 0.028711318969726562, 0.032494544982910156, 0.03627777099609375, 0.040060997009277344, 0.04384422302246094, 0.04762744903564453, 0.051410675048828125, 0.05519390106201172, 0.05897712707519531, 0.0627603530883789, 0.0665435791015625, 0.0703268051147461, 0.07411003112792969, 0.07789325714111328, 0.08167648315429688, 0.08545970916748047, 0.08924293518066406, 0.09302616119384766, 0.09680938720703125, 0.10059261322021484, 0.10437583923339844, 0.10815906524658203, 0.11194229125976562, 0.11572551727294922, 0.11950874328613281, 0.1232919692993164, 0.1270751953125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 8.0, 13.0, 12.0, 20.0, 23.0, 28.0, 32.0, 30.0, 58.0, 55.0, 64.0, 102.0, 124.0, 80.0, 76.0, 52.0, 50.0, 38.0, 27.0, 20.0, 25.0, 12.0, 11.0, 11.0, 2.0, 7.0, 7.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.9265880584716797e-05, -2.8411857783794403e-05, -2.755783498287201e-05, -2.6703812181949615e-05, -2.584978938102722e-05, -2.4995766580104828e-05, -2.4141743779182434e-05, -2.328772097826004e-05, -2.2433698177337646e-05, -2.1579675376415253e-05, -2.072565257549286e-05, -1.9871629774570465e-05, -1.901760697364807e-05, -1.8163584172725677e-05, -1.7309561371803284e-05, -1.645553857088089e-05, -1.5601515769958496e-05, -1.4747492969036102e-05, -1.3893470168113708e-05, -1.3039447367191315e-05, -1.2185424566268921e-05, -1.1331401765346527e-05, -1.0477378964424133e-05, -9.62335616350174e-06, -8.769333362579346e-06, -7.915310561656952e-06, -7.061287760734558e-06, -6.207264959812164e-06, -5.3532421588897705e-06, -4.499219357967377e-06, -3.645196557044983e-06, -2.791173756122589e-06, -1.9371509552001953e-06, -1.0831281542778015e-06, -2.2910535335540771e-07, 6.249174475669861e-07, 1.4789402484893799e-06, 2.3329630494117737e-06, 3.1869858503341675e-06, 4.041008651256561e-06, 4.895031452178955e-06, 5.749054253101349e-06, 6.603077054023743e-06, 7.4570998549461365e-06, 8.31112265586853e-06, 9.165145456790924e-06, 1.0019168257713318e-05, 1.0873191058635712e-05, 1.1727213859558105e-05, 1.25812366604805e-05, 1.3435259461402893e-05, 1.4289282262325287e-05, 1.514330506324768e-05, 1.5997327864170074e-05, 1.6851350665092468e-05, 1.7705373466014862e-05, 1.8559396266937256e-05, 1.941341906785965e-05, 2.0267441868782043e-05, 2.1121464669704437e-05, 2.197548747062683e-05, 2.2829510271549225e-05, 2.368353307247162e-05, 2.4537555873394012e-05, 2.5391578674316406e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 6.0, 8.0, 13.0, 13.0, 23.0, 24.0, 45.0, 51.0, 73.0, 101.0, 118.0, 169.0, 250.0, 391.0, 551.0, 888.0, 1505.0, 2554.0, 5523.0, 13613.0, 41016.0, 136053.0, 435163.0, 278178.0, 86187.0, 26800.0, 9545.0, 4057.0, 2098.0, 1220.0, 747.0, 466.0, 289.0, 224.0, 163.0, 110.0, 96.0, 77.0, 49.0, 28.0, 35.0, 11.0, 10.0, 12.0, 2.0, 8.0, 0.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.16015625, -0.1552753448486328, -0.15039443969726562, -0.14551353454589844, -0.14063262939453125, -0.13575172424316406, -0.13087081909179688, -0.1259899139404297, -0.1211090087890625, -0.11622810363769531, -0.11134719848632812, -0.10646629333496094, -0.10158538818359375, -0.09670448303222656, -0.09182357788085938, -0.08694267272949219, -0.082061767578125, -0.07718086242675781, -0.07229995727539062, -0.06741905212402344, -0.06253814697265625, -0.05765724182128906, -0.052776336669921875, -0.04789543151855469, -0.0430145263671875, -0.03813362121582031, -0.033252716064453125, -0.028371810913085938, -0.02349090576171875, -0.018610000610351562, -0.013729095458984375, -0.008848190307617188, -0.00396728515625, 0.0009136199951171875, 0.005794525146484375, 0.010675430297851562, 0.01555633544921875, 0.020437240600585938, 0.025318145751953125, 0.030199050903320312, 0.0350799560546875, 0.03996086120605469, 0.044841766357421875, 0.04972267150878906, 0.05460357666015625, 0.05948448181152344, 0.06436538696289062, 0.06924629211425781, 0.074127197265625, 0.07900810241699219, 0.08388900756835938, 0.08876991271972656, 0.09365081787109375, 0.09853172302246094, 0.10341262817382812, 0.10829353332519531, 0.1131744384765625, 0.11805534362792969, 0.12293624877929688, 0.12781715393066406, 0.13269805908203125, 0.13757896423339844, 0.14245986938476562, 0.1473407745361328, 0.1522216796875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 9.0, 16.0, 16.0, 33.0, 40.0, 65.0, 77.0, 95.0, 179.0, 114.0, 110.0, 75.0, 54.0, 47.0, 29.0, 10.0, 10.0, 7.0, 8.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1370849609375, -0.13301849365234375, -0.1289520263671875, -0.12488555908203125, -0.120819091796875, -0.11675262451171875, -0.1126861572265625, -0.10861968994140625, -0.10455322265625, -0.10048675537109375, -0.0964202880859375, -0.09235382080078125, -0.088287353515625, -0.08422088623046875, -0.0801544189453125, -0.07608795166015625, -0.072021484375, -0.06795501708984375, -0.0638885498046875, -0.05982208251953125, -0.055755615234375, -0.05168914794921875, -0.0476226806640625, -0.04355621337890625, -0.03948974609375, -0.03542327880859375, -0.0313568115234375, -0.02729034423828125, -0.023223876953125, -0.01915740966796875, -0.0150909423828125, -0.01102447509765625, -0.0069580078125, -0.00289154052734375, 0.0011749267578125, 0.00524139404296875, 0.009307861328125, 0.01337432861328125, 0.0174407958984375, 0.02150726318359375, 0.02557373046875, 0.02964019775390625, 0.0337066650390625, 0.03777313232421875, 0.041839599609375, 0.04590606689453125, 0.0499725341796875, 0.05403900146484375, 0.05810546875, 0.06217193603515625, 0.0662384033203125, 0.07030487060546875, 0.074371337890625, 0.07843780517578125, 0.0825042724609375, 0.08657073974609375, 0.09063720703125, 0.09470367431640625, 0.0987701416015625, 0.10283660888671875, 0.106903076171875, 0.11096954345703125, 0.1150360107421875, 0.11910247802734375, 0.1231689453125]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 5.0, 12.0, 38.0, 97.0, 200.0, 263.0, 190.0, 119.0, 49.0, 19.0, 9.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1071416139602661, -0.9914671778678894, -0.8757927417755127, -0.7601182460784912, -0.6444438695907593, -0.5287693738937378, -0.4130949378013611, -0.2974205017089844, -0.18174606561660767, -0.06607162207365036, 0.049602821469306946, 0.16527727246284485, 0.28095170855522156, 0.39662617444992065, 0.5123006105422974, 0.6279750466346741, 0.7436494827270508, 0.8593239188194275, 0.9749983549118042, 1.0906728506088257, 1.2063472270965576, 1.322021722793579, 1.4376962184906006, 1.5533705949783325, 1.6690449714660645, 1.784719467163086, 1.9003938436508179, 2.01606822013855, 2.1317427158355713, 2.2474172115325928, 2.3630917072296143, 2.4787659645080566, 2.5944406986236572, 2.7101151943206787, 2.8257896900177, 2.9414639472961426, 3.057138442993164, 3.1728129386901855, 3.288487434387207, 3.4041619300842285, 3.519836187362671, 3.6355106830596924, 3.751185178756714, 3.8668594360351562, 3.9825339317321777, 4.098208427429199, 4.213882923126221, 4.329557418823242, 4.445231914520264, 4.560906410217285, 4.676580905914307, 4.792255401611328, 4.90792989730835, 5.023604393005371, 5.139278411865234, 5.254952907562256, 5.370627403259277, 5.486301898956299, 5.60197639465332, 5.717650890350342, 5.833325386047363, 5.948999404907227, 6.064673900604248, 6.1803483963012695, 6.296022891998291]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 11.0, 7.0, 13.0, 10.0, 20.0, 17.0, 21.0, 29.0, 25.0, 22.0, 25.0, 37.0, 32.0, 34.0, 47.0, 42.0, 46.0, 42.0, 38.0, 40.0, 41.0, 53.0, 26.0, 45.0, 33.0, 39.0, 35.0, 26.0, 18.0, 17.0, 25.0, 15.0, 21.0, 17.0, 9.0, 2.0, 5.0, 10.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.5122652053833008, -1.4709608554840088, -1.4296565055847168, -1.3883522748947144, -1.3470479249954224, -1.3057435750961304, -1.2644392251968384, -1.2231348752975464, -1.181830644607544, -1.140526294708252, -1.09922194480896, -1.0579177141189575, -1.0166133642196655, -0.9753090143203735, -0.9340046644210815, -0.8927003145217896, -0.8513959646224976, -0.8100916147232056, -0.7687873244285583, -0.7274829745292664, -0.6861786842346191, -0.6448743343353271, -0.6035699844360352, -0.5622656345367432, -0.520961344242096, -0.47965702414512634, -0.43835270404815674, -0.39704835414886475, -0.35574403405189514, -0.31443971395492554, -0.27313536405563354, -0.23183104395866394, -0.19052660465240479, -0.14922228455543518, -0.10791794955730438, -0.06661362200975418, -0.02530929446220398, 0.015995025634765625, 0.05729936063289642, 0.09860369563102722, 0.13990801572799683, 0.18121233582496643, 0.22251667082309723, 0.263821005821228, 0.30512532591819763, 0.34642964601516724, 0.38773399591445923, 0.42903831601142883, 0.47034263610839844, 0.5116469860076904, 0.5529512763023376, 0.5942556262016296, 0.6355599164962769, 0.6768642663955688, 0.7181686162948608, 0.7594729661941528, 0.8007772564888, 0.842081606388092, 0.8833858966827393, 0.9246902465820312, 0.9659945964813232, 1.0072989463806152, 1.0486031770706177, 1.0899075269699097, 1.1312118768692017]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 5.0, 7.0, 15.0, 16.0, 16.0, 27.0, 31.0, 50.0, 62.0, 119.0, 224.0, 357.0, 631.0, 1460.0, 4112.0, 13847.0, 1021078.0, 5064.0, 1687.0, 751.0, 430.0, 225.0, 123.0, 87.0, 49.0, 39.0, 23.0, 16.0, 11.0, 10.0, 6.0, 6.0, 6.0, 2.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.4936835765838623, -2.4205307960510254, -2.3473782539367676, -2.2742257118225098, -2.201072931289673, -2.127920150756836, -2.054767608642578, -1.9816149473190308, -1.9084622859954834, -1.835309624671936, -1.7621569633483887, -1.6890043020248413, -1.615851640701294, -1.5426989793777466, -1.4695463180541992, -1.3963936567306519, -1.3232409954071045, -1.2500883340835571, -1.1769356727600098, -1.1037830114364624, -1.030630350112915, -0.9574776887893677, -0.8843250274658203, -0.811172366142273, -0.7380197048187256, -0.6648670434951782, -0.5917143821716309, -0.5185617208480835, -0.44540905952453613, -0.37225639820098877, -0.2991037368774414, -0.22595107555389404, -0.15279841423034668, -0.07964575290679932, -0.006493091583251953, 0.06665956974029541, 0.13981223106384277, 0.21296489238739014, 0.2861175537109375, 0.35927021503448486, 0.4324228763580322, 0.5055755376815796, 0.578728199005127, 0.6518808603286743, 0.7250335216522217, 0.798186182975769, 0.8713388442993164, 0.9444915056228638, 1.0176441669464111, 1.0907968282699585, 1.1639494895935059, 1.2371021509170532, 1.3102548122406006, 1.383407473564148, 1.4565601348876953, 1.5297127962112427, 1.60286545753479, 1.6760181188583374, 1.7491707801818848, 1.8223234415054321, 1.8954761028289795, 1.9686287641525269, 2.041781425476074, 2.114933967590332, 2.188086748123169]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 8.0, 15.0, 26.0, 31.0, 50.0, 88.0, 153.0, 239.0, 337.0, 532.0, 957.0, 1885.0, 4371.0, 51436176.0, 18969.0, 3005.0, 1434.0, 764.0, 447.0, 293.0, 182.0, 123.0, 74.0, 58.0, 32.0, 20.0, 14.0, 6.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.352810859680176, -10.995879173278809, -10.638947486877441, -10.282015800476074, -9.925085067749023, -9.568153381347656, -9.211221694946289, -8.854290008544922, -8.497358322143555, -8.140426635742188, -7.78349494934082, -7.426563739776611, -7.069632053375244, -6.712700366973877, -6.355769157409668, -5.998837471008301, -5.641905784606934, -5.284974098205566, -4.928042411804199, -4.57111120223999, -4.214179515838623, -3.857247829437256, -3.5003163814544678, -3.1433849334716797, -2.7864532470703125, -2.4295215606689453, -2.0725901126861572, -1.7156585454940796, -1.358726978302002, -1.0017954111099243, -0.6448638439178467, -0.2879323959350586, 0.069000244140625, 0.42593181133270264, 0.7828633785247803, 1.139794945716858, 1.4967265129089355, 1.8536580801010132, 2.210589647293091, 2.567521095275879, 2.924452781677246, 3.2813844680786133, 3.6383159160614014, 3.9952473640441895, 4.352179050445557, 4.709110736846924, 5.066041946411133, 5.4229736328125, 5.779905319213867, 6.136837005615234, 6.493768692016602, 6.8506999015808105, 7.207631587982178, 7.564563274383545, 7.921494483947754, 8.278426170349121, 8.635357856750488, 8.992289543151855, 9.349221229553223, 9.70615291595459, 10.06308364868164, 10.420015335083008, 10.776947021484375, 11.133878707885742, 11.49081039428711]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 8.0, 3.0, 12.0, 10.0, 27.0, 38.0, 67.0, 108.0, 210.0, 344.0, 480.0, 852.0, 1513.0, 2668.0, 4711.0, 8792.0, 16680.0, 32671.0, 64602.0, 125280.0, 232551.0, 387165.0, 748690.0, 3455405.0, 505303.0, 319696.0, 183115.0, 96828.0, 49413.0, 25049.0, 13124.0, 7046.0, 3950.0, 2031.0, 1212.0, 731.0, 439.0, 249.0, 146.0, 80.0, 54.0, 36.0, 19.0, 8.0, 13.0, 10.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.99169921875, -0.9600143432617188, -0.9283294677734375, -0.8966445922851562, -0.864959716796875, -0.8332748413085938, -0.8015899658203125, -0.7699050903320312, -0.73822021484375, -0.7065353393554688, -0.6748504638671875, -0.6431655883789062, -0.611480712890625, -0.5797958374023438, -0.5481109619140625, -0.5164260864257812, -0.4847412109375, -0.45305633544921875, -0.4213714599609375, -0.38968658447265625, -0.358001708984375, -0.32631683349609375, -0.2946319580078125, -0.26294708251953125, -0.23126220703125, -0.19957733154296875, -0.1678924560546875, -0.13620758056640625, -0.104522705078125, -0.07283782958984375, -0.0411529541015625, -0.00946807861328125, 0.022216796875, 0.05390167236328125, 0.0855865478515625, 0.11727142333984375, 0.148956298828125, 0.18064117431640625, 0.2123260498046875, 0.24401092529296875, 0.27569580078125, 0.30738067626953125, 0.3390655517578125, 0.37075042724609375, 0.402435302734375, 0.43412017822265625, 0.4658050537109375, 0.49748992919921875, 0.5291748046875, 0.5608596801757812, 0.5925445556640625, 0.6242294311523438, 0.655914306640625, 0.6875991821289062, 0.7192840576171875, 0.7509689331054688, 0.78265380859375, 0.8143386840820312, 0.8460235595703125, 0.8777084350585938, 0.909393310546875, 0.9410781860351562, 0.9727630615234375, 1.0044479370117188, 1.0361328125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 6.0, 4.0, 8.0, 11.0, 15.0, 18.0, 16.0, 13.0, 20.0, 23.0, 36.0, 39.0, 31.0, 29.0, 37.0, 38.0, 31.0, 62.0, 200.0, 871.0, 100.0, 46.0, 43.0, 36.0, 31.0, 39.0, 31.0, 28.0, 28.0, 27.0, 19.0, 19.0, 14.0, 9.0, 7.0, 7.0, 10.0, 3.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.13671875, -6.9013671875, -6.666015625, -6.4306640625, -6.1953125, -5.9599609375, -5.724609375, -5.4892578125, -5.25390625, -5.0185546875, -4.783203125, -4.5478515625, -4.3125, -4.0771484375, -3.841796875, -3.6064453125, -3.37109375, -3.1357421875, -2.900390625, -2.6650390625, -2.4296875, -2.1943359375, -1.958984375, -1.7236328125, -1.48828125, -1.2529296875, -1.017578125, -0.7822265625, -0.546875, -0.3115234375, -0.076171875, 0.1591796875, 0.39453125, 0.6298828125, 0.865234375, 1.1005859375, 1.3359375, 1.5712890625, 1.806640625, 2.0419921875, 2.27734375, 2.5126953125, 2.748046875, 2.9833984375, 3.21875, 3.4541015625, 3.689453125, 3.9248046875, 4.16015625, 4.3955078125, 4.630859375, 4.8662109375, 5.1015625, 5.3369140625, 5.572265625, 5.8076171875, 6.04296875, 6.2783203125, 6.513671875, 6.7490234375, 6.984375, 7.2197265625, 7.455078125, 7.6904296875, 7.92578125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 10.0, 5.0, 13.0, 25.0, 46.0, 44.0, 101.0, 138.0, 204.0, 329.0, 517.0, 828.0, 1280.0, 1871.0, 2976.0, 4693.0, 7404.0, 11253.0, 17983.0, 28303.0, 43888.0, 66366.0, 99190.0, 141712.0, 193871.0, 249595.0, 307774.0, 1071633.0, 2705785.0, 350135.0, 271931.0, 215431.0, 160706.0, 113821.0, 77652.0, 51324.0, 33133.0, 21346.0, 13609.0, 8942.0, 5483.0, 3567.0, 2268.0, 1441.0, 1017.0, 687.0, 380.0, 263.0, 183.0, 112.0, 72.0, 37.0, 23.0, 19.0, 13.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.468505859375, -0.4534873962402344, -0.43846893310546875, -0.4234504699707031, -0.4084320068359375, -0.3934135437011719, -0.37839508056640625, -0.3633766174316406, -0.348358154296875, -0.3333396911621094, -0.31832122802734375, -0.3033027648925781, -0.2882843017578125, -0.2732658386230469, -0.25824737548828125, -0.24322891235351562, -0.22821044921875, -0.21319198608398438, -0.19817352294921875, -0.18315505981445312, -0.1681365966796875, -0.15311813354492188, -0.13809967041015625, -0.12308120727539062, -0.108062744140625, -0.09304428100585938, -0.07802581787109375, -0.06300735473632812, -0.0479888916015625, -0.032970428466796875, -0.01795196533203125, -0.002933502197265625, 0.0120849609375, 0.027103424072265625, 0.04212188720703125, 0.057140350341796875, 0.0721588134765625, 0.08717727661132812, 0.10219573974609375, 0.11721420288085938, 0.132232666015625, 0.14725112915039062, 0.16226959228515625, 0.17728805541992188, 0.1923065185546875, 0.20732498168945312, 0.22234344482421875, 0.23736190795898438, 0.25238037109375, 0.2673988342285156, 0.28241729736328125, 0.2974357604980469, 0.3124542236328125, 0.3274726867675781, 0.34249114990234375, 0.3575096130371094, 0.372528076171875, 0.3875465393066406, 0.40256500244140625, 0.4175834655761719, 0.4326019287109375, 0.4476203918457031, 0.46263885498046875, 0.4776573181152344, 0.49267578125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 9.0, 8.0, 17.0, 5.0, 11.0, 13.0, 13.0, 18.0, 19.0, 28.0, 24.0, 16.0, 30.0, 45.0, 35.0, 45.0, 47.0, 61.0, 635.0, 465.0, 46.0, 42.0, 45.0, 35.0, 35.0, 30.0, 29.0, 40.0, 18.0, 24.0, 27.0, 20.0, 18.0, 11.0, 12.0, 16.0, 7.0, 4.0, 4.0, 9.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.328125, -6.14666748046875, -5.9652099609375, -5.78375244140625, -5.602294921875, -5.42083740234375, -5.2393798828125, -5.05792236328125, -4.87646484375, -4.69500732421875, -4.5135498046875, -4.33209228515625, -4.150634765625, -3.96917724609375, -3.7877197265625, -3.60626220703125, -3.4248046875, -3.24334716796875, -3.0618896484375, -2.88043212890625, -2.698974609375, -2.51751708984375, -2.3360595703125, -2.15460205078125, -1.97314453125, -1.79168701171875, -1.6102294921875, -1.42877197265625, -1.247314453125, -1.06585693359375, -0.8843994140625, -0.70294189453125, -0.521484375, -0.34002685546875, -0.1585693359375, 0.02288818359375, 0.204345703125, 0.38580322265625, 0.5672607421875, 0.74871826171875, 0.93017578125, 1.11163330078125, 1.2930908203125, 1.47454833984375, 1.656005859375, 1.83746337890625, 2.0189208984375, 2.20037841796875, 2.3818359375, 2.56329345703125, 2.7447509765625, 2.92620849609375, 3.107666015625, 3.28912353515625, 3.4705810546875, 3.65203857421875, 3.83349609375, 4.01495361328125, 4.1964111328125, 4.37786865234375, 4.559326171875, 4.74078369140625, 4.9222412109375, 5.10369873046875, 5.28515625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 2.0, 2.0, 5.0, 9.0, 8.0, 17.0, 11.0, 28.0, 28.0, 45.0, 52.0, 81.0, 110.0, 135.0, 156.0, 214.0, 328.0, 423.0, 589.0, 841.0, 1318.0, 1902.0, 3015.0, 5546.0, 10888.0, 23024.0, 51172.0, 108644.0, 965297.0, 4893232.0, 116614.0, 55231.0, 25013.0, 11674.0, 5889.0, 3298.0, 1995.0, 1339.0, 947.0, 621.0, 458.0, 341.0, 226.0, 155.0, 124.0, 81.0, 81.0, 52.0, 52.0, 38.0, 27.0, 18.0, 14.0, 13.0, 6.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0], "bins": [-1.6728515625, -1.62066650390625, -1.5684814453125, -1.51629638671875, -1.464111328125, -1.41192626953125, -1.3597412109375, -1.30755615234375, -1.25537109375, -1.20318603515625, -1.1510009765625, -1.09881591796875, -1.046630859375, -0.99444580078125, -0.9422607421875, -0.89007568359375, -0.837890625, -0.78570556640625, -0.7335205078125, -0.68133544921875, -0.629150390625, -0.57696533203125, -0.5247802734375, -0.47259521484375, -0.42041015625, -0.36822509765625, -0.3160400390625, -0.26385498046875, -0.211669921875, -0.15948486328125, -0.1072998046875, -0.05511474609375, -0.0029296875, 0.04925537109375, 0.1014404296875, 0.15362548828125, 0.205810546875, 0.25799560546875, 0.3101806640625, 0.36236572265625, 0.41455078125, 0.46673583984375, 0.5189208984375, 0.57110595703125, 0.623291015625, 0.67547607421875, 0.7276611328125, 0.77984619140625, 0.83203125, 0.88421630859375, 0.9364013671875, 0.98858642578125, 1.040771484375, 1.09295654296875, 1.1451416015625, 1.19732666015625, 1.24951171875, 1.30169677734375, 1.3538818359375, 1.40606689453125, 1.458251953125, 1.51043701171875, 1.5626220703125, 1.61480712890625, 1.6669921875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 4.0, 5.0, 5.0, 7.0, 6.0, 8.0, 8.0, 5.0, 14.0, 17.0, 14.0, 22.0, 33.0, 29.0, 21.0, 42.0, 36.0, 28.0, 35.0, 41.0, 50.0, 113.0, 884.0, 160.0, 48.0, 34.0, 40.0, 30.0, 33.0, 32.0, 39.0, 25.0, 27.0, 24.0, 15.0, 10.0, 17.0, 14.0, 15.0, 4.0, 4.0, 6.0, 2.0, 11.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.69140625, -5.52655029296875, -5.3616943359375, -5.19683837890625, -5.031982421875, -4.86712646484375, -4.7022705078125, -4.53741455078125, -4.37255859375, -4.20770263671875, -4.0428466796875, -3.87799072265625, -3.713134765625, -3.54827880859375, -3.3834228515625, -3.21856689453125, -3.0537109375, -2.88885498046875, -2.7239990234375, -2.55914306640625, -2.394287109375, -2.22943115234375, -2.0645751953125, -1.89971923828125, -1.73486328125, -1.57000732421875, -1.4051513671875, -1.24029541015625, -1.075439453125, -0.91058349609375, -0.7457275390625, -0.58087158203125, -0.416015625, -0.25115966796875, -0.0863037109375, 0.07855224609375, 0.243408203125, 0.40826416015625, 0.5731201171875, 0.73797607421875, 0.90283203125, 1.06768798828125, 1.2325439453125, 1.39739990234375, 1.562255859375, 1.72711181640625, 1.8919677734375, 2.05682373046875, 2.2216796875, 2.38653564453125, 2.5513916015625, 2.71624755859375, 2.881103515625, 3.04595947265625, 3.2108154296875, 3.37567138671875, 3.54052734375, 3.70538330078125, 3.8702392578125, 4.03509521484375, 4.199951171875, 4.36480712890625, 4.5296630859375, 4.69451904296875, 4.859375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 13.0, 20.0, 15.0, 23.0, 32.0, 43.0, 48.0, 58.0, 123.0, 183.0, 111.0, 66.0, 58.0, 46.0, 34.0, 28.0, 11.0, 20.0, 13.0, 13.0, 3.0, 6.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-38.38465881347656, -37.480552673339844, -36.57645034790039, -35.67234420776367, -34.76824188232422, -33.8641357421875, -32.96003341674805, -32.05592727661133, -31.151823043823242, -30.247718811035156, -29.34361457824707, -28.439510345458984, -27.535404205322266, -26.631301879882812, -25.727195739746094, -24.823091506958008, -23.918987274169922, -23.014883041381836, -22.11077880859375, -21.206674575805664, -20.302570343017578, -19.39846420288086, -18.494359970092773, -17.590255737304688, -16.6861515045166, -15.782047271728516, -14.87794303894043, -13.973837852478027, -13.069733619689941, -12.165629386901855, -11.261524200439453, -10.357419967651367, -9.453313827514648, -8.549209594726562, -7.645104885101318, -6.741000175476074, -5.836895942687988, -4.932791709899902, -4.028687000274658, -3.124582290649414, -2.220478057861328, -1.316373586654663, -0.41226911544799805, 0.491835355758667, 1.395939826965332, 2.300044059753418, 3.204148769378662, 4.108253479003906, 5.012357711791992, 5.916461944580078, 6.820566654205322, 7.724671363830566, 8.628775596618652, 9.532879829406738, 10.43698501586914, 11.341089248657227, 12.245193481445312, 13.149297714233398, 14.053401947021484, 14.957507133483887, 15.861611366271973, 16.765716552734375, 17.66982078552246, 18.573925018310547, 19.478029251098633]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 4.0, 3.0, 1.0, 7.0, 5.0, 5.0, 4.0, 10.0, 15.0, 11.0, 22.0, 19.0, 17.0, 19.0, 31.0, 31.0, 34.0, 48.0, 73.0, 88.0, 115.0, 92.0, 51.0, 48.0, 41.0, 36.0, 26.0, 24.0, 22.0, 14.0, 14.0, 7.0, 13.0, 10.0, 4.0, 9.0, 5.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-66.30535125732422, -64.30560302734375, -62.30585861206055, -60.306114196777344, -58.306365966796875, -56.30662155151367, -54.30687713623047, -52.30712890625, -50.3073844909668, -48.307640075683594, -46.307891845703125, -44.30814743041992, -42.30840301513672, -40.30865478515625, -38.30891036987305, -36.309165954589844, -34.309417724609375, -32.30967330932617, -30.309925079345703, -28.3101806640625, -26.310434341430664, -24.310688018798828, -22.310943603515625, -20.31119728088379, -18.311450958251953, -16.311704635620117, -14.311959266662598, -12.312213897705078, -10.312467575073242, -8.312721252441406, -6.312975883483887, -4.313230514526367, -2.313488006591797, -0.31374216079711914, 1.6860036849975586, 3.6857495307922363, 5.685495376586914, 7.68524169921875, 9.68498706817627, 11.684732437133789, 13.684478759765625, 15.684225082397461, 17.683971405029297, 19.6837158203125, 21.683462142944336, 23.683208465576172, 25.682952880859375, 27.68269920349121, 29.682445526123047, 31.682191848754883, 33.68193817138672, 35.68168258666992, 37.681427001953125, 39.681175231933594, 41.6809196472168, 43.6806640625, 45.68041229248047, 47.68015670776367, 49.67990493774414, 51.679649353027344, 53.67939758300781, 55.679141998291016, 57.67888641357422, 59.67863464355469, 61.67837905883789]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 1.0, 5.0, 9.0, 17.0, 14.0, 21.0, 34.0, 61.0, 95.0, 115.0, 168.0, 245.0, 406.0, 694.0, 1116.0, 1969.0, 3681.0, 7889.0, 19253.0, 68017.0, 3066853.0, 931969.0, 57839.0, 17726.0, 7268.0, 3715.0, 1980.0, 1141.0, 665.0, 443.0, 273.0, 196.0, 116.0, 86.0, 64.0, 39.0, 24.0, 20.0, 24.0, 8.0, 5.0, 7.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11614990234375, -0.11227130889892578, -0.10839271545410156, -0.10451412200927734, -0.10063552856445312, -0.0967569351196289, -0.09287834167480469, -0.08899974822998047, -0.08512115478515625, -0.08124256134033203, -0.07736396789550781, -0.0734853744506836, -0.06960678100585938, -0.06572818756103516, -0.06184959411621094, -0.05797100067138672, -0.0540924072265625, -0.05021381378173828, -0.04633522033691406, -0.042456626892089844, -0.038578033447265625, -0.034699440002441406, -0.030820846557617188, -0.02694225311279297, -0.02306365966796875, -0.01918506622314453, -0.015306472778320312, -0.011427879333496094, -0.007549285888671875, -0.0036706924438476562, 0.0002079010009765625, 0.004086494445800781, 0.007965087890625, 0.011843681335449219, 0.015722274780273438, 0.019600868225097656, 0.023479461669921875, 0.027358055114746094, 0.031236648559570312, 0.03511524200439453, 0.03899383544921875, 0.04287242889404297, 0.04675102233886719, 0.050629615783691406, 0.054508209228515625, 0.058386802673339844, 0.06226539611816406, 0.06614398956298828, 0.0700225830078125, 0.07390117645263672, 0.07777976989746094, 0.08165836334228516, 0.08553695678710938, 0.0894155502319336, 0.09329414367675781, 0.09717273712158203, 0.10105133056640625, 0.10492992401123047, 0.10880851745605469, 0.1126871109008789, 0.11656570434570312, 0.12044429779052734, 0.12432289123535156, 0.12820148468017578, 0.132080078125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 7.0, 1.0, 3.0, 9.0, 8.0, 9.0, 15.0, 20.0, 8.0, 28.0, 35.0, 35.0, 64.0, 110.0, 288.0, 92.0, 69.0, 49.0, 37.0, 23.0, 18.0, 17.0, 10.0, 12.0, 6.0, 8.0, 3.0, 3.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056488037109375, -0.054802894592285156, -0.05311775207519531, -0.05143260955810547, -0.049747467041015625, -0.04806232452392578, -0.04637718200683594, -0.044692039489746094, -0.04300689697265625, -0.041321754455566406, -0.03963661193847656, -0.03795146942138672, -0.036266326904296875, -0.03458118438720703, -0.03289604187011719, -0.031210899353027344, -0.0295257568359375, -0.027840614318847656, -0.026155471801757812, -0.02447032928466797, -0.022785186767578125, -0.02110004425048828, -0.019414901733398438, -0.017729759216308594, -0.01604461669921875, -0.014359474182128906, -0.012674331665039062, -0.010989189147949219, -0.009304046630859375, -0.007618904113769531, -0.0059337615966796875, -0.004248619079589844, -0.0025634765625, -0.0008783340454101562, 0.0008068084716796875, 0.0024919509887695312, 0.004177093505859375, 0.005862236022949219, 0.0075473785400390625, 0.009232521057128906, 0.01091766357421875, 0.012602806091308594, 0.014287948608398438, 0.01597309112548828, 0.017658233642578125, 0.01934337615966797, 0.021028518676757812, 0.022713661193847656, 0.0243988037109375, 0.026083946228027344, 0.027769088745117188, 0.02945423126220703, 0.031139373779296875, 0.03282451629638672, 0.03450965881347656, 0.036194801330566406, 0.03787994384765625, 0.039565086364746094, 0.04125022888183594, 0.04293537139892578, 0.044620513916015625, 0.04630565643310547, 0.04799079895019531, 0.049675941467285156, 0.051361083984375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 5.0, 11.0, 25.0, 22.0, 32.0, 47.0, 88.0, 163.0, 265.0, 564.0, 1149.0, 2682.0, 6895.0, 21692.0, 100490.0, 1060386.0, 2768791.0, 183269.0, 32539.0, 9163.0, 3313.0, 1350.0, 629.0, 336.0, 156.0, 77.0, 44.0, 33.0, 18.0, 14.0, 7.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12371826171875, -0.11998748779296875, -0.1162567138671875, -0.11252593994140625, -0.108795166015625, -0.10506439208984375, -0.1013336181640625, -0.09760284423828125, -0.0938720703125, -0.09014129638671875, -0.0864105224609375, -0.08267974853515625, -0.078948974609375, -0.07521820068359375, -0.0714874267578125, -0.06775665283203125, -0.06402587890625, -0.06029510498046875, -0.0565643310546875, -0.05283355712890625, -0.049102783203125, -0.04537200927734375, -0.0416412353515625, -0.03791046142578125, -0.0341796875, -0.03044891357421875, -0.0267181396484375, -0.02298736572265625, -0.019256591796875, -0.01552581787109375, -0.0117950439453125, -0.00806427001953125, -0.00433349609375, -0.00060272216796875, 0.0031280517578125, 0.00685882568359375, 0.010589599609375, 0.01432037353515625, 0.0180511474609375, 0.02178192138671875, 0.0255126953125, 0.02924346923828125, 0.0329742431640625, 0.03670501708984375, 0.040435791015625, 0.04416656494140625, 0.0478973388671875, 0.05162811279296875, 0.05535888671875, 0.05908966064453125, 0.0628204345703125, 0.06655120849609375, 0.070281982421875, 0.07401275634765625, 0.0777435302734375, 0.08147430419921875, 0.085205078125, 0.08893585205078125, 0.0926666259765625, 0.09639739990234375, 0.100128173828125, 0.10385894775390625, 0.1075897216796875, 0.11132049560546875, 0.11505126953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 9.0, 3.0, 9.0, 6.0, 7.0, 18.0, 11.0, 21.0, 37.0, 50.0, 65.0, 101.0, 154.0, 302.0, 619.0, 1113.0, 714.0, 307.0, 198.0, 120.0, 66.0, 48.0, 32.0, 22.0, 12.0, 8.0, 3.0, 7.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.050994873046875, -0.04938220977783203, -0.04776954650878906, -0.046156883239746094, -0.044544219970703125, -0.042931556701660156, -0.04131889343261719, -0.03970623016357422, -0.03809356689453125, -0.03648090362548828, -0.03486824035644531, -0.033255577087402344, -0.031642913818359375, -0.030030250549316406, -0.028417587280273438, -0.02680492401123047, -0.0251922607421875, -0.02357959747314453, -0.021966934204101562, -0.020354270935058594, -0.018741607666015625, -0.017128944396972656, -0.015516281127929688, -0.013903617858886719, -0.01229095458984375, -0.010678291320800781, -0.009065628051757812, -0.007452964782714844, -0.005840301513671875, -0.004227638244628906, -0.0026149749755859375, -0.0010023117065429688, 0.0006103515625, 0.0022230148315429688, 0.0038356781005859375, 0.005448341369628906, 0.007061004638671875, 0.008673667907714844, 0.010286331176757812, 0.011898994445800781, 0.01351165771484375, 0.015124320983886719, 0.016736984252929688, 0.018349647521972656, 0.019962310791015625, 0.021574974060058594, 0.023187637329101562, 0.02480030059814453, 0.0264129638671875, 0.02802562713623047, 0.029638290405273438, 0.031250953674316406, 0.032863616943359375, 0.034476280212402344, 0.03608894348144531, 0.03770160675048828, 0.03931427001953125, 0.04092693328857422, 0.04253959655761719, 0.044152259826660156, 0.045764923095703125, 0.047377586364746094, 0.04899024963378906, 0.05060291290283203, 0.052215576171875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 12.0, 36.0, 186.0, 506.0, 224.0, 26.0, 4.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5204178690910339, -0.4938589632511139, -0.46730005741119385, -0.4407411217689514, -0.41418221592903137, -0.38762331008911133, -0.3610643744468689, -0.33450546860694885, -0.3079465627670288, -0.28138765692710876, -0.2548287510871887, -0.2282698154449463, -0.20171090960502625, -0.1751520037651062, -0.14859308302402496, -0.12203416228294373, -0.09547525644302368, -0.06891634315252304, -0.0423574298620224, -0.01579851657152176, 0.010760396718978882, 0.037319302558898926, 0.06387822329998016, 0.0904371440410614, 0.11699604988098145, 0.1435549557209015, 0.17011387646198273, 0.19667279720306396, 0.223231703042984, 0.24979060888290405, 0.2763495445251465, 0.30290845036506653, 0.3294672966003418, 0.35602620244026184, 0.3825851082801819, 0.4091440439224243, 0.43570294976234436, 0.4622618556022644, 0.48882079124450684, 0.5153796672821045, 0.5419386029243469, 0.5684975385665894, 0.595056414604187, 0.6216153502464294, 0.6481742858886719, 0.6747331619262695, 0.701292097568512, 0.7278510332107544, 0.754409909248352, 0.7809688448905945, 0.8075277209281921, 0.8340866565704346, 0.8606455326080322, 0.8872044682502747, 0.9137634038925171, 0.9403222799301147, 0.9668812155723572, 0.9934401512145996, 1.0199990272521973, 1.046557903289795, 1.0731168985366821, 1.0996757745742798, 1.1262346506118774, 1.1527936458587646, 1.1793525218963623]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 1.0, 3.0, 8.0, 5.0, 8.0, 8.0, 7.0, 12.0, 14.0, 30.0, 37.0, 45.0, 50.0, 73.0, 65.0, 56.0, 82.0, 67.0, 79.0, 67.0, 54.0, 47.0, 47.0, 49.0, 21.0, 10.0, 15.0, 11.0, 5.0, 8.0, 1.0, 4.0, 3.0, 2.0, 7.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.27869975566864014, -0.2711939811706543, -0.26368820667266846, -0.2561824321746826, -0.24867665767669678, -0.24117088317871094, -0.2336651086807251, -0.22615933418273926, -0.21865355968475342, -0.21114778518676758, -0.20364201068878174, -0.1961362361907959, -0.18863046169281006, -0.18112468719482422, -0.17361891269683838, -0.16611313819885254, -0.1586073487997055, -0.15110157430171967, -0.14359579980373383, -0.13609002530574799, -0.12858425080776215, -0.1210784763097763, -0.11357269436120987, -0.10606691986322403, -0.09856114536523819, -0.09105537086725235, -0.08354959636926651, -0.07604381442070007, -0.06853803992271423, -0.06103226915001869, -0.053526490926742554, -0.046020716428756714, -0.038514941930770874, -0.031009167432785034, -0.023503391072154045, -0.015997614711523056, -0.008491840213537216, -0.0009860657155513763, 0.006519712507724762, 0.014025487005710602, 0.02153126150369644, 0.02903703600168228, 0.03654281049966812, 0.04404858872294426, 0.0515543632209301, 0.05906013771891594, 0.06656591594219208, 0.07407169044017792, 0.08157746493816376, 0.0890832394361496, 0.09658901393413544, 0.10409478843212128, 0.11160056293010712, 0.11910633742809296, 0.12661212682724, 0.13411790132522583, 0.14162367582321167, 0.1491294503211975, 0.15663522481918335, 0.1641409993171692, 0.17164677381515503, 0.17915254831314087, 0.1866583228111267, 0.19416409730911255, 0.2016698718070984]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 16.0, 16.0, 14.0, 26.0, 34.0, 43.0, 62.0, 103.0, 102.0, 156.0, 232.0, 323.0, 455.0, 686.0, 969.0, 1596.0, 2574.0, 4154.0, 7147.0, 12799.0, 24611.0, 55024.0, 172675.0, 568454.0, 108857.0, 41049.0, 19929.0, 10488.0, 5894.0, 3507.0, 2183.0, 1448.0, 903.0, 597.0, 442.0, 288.0, 185.0, 159.0, 96.0, 68.0, 49.0, 36.0, 35.0, 15.0, 18.0, 11.0, 3.0, 11.0, 4.0, 2.0, 3.0, 5.0, 0.0, 1.0], "bins": [-0.143310546875, -0.13901138305664062, -0.13471221923828125, -0.13041305541992188, -0.1261138916015625, -0.12181472778320312, -0.11751556396484375, -0.11321640014648438, -0.108917236328125, -0.10461807250976562, -0.10031890869140625, -0.09601974487304688, -0.0917205810546875, -0.08742141723632812, -0.08312225341796875, -0.07882308959960938, -0.07452392578125, -0.07022476196289062, -0.06592559814453125, -0.061626434326171875, -0.0573272705078125, -0.053028106689453125, -0.04872894287109375, -0.044429779052734375, -0.040130615234375, -0.035831451416015625, -0.03153228759765625, -0.027233123779296875, -0.0229339599609375, -0.018634796142578125, -0.01433563232421875, -0.010036468505859375, -0.0057373046875, -0.001438140869140625, 0.00286102294921875, 0.007160186767578125, 0.0114593505859375, 0.015758514404296875, 0.02005767822265625, 0.024356842041015625, 0.028656005859375, 0.032955169677734375, 0.03725433349609375, 0.041553497314453125, 0.0458526611328125, 0.050151824951171875, 0.05445098876953125, 0.058750152587890625, 0.06304931640625, 0.06734848022460938, 0.07164764404296875, 0.07594680786132812, 0.0802459716796875, 0.08454513549804688, 0.08884429931640625, 0.09314346313476562, 0.097442626953125, 0.10174179077148438, 0.10604095458984375, 0.11034011840820312, 0.1146392822265625, 0.11893844604492188, 0.12323760986328125, 0.12753677368164062, 0.1318359375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 6.0, 3.0, 3.0, 5.0, 9.0, 14.0, 10.0, 16.0, 18.0, 20.0, 21.0, 34.0, 47.0, 66.0, 177.0, 217.0, 79.0, 61.0, 41.0, 39.0, 17.0, 20.0, 17.0, 12.0, 11.0, 11.0, 8.0, 2.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0523681640625, -0.05079507827758789, -0.04922199249267578, -0.04764890670776367, -0.04607582092285156, -0.04450273513793945, -0.042929649353027344, -0.041356563568115234, -0.039783477783203125, -0.038210391998291016, -0.036637306213378906, -0.0350642204284668, -0.03349113464355469, -0.03191804885864258, -0.03034496307373047, -0.02877187728881836, -0.02719879150390625, -0.02562570571899414, -0.02405261993408203, -0.022479534149169922, -0.020906448364257812, -0.019333362579345703, -0.017760276794433594, -0.016187191009521484, -0.014614105224609375, -0.013041019439697266, -0.011467933654785156, -0.009894847869873047, -0.008321762084960938, -0.006748676300048828, -0.005175590515136719, -0.0036025047302246094, -0.0020294189453125, -0.0004563331604003906, 0.0011167526245117188, 0.002689838409423828, 0.0042629241943359375, 0.005836009979248047, 0.007409095764160156, 0.008982181549072266, 0.010555267333984375, 0.012128353118896484, 0.013701438903808594, 0.015274524688720703, 0.016847610473632812, 0.018420696258544922, 0.01999378204345703, 0.02156686782836914, 0.02313995361328125, 0.02471303939819336, 0.02628612518310547, 0.027859210968017578, 0.029432296752929688, 0.031005382537841797, 0.032578468322753906, 0.034151554107666016, 0.035724639892578125, 0.037297725677490234, 0.038870811462402344, 0.04044389724731445, 0.04201698303222656, 0.04359006881713867, 0.04516315460205078, 0.04673624038696289, 0.048309326171875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 10.0, 11.0, 16.0, 16.0, 29.0, 39.0, 48.0, 90.0, 109.0, 172.0, 327.0, 543.0, 1085.0, 2373.0, 6085.0, 16793.0, 57394.0, 247730.0, 508974.0, 149356.0, 37186.0, 11804.0, 4484.0, 1799.0, 897.0, 433.0, 278.0, 141.0, 102.0, 45.0, 48.0, 29.0, 25.0, 27.0, 14.0, 10.0, 5.0, 8.0, 4.0, 4.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.11474609375, -0.111083984375, -0.107421875, -0.103759765625, -0.10009765625, -0.096435546875, -0.0927734375, -0.089111328125, -0.08544921875, -0.081787109375, -0.078125, -0.074462890625, -0.07080078125, -0.067138671875, -0.0634765625, -0.059814453125, -0.05615234375, -0.052490234375, -0.048828125, -0.045166015625, -0.04150390625, -0.037841796875, -0.0341796875, -0.030517578125, -0.02685546875, -0.023193359375, -0.01953125, -0.015869140625, -0.01220703125, -0.008544921875, -0.0048828125, -0.001220703125, 0.00244140625, 0.006103515625, 0.009765625, 0.013427734375, 0.01708984375, 0.020751953125, 0.0244140625, 0.028076171875, 0.03173828125, 0.035400390625, 0.0390625, 0.042724609375, 0.04638671875, 0.050048828125, 0.0537109375, 0.057373046875, 0.06103515625, 0.064697265625, 0.068359375, 0.072021484375, 0.07568359375, 0.079345703125, 0.0830078125, 0.086669921875, 0.09033203125, 0.093994140625, 0.09765625, 0.101318359375, 0.10498046875, 0.108642578125, 0.1123046875, 0.115966796875, 0.11962890625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 9.0, 9.0, 13.0, 8.0, 19.0, 19.0, 24.0, 30.0, 31.0, 33.0, 27.0, 38.0, 30.0, 28.0, 48.0, 39.0, 47.0, 37.0, 36.0, 52.0, 33.0, 36.0, 30.0, 30.0, 44.0, 44.0, 28.0, 30.0, 18.0, 20.0, 21.0, 17.0, 18.0, 13.0, 6.0, 9.0, 5.0, 6.0, 6.0, 2.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.15869140625, -0.15356826782226562, -0.14844512939453125, -0.14332199096679688, -0.1381988525390625, -0.13307571411132812, -0.12795257568359375, -0.12282943725585938, -0.117706298828125, -0.11258316040039062, -0.10746002197265625, -0.10233688354492188, -0.0972137451171875, -0.09209060668945312, -0.08696746826171875, -0.08184432983398438, -0.07672119140625, -0.07159805297851562, -0.06647491455078125, -0.061351776123046875, -0.0562286376953125, -0.051105499267578125, -0.04598236083984375, -0.040859222412109375, -0.035736083984375, -0.030612945556640625, -0.02548980712890625, -0.020366668701171875, -0.0152435302734375, -0.010120391845703125, -0.00499725341796875, 0.000125885009765625, 0.0052490234375, 0.010372161865234375, 0.01549530029296875, 0.020618438720703125, 0.0257415771484375, 0.030864715576171875, 0.03598785400390625, 0.041110992431640625, 0.046234130859375, 0.051357269287109375, 0.05648040771484375, 0.061603546142578125, 0.0667266845703125, 0.07184982299804688, 0.07697296142578125, 0.08209609985351562, 0.08721923828125, 0.09234237670898438, 0.09746551513671875, 0.10258865356445312, 0.1077117919921875, 0.11283493041992188, 0.11795806884765625, 0.12308120727539062, 0.128204345703125, 0.13332748413085938, 0.13845062255859375, 0.14357376098632812, 0.1486968994140625, 0.15382003784179688, 0.15894317626953125, 0.16406631469726562, 0.169189453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 13.0, 18.0, 26.0, 45.0, 60.0, 92.0, 176.0, 278.0, 524.0, 1031.0, 2368.0, 6036.0, 20288.0, 121087.0, 670870.0, 186366.0, 26567.0, 7341.0, 2769.0, 1215.0, 570.0, 308.0, 182.0, 100.0, 65.0, 37.0, 30.0, 26.0, 11.0, 10.0, 9.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10418701171875, -0.10117530822753906, -0.09816360473632812, -0.09515190124511719, -0.09214019775390625, -0.08912849426269531, -0.08611679077148438, -0.08310508728027344, -0.0800933837890625, -0.07708168029785156, -0.07406997680664062, -0.07105827331542969, -0.06804656982421875, -0.06503486633300781, -0.062023162841796875, -0.05901145935058594, -0.055999755859375, -0.05298805236816406, -0.049976348876953125, -0.04696464538574219, -0.04395294189453125, -0.04094123840332031, -0.037929534912109375, -0.03491783142089844, -0.0319061279296875, -0.028894424438476562, -0.025882720947265625, -0.022871017456054688, -0.01985931396484375, -0.016847610473632812, -0.013835906982421875, -0.010824203491210938, -0.0078125, -0.0048007965087890625, -0.001789093017578125, 0.0012226104736328125, 0.00423431396484375, 0.0072460174560546875, 0.010257720947265625, 0.013269424438476562, 0.0162811279296875, 0.019292831420898438, 0.022304534912109375, 0.025316238403320312, 0.02832794189453125, 0.03133964538574219, 0.034351348876953125, 0.03736305236816406, 0.040374755859375, 0.04338645935058594, 0.046398162841796875, 0.04940986633300781, 0.05242156982421875, 0.05543327331542969, 0.058444976806640625, 0.06145668029785156, 0.0644683837890625, 0.06748008728027344, 0.07049179077148438, 0.07350349426269531, 0.07651519775390625, 0.07952690124511719, 0.08253860473632812, 0.08555030822753906, 0.08856201171875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 7.0, 7.0, 5.0, 8.0, 18.0, 23.0, 37.0, 41.0, 42.0, 57.0, 73.0, 92.0, 94.0, 63.0, 91.0, 68.0, 64.0, 65.0, 40.0, 31.0, 18.0, 18.0, 12.0, 10.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6193599700927734e-05, -4.4547952711582184e-05, -4.290230572223663e-05, -4.125665873289108e-05, -3.961101174354553e-05, -3.796536475419998e-05, -3.631971776485443e-05, -3.467407077550888e-05, -3.302842378616333e-05, -3.138277679681778e-05, -2.973712980747223e-05, -2.809148281812668e-05, -2.6445835828781128e-05, -2.4800188839435577e-05, -2.3154541850090027e-05, -2.1508894860744476e-05, -1.9863247871398926e-05, -1.8217600882053375e-05, -1.6571953892707825e-05, -1.4926306903362274e-05, -1.3280659914016724e-05, -1.1635012924671173e-05, -9.989365935325623e-06, -8.343718945980072e-06, -6.6980719566345215e-06, -5.052424967288971e-06, -3.4067779779434204e-06, -1.7611309885978699e-06, -1.1548399925231934e-07, 1.5301629900932312e-06, 3.1758099794387817e-06, 4.821456968784332e-06, 6.467103958129883e-06, 8.112750947475433e-06, 9.758397936820984e-06, 1.1404044926166534e-05, 1.3049691915512085e-05, 1.4695338904857635e-05, 1.6340985894203186e-05, 1.7986632883548737e-05, 1.9632279872894287e-05, 2.1277926862239838e-05, 2.2923573851585388e-05, 2.456922084093094e-05, 2.621486783027649e-05, 2.786051481962204e-05, 2.950616180896759e-05, 3.115180879831314e-05, 3.279745578765869e-05, 3.444310277700424e-05, 3.608874976634979e-05, 3.773439675569534e-05, 3.9380043745040894e-05, 4.1025690734386444e-05, 4.2671337723731995e-05, 4.4316984713077545e-05, 4.5962631702423096e-05, 4.7608278691768646e-05, 4.92539256811142e-05, 5.089957267045975e-05, 5.25452196598053e-05, 5.419086664915085e-05, 5.58365136384964e-05, 5.748216062784195e-05, 5.91278076171875e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 7.0, 7.0, 7.0, 30.0, 14.0, 35.0, 42.0, 67.0, 100.0, 143.0, 239.0, 396.0, 784.0, 1393.0, 3005.0, 7153.0, 19552.0, 67939.0, 306136.0, 468567.0, 123479.0, 30644.0, 10244.0, 4262.0, 1939.0, 985.0, 517.0, 353.0, 180.0, 112.0, 77.0, 35.0, 30.0, 26.0, 18.0, 10.0, 9.0, 5.0, 8.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06182861328125, -0.05963611602783203, -0.05744361877441406, -0.055251121520996094, -0.053058624267578125, -0.050866127014160156, -0.04867362976074219, -0.04648113250732422, -0.04428863525390625, -0.04209613800048828, -0.03990364074707031, -0.037711143493652344, -0.035518646240234375, -0.033326148986816406, -0.031133651733398438, -0.02894115447998047, -0.0267486572265625, -0.02455615997314453, -0.022363662719726562, -0.020171165466308594, -0.017978668212890625, -0.015786170959472656, -0.013593673706054688, -0.011401176452636719, -0.00920867919921875, -0.007016181945800781, -0.0048236846923828125, -0.0026311874389648438, -0.000438690185546875, 0.0017538070678710938, 0.0039463043212890625, 0.006138801574707031, 0.008331298828125, 0.010523796081542969, 0.012716293334960938, 0.014908790588378906, 0.017101287841796875, 0.019293785095214844, 0.021486282348632812, 0.02367877960205078, 0.02587127685546875, 0.02806377410888672, 0.030256271362304688, 0.032448768615722656, 0.034641265869140625, 0.036833763122558594, 0.03902626037597656, 0.04121875762939453, 0.0434112548828125, 0.04560375213623047, 0.04779624938964844, 0.049988746643066406, 0.052181243896484375, 0.054373741149902344, 0.05656623840332031, 0.05875873565673828, 0.06095123291015625, 0.06314373016357422, 0.06533622741699219, 0.06752872467041016, 0.06972122192382812, 0.0719137191772461, 0.07410621643066406, 0.07629871368408203, 0.0784912109375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 4.0, 7.0, 10.0, 10.0, 20.0, 24.0, 39.0, 44.0, 51.0, 65.0, 84.0, 81.0, 63.0, 99.0, 73.0, 75.0, 58.0, 44.0, 25.0, 31.0, 18.0, 15.0, 13.0, 9.0, 7.0, 10.0, 4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.1080322265625, -0.10537195205688477, -0.10271167755126953, -0.1000514030456543, -0.09739112854003906, -0.09473085403442383, -0.0920705795288086, -0.08941030502319336, -0.08675003051757812, -0.08408975601196289, -0.08142948150634766, -0.07876920700073242, -0.07610893249511719, -0.07344865798950195, -0.07078838348388672, -0.06812810897827148, -0.06546783447265625, -0.06280755996704102, -0.06014728546142578, -0.05748701095581055, -0.05482673645019531, -0.05216646194458008, -0.049506187438964844, -0.04684591293334961, -0.044185638427734375, -0.04152536392211914, -0.038865089416503906, -0.03620481491088867, -0.03354454040527344, -0.030884265899658203, -0.02822399139404297, -0.025563716888427734, -0.0229034423828125, -0.020243167877197266, -0.01758289337158203, -0.014922618865966797, -0.012262344360351562, -0.009602069854736328, -0.006941795349121094, -0.004281520843505859, -0.001621246337890625, 0.0010390281677246094, 0.0036993026733398438, 0.006359577178955078, 0.009019851684570312, 0.011680126190185547, 0.014340400695800781, 0.017000675201416016, 0.01966094970703125, 0.022321224212646484, 0.02498149871826172, 0.027641773223876953, 0.030302047729492188, 0.03296232223510742, 0.035622596740722656, 0.03828287124633789, 0.040943145751953125, 0.04360342025756836, 0.046263694763183594, 0.04892396926879883, 0.05158424377441406, 0.0542445182800293, 0.05690479278564453, 0.059565067291259766, 0.062225341796875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 8.0, 29.0, 75.0, 422.0, 380.0, 65.0, 17.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7165491580963135, -1.6089847087860107, -1.501420259475708, -1.3938559293746948, -1.286291480064392, -1.1787270307540894, -1.0711627006530762, -0.9635982513427734, -0.8560338020324707, -0.748469352722168, -0.64090496301651, -0.533340573310852, -0.4257761240005493, -0.3182116746902466, -0.21064728498458862, -0.10308289527893066, 0.00448155403137207, 0.11204597353935242, 0.21961039304733276, 0.3271748125553131, 0.43473923206329346, 0.5423036813735962, 0.6498680710792542, 0.7574324607849121, 0.8649969100952148, 0.9725613594055176, 1.0801258087158203, 1.1876901388168335, 1.2952545881271362, 1.402819037437439, 1.5103833675384521, 1.6179478168487549, 1.7255125045776367, 1.8330769538879395, 1.9406414031982422, 2.048205852508545, 2.1557703018188477, 2.2633347511291504, 2.370898962020874, 2.4784634113311768, 2.5860278606414795, 2.6935923099517822, 2.801156759262085, 2.9087212085723877, 3.0162854194641113, 3.123849868774414, 3.231414318084717, 3.3389787673950195, 3.4465432167053223, 3.554107666015625, 3.6616721153259277, 3.7692365646362305, 3.876801013946533, 3.984365463256836, 4.091929912567139, 4.199494361877441, 4.307058334350586, 4.414622783660889, 4.522187232971191, 4.629751682281494, 4.737316131591797, 4.8448805809021, 4.952445030212402, 5.060009002685547, 5.167573928833008]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 3.0, 6.0, 5.0, 8.0, 4.0, 13.0, 18.0, 30.0, 62.0, 106.0, 143.0, 163.0, 145.0, 106.0, 69.0, 32.0, 19.0, 9.0, 13.0, 4.0, 6.0, 6.0, 7.0, 4.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9579219818115234, -2.851120710372925, -2.744319438934326, -2.6375181674957275, -2.530716896057129, -2.4239156246185303, -2.3171143531799316, -2.210313320159912, -2.1035118103027344, -1.9967105388641357, -1.889909267425537, -1.7831079959869385, -1.6763067245483398, -1.5695054531097412, -1.4627043008804321, -1.3559030294418335, -1.2491018772125244, -1.1423006057739258, -1.0354993343353271, -0.9286981225013733, -0.8218968510627747, -0.715095579624176, -0.6082943677902222, -0.5014930963516235, -0.3946918249130249, -0.28789055347442627, -0.18108931183815002, -0.07428807020187378, 0.032513201236724854, 0.1393144726753235, 0.24611568450927734, 0.352916955947876, 0.4597184658050537, 0.5665197372436523, 0.673321008682251, 0.7801222205162048, 0.8869234919548035, 0.9937247633934021, 1.100525975227356, 1.2073272466659546, 1.3141285181045532, 1.4209297895431519, 1.5277310609817505, 1.6345322132110596, 1.7413334846496582, 1.8481347560882568, 1.9549360275268555, 2.061737298965454, 2.1685385704040527, 2.2753398418426514, 2.38214111328125, 2.4889423847198486, 2.5957436561584473, 2.702544927597046, 2.8093461990356445, 2.916147232055664, 3.022948741912842, 3.1297500133514404, 3.236551284790039, 3.3433525562286377, 3.4501538276672363, 3.556955099105835, 3.6637563705444336, 3.770557403564453, 3.8773586750030518]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 7.0, 13.0, 25.0, 11.0, 27.0, 44.0, 75.0, 131.0, 210.0, 348.0, 630.0, 1148.0, 2108.0, 4630.0, 11633.0, 36517.0, 237185.0, 3702418.0, 147026.0, 30372.0, 10406.0, 4423.0, 2157.0, 1123.0, 673.0, 388.0, 204.0, 111.0, 88.0, 45.0, 27.0, 32.0, 12.0, 10.0, 7.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.383544921875, -0.37133026123046875, -0.3591156005859375, -0.34690093994140625, -0.334686279296875, -0.32247161865234375, -0.3102569580078125, -0.29804229736328125, -0.28582763671875, -0.27361297607421875, -0.2613983154296875, -0.24918365478515625, -0.236968994140625, -0.22475433349609375, -0.2125396728515625, -0.20032501220703125, -0.1881103515625, -0.17589569091796875, -0.1636810302734375, -0.15146636962890625, -0.139251708984375, -0.12703704833984375, -0.1148223876953125, -0.10260772705078125, -0.09039306640625, -0.07817840576171875, -0.0659637451171875, -0.05374908447265625, -0.041534423828125, -0.02931976318359375, -0.0171051025390625, -0.00489044189453125, 0.00732421875, 0.01953887939453125, 0.0317535400390625, 0.04396820068359375, 0.056182861328125, 0.06839752197265625, 0.0806121826171875, 0.09282684326171875, 0.10504150390625, 0.11725616455078125, 0.1294708251953125, 0.14168548583984375, 0.153900146484375, 0.16611480712890625, 0.1783294677734375, 0.19054412841796875, 0.2027587890625, 0.21497344970703125, 0.2271881103515625, 0.23940277099609375, 0.251617431640625, 0.26383209228515625, 0.2760467529296875, 0.28826141357421875, 0.30047607421875, 0.31269073486328125, 0.3249053955078125, 0.33712005615234375, 0.349334716796875, 0.36154937744140625, 0.3737640380859375, 0.38597869873046875, 0.398193359375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 8.0, 11.0, 7.0, 13.0, 12.0, 17.0, 19.0, 23.0, 31.0, 45.0, 73.0, 89.0, 181.0, 138.0, 75.0, 54.0, 36.0, 26.0, 32.0, 14.0, 16.0, 15.0, 16.0, 5.0, 8.0, 10.0, 5.0, 3.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.045745849609375, -0.04431343078613281, -0.042881011962890625, -0.04144859313964844, -0.04001617431640625, -0.03858375549316406, -0.037151336669921875, -0.03571891784667969, -0.0342864990234375, -0.03285408020019531, -0.031421661376953125, -0.029989242553710938, -0.02855682373046875, -0.027124404907226562, -0.025691986083984375, -0.024259567260742188, -0.0228271484375, -0.021394729614257812, -0.019962310791015625, -0.018529891967773438, -0.01709747314453125, -0.015665054321289062, -0.014232635498046875, -0.012800216674804688, -0.0113677978515625, -0.009935379028320312, -0.008502960205078125, -0.0070705413818359375, -0.00563812255859375, -0.0042057037353515625, -0.002773284912109375, -0.0013408660888671875, 9.1552734375e-05, 0.0015239715576171875, 0.002956390380859375, 0.0043888092041015625, 0.00582122802734375, 0.0072536468505859375, 0.008686065673828125, 0.010118484497070312, 0.0115509033203125, 0.012983322143554688, 0.014415740966796875, 0.015848159790039062, 0.01728057861328125, 0.018712997436523438, 0.020145416259765625, 0.021577835083007812, 0.02301025390625, 0.024442672729492188, 0.025875091552734375, 0.027307510375976562, 0.02873992919921875, 0.030172348022460938, 0.031604766845703125, 0.03303718566894531, 0.0344696044921875, 0.03590202331542969, 0.037334442138671875, 0.03876686096191406, 0.04019927978515625, 0.04163169860839844, 0.043064117431640625, 0.04449653625488281, 0.045928955078125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 6.0, 9.0, 11.0, 15.0, 17.0, 24.0, 36.0, 51.0, 72.0, 121.0, 231.0, 441.0, 909.0, 2056.0, 5031.0, 15985.0, 66275.0, 556714.0, 3249499.0, 240684.0, 38746.0, 10647.0, 3668.0, 1553.0, 677.0, 345.0, 155.0, 114.0, 68.0, 39.0, 21.0, 19.0, 18.0, 8.0, 10.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.27099609375, -0.2626152038574219, -0.25423431396484375, -0.24585342407226562, -0.2374725341796875, -0.22909164428710938, -0.22071075439453125, -0.21232986450195312, -0.203948974609375, -0.19556808471679688, -0.18718719482421875, -0.17880630493164062, -0.1704254150390625, -0.16204452514648438, -0.15366363525390625, -0.14528274536132812, -0.13690185546875, -0.12852096557617188, -0.12014007568359375, -0.11175918579101562, -0.1033782958984375, -0.09499740600585938, -0.08661651611328125, -0.07823562622070312, -0.069854736328125, -0.061473846435546875, -0.05309295654296875, -0.044712066650390625, -0.0363311767578125, -0.027950286865234375, -0.01956939697265625, -0.011188507080078125, -0.0028076171875, 0.005573272705078125, 0.01395416259765625, 0.022335052490234375, 0.0307159423828125, 0.039096832275390625, 0.04747772216796875, 0.055858612060546875, 0.064239501953125, 0.07262039184570312, 0.08100128173828125, 0.08938217163085938, 0.0977630615234375, 0.10614395141601562, 0.11452484130859375, 0.12290573120117188, 0.13128662109375, 0.13966751098632812, 0.14804840087890625, 0.15642929077148438, 0.1648101806640625, 0.17319107055664062, 0.18157196044921875, 0.18995285034179688, 0.198333740234375, 0.20671463012695312, 0.21509552001953125, 0.22347640991210938, 0.2318572998046875, 0.24023818969726562, 0.24861907958984375, 0.2569999694824219, 0.265380859375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 5.0, 10.0, 5.0, 6.0, 11.0, 10.0, 18.0, 31.0, 56.0, 84.0, 109.0, 193.0, 368.0, 773.0, 1320.0, 481.0, 237.0, 118.0, 74.0, 46.0, 26.0, 18.0, 20.0, 12.0, 13.0, 2.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.057159423828125, -0.05538225173950195, -0.053605079650878906, -0.05182790756225586, -0.05005073547363281, -0.048273563385009766, -0.04649639129638672, -0.04471921920776367, -0.042942047119140625, -0.04116487503051758, -0.03938770294189453, -0.037610530853271484, -0.03583335876464844, -0.03405618667602539, -0.032279014587402344, -0.030501842498779297, -0.02872467041015625, -0.026947498321533203, -0.025170326232910156, -0.02339315414428711, -0.021615982055664062, -0.019838809967041016, -0.01806163787841797, -0.016284465789794922, -0.014507293701171875, -0.012730121612548828, -0.010952949523925781, -0.009175777435302734, -0.0073986053466796875, -0.005621433258056641, -0.0038442611694335938, -0.002067089080810547, -0.0002899169921875, 0.0014872550964355469, 0.0032644271850585938, 0.005041599273681641, 0.0068187713623046875, 0.008595943450927734, 0.010373115539550781, 0.012150287628173828, 0.013927459716796875, 0.015704631805419922, 0.01748180389404297, 0.019258975982666016, 0.021036148071289062, 0.02281332015991211, 0.024590492248535156, 0.026367664337158203, 0.02814483642578125, 0.029922008514404297, 0.031699180603027344, 0.03347635269165039, 0.03525352478027344, 0.037030696868896484, 0.03880786895751953, 0.04058504104614258, 0.042362213134765625, 0.04413938522338867, 0.04591655731201172, 0.047693729400634766, 0.04947090148925781, 0.05124807357788086, 0.053025245666503906, 0.05480241775512695, 0.05657958984375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 9.0, 9.0, 22.0, 70.0, 187.0, 332.0, 258.0, 76.0, 29.0, 7.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2700851559638977, -0.25392162799835205, -0.2377581149339676, -0.22159460186958313, -0.20543107390403748, -0.18926754593849182, -0.17310403287410736, -0.1569405198097229, -0.14077699184417725, -0.12461347132921219, -0.10844995081424713, -0.09228643029928207, -0.07612290978431702, -0.05995938926935196, -0.0437958687543869, -0.027632348239421844, -0.011468827724456787, 0.00469469279050827, 0.020858213305473328, 0.037021733820438385, 0.05318525433540344, 0.0693487748503685, 0.08551229536533356, 0.10167581588029861, 0.11783933639526367, 0.13400286436080933, 0.1501663774251938, 0.16632989048957825, 0.1824934184551239, 0.19865694642066956, 0.21482045948505402, 0.23098397254943848, 0.2471475601196289, 0.26331108808517456, 0.2794746160507202, 0.2956381142139435, 0.31180164217948914, 0.3279651701450348, 0.34412866830825806, 0.3602921962738037, 0.37645572423934937, 0.392619252204895, 0.4087827801704407, 0.42494627833366394, 0.4411098062992096, 0.45727333426475525, 0.4734368324279785, 0.48960036039352417, 0.5057638883590698, 0.5219274163246155, 0.5380909442901611, 0.5542544722557068, 0.5704180002212524, 0.5865814685821533, 0.602744996547699, 0.6189085245132446, 0.6350720524787903, 0.6512355804443359, 0.6673991084098816, 0.6835626363754272, 0.6997261047363281, 0.7158896327018738, 0.7320531606674194, 0.7482166886329651, 0.7643802165985107]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 10.0, 12.0, 7.0, 16.0, 22.0, 25.0, 20.0, 58.0, 66.0, 69.0, 70.0, 73.0, 104.0, 79.0, 74.0, 70.0, 57.0, 33.0, 33.0, 21.0, 13.0, 11.0, 15.0, 3.0, 6.0, 7.0, 3.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.30907267332077026, -0.30069243907928467, -0.2923122048377991, -0.2839319407939911, -0.2755517065525055, -0.2671714723110199, -0.2587912380695343, -0.2504109740257263, -0.24203073978424072, -0.23365050554275513, -0.22527025640010834, -0.21689002215862274, -0.20850977301597595, -0.20012953877449036, -0.19174930453300476, -0.18336905539035797, -0.17498882114887238, -0.16660858690738678, -0.15822833776474, -0.1498481035232544, -0.1414678543806076, -0.133087620139122, -0.12470737844705582, -0.11632713675498962, -0.10794689506292343, -0.09956665337085724, -0.09118641167879105, -0.08280616998672485, -0.07442593574523926, -0.06604568660259247, -0.05766545236110687, -0.04928521066904068, -0.04090496897697449, -0.032524727284908295, -0.02414448745548725, -0.015764247626066208, -0.007384005934000015, 0.0009962357580661774, 0.009376473724842072, 0.017756715416908264, 0.026136957108974457, 0.03451719880104065, 0.04289744049310684, 0.051277678459882736, 0.05965792015194893, 0.06803816556930542, 0.07641839981079102, 0.08479864150285721, 0.0931788831949234, 0.1015591248869896, 0.10993936657905579, 0.11831960082054138, 0.12669984996318817, 0.13508008420467377, 0.14346033334732056, 0.15184056758880615, 0.16022080183029175, 0.16860103607177734, 0.17698128521442413, 0.18536151945590973, 0.19374176859855652, 0.20212200284004211, 0.2105022370815277, 0.2188824862241745, 0.2272627353668213]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 7.0, 1.0, 3.0, 1.0, 5.0, 8.0, 23.0, 17.0, 24.0, 39.0, 55.0, 78.0, 149.0, 219.0, 305.0, 511.0, 895.0, 1635.0, 3045.0, 6174.0, 13751.0, 34325.0, 108008.0, 545376.0, 237159.0, 57266.0, 21087.0, 8982.0, 4302.0, 2155.0, 1122.0, 677.0, 425.0, 269.0, 154.0, 98.0, 74.0, 46.0, 29.0, 18.0, 11.0, 14.0, 6.0, 9.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.218017578125, -0.21135902404785156, -0.20470046997070312, -0.1980419158935547, -0.19138336181640625, -0.1847248077392578, -0.17806625366210938, -0.17140769958496094, -0.1647491455078125, -0.15809059143066406, -0.15143203735351562, -0.1447734832763672, -0.13811492919921875, -0.1314563751220703, -0.12479782104492188, -0.11813926696777344, -0.111480712890625, -0.10482215881347656, -0.09816360473632812, -0.09150505065917969, -0.08484649658203125, -0.07818794250488281, -0.07152938842773438, -0.06487083435058594, -0.0582122802734375, -0.05155372619628906, -0.044895172119140625, -0.03823661804199219, -0.03157806396484375, -0.024919509887695312, -0.018260955810546875, -0.011602401733398438, -0.00494384765625, 0.0017147064208984375, 0.008373260498046875, 0.015031814575195312, 0.02169036865234375, 0.028348922729492188, 0.035007476806640625, 0.04166603088378906, 0.0483245849609375, 0.05498313903808594, 0.061641693115234375, 0.06830024719238281, 0.07495880126953125, 0.08161735534667969, 0.08827590942382812, 0.09493446350097656, 0.101593017578125, 0.10825157165527344, 0.11491012573242188, 0.12156867980957031, 0.12822723388671875, 0.1348857879638672, 0.14154434204101562, 0.14820289611816406, 0.1548614501953125, 0.16152000427246094, 0.16817855834960938, 0.1748371124267578, 0.18149566650390625, 0.1881542205810547, 0.19481277465820312, 0.20147132873535156, 0.2081298828125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 5.0, 3.0, 10.0, 8.0, 14.0, 13.0, 19.0, 24.0, 27.0, 36.0, 34.0, 66.0, 125.0, 136.0, 132.0, 79.0, 62.0, 47.0, 29.0, 27.0, 19.0, 19.0, 14.0, 9.0, 13.0, 10.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.046875, -0.045491695404052734, -0.04410839080810547, -0.0427250862121582, -0.04134178161621094, -0.03995847702026367, -0.038575172424316406, -0.03719186782836914, -0.035808563232421875, -0.03442525863647461, -0.033041954040527344, -0.03165864944458008, -0.030275344848632812, -0.028892040252685547, -0.02750873565673828, -0.026125431060791016, -0.02474212646484375, -0.023358821868896484, -0.02197551727294922, -0.020592212677001953, -0.019208908081054688, -0.017825603485107422, -0.016442298889160156, -0.01505899429321289, -0.013675689697265625, -0.01229238510131836, -0.010909080505371094, -0.009525775909423828, -0.008142471313476562, -0.006759166717529297, -0.005375862121582031, -0.003992557525634766, -0.0026092529296875, -0.0012259483337402344, 0.00015735626220703125, 0.0015406608581542969, 0.0029239654541015625, 0.004307270050048828, 0.005690574645996094, 0.007073879241943359, 0.008457183837890625, 0.00984048843383789, 0.011223793029785156, 0.012607097625732422, 0.013990402221679688, 0.015373706817626953, 0.01675701141357422, 0.018140316009521484, 0.01952362060546875, 0.020906925201416016, 0.02229022979736328, 0.023673534393310547, 0.025056838989257812, 0.026440143585205078, 0.027823448181152344, 0.02920675277709961, 0.030590057373046875, 0.03197336196899414, 0.033356666564941406, 0.03473997116088867, 0.03612327575683594, 0.0375065803527832, 0.03888988494873047, 0.040273189544677734, 0.041656494140625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 6.0, 5.0, 4.0, 10.0, 19.0, 15.0, 20.0, 36.0, 42.0, 52.0, 74.0, 99.0, 146.0, 228.0, 405.0, 665.0, 1351.0, 2605.0, 5702.0, 13291.0, 39251.0, 159457.0, 523136.0, 219890.0, 51979.0, 16821.0, 6748.0, 2927.0, 1469.0, 769.0, 485.0, 278.0, 173.0, 124.0, 72.0, 51.0, 35.0, 33.0, 15.0, 23.0, 13.0, 7.0, 7.0, 7.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1353759765625, -0.1312236785888672, -0.12707138061523438, -0.12291908264160156, -0.11876678466796875, -0.11461448669433594, -0.11046218872070312, -0.10630989074707031, -0.1021575927734375, -0.09800529479980469, -0.09385299682617188, -0.08970069885253906, -0.08554840087890625, -0.08139610290527344, -0.07724380493164062, -0.07309150695800781, -0.068939208984375, -0.06478691101074219, -0.060634613037109375, -0.05648231506347656, -0.05233001708984375, -0.04817771911621094, -0.044025421142578125, -0.03987312316894531, -0.0357208251953125, -0.03156852722167969, -0.027416229248046875, -0.023263931274414062, -0.01911163330078125, -0.014959335327148438, -0.010807037353515625, -0.0066547393798828125, -0.00250244140625, 0.0016498565673828125, 0.005802154541015625, 0.009954452514648438, 0.01410675048828125, 0.018259048461914062, 0.022411346435546875, 0.026563644409179688, 0.0307159423828125, 0.03486824035644531, 0.039020538330078125, 0.04317283630371094, 0.04732513427734375, 0.05147743225097656, 0.055629730224609375, 0.05978202819824219, 0.063934326171875, 0.06808662414550781, 0.07223892211914062, 0.07639122009277344, 0.08054351806640625, 0.08469581604003906, 0.08884811401367188, 0.09300041198730469, 0.0971527099609375, 0.10130500793457031, 0.10545730590820312, 0.10960960388183594, 0.11376190185546875, 0.11791419982910156, 0.12206649780273438, 0.1262187957763672, 0.13037109375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 4.0, 7.0, 7.0, 8.0, 11.0, 7.0, 16.0, 15.0, 12.0, 18.0, 20.0, 38.0, 30.0, 26.0, 51.0, 34.0, 43.0, 45.0, 55.0, 39.0, 56.0, 43.0, 34.0, 49.0, 41.0, 46.0, 23.0, 31.0, 29.0, 26.0, 20.0, 21.0, 26.0, 15.0, 12.0, 12.0, 5.0, 11.0, 6.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1298828125, -0.12584877014160156, -0.12181472778320312, -0.11778068542480469, -0.11374664306640625, -0.10971260070800781, -0.10567855834960938, -0.10164451599121094, -0.0976104736328125, -0.09357643127441406, -0.08954238891601562, -0.08550834655761719, -0.08147430419921875, -0.07744026184082031, -0.07340621948242188, -0.06937217712402344, -0.065338134765625, -0.06130409240722656, -0.057270050048828125, -0.05323600769042969, -0.04920196533203125, -0.04516792297363281, -0.041133880615234375, -0.03709983825683594, -0.0330657958984375, -0.029031753540039062, -0.024997711181640625, -0.020963668823242188, -0.01692962646484375, -0.012895584106445312, -0.008861541748046875, -0.0048274993896484375, -0.00079345703125, 0.0032405853271484375, 0.007274627685546875, 0.011308670043945312, 0.01534271240234375, 0.019376754760742188, 0.023410797119140625, 0.027444839477539062, 0.0314788818359375, 0.03551292419433594, 0.039546966552734375, 0.04358100891113281, 0.04761505126953125, 0.05164909362792969, 0.055683135986328125, 0.05971717834472656, 0.063751220703125, 0.06778526306152344, 0.07181930541992188, 0.07585334777832031, 0.07988739013671875, 0.08392143249511719, 0.08795547485351562, 0.09198951721191406, 0.0960235595703125, 0.10005760192871094, 0.10409164428710938, 0.10812568664550781, 0.11215972900390625, 0.11619377136230469, 0.12022781372070312, 0.12426185607910156, 0.1282958984375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 5.0, 4.0, 5.0, 13.0, 12.0, 27.0, 32.0, 65.0, 96.0, 157.0, 286.0, 512.0, 1155.0, 2701.0, 8122.0, 34641.0, 273251.0, 615854.0, 87862.0, 15842.0, 4549.0, 1627.0, 792.0, 396.0, 210.0, 120.0, 67.0, 44.0, 26.0, 28.0, 19.0, 10.0, 5.0, 8.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.205078125, -0.19890975952148438, -0.19274139404296875, -0.18657302856445312, -0.1804046630859375, -0.17423629760742188, -0.16806793212890625, -0.16189956665039062, -0.155731201171875, -0.14956283569335938, -0.14339447021484375, -0.13722610473632812, -0.1310577392578125, -0.12488937377929688, -0.11872100830078125, -0.11255264282226562, -0.10638427734375, -0.10021591186523438, -0.09404754638671875, -0.08787918090820312, -0.0817108154296875, -0.07554244995117188, -0.06937408447265625, -0.06320571899414062, -0.057037353515625, -0.050868988037109375, -0.04470062255859375, -0.038532257080078125, -0.0323638916015625, -0.026195526123046875, -0.02002716064453125, -0.013858795166015625, -0.0076904296875, -0.001522064208984375, 0.00464630126953125, 0.010814666748046875, 0.0169830322265625, 0.023151397705078125, 0.02931976318359375, 0.035488128662109375, 0.041656494140625, 0.047824859619140625, 0.05399322509765625, 0.060161590576171875, 0.0663299560546875, 0.07249832153320312, 0.07866668701171875, 0.08483505249023438, 0.09100341796875, 0.09717178344726562, 0.10334014892578125, 0.10950851440429688, 0.1156768798828125, 0.12184524536132812, 0.12801361083984375, 0.13418197631835938, 0.140350341796875, 0.14651870727539062, 0.15268707275390625, 0.15885543823242188, 0.1650238037109375, 0.17119216918945312, 0.17736053466796875, 0.18352890014648438, 0.189697265625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 2.0, 4.0, 12.0, 13.0, 19.0, 27.0, 30.0, 35.0, 60.0, 80.0, 127.0, 100.0, 102.0, 108.0, 86.0, 56.0, 43.0, 30.0, 23.0, 9.0, 12.0, 7.0, 6.0, 4.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013375282287597656, -0.00013048294931650162, -0.00012721307575702667, -0.00012394320219755173, -0.00012067332863807678, -0.00011740345507860184, -0.00011413358151912689, -0.00011086370795965195, -0.000107593834400177, -0.00010432396084070206, -0.00010105408728122711, -9.778421372175217e-05, -9.451434016227722e-05, -9.124446660280228e-05, -8.797459304332733e-05, -8.470471948385239e-05, -8.143484592437744e-05, -7.81649723649025e-05, -7.489509880542755e-05, -7.16252252459526e-05, -6.835535168647766e-05, -6.508547812700272e-05, -6.181560456752777e-05, -5.8545731008052826e-05, -5.527585744857788e-05, -5.2005983889102936e-05, -4.873611032962799e-05, -4.5466236770153046e-05, -4.21963632106781e-05, -3.8926489651203156e-05, -3.565661609172821e-05, -3.2386742532253265e-05, -2.911686897277832e-05, -2.5846995413303375e-05, -2.257712185382843e-05, -1.9307248294353485e-05, -1.603737473487854e-05, -1.2767501175403595e-05, -9.49762761592865e-06, -6.227754056453705e-06, -2.9578804969787598e-06, 3.119930624961853e-07, 3.5818666219711304e-06, 6.8517401814460754e-06, 1.012161374092102e-05, 1.3391487300395966e-05, 1.666136085987091e-05, 1.9931234419345856e-05, 2.32011079788208e-05, 2.6470981538295746e-05, 2.974085509777069e-05, 3.3010728657245636e-05, 3.628060221672058e-05, 3.9550475776195526e-05, 4.282034933567047e-05, 4.6090222895145416e-05, 4.936009645462036e-05, 5.2629970014095306e-05, 5.589984357357025e-05, 5.9169717133045197e-05, 6.243959069252014e-05, 6.570946425199509e-05, 6.897933781147003e-05, 7.224921137094498e-05, 7.551908493041992e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 0.0, 2.0, 4.0, 3.0, 2.0, 6.0, 13.0, 12.0, 19.0, 27.0, 38.0, 73.0, 91.0, 158.0, 228.0, 465.0, 734.0, 1498.0, 3050.0, 6882.0, 18062.0, 58498.0, 226616.0, 459290.0, 192940.0, 51433.0, 16265.0, 6285.0, 2783.0, 1339.0, 722.0, 390.0, 216.0, 136.0, 69.0, 67.0, 36.0, 32.0, 17.0, 11.0, 11.0, 7.0, 9.0, 2.0, 10.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.131103515625, -0.12750530242919922, -0.12390708923339844, -0.12030887603759766, -0.11671066284179688, -0.1131124496459961, -0.10951423645019531, -0.10591602325439453, -0.10231781005859375, -0.09871959686279297, -0.09512138366699219, -0.0915231704711914, -0.08792495727539062, -0.08432674407958984, -0.08072853088378906, -0.07713031768798828, -0.0735321044921875, -0.06993389129638672, -0.06633567810058594, -0.06273746490478516, -0.059139251708984375, -0.055541038513183594, -0.05194282531738281, -0.04834461212158203, -0.04474639892578125, -0.04114818572998047, -0.03754997253417969, -0.033951759338378906, -0.030353546142578125, -0.026755332946777344, -0.023157119750976562, -0.01955890655517578, -0.015960693359375, -0.012362480163574219, -0.008764266967773438, -0.005166053771972656, -0.001567840576171875, 0.0020303726196289062, 0.0056285858154296875, 0.009226799011230469, 0.01282501220703125, 0.01642322540283203, 0.020021438598632812, 0.023619651794433594, 0.027217864990234375, 0.030816078186035156, 0.03441429138183594, 0.03801250457763672, 0.0416107177734375, 0.04520893096923828, 0.04880714416503906, 0.052405357360839844, 0.056003570556640625, 0.059601783752441406, 0.06319999694824219, 0.06679821014404297, 0.07039642333984375, 0.07399463653564453, 0.07759284973144531, 0.0811910629272461, 0.08478927612304688, 0.08838748931884766, 0.09198570251464844, 0.09558391571044922, 0.09918212890625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 6.0, 3.0, 7.0, 8.0, 9.0, 18.0, 15.0, 12.0, 19.0, 29.0, 29.0, 62.0, 56.0, 68.0, 59.0, 69.0, 80.0, 72.0, 69.0, 57.0, 42.0, 39.0, 30.0, 34.0, 20.0, 20.0, 16.0, 8.0, 15.0, 6.0, 4.0, 8.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1004638671875, -0.09743309020996094, -0.09440231323242188, -0.09137153625488281, -0.08834075927734375, -0.08530998229980469, -0.08227920532226562, -0.07924842834472656, -0.0762176513671875, -0.07318687438964844, -0.07015609741210938, -0.06712532043457031, -0.06409454345703125, -0.06106376647949219, -0.058032989501953125, -0.05500221252441406, -0.051971435546875, -0.04894065856933594, -0.045909881591796875, -0.04287910461425781, -0.03984832763671875, -0.03681755065917969, -0.033786773681640625, -0.030755996704101562, -0.0277252197265625, -0.024694442749023438, -0.021663665771484375, -0.018632888793945312, -0.01560211181640625, -0.012571334838867188, -0.009540557861328125, -0.0065097808837890625, -0.00347900390625, -0.0004482269287109375, 0.002582550048828125, 0.0056133270263671875, 0.00864410400390625, 0.011674880981445312, 0.014705657958984375, 0.017736434936523438, 0.0207672119140625, 0.023797988891601562, 0.026828765869140625, 0.029859542846679688, 0.03289031982421875, 0.03592109680175781, 0.038951873779296875, 0.04198265075683594, 0.045013427734375, 0.04804420471191406, 0.051074981689453125, 0.05410575866699219, 0.05713653564453125, 0.06016731262207031, 0.06319808959960938, 0.06622886657714844, 0.0692596435546875, 0.07229042053222656, 0.07532119750976562, 0.07835197448730469, 0.08138275146484375, 0.08441352844238281, 0.08744430541992188, 0.09047508239746094, 0.093505859375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 3.0, 9.0, 28.0, 57.0, 146.0, 232.0, 251.0, 145.0, 65.0, 29.0, 16.0, 8.0, 3.0, 8.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.541589379310608, -1.4990280866622925, -1.4564666748046875, -1.413905382156372, -1.3713440895080566, -1.3287826776504517, -1.2862213850021362, -1.2436599731445312, -1.2010986804962158, -1.1585373878479004, -1.1159759759902954, -1.07341468334198, -1.030853271484375, -0.9882919788360596, -0.9457306861877441, -0.9031693339347839, -0.8606079816818237, -0.8180466294288635, -0.7754852771759033, -0.7329239845275879, -0.6903626322746277, -0.6478012800216675, -0.605239987373352, -0.5626786351203918, -0.5201172828674316, -0.47755593061447144, -0.4349946081638336, -0.3924332857131958, -0.3498719334602356, -0.3073105812072754, -0.2647492587566376, -0.22218793630599976, -0.17962646484375, -0.137065127491951, -0.09450379014015198, -0.051942452788352966, -0.009381115436553955, 0.033180221915245056, 0.07574155926704407, 0.11830288171768188, 0.1608642339706421, 0.2034255713224411, 0.2459869086742401, 0.28854823112487793, 0.33110958337783813, 0.37367093563079834, 0.41623225808143616, 0.458793580532074, 0.5013549327850342, 0.5439162850379944, 0.5864776372909546, 0.62903892993927, 0.6716002821922302, 0.7141616344451904, 0.7567229270935059, 0.7992842793464661, 0.8418456315994263, 0.8844069838523865, 0.9269683361053467, 0.9695296287536621, 1.0120909214019775, 1.0546523332595825, 1.097213625907898, 1.139775037765503, 1.1823363304138184]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 5.0, 3.0, 3.0, 4.0, 1.0, 9.0, 4.0, 9.0, 20.0, 20.0, 28.0, 37.0, 48.0, 53.0, 51.0, 76.0, 74.0, 73.0, 87.0, 67.0, 65.0, 52.0, 40.0, 38.0, 34.0, 28.0, 20.0, 8.0, 12.0, 6.0, 6.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-1.2606399059295654, -1.2212210893630981, -1.1818022727966309, -1.1423835754394531, -1.1029647588729858, -1.0635459423065186, -1.0241272449493408, -0.9847084283828735, -0.9452896118164062, -0.905870795249939, -0.8664520382881165, -0.827033281326294, -0.7876144647598267, -0.7481956481933594, -0.7087768912315369, -0.6693581342697144, -0.6299393177032471, -0.5905205011367798, -0.5511017441749573, -0.5116829872131348, -0.4722641706466675, -0.4328453838825226, -0.3934265971183777, -0.3540078103542328, -0.3145890235900879, -0.275170236825943, -0.2357514500617981, -0.1963326632976532, -0.1569138765335083, -0.1174950897693634, -0.0780763030052185, -0.03865751624107361, 0.0007613897323608398, 0.04018017649650574, 0.07959896326065063, 0.11901775002479553, 0.15843653678894043, 0.19785532355308533, 0.23727411031723022, 0.2766928970813751, 0.31611168384552, 0.3555304706096649, 0.3949492573738098, 0.4343680441379547, 0.4737868309020996, 0.5132056474685669, 0.5526244044303894, 0.5920431613922119, 0.6314619779586792, 0.6708807945251465, 0.710299551486969, 0.7497183084487915, 0.7891371250152588, 0.8285559415817261, 0.8679746985435486, 0.9073934555053711, 0.9468122720718384, 0.9862310886383057, 1.0256497859954834, 1.0650686025619507, 1.104487419128418, 1.1439062356948853, 1.1833250522613525, 1.2227437496185303, 1.2621625661849976]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 1.0, 6.0, 4.0, 3.0, 6.0, 9.0, 15.0, 15.0, 16.0, 16.0, 36.0, 46.0, 77.0, 98.0, 156.0, 217.0, 343.0, 527.0, 839.0, 1242.0, 2037.0, 3509.0, 7633.0, 19028.0, 79393.0, 3409459.0, 591113.0, 48762.0, 14605.0, 6300.0, 3376.0, 2002.0, 1198.0, 743.0, 440.0, 298.0, 219.0, 160.0, 93.0, 67.0, 45.0, 31.0, 21.0, 18.0, 12.0, 20.0, 5.0, 11.0, 7.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.416259765625, -0.4023170471191406, -0.38837432861328125, -0.3744316101074219, -0.3604888916015625, -0.3465461730957031, -0.33260345458984375, -0.3186607360839844, -0.304718017578125, -0.2907752990722656, -0.27683258056640625, -0.2628898620605469, -0.2489471435546875, -0.23500442504882812, -0.22106170654296875, -0.20711898803710938, -0.19317626953125, -0.17923355102539062, -0.16529083251953125, -0.15134811401367188, -0.1374053955078125, -0.12346267700195312, -0.10951995849609375, -0.09557723999023438, -0.081634521484375, -0.06769180297851562, -0.05374908447265625, -0.039806365966796875, -0.0258636474609375, -0.011920928955078125, 0.00202178955078125, 0.015964508056640625, 0.0299072265625, 0.043849945068359375, 0.05779266357421875, 0.07173538208007812, 0.0856781005859375, 0.09962081909179688, 0.11356353759765625, 0.12750625610351562, 0.141448974609375, 0.15539169311523438, 0.16933441162109375, 0.18327713012695312, 0.1972198486328125, 0.21116256713867188, 0.22510528564453125, 0.23904800415039062, 0.25299072265625, 0.2669334411621094, 0.28087615966796875, 0.2948188781738281, 0.3087615966796875, 0.3227043151855469, 0.33664703369140625, 0.3505897521972656, 0.364532470703125, 0.3784751892089844, 0.39241790771484375, 0.4063606262207031, 0.4203033447265625, 0.4342460632324219, 0.44818878173828125, 0.4621315002441406, 0.47607421875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 6.0, 9.0, 3.0, 8.0, 11.0, 9.0, 16.0, 23.0, 17.0, 51.0, 37.0, 71.0, 86.0, 127.0, 136.0, 101.0, 69.0, 38.0, 42.0, 29.0, 22.0, 22.0, 16.0, 19.0, 8.0, 10.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04510498046875, -0.04370594024658203, -0.04230690002441406, -0.040907859802246094, -0.039508819580078125, -0.038109779357910156, -0.03671073913574219, -0.03531169891357422, -0.03391265869140625, -0.03251361846923828, -0.031114578247070312, -0.029715538024902344, -0.028316497802734375, -0.026917457580566406, -0.025518417358398438, -0.02411937713623047, -0.0227203369140625, -0.02132129669189453, -0.019922256469726562, -0.018523216247558594, -0.017124176025390625, -0.015725135803222656, -0.014326095581054688, -0.012927055358886719, -0.01152801513671875, -0.010128974914550781, -0.008729934692382812, -0.007330894470214844, -0.005931854248046875, -0.004532814025878906, -0.0031337738037109375, -0.0017347335815429688, -0.000335693359375, 0.0010633468627929688, 0.0024623870849609375, 0.0038614273071289062, 0.005260467529296875, 0.006659507751464844, 0.008058547973632812, 0.009457588195800781, 0.01085662841796875, 0.012255668640136719, 0.013654708862304688, 0.015053749084472656, 0.016452789306640625, 0.017851829528808594, 0.019250869750976562, 0.02064990997314453, 0.0220489501953125, 0.02344799041748047, 0.024847030639648438, 0.026246070861816406, 0.027645111083984375, 0.029044151306152344, 0.030443191528320312, 0.03184223175048828, 0.03324127197265625, 0.03464031219482422, 0.03603935241699219, 0.037438392639160156, 0.038837432861328125, 0.040236473083496094, 0.04163551330566406, 0.04303455352783203, 0.04443359375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 8.0, 8.0, 15.0, 12.0, 21.0, 26.0, 41.0, 77.0, 157.0, 309.0, 708.0, 1876.0, 5614.0, 20312.0, 131433.0, 3366189.0, 604485.0, 47084.0, 10480.0, 3243.0, 1179.0, 458.0, 209.0, 116.0, 67.0, 38.0, 26.0, 23.0, 11.0, 8.0, 7.0, 7.0, 8.0, 6.0, 8.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.367919921875, -0.3555564880371094, -0.34319305419921875, -0.3308296203613281, -0.3184661865234375, -0.3061027526855469, -0.29373931884765625, -0.2813758850097656, -0.269012451171875, -0.2566490173339844, -0.24428558349609375, -0.23192214965820312, -0.2195587158203125, -0.20719528198242188, -0.19483184814453125, -0.18246841430664062, -0.17010498046875, -0.15774154663085938, -0.14537811279296875, -0.13301467895507812, -0.1206512451171875, -0.10828781127929688, -0.09592437744140625, -0.08356094360351562, -0.071197509765625, -0.058834075927734375, -0.04647064208984375, -0.034107208251953125, -0.0217437744140625, -0.009380340576171875, 0.00298309326171875, 0.015346527099609375, 0.0277099609375, 0.040073394775390625, 0.05243682861328125, 0.06480026245117188, 0.0771636962890625, 0.08952713012695312, 0.10189056396484375, 0.11425399780273438, 0.126617431640625, 0.13898086547851562, 0.15134429931640625, 0.16370773315429688, 0.1760711669921875, 0.18843460083007812, 0.20079803466796875, 0.21316146850585938, 0.22552490234375, 0.23788833618164062, 0.25025177001953125, 0.2626152038574219, 0.2749786376953125, 0.2873420715332031, 0.29970550537109375, 0.3120689392089844, 0.324432373046875, 0.3367958068847656, 0.34915924072265625, 0.3615226745605469, 0.3738861083984375, 0.3862495422363281, 0.39861297607421875, 0.4109764099121094, 0.42333984375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 6.0, 4.0, 5.0, 5.0, 6.0, 6.0, 15.0, 19.0, 17.0, 27.0, 47.0, 61.0, 101.0, 163.0, 300.0, 732.0, 1424.0, 502.0, 264.0, 110.0, 79.0, 68.0, 28.0, 18.0, 13.0, 12.0, 7.0, 8.0, 4.0, 8.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.068603515625, -0.0666036605834961, -0.06460380554199219, -0.06260395050048828, -0.060604095458984375, -0.05860424041748047, -0.05660438537597656, -0.054604530334472656, -0.05260467529296875, -0.050604820251464844, -0.04860496520996094, -0.04660511016845703, -0.044605255126953125, -0.04260540008544922, -0.04060554504394531, -0.038605690002441406, -0.0366058349609375, -0.034605979919433594, -0.03260612487792969, -0.03060626983642578, -0.028606414794921875, -0.02660655975341797, -0.024606704711914062, -0.022606849670410156, -0.02060699462890625, -0.018607139587402344, -0.016607284545898438, -0.014607429504394531, -0.012607574462890625, -0.010607719421386719, -0.008607864379882812, -0.006608009338378906, -0.004608154296875, -0.0026082992553710938, -0.0006084442138671875, 0.0013914108276367188, 0.003391265869140625, 0.005391120910644531, 0.0073909759521484375, 0.009390830993652344, 0.01139068603515625, 0.013390541076660156, 0.015390396118164062, 0.01739025115966797, 0.019390106201171875, 0.02138996124267578, 0.023389816284179688, 0.025389671325683594, 0.0273895263671875, 0.029389381408691406, 0.03138923645019531, 0.03338909149169922, 0.035388946533203125, 0.03738880157470703, 0.03938865661621094, 0.041388511657714844, 0.04338836669921875, 0.045388221740722656, 0.04738807678222656, 0.04938793182373047, 0.051387786865234375, 0.05338764190673828, 0.05538749694824219, 0.057387351989746094, 0.05938720703125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 11.0, 57.0, 175.0, 318.0, 278.0, 112.0, 32.0, 10.0, 7.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43601012229919434, -0.4150972366333008, -0.3941843807697296, -0.37327152490615845, -0.3523586392402649, -0.33144575357437134, -0.31053289771080017, -0.289620041847229, -0.26870715618133545, -0.2477942854166031, -0.22688141465187073, -0.20596854388713837, -0.185055673122406, -0.16414280235767365, -0.14322993159294128, -0.12231706082820892, -0.10140419006347656, -0.0804913192987442, -0.05957844853401184, -0.03866557776927948, -0.01775270700454712, 0.0031601637601852417, 0.024073034524917603, 0.04498590528964996, 0.06589877605438232, 0.08681164681911469, 0.10772451758384705, 0.1286373883485794, 0.14955025911331177, 0.17046312987804413, 0.1913760006427765, 0.21228887140750885, 0.2332017421722412, 0.25411462783813477, 0.27502748370170593, 0.2959403395652771, 0.31685322523117065, 0.3377661108970642, 0.3586789667606354, 0.37959182262420654, 0.4005047082901001, 0.42141759395599365, 0.4423304498195648, 0.463243305683136, 0.48415619134902954, 0.5050690770149231, 0.5259819030761719, 0.5468947887420654, 0.567807674407959, 0.5887205600738525, 0.6096334457397461, 0.6305462718009949, 0.6514591574668884, 0.672372043132782, 0.6932848691940308, 0.7141977548599243, 0.7351106405258179, 0.7560235261917114, 0.776936411857605, 0.7978492379188538, 0.8187621235847473, 0.8396750092506409, 0.8605878353118896, 0.8815007209777832, 0.9024136066436768]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 1.0, 9.0, 4.0, 6.0, 8.0, 12.0, 11.0, 17.0, 23.0, 31.0, 29.0, 38.0, 45.0, 49.0, 61.0, 64.0, 70.0, 64.0, 60.0, 61.0, 55.0, 52.0, 39.0, 39.0, 24.0, 27.0, 19.0, 22.0, 21.0, 12.0, 5.0, 3.0, 7.0, 4.0, 2.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2592061758041382, -0.251478374004364, -0.24375058710575104, -0.23602278530597687, -0.2282949984073639, -0.22056719660758972, -0.21283939480781555, -0.20511159300804138, -0.1973838061094284, -0.18965600430965424, -0.18192821741104126, -0.1742004156112671, -0.16647261381149292, -0.15874482691287994, -0.15101702511310577, -0.1432892382144928, -0.13556143641471863, -0.12783363461494446, -0.12010584771633148, -0.11237804591655731, -0.10465025156736374, -0.09692245721817017, -0.089194655418396, -0.08146686106920242, -0.07373906672000885, -0.06601127237081528, -0.058283474296331406, -0.050555676221847534, -0.04282788187265396, -0.03510008752346039, -0.027372289448976517, -0.019644491374492645, -0.011916697025299072, -0.00418890081346035, 0.003538895398378372, 0.011266691610217094, 0.018994487822055817, 0.02672228217124939, 0.03445008024573326, 0.04217787832021713, 0.049905672669410706, 0.05763346701860428, 0.06536126136779785, 0.07308906316757202, 0.0808168575167656, 0.08854465186595917, 0.09627245366573334, 0.10400024801492691, 0.11172804236412048, 0.11945583671331406, 0.12718363106250763, 0.1349114328622818, 0.14263921976089478, 0.15036702156066895, 0.15809482336044312, 0.16582262516021729, 0.17355041205883026, 0.18127821385860443, 0.1890060007572174, 0.19673380255699158, 0.20446160435676575, 0.21218939125537872, 0.2199171930551529, 0.22764497995376587, 0.23537278175354004]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 6.0, 4.0, 5.0, 3.0, 7.0, 10.0, 12.0, 14.0, 18.0, 28.0, 31.0, 41.0, 72.0, 108.0, 154.0, 243.0, 376.0, 579.0, 905.0, 1666.0, 3057.0, 6111.0, 13383.0, 33300.0, 101944.0, 397524.0, 345858.0, 88691.0, 29747.0, 12230.0, 5635.0, 2819.0, 1496.0, 881.0, 549.0, 339.0, 223.0, 133.0, 110.0, 81.0, 49.0, 35.0, 19.0, 16.0, 10.0, 7.0, 12.0, 7.0, 4.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.218505859375, -0.21120834350585938, -0.20391082763671875, -0.19661331176757812, -0.1893157958984375, -0.18201828002929688, -0.17472076416015625, -0.16742324829101562, -0.160125732421875, -0.15282821655273438, -0.14553070068359375, -0.13823318481445312, -0.1309356689453125, -0.12363815307617188, -0.11634063720703125, -0.10904312133789062, -0.10174560546875, -0.09444808959960938, -0.08715057373046875, -0.07985305786132812, -0.0725555419921875, -0.06525802612304688, -0.05796051025390625, -0.050662994384765625, -0.043365478515625, -0.036067962646484375, -0.02877044677734375, -0.021472930908203125, -0.0141754150390625, -0.006877899169921875, 0.00041961669921875, 0.007717132568359375, 0.0150146484375, 0.022312164306640625, 0.02960968017578125, 0.036907196044921875, 0.0442047119140625, 0.051502227783203125, 0.05879974365234375, 0.06609725952148438, 0.073394775390625, 0.08069229125976562, 0.08798980712890625, 0.09528732299804688, 0.1025848388671875, 0.10988235473632812, 0.11717987060546875, 0.12447738647460938, 0.13177490234375, 0.13907241821289062, 0.14636993408203125, 0.15366744995117188, 0.1609649658203125, 0.16826248168945312, 0.17555999755859375, 0.18285751342773438, 0.190155029296875, 0.19745254516601562, 0.20475006103515625, 0.21204757690429688, 0.2193450927734375, 0.22664260864257812, 0.23394012451171875, 0.24123764038085938, 0.24853515625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 7.0, 5.0, 12.0, 10.0, 13.0, 17.0, 20.0, 28.0, 29.0, 42.0, 57.0, 91.0, 95.0, 127.0, 101.0, 71.0, 65.0, 41.0, 44.0, 30.0, 21.0, 17.0, 13.0, 10.0, 11.0, 9.0, 4.0, 0.0, 7.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0361328125, -0.03486919403076172, -0.03360557556152344, -0.032341957092285156, -0.031078338623046875, -0.029814720153808594, -0.028551101684570312, -0.02728748321533203, -0.02602386474609375, -0.02476024627685547, -0.023496627807617188, -0.022233009338378906, -0.020969390869140625, -0.019705772399902344, -0.018442153930664062, -0.01717853546142578, -0.0159149169921875, -0.014651298522949219, -0.013387680053710938, -0.012124061584472656, -0.010860443115234375, -0.009596824645996094, -0.008333206176757812, -0.007069587707519531, -0.00580596923828125, -0.004542350769042969, -0.0032787322998046875, -0.0020151138305664062, -0.000751495361328125, 0.0005121231079101562, 0.0017757415771484375, 0.0030393600463867188, 0.004302978515625, 0.005566596984863281, 0.0068302154541015625, 0.008093833923339844, 0.009357452392578125, 0.010621070861816406, 0.011884689331054688, 0.013148307800292969, 0.01441192626953125, 0.01567554473876953, 0.016939163208007812, 0.018202781677246094, 0.019466400146484375, 0.020730018615722656, 0.021993637084960938, 0.02325725555419922, 0.0245208740234375, 0.02578449249267578, 0.027048110961914062, 0.028311729431152344, 0.029575347900390625, 0.030838966369628906, 0.03210258483886719, 0.03336620330810547, 0.03462982177734375, 0.03589344024658203, 0.03715705871582031, 0.038420677185058594, 0.039684295654296875, 0.040947914123535156, 0.04221153259277344, 0.04347515106201172, 0.04473876953125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 5.0, 3.0, 7.0, 7.0, 11.0, 8.0, 18.0, 22.0, 35.0, 42.0, 52.0, 86.0, 109.0, 178.0, 296.0, 406.0, 732.0, 1465.0, 3851.0, 13555.0, 60782.0, 313426.0, 502657.0, 116425.0, 23787.0, 6025.0, 2141.0, 917.0, 537.0, 345.0, 190.0, 127.0, 88.0, 60.0, 39.0, 32.0, 25.0, 20.0, 10.0, 7.0, 8.0, 6.0, 3.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.276123046875, -0.26727294921875, -0.2584228515625, -0.24957275390625, -0.24072265625, -0.23187255859375, -0.2230224609375, -0.21417236328125, -0.205322265625, -0.19647216796875, -0.1876220703125, -0.17877197265625, -0.169921875, -0.16107177734375, -0.1522216796875, -0.14337158203125, -0.134521484375, -0.12567138671875, -0.1168212890625, -0.10797119140625, -0.09912109375, -0.09027099609375, -0.0814208984375, -0.07257080078125, -0.063720703125, -0.05487060546875, -0.0460205078125, -0.03717041015625, -0.0283203125, -0.01947021484375, -0.0106201171875, -0.00177001953125, 0.007080078125, 0.01593017578125, 0.0247802734375, 0.03363037109375, 0.04248046875, 0.05133056640625, 0.0601806640625, 0.06903076171875, 0.077880859375, 0.08673095703125, 0.0955810546875, 0.10443115234375, 0.11328125, 0.12213134765625, 0.1309814453125, 0.13983154296875, 0.148681640625, 0.15753173828125, 0.1663818359375, 0.17523193359375, 0.18408203125, 0.19293212890625, 0.2017822265625, 0.21063232421875, 0.219482421875, 0.22833251953125, 0.2371826171875, 0.24603271484375, 0.2548828125, 0.26373291015625, 0.2725830078125, 0.28143310546875, 0.290283203125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 3.0, 4.0, 6.0, 9.0, 8.0, 10.0, 8.0, 18.0, 15.0, 14.0, 22.0, 28.0, 24.0, 23.0, 31.0, 34.0, 34.0, 49.0, 32.0, 33.0, 37.0, 41.0, 46.0, 47.0, 54.0, 46.0, 48.0, 48.0, 41.0, 28.0, 22.0, 19.0, 17.0, 25.0, 11.0, 11.0, 16.0, 7.0, 13.0, 9.0, 4.0, 4.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.149169921875, -0.14434814453125, -0.1395263671875, -0.13470458984375, -0.1298828125, -0.12506103515625, -0.1202392578125, -0.11541748046875, -0.110595703125, -0.10577392578125, -0.1009521484375, -0.09613037109375, -0.09130859375, -0.08648681640625, -0.0816650390625, -0.07684326171875, -0.072021484375, -0.06719970703125, -0.0623779296875, -0.05755615234375, -0.052734375, -0.04791259765625, -0.0430908203125, -0.03826904296875, -0.033447265625, -0.02862548828125, -0.0238037109375, -0.01898193359375, -0.01416015625, -0.00933837890625, -0.0045166015625, 0.00030517578125, 0.005126953125, 0.00994873046875, 0.0147705078125, 0.01959228515625, 0.0244140625, 0.02923583984375, 0.0340576171875, 0.03887939453125, 0.043701171875, 0.04852294921875, 0.0533447265625, 0.05816650390625, 0.06298828125, 0.06781005859375, 0.0726318359375, 0.07745361328125, 0.082275390625, 0.08709716796875, 0.0919189453125, 0.09674072265625, 0.1015625, 0.10638427734375, 0.1112060546875, 0.11602783203125, 0.120849609375, 0.12567138671875, 0.1304931640625, 0.13531494140625, 0.14013671875, 0.14495849609375, 0.1497802734375, 0.15460205078125, 0.159423828125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 8.0, 5.0, 10.0, 10.0, 20.0, 20.0, 30.0, 45.0, 79.0, 148.0, 212.0, 406.0, 787.0, 1517.0, 3633.0, 8838.0, 25182.0, 85201.0, 305035.0, 415140.0, 140361.0, 39441.0, 13031.0, 4951.0, 2238.0, 969.0, 506.0, 279.0, 170.0, 92.0, 56.0, 41.0, 29.0, 25.0, 12.0, 10.0, 6.0, 1.0, 3.0, 4.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1419677734375, -0.1378154754638672, -0.13366317749023438, -0.12951087951660156, -0.12535858154296875, -0.12120628356933594, -0.11705398559570312, -0.11290168762207031, -0.1087493896484375, -0.10459709167480469, -0.10044479370117188, -0.09629249572753906, -0.09214019775390625, -0.08798789978027344, -0.08383560180664062, -0.07968330383300781, -0.075531005859375, -0.07137870788574219, -0.06722640991210938, -0.06307411193847656, -0.05892181396484375, -0.05476951599121094, -0.050617218017578125, -0.04646492004394531, -0.0423126220703125, -0.03816032409667969, -0.034008026123046875, -0.029855728149414062, -0.02570343017578125, -0.021551132202148438, -0.017398834228515625, -0.013246536254882812, -0.00909423828125, -0.0049419403076171875, -0.000789642333984375, 0.0033626556396484375, 0.00751495361328125, 0.011667251586914062, 0.015819549560546875, 0.019971847534179688, 0.0241241455078125, 0.028276443481445312, 0.032428741455078125, 0.03658103942871094, 0.04073333740234375, 0.04488563537597656, 0.049037933349609375, 0.05319023132324219, 0.057342529296875, 0.06149482727050781, 0.06564712524414062, 0.06979942321777344, 0.07395172119140625, 0.07810401916503906, 0.08225631713867188, 0.08640861511230469, 0.0905609130859375, 0.09471321105957031, 0.09886550903320312, 0.10301780700683594, 0.10717010498046875, 0.11132240295410156, 0.11547470092773438, 0.11962699890136719, 0.123779296875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 3.0, 4.0, 11.0, 33.0, 31.0, 42.0, 50.0, 49.0, 73.0, 106.0, 88.0, 85.0, 70.0, 73.0, 65.0, 66.0, 37.0, 28.0, 23.0, 16.0, 11.0, 8.0, 11.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00012218952178955078, -0.00011922325938940048, -0.00011625699698925018, -0.00011329073458909988, -0.00011032447218894958, -0.00010735820978879929, -0.00010439194738864899, -0.00010142568498849869, -9.845942258834839e-05, -9.549316018819809e-05, -9.252689778804779e-05, -8.956063538789749e-05, -8.659437298774719e-05, -8.36281105875969e-05, -8.06618481874466e-05, -7.76955857872963e-05, -7.4729323387146e-05, -7.17630609869957e-05, -6.87967985868454e-05, -6.58305361866951e-05, -6.28642737865448e-05, -5.98980113863945e-05, -5.69317489862442e-05, -5.39654865860939e-05, -5.0999224185943604e-05, -4.8032961785793304e-05, -4.5066699385643005e-05, -4.2100436985492706e-05, -3.913417458534241e-05, -3.616791218519211e-05, -3.320164978504181e-05, -3.023538738489151e-05, -2.726912498474121e-05, -2.4302862584590912e-05, -2.1336600184440613e-05, -1.8370337784290314e-05, -1.5404075384140015e-05, -1.2437812983989716e-05, -9.471550583839417e-06, -6.5052881836891174e-06, -3.5390257835388184e-06, -5.727633833885193e-07, 2.3934990167617798e-06, 5.359761416912079e-06, 8.326023817062378e-06, 1.1292286217212677e-05, 1.4258548617362976e-05, 1.7224811017513275e-05, 2.0191073417663574e-05, 2.3157335817813873e-05, 2.6123598217964172e-05, 2.908986061811447e-05, 3.205612301826477e-05, 3.502238541841507e-05, 3.798864781856537e-05, 4.095491021871567e-05, 4.392117261886597e-05, 4.6887435019016266e-05, 4.9853697419166565e-05, 5.2819959819316864e-05, 5.578622221946716e-05, 5.875248461961746e-05, 6.171874701976776e-05, 6.468500941991806e-05, 6.765127182006836e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 2.0, 6.0, 7.0, 15.0, 10.0, 33.0, 56.0, 67.0, 120.0, 266.0, 432.0, 1054.0, 2957.0, 11421.0, 71307.0, 608955.0, 309265.0, 32699.0, 6485.0, 1897.0, 740.0, 332.0, 181.0, 90.0, 53.0, 40.0, 18.0, 18.0, 11.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2352294921875, -0.2280597686767578, -0.22089004516601562, -0.21372032165527344, -0.20655059814453125, -0.19938087463378906, -0.19221115112304688, -0.1850414276123047, -0.1778717041015625, -0.1707019805908203, -0.16353225708007812, -0.15636253356933594, -0.14919281005859375, -0.14202308654785156, -0.13485336303710938, -0.1276836395263672, -0.120513916015625, -0.11334419250488281, -0.10617446899414062, -0.09900474548339844, -0.09183502197265625, -0.08466529846191406, -0.07749557495117188, -0.07032585144042969, -0.0631561279296875, -0.05598640441894531, -0.048816680908203125, -0.04164695739746094, -0.03447723388671875, -0.027307510375976562, -0.020137786865234375, -0.012968063354492188, -0.00579833984375, 0.0013713836669921875, 0.008541107177734375, 0.015710830688476562, 0.02288055419921875, 0.030050277709960938, 0.037220001220703125, 0.04438972473144531, 0.0515594482421875, 0.05872917175292969, 0.06589889526367188, 0.07306861877441406, 0.08023834228515625, 0.08740806579589844, 0.09457778930664062, 0.10174751281738281, 0.108917236328125, 0.11608695983886719, 0.12325668334960938, 0.13042640686035156, 0.13759613037109375, 0.14476585388183594, 0.15193557739257812, 0.1591053009033203, 0.1662750244140625, 0.1734447479248047, 0.18061447143554688, 0.18778419494628906, 0.19495391845703125, 0.20212364196777344, 0.20929336547851562, 0.2164630889892578, 0.2236328125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 4.0, 8.0, 15.0, 9.0, 15.0, 25.0, 34.0, 41.0, 53.0, 61.0, 85.0, 99.0, 113.0, 89.0, 93.0, 63.0, 39.0, 39.0, 26.0, 15.0, 14.0, 14.0, 11.0, 9.0, 5.0, 9.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.1273193359375, -0.12417125701904297, -0.12102317810058594, -0.1178750991821289, -0.11472702026367188, -0.11157894134521484, -0.10843086242675781, -0.10528278350830078, -0.10213470458984375, -0.09898662567138672, -0.09583854675292969, -0.09269046783447266, -0.08954238891601562, -0.0863943099975586, -0.08324623107910156, -0.08009815216064453, -0.0769500732421875, -0.07380199432373047, -0.07065391540527344, -0.0675058364868164, -0.06435775756835938, -0.061209678649902344, -0.05806159973144531, -0.05491352081298828, -0.05176544189453125, -0.04861736297607422, -0.04546928405761719, -0.042321205139160156, -0.039173126220703125, -0.036025047302246094, -0.03287696838378906, -0.02972888946533203, -0.026580810546875, -0.02343273162841797, -0.020284652709960938, -0.017136573791503906, -0.013988494873046875, -0.010840415954589844, -0.0076923370361328125, -0.004544258117675781, -0.00139617919921875, 0.0017518997192382812, 0.0048999786376953125, 0.008048057556152344, 0.011196136474609375, 0.014344215393066406, 0.017492294311523438, 0.02064037322998047, 0.0237884521484375, 0.02693653106689453, 0.030084609985351562, 0.033232688903808594, 0.036380767822265625, 0.039528846740722656, 0.04267692565917969, 0.04582500457763672, 0.04897308349609375, 0.05212116241455078, 0.05526924133300781, 0.058417320251464844, 0.061565399169921875, 0.0647134780883789, 0.06786155700683594, 0.07100963592529297, 0.07415771484375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 2.0, 10.0, 18.0, 32.0, 57.0, 146.0, 224.0, 230.0, 141.0, 71.0, 38.0, 12.0, 14.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.209059953689575, -3.1378350257873535, -3.066610097885132, -2.99538516998291, -2.9241602420806885, -2.852935314178467, -2.781710386276245, -2.7104854583740234, -2.6392602920532227, -2.568035364151001, -2.4968104362487793, -2.4255855083465576, -2.354360580444336, -2.2831356525421143, -2.2119107246398926, -2.140685558319092, -2.069460868835449, -1.9982359409332275, -1.9270110130310059, -1.8557860851287842, -1.7845611572265625, -1.7133362293243408, -1.6421111822128296, -1.570886254310608, -1.4996613264083862, -1.4284363985061646, -1.3572114706039429, -1.2859865427017212, -1.21476149559021, -1.1435365676879883, -1.0723116397857666, -1.001086711883545, -0.9298619031906128, -0.8586369752883911, -0.7874120473861694, -0.716187059879303, -0.6449621319770813, -0.5737372040748596, -0.5025122165679932, -0.4312872886657715, -0.3600623607635498, -0.2888374328613281, -0.21761247515678406, -0.14638753235340118, -0.07516258955001831, -0.003937661647796631, 0.06728729605674744, 0.1385122537612915, 0.20973718166351318, 0.28096210956573486, 0.35218706727027893, 0.423412024974823, 0.4946369528770447, 0.5658618807792664, 0.6370868682861328, 0.7083117961883545, 0.7795367240905762, 0.8507616519927979, 0.9219865798950195, 0.993211567401886, 1.064436435699463, 1.1356613636016846, 1.2068864107131958, 1.2781113386154175, 1.3493362665176392]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 4.0, 11.0, 7.0, 18.0, 13.0, 20.0, 28.0, 31.0, 38.0, 31.0, 44.0, 50.0, 57.0, 61.0, 65.0, 72.0, 78.0, 58.0, 48.0, 43.0, 44.0, 35.0, 32.0, 32.0, 23.0, 17.0, 11.0, 10.0, 3.0, 4.0, 4.0, 0.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-2.0063319206237793, -1.957811713218689, -1.9092915058135986, -1.8607712984085083, -1.812251091003418, -1.763730764389038, -1.7152105569839478, -1.6666903495788574, -1.618170142173767, -1.5696499347686768, -1.5211297273635864, -1.472609519958496, -1.4240891933441162, -1.3755689859390259, -1.3270487785339355, -1.2785285711288452, -1.2300083637237549, -1.1814881563186646, -1.1329679489135742, -1.0844477415084839, -1.0359275341033936, -0.9874072670936584, -0.9388870000839233, -0.890366792678833, -0.8418465852737427, -0.7933263778686523, -0.744806170463562, -0.6962859034538269, -0.6477656960487366, -0.5992454886436462, -0.5507252216339111, -0.5022050142288208, -0.4536846876144409, -0.4051644802093506, -0.35664424300193787, -0.30812400579452515, -0.2596037983894348, -0.2110835760831833, -0.16256335377693176, -0.11404311656951904, -0.06552290916442871, -0.017002686858177185, 0.03151753544807434, 0.08003775775432587, 0.1285579800605774, 0.17707820236682892, 0.22559842467308044, 0.27411866188049316, 0.3226388692855835, 0.37115907669067383, 0.41967931389808655, 0.46819955110549927, 0.5167197585105896, 0.5652399659156799, 0.613760232925415, 0.6622804403305054, 0.7108006477355957, 0.759320855140686, 0.8078410625457764, 0.8563613295555115, 0.9048815369606018, 0.9534017443656921, 1.0019220113754272, 1.0504422187805176, 1.098962426185608]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 7.0, 10.0, 14.0, 23.0, 35.0, 66.0, 80.0, 195.0, 331.0, 724.0, 1892.0, 6817.0, 53784.0, 3943837.0, 169734.0, 12035.0, 2717.0, 957.0, 459.0, 214.0, 123.0, 74.0, 41.0, 34.0, 17.0, 10.0, 8.0, 15.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.77685546875, -0.75067138671875, -0.7244873046875, -0.69830322265625, -0.672119140625, -0.64593505859375, -0.6197509765625, -0.59356689453125, -0.5673828125, -0.54119873046875, -0.5150146484375, -0.48883056640625, -0.462646484375, -0.43646240234375, -0.4102783203125, -0.38409423828125, -0.35791015625, -0.33172607421875, -0.3055419921875, -0.27935791015625, -0.253173828125, -0.22698974609375, -0.2008056640625, -0.17462158203125, -0.1484375, -0.12225341796875, -0.0960693359375, -0.06988525390625, -0.043701171875, -0.01751708984375, 0.0086669921875, 0.03485107421875, 0.06103515625, 0.08721923828125, 0.1134033203125, 0.13958740234375, 0.165771484375, 0.19195556640625, 0.2181396484375, 0.24432373046875, 0.2705078125, 0.29669189453125, 0.3228759765625, 0.34906005859375, 0.375244140625, 0.40142822265625, 0.4276123046875, 0.45379638671875, 0.47998046875, 0.50616455078125, 0.5323486328125, 0.55853271484375, 0.584716796875, 0.61090087890625, 0.6370849609375, 0.66326904296875, 0.689453125, 0.71563720703125, 0.7418212890625, 0.76800537109375, 0.794189453125, 0.82037353515625, 0.8465576171875, 0.87274169921875, 0.89892578125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 7.0, 2.0, 4.0, 4.0, 10.0, 8.0, 11.0, 26.0, 20.0, 21.0, 33.0, 43.0, 41.0, 54.0, 64.0, 71.0, 84.0, 79.0, 70.0, 79.0, 53.0, 43.0, 38.0, 27.0, 28.0, 12.0, 21.0, 9.0, 6.0, 6.0, 5.0, 4.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.04052734375, -0.03921318054199219, -0.037899017333984375, -0.03658485412597656, -0.03527069091796875, -0.03395652770996094, -0.032642364501953125, -0.03132820129394531, -0.0300140380859375, -0.028699874877929688, -0.027385711669921875, -0.026071548461914062, -0.02475738525390625, -0.023443222045898438, -0.022129058837890625, -0.020814895629882812, -0.019500732421875, -0.018186569213867188, -0.016872406005859375, -0.015558242797851562, -0.01424407958984375, -0.012929916381835938, -0.011615753173828125, -0.010301589965820312, -0.0089874267578125, -0.0076732635498046875, -0.006359100341796875, -0.0050449371337890625, -0.00373077392578125, -0.0024166107177734375, -0.001102447509765625, 0.0002117156982421875, 0.00152587890625, 0.0028400421142578125, 0.004154205322265625, 0.0054683685302734375, 0.00678253173828125, 0.008096694946289062, 0.009410858154296875, 0.010725021362304688, 0.0120391845703125, 0.013353347778320312, 0.014667510986328125, 0.015981674194335938, 0.01729583740234375, 0.018610000610351562, 0.019924163818359375, 0.021238327026367188, 0.022552490234375, 0.023866653442382812, 0.025180816650390625, 0.026494979858398438, 0.02780914306640625, 0.029123306274414062, 0.030437469482421875, 0.03175163269042969, 0.0330657958984375, 0.03437995910644531, 0.035694122314453125, 0.03700828552246094, 0.03832244873046875, 0.03963661193847656, 0.040950775146484375, 0.04226493835449219, 0.0435791015625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 12.0, 15.0, 29.0, 54.0, 112.0, 222.0, 510.0, 1617.0, 5566.0, 26021.0, 216274.0, 3611162.0, 292262.0, 30764.0, 6482.0, 1920.0, 659.0, 275.0, 134.0, 74.0, 45.0, 26.0, 19.0, 16.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.344970703125, -0.3314704895019531, -0.31797027587890625, -0.3044700622558594, -0.2909698486328125, -0.2774696350097656, -0.26396942138671875, -0.2504692077636719, -0.236968994140625, -0.22346878051757812, -0.20996856689453125, -0.19646835327148438, -0.1829681396484375, -0.16946792602539062, -0.15596771240234375, -0.14246749877929688, -0.12896728515625, -0.11546707153320312, -0.10196685791015625, -0.08846664428710938, -0.0749664306640625, -0.061466217041015625, -0.04796600341796875, -0.034465789794921875, -0.020965576171875, -0.007465362548828125, 0.00603485107421875, 0.019535064697265625, 0.0330352783203125, 0.046535491943359375, 0.06003570556640625, 0.07353591918945312, 0.0870361328125, 0.10053634643554688, 0.11403656005859375, 0.12753677368164062, 0.1410369873046875, 0.15453720092773438, 0.16803741455078125, 0.18153762817382812, 0.195037841796875, 0.20853805541992188, 0.22203826904296875, 0.23553848266601562, 0.2490386962890625, 0.2625389099121094, 0.27603912353515625, 0.2895393371582031, 0.30303955078125, 0.3165397644042969, 0.33003997802734375, 0.3435401916503906, 0.3570404052734375, 0.3705406188964844, 0.38404083251953125, 0.3975410461425781, 0.411041259765625, 0.4245414733886719, 0.43804168701171875, 0.4515419006347656, 0.4650421142578125, 0.4785423278808594, 0.49204254150390625, 0.5055427551269531, 0.51904296875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 13.0, 17.0, 20.0, 27.0, 45.0, 89.0, 147.0, 224.0, 576.0, 1771.0, 570.0, 238.0, 130.0, 80.0, 39.0, 27.0, 23.0, 20.0, 9.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06072998046875, -0.05761241912841797, -0.05449485778808594, -0.051377296447753906, -0.048259735107421875, -0.045142173767089844, -0.04202461242675781, -0.03890705108642578, -0.03578948974609375, -0.03267192840576172, -0.029554367065429688, -0.026436805725097656, -0.023319244384765625, -0.020201683044433594, -0.017084121704101562, -0.013966560363769531, -0.0108489990234375, -0.007731437683105469, -0.0046138763427734375, -0.0014963150024414062, 0.001621246337890625, 0.004738807678222656, 0.007856369018554688, 0.010973930358886719, 0.01409149169921875, 0.01720905303955078, 0.020326614379882812, 0.023444175720214844, 0.026561737060546875, 0.029679298400878906, 0.03279685974121094, 0.03591442108154297, 0.039031982421875, 0.04214954376220703, 0.04526710510253906, 0.048384666442871094, 0.051502227783203125, 0.054619789123535156, 0.05773735046386719, 0.06085491180419922, 0.06397247314453125, 0.06709003448486328, 0.07020759582519531, 0.07332515716552734, 0.07644271850585938, 0.0795602798461914, 0.08267784118652344, 0.08579540252685547, 0.0889129638671875, 0.09203052520751953, 0.09514808654785156, 0.0982656478881836, 0.10138320922851562, 0.10450077056884766, 0.10761833190917969, 0.11073589324951172, 0.11385345458984375, 0.11697101593017578, 0.12008857727050781, 0.12320613861083984, 0.12632369995117188, 0.1294412612915039, 0.13255882263183594, 0.13567638397216797, 0.1387939453125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 5.0, 18.0, 33.0, 82.0, 183.0, 302.0, 233.0, 92.0, 43.0, 12.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2170950323343277, -0.19176141917705536, -0.16642779111862183, -0.1410941779613495, -0.11576056480407715, -0.09042695164680481, -0.06509332358837128, -0.03975971043109894, -0.014426097273826599, 0.010907519608736038, 0.036241136491298676, 0.06157475709915161, 0.08690837025642395, 0.11224198341369629, 0.13757561147212982, 0.16290922462940216, 0.1882428377866745, 0.21357645094394684, 0.23891007900238037, 0.2642436921596527, 0.28957730531692505, 0.3149109184741974, 0.3402445316314697, 0.36557817459106445, 0.3909117579460144, 0.41624537110328674, 0.4415789842605591, 0.4669126272201538, 0.49224621057510376, 0.5175798535346985, 0.5429134368896484, 0.5682470798492432, 0.5935807228088379, 0.6189143657684326, 0.6442479491233826, 0.6695815920829773, 0.6949151754379272, 0.720248818397522, 0.7455824613571167, 0.7709160447120667, 0.7962496280670166, 0.8215832710266113, 0.8469168543815613, 0.872250497341156, 0.897584080696106, 0.9229177236557007, 0.9482513666152954, 0.9735849499702454, 0.9989185929298401, 1.02425217628479, 1.0495858192443848, 1.0749194622039795, 1.1002531051635742, 1.1255866289138794, 1.1509202718734741, 1.1762539148330688, 1.2015875577926636, 1.2269212007522583, 1.252254843711853, 1.2775883674621582, 1.302922010421753, 1.3282556533813477, 1.3535892963409424, 1.378922939300537, 1.4042564630508423]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 9.0, 7.0, 14.0, 11.0, 9.0, 15.0, 16.0, 13.0, 14.0, 24.0, 40.0, 31.0, 24.0, 40.0, 44.0, 52.0, 38.0, 45.0, 48.0, 36.0, 46.0, 62.0, 37.0, 45.0, 43.0, 32.0, 33.0, 31.0, 20.0, 16.0, 17.0, 16.0, 6.0, 10.0, 12.0, 10.0, 8.0, 7.0, 9.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2006056308746338, -0.1934179812669754, -0.1862303465604782, -0.17904269695281982, -0.17185504734516144, -0.16466739773750305, -0.15747976303100586, -0.15029211342334747, -0.1431044638156891, -0.1359168142080307, -0.1287291795015335, -0.12154152989387512, -0.11435388028621674, -0.10716623812913895, -0.09997859597206116, -0.09279094636440277, -0.08560331165790558, -0.07841566950082779, -0.0712280198931694, -0.06404037773609161, -0.056852731853723526, -0.04966508597135544, -0.04247744381427765, -0.03528979793190956, -0.028102152049541473, -0.020914506167173386, -0.013726862147450447, -0.0065392181277275085, 0.0006484277546405792, 0.007836073637008667, 0.015023715794086456, 0.022211361676454544, 0.029399007558822632, 0.03658665344119072, 0.04377429932355881, 0.0509619414806366, 0.058149587363004684, 0.06533723324537277, 0.07252487540245056, 0.07971252501010895, 0.08690016716718674, 0.09408780932426453, 0.10127545893192291, 0.1084631010890007, 0.11565074324607849, 0.12283839285373688, 0.13002604246139526, 0.13721367716789246, 0.14440132677555084, 0.15158897638320923, 0.15877661108970642, 0.1659642606973648, 0.1731519103050232, 0.18033954501152039, 0.18752719461917877, 0.19471484422683716, 0.20190247893333435, 0.20909012854099274, 0.21627776324748993, 0.22346541285514832, 0.2306530624628067, 0.2378407120704651, 0.24502834677696228, 0.2522159814834595, 0.25940364599227905]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 9.0, 9.0, 15.0, 28.0, 25.0, 34.0, 66.0, 109.0, 160.0, 269.0, 456.0, 849.0, 1660.0, 3403.0, 8192.0, 24305.0, 88347.0, 347761.0, 413087.0, 111932.0, 30023.0, 9744.0, 3993.0, 1823.0, 963.0, 508.0, 269.0, 185.0, 106.0, 73.0, 44.0, 38.0, 16.0, 11.0, 11.0, 8.0, 3.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2406005859375, -0.2323284149169922, -0.22405624389648438, -0.21578407287597656, -0.20751190185546875, -0.19923973083496094, -0.19096755981445312, -0.1826953887939453, -0.1744232177734375, -0.1661510467529297, -0.15787887573242188, -0.14960670471191406, -0.14133453369140625, -0.13306236267089844, -0.12479019165039062, -0.11651802062988281, -0.108245849609375, -0.09997367858886719, -0.09170150756835938, -0.08342933654785156, -0.07515716552734375, -0.06688499450683594, -0.058612823486328125, -0.05034065246582031, -0.0420684814453125, -0.03379631042480469, -0.025524139404296875, -0.017251968383789062, -0.00897979736328125, -0.0007076263427734375, 0.007564544677734375, 0.015836715698242188, 0.02410888671875, 0.03238105773925781, 0.040653228759765625, 0.04892539978027344, 0.05719757080078125, 0.06546974182128906, 0.07374191284179688, 0.08201408386230469, 0.0902862548828125, 0.09855842590332031, 0.10683059692382812, 0.11510276794433594, 0.12337493896484375, 0.13164710998535156, 0.13991928100585938, 0.1481914520263672, 0.156463623046875, 0.1647357940673828, 0.17300796508789062, 0.18128013610839844, 0.18955230712890625, 0.19782447814941406, 0.20609664916992188, 0.2143688201904297, 0.2226409912109375, 0.2309131622314453, 0.23918533325195312, 0.24745750427246094, 0.25572967529296875, 0.26400184631347656, 0.2722740173339844, 0.2805461883544922, 0.288818359375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 11.0, 9.0, 20.0, 30.0, 25.0, 36.0, 39.0, 44.0, 61.0, 71.0, 86.0, 82.0, 71.0, 81.0, 68.0, 50.0, 41.0, 34.0, 33.0, 13.0, 17.0, 16.0, 12.0, 4.0, 8.0, 10.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0382080078125, -0.03683042526245117, -0.035452842712402344, -0.034075260162353516, -0.03269767761230469, -0.03132009506225586, -0.02994251251220703, -0.028564929962158203, -0.027187347412109375, -0.025809764862060547, -0.02443218231201172, -0.02305459976196289, -0.021677017211914062, -0.020299434661865234, -0.018921852111816406, -0.017544269561767578, -0.01616668701171875, -0.014789104461669922, -0.013411521911621094, -0.012033939361572266, -0.010656356811523438, -0.00927877426147461, -0.007901191711425781, -0.006523609161376953, -0.005146026611328125, -0.003768444061279297, -0.0023908615112304688, -0.0010132789611816406, 0.0003643035888671875, 0.0017418861389160156, 0.0031194686889648438, 0.004497051239013672, 0.0058746337890625, 0.007252216339111328, 0.008629798889160156, 0.010007381439208984, 0.011384963989257812, 0.01276254653930664, 0.014140129089355469, 0.015517711639404297, 0.016895294189453125, 0.018272876739501953, 0.01965045928955078, 0.02102804183959961, 0.022405624389648438, 0.023783206939697266, 0.025160789489746094, 0.026538372039794922, 0.02791595458984375, 0.029293537139892578, 0.030671119689941406, 0.032048702239990234, 0.03342628479003906, 0.03480386734008789, 0.03618144989013672, 0.03755903244018555, 0.038936614990234375, 0.0403141975402832, 0.04169178009033203, 0.04306936264038086, 0.04444694519042969, 0.045824527740478516, 0.047202110290527344, 0.04857969284057617, 0.049957275390625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 7.0, 10.0, 15.0, 13.0, 19.0, 20.0, 39.0, 54.0, 88.0, 103.0, 138.0, 224.0, 350.0, 637.0, 1127.0, 2496.0, 6776.0, 21462.0, 79860.0, 304304.0, 440910.0, 136737.0, 35495.0, 10425.0, 3650.0, 1527.0, 770.0, 417.0, 282.0, 172.0, 122.0, 88.0, 56.0, 44.0, 23.0, 16.0, 19.0, 16.0, 8.0, 10.0, 6.0, 5.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.278076171875, -0.2696990966796875, -0.261322021484375, -0.2529449462890625, -0.24456787109375, -0.2361907958984375, -0.227813720703125, -0.2194366455078125, -0.2110595703125, -0.2026824951171875, -0.194305419921875, -0.1859283447265625, -0.17755126953125, -0.1691741943359375, -0.160797119140625, -0.1524200439453125, -0.14404296875, -0.1356658935546875, -0.127288818359375, -0.1189117431640625, -0.11053466796875, -0.1021575927734375, -0.093780517578125, -0.0854034423828125, -0.0770263671875, -0.0686492919921875, -0.060272216796875, -0.0518951416015625, -0.04351806640625, -0.0351409912109375, -0.026763916015625, -0.0183868408203125, -0.010009765625, -0.0016326904296875, 0.006744384765625, 0.0151214599609375, 0.02349853515625, 0.0318756103515625, 0.040252685546875, 0.0486297607421875, 0.0570068359375, 0.0653839111328125, 0.073760986328125, 0.0821380615234375, 0.09051513671875, 0.0988922119140625, 0.107269287109375, 0.1156463623046875, 0.1240234375, 0.1324005126953125, 0.140777587890625, 0.1491546630859375, 0.15753173828125, 0.1659088134765625, 0.174285888671875, 0.1826629638671875, 0.1910400390625, 0.1994171142578125, 0.207794189453125, 0.2161712646484375, 0.22454833984375, 0.2329254150390625, 0.241302490234375, 0.2496795654296875, 0.258056640625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 9.0, 8.0, 8.0, 12.0, 8.0, 14.0, 16.0, 18.0, 23.0, 23.0, 33.0, 20.0, 39.0, 30.0, 32.0, 35.0, 56.0, 51.0, 35.0, 39.0, 57.0, 47.0, 30.0, 41.0, 49.0, 34.0, 28.0, 30.0, 21.0, 16.0, 18.0, 23.0, 20.0, 11.0, 13.0, 14.0, 8.0, 6.0, 3.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.20263671875, -0.19637489318847656, -0.19011306762695312, -0.1838512420654297, -0.17758941650390625, -0.1713275909423828, -0.16506576538085938, -0.15880393981933594, -0.1525421142578125, -0.14628028869628906, -0.14001846313476562, -0.1337566375732422, -0.12749481201171875, -0.12123298645019531, -0.11497116088867188, -0.10870933532714844, -0.102447509765625, -0.09618568420410156, -0.08992385864257812, -0.08366203308105469, -0.07740020751953125, -0.07113838195800781, -0.06487655639648438, -0.05861473083496094, -0.0523529052734375, -0.04609107971191406, -0.039829254150390625, -0.03356742858886719, -0.02730560302734375, -0.021043777465820312, -0.014781951904296875, -0.008520126342773438, -0.00225830078125, 0.0040035247802734375, 0.010265350341796875, 0.016527175903320312, 0.02278900146484375, 0.029050827026367188, 0.035312652587890625, 0.04157447814941406, 0.0478363037109375, 0.05409812927246094, 0.060359954833984375, 0.06662178039550781, 0.07288360595703125, 0.07914543151855469, 0.08540725708007812, 0.09166908264160156, 0.097930908203125, 0.10419273376464844, 0.11045455932617188, 0.11671638488769531, 0.12297821044921875, 0.1292400360107422, 0.13550186157226562, 0.14176368713378906, 0.1480255126953125, 0.15428733825683594, 0.16054916381835938, 0.1668109893798828, 0.17307281494140625, 0.1793346405029297, 0.18559646606445312, 0.19185829162597656, 0.1981201171875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 10.0, 18.0, 45.0, 62.0, 115.0, 210.0, 440.0, 1042.0, 2387.0, 6565.0, 19922.0, 67071.0, 259503.0, 478583.0, 151099.0, 41298.0, 12717.0, 4306.0, 1679.0, 711.0, 332.0, 193.0, 105.0, 52.0, 30.0, 22.0, 13.0, 7.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10748291015625, -0.10306072235107422, -0.09863853454589844, -0.09421634674072266, -0.08979415893554688, -0.0853719711303711, -0.08094978332519531, -0.07652759552001953, -0.07210540771484375, -0.06768321990966797, -0.06326103210449219, -0.058838844299316406, -0.054416656494140625, -0.049994468688964844, -0.04557228088378906, -0.04115009307861328, -0.0367279052734375, -0.03230571746826172, -0.027883529663085938, -0.023461341857910156, -0.019039154052734375, -0.014616966247558594, -0.010194778442382812, -0.005772590637207031, -0.00135040283203125, 0.0030717849731445312, 0.0074939727783203125, 0.011916160583496094, 0.016338348388671875, 0.020760536193847656, 0.025182723999023438, 0.02960491180419922, 0.034027099609375, 0.03844928741455078, 0.04287147521972656, 0.047293663024902344, 0.051715850830078125, 0.056138038635253906, 0.06056022644042969, 0.06498241424560547, 0.06940460205078125, 0.07382678985595703, 0.07824897766113281, 0.0826711654663086, 0.08709335327148438, 0.09151554107666016, 0.09593772888183594, 0.10035991668701172, 0.1047821044921875, 0.10920429229736328, 0.11362648010253906, 0.11804866790771484, 0.12247085571289062, 0.1268930435180664, 0.1313152313232422, 0.13573741912841797, 0.14015960693359375, 0.14458179473876953, 0.1490039825439453, 0.1534261703491211, 0.15784835815429688, 0.16227054595947266, 0.16669273376464844, 0.17111492156982422, 0.175537109375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 9.0, 5.0, 1.0, 7.0, 9.0, 15.0, 24.0, 47.0, 50.0, 54.0, 87.0, 106.0, 90.0, 109.0, 104.0, 75.0, 53.0, 46.0, 36.0, 30.0, 20.0, 12.0, 10.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013554096221923828, -0.00013245176523923874, -0.0001293625682592392, -0.00012627337127923965, -0.0001231841742992401, -0.00012009497731924057, -0.00011700578033924103, -0.00011391658335924149, -0.00011082738637924194, -0.0001077381893992424, -0.00010464899241924286, -0.00010155979543924332, -9.847059845924377e-05, -9.538140147924423e-05, -9.229220449924469e-05, -8.920300751924515e-05, -8.61138105392456e-05, -8.302461355924606e-05, -7.993541657924652e-05, -7.684621959924698e-05, -7.375702261924744e-05, -7.06678256392479e-05, -6.757862865924835e-05, -6.448943167924881e-05, -6.140023469924927e-05, -5.8311037719249725e-05, -5.522184073925018e-05, -5.213264375925064e-05, -4.90434467792511e-05, -4.5954249799251556e-05, -4.2865052819252014e-05, -3.977585583925247e-05, -3.668665885925293e-05, -3.359746187925339e-05, -3.0508264899253845e-05, -2.7419067919254303e-05, -2.432987093925476e-05, -2.124067395925522e-05, -1.8151476979255676e-05, -1.5062279999256134e-05, -1.1973083019256592e-05, -8.88388603925705e-06, -5.794689059257507e-06, -2.705492079257965e-06, 3.8370490074157715e-07, 3.4729018807411194e-06, 6.562098860740662e-06, 9.651295840740204e-06, 1.2740492820739746e-05, 1.582968980073929e-05, 1.891888678073883e-05, 2.2008083760738373e-05, 2.5097280740737915e-05, 2.8186477720737457e-05, 3.1275674700737e-05, 3.436487168073654e-05, 3.7454068660736084e-05, 4.0543265640735626e-05, 4.363246262073517e-05, 4.672165960073471e-05, 4.981085658073425e-05, 5.2900053560733795e-05, 5.598925054073334e-05, 5.907844752073288e-05, 6.216764450073242e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 8.0, 2.0, 7.0, 8.0, 14.0, 17.0, 26.0, 46.0, 60.0, 63.0, 103.0, 149.0, 201.0, 331.0, 560.0, 1126.0, 2495.0, 6127.0, 18143.0, 59884.0, 233389.0, 518073.0, 145504.0, 40525.0, 12924.0, 4621.0, 1858.0, 933.0, 465.0, 265.0, 175.0, 115.0, 85.0, 77.0, 44.0, 33.0, 26.0, 23.0, 16.0, 12.0, 6.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1396484375, -0.13519287109375, -0.1307373046875, -0.12628173828125, -0.121826171875, -0.11737060546875, -0.1129150390625, -0.10845947265625, -0.10400390625, -0.09954833984375, -0.0950927734375, -0.09063720703125, -0.086181640625, -0.08172607421875, -0.0772705078125, -0.07281494140625, -0.068359375, -0.06390380859375, -0.0594482421875, -0.05499267578125, -0.050537109375, -0.04608154296875, -0.0416259765625, -0.03717041015625, -0.03271484375, -0.02825927734375, -0.0238037109375, -0.01934814453125, -0.014892578125, -0.01043701171875, -0.0059814453125, -0.00152587890625, 0.0029296875, 0.00738525390625, 0.0118408203125, 0.01629638671875, 0.020751953125, 0.02520751953125, 0.0296630859375, 0.03411865234375, 0.03857421875, 0.04302978515625, 0.0474853515625, 0.05194091796875, 0.056396484375, 0.06085205078125, 0.0653076171875, 0.06976318359375, 0.07421875, 0.07867431640625, 0.0831298828125, 0.08758544921875, 0.092041015625, 0.09649658203125, 0.1009521484375, 0.10540771484375, 0.10986328125, 0.11431884765625, 0.1187744140625, 0.12322998046875, 0.127685546875, 0.13214111328125, 0.1365966796875, 0.14105224609375, 0.1455078125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 1.0, 3.0, 9.0, 9.0, 6.0, 8.0, 15.0, 21.0, 13.0, 24.0, 32.0, 35.0, 46.0, 50.0, 73.0, 78.0, 102.0, 75.0, 63.0, 54.0, 54.0, 45.0, 40.0, 34.0, 19.0, 15.0, 12.0, 12.0, 12.0, 8.0, 7.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0], "bins": [-0.09893798828125, -0.09633350372314453, -0.09372901916503906, -0.0911245346069336, -0.08852005004882812, -0.08591556549072266, -0.08331108093261719, -0.08070659637451172, -0.07810211181640625, -0.07549762725830078, -0.07289314270019531, -0.07028865814208984, -0.06768417358398438, -0.0650796890258789, -0.06247520446777344, -0.05987071990966797, -0.0572662353515625, -0.05466175079345703, -0.05205726623535156, -0.049452781677246094, -0.046848297119140625, -0.044243812561035156, -0.04163932800292969, -0.03903484344482422, -0.03643035888671875, -0.03382587432861328, -0.031221389770507812, -0.028616905212402344, -0.026012420654296875, -0.023407936096191406, -0.020803451538085938, -0.01819896697998047, -0.015594482421875, -0.012989997863769531, -0.010385513305664062, -0.007781028747558594, -0.005176544189453125, -0.0025720596313476562, 3.24249267578125e-05, 0.0026369094848632812, 0.00524139404296875, 0.007845878601074219, 0.010450363159179688, 0.013054847717285156, 0.015659332275390625, 0.018263816833496094, 0.020868301391601562, 0.02347278594970703, 0.0260772705078125, 0.02868175506591797, 0.03128623962402344, 0.033890724182128906, 0.036495208740234375, 0.039099693298339844, 0.04170417785644531, 0.04430866241455078, 0.04691314697265625, 0.04951763153076172, 0.05212211608886719, 0.054726600646972656, 0.057331085205078125, 0.059935569763183594, 0.06254005432128906, 0.06514453887939453, 0.0677490234375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 8.0, 11.0, 8.0, 31.0, 55.0, 105.0, 193.0, 210.0, 170.0, 99.0, 58.0, 24.0, 13.0, 12.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1753957271575928, -1.099431037902832, -1.0234663486480713, -0.9475017189979553, -0.8715370893478394, -0.7955724000930786, -0.7196077108383179, -0.6436430811882019, -0.5676783919334412, -0.4917137324810028, -0.41574907302856445, -0.3397843837738037, -0.26381972432136536, -0.187855064868927, -0.11189037561416626, -0.03592574596405029, 0.04003894329071045, 0.1160036101937294, 0.19196827709674835, 0.2679329514503479, 0.34389761090278625, 0.4198622703552246, 0.49582695960998535, 0.5717915892601013, 0.6477562785148621, 0.7237209677696228, 0.7996855974197388, 0.8756502866744995, 0.9516149759292603, 1.0275795459747314, 1.1035442352294922, 1.179508924484253, 1.2554736137390137, 1.3314383029937744, 1.4074029922485352, 1.483367681503296, 1.559332251548767, 1.6352969408035278, 1.7112616300582886, 1.7872262001037598, 1.8631908893585205, 1.9391555786132812, 2.015120267868042, 2.0910849571228027, 2.1670496463775635, 2.243014335632324, 2.318978786468506, 2.3949434757232666, 2.4709081649780273, 2.546872854232788, 2.622837543487549, 2.6988022327423096, 2.7747669219970703, 2.850731372833252, 2.926696300506592, 3.0026607513427734, 3.0786256790161133, 3.154590368270874, 3.2305550575256348, 3.3065197467803955, 3.3824844360351562, 3.458448886871338, 3.5344138145446777, 3.6103782653808594, 3.68634295463562]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 6.0, 4.0, 11.0, 11.0, 10.0, 13.0, 23.0, 14.0, 20.0, 31.0, 26.0, 28.0, 31.0, 30.0, 51.0, 45.0, 41.0, 43.0, 48.0, 45.0, 42.0, 49.0, 45.0, 46.0, 41.0, 40.0, 23.0, 35.0, 18.0, 28.0, 22.0, 8.0, 14.0, 10.0, 16.0, 10.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.4971299171447754, -1.451413869857788, -1.4056979417800903, -1.359981894493103, -1.3142659664154053, -1.268549919128418, -1.2228338718414307, -1.177117943763733, -1.1314020156860352, -1.0856859683990479, -1.03997004032135, -0.9942539930343628, -0.948538064956665, -0.9028220176696777, -0.8571060299873352, -0.8113900423049927, -0.7656739950180054, -0.7199580073356628, -0.6742420196533203, -0.628525972366333, -0.5828100442886353, -0.537093997001648, -0.4913780093193054, -0.4456620216369629, -0.39994603395462036, -0.35423004627227783, -0.3085140585899353, -0.2627980411052704, -0.21708205342292786, -0.17136606574058533, -0.1256500482559204, -0.07993406057357788, -0.03421807289123535, 0.011497922241687775, 0.0572139173746109, 0.10292991995811462, 0.14864590764045715, 0.19436189532279968, 0.2400779128074646, 0.28579390048980713, 0.33150988817214966, 0.3772258758544922, 0.4229418635368347, 0.46865788102149963, 0.5143738985061646, 0.5600898265838623, 0.6058058738708496, 0.6515218615531921, 0.6972378492355347, 0.7429538369178772, 0.7886698246002197, 0.834385871887207, 0.8801017999649048, 0.9258178472518921, 0.9715338349342346, 1.0172498226165771, 1.0629658699035645, 1.1086819171905518, 1.1543978452682495, 1.2001138925552368, 1.2458298206329346, 1.2915458679199219, 1.3372619152069092, 1.382977843284607, 1.4286937713623047]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 7.0, 8.0, 12.0, 5.0, 23.0, 30.0, 39.0, 66.0, 98.0, 158.0, 253.0, 446.0, 710.0, 1336.0, 2904.0, 7868.0, 27157.0, 149589.0, 3602473.0, 337017.0, 44224.0, 11450.0, 4181.0, 1844.0, 911.0, 513.0, 293.0, 210.0, 165.0, 75.0, 59.0, 51.0, 23.0, 23.0, 15.0, 10.0, 5.0, 10.0, 2.0, 6.0, 5.0, 1.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33544921875, -0.3248558044433594, -0.31426239013671875, -0.3036689758300781, -0.2930755615234375, -0.2824821472167969, -0.27188873291015625, -0.2612953186035156, -0.250701904296875, -0.24010848999023438, -0.22951507568359375, -0.21892166137695312, -0.2083282470703125, -0.19773483276367188, -0.18714141845703125, -0.17654800415039062, -0.16595458984375, -0.15536117553710938, -0.14476776123046875, -0.13417434692382812, -0.1235809326171875, -0.11298751831054688, -0.10239410400390625, -0.09180068969726562, -0.081207275390625, -0.07061386108398438, -0.06002044677734375, -0.049427032470703125, -0.0388336181640625, -0.028240203857421875, -0.01764678955078125, -0.007053375244140625, 0.0035400390625, 0.014133453369140625, 0.02472686767578125, 0.035320281982421875, 0.0459136962890625, 0.056507110595703125, 0.06710052490234375, 0.07769393920898438, 0.088287353515625, 0.09888076782226562, 0.10947418212890625, 0.12006759643554688, 0.1306610107421875, 0.14125442504882812, 0.15184783935546875, 0.16244125366210938, 0.17303466796875, 0.18362808227539062, 0.19422149658203125, 0.20481491088867188, 0.2154083251953125, 0.22600173950195312, 0.23659515380859375, 0.24718856811523438, 0.257781982421875, 0.2683753967285156, 0.27896881103515625, 0.2895622253417969, 0.3001556396484375, 0.3107490539550781, 0.32134246826171875, 0.3319358825683594, 0.342529296875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 12.0, 10.0, 14.0, 16.0, 24.0, 29.0, 29.0, 40.0, 46.0, 49.0, 72.0, 77.0, 67.0, 80.0, 81.0, 66.0, 51.0, 45.0, 37.0, 41.0, 22.0, 20.0, 22.0, 10.0, 12.0, 6.0, 3.0, 10.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.059112548828125, -0.057383060455322266, -0.05565357208251953, -0.0539240837097168, -0.05219459533691406, -0.05046510696411133, -0.048735618591308594, -0.04700613021850586, -0.045276641845703125, -0.04354715347290039, -0.041817665100097656, -0.04008817672729492, -0.03835868835449219, -0.03662919998168945, -0.03489971160888672, -0.033170223236083984, -0.03144073486328125, -0.029711246490478516, -0.02798175811767578, -0.026252269744873047, -0.024522781372070312, -0.022793292999267578, -0.021063804626464844, -0.01933431625366211, -0.017604827880859375, -0.01587533950805664, -0.014145851135253906, -0.012416362762451172, -0.010686874389648438, -0.008957386016845703, -0.007227897644042969, -0.005498409271240234, -0.0037689208984375, -0.0020394325256347656, -0.00030994415283203125, 0.0014195442199707031, 0.0031490325927734375, 0.004878520965576172, 0.006608009338378906, 0.00833749771118164, 0.010066986083984375, 0.01179647445678711, 0.013525962829589844, 0.015255451202392578, 0.016984939575195312, 0.018714427947998047, 0.02044391632080078, 0.022173404693603516, 0.02390289306640625, 0.025632381439208984, 0.02736186981201172, 0.029091358184814453, 0.030820846557617188, 0.03255033493041992, 0.034279823303222656, 0.03600931167602539, 0.037738800048828125, 0.03946828842163086, 0.041197776794433594, 0.04292726516723633, 0.04465675354003906, 0.0463862419128418, 0.04811573028564453, 0.049845218658447266, 0.05157470703125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 4.0, 4.0, 4.0, 3.0, 11.0, 7.0, 20.0, 19.0, 23.0, 45.0, 47.0, 71.0, 137.0, 183.0, 252.0, 380.0, 686.0, 1247.0, 2430.0, 5224.0, 13005.0, 36606.0, 136006.0, 1163850.0, 2581756.0, 180167.0, 44583.0, 15191.0, 6228.0, 2714.0, 1384.0, 787.0, 432.0, 259.0, 183.0, 119.0, 85.0, 46.0, 25.0, 18.0, 17.0, 8.0, 5.0, 9.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2115478515625, -0.2047443389892578, -0.19794082641601562, -0.19113731384277344, -0.18433380126953125, -0.17753028869628906, -0.17072677612304688, -0.1639232635498047, -0.1571197509765625, -0.1503162384033203, -0.14351272583007812, -0.13670921325683594, -0.12990570068359375, -0.12310218811035156, -0.11629867553710938, -0.10949516296386719, -0.102691650390625, -0.09588813781738281, -0.08908462524414062, -0.08228111267089844, -0.07547760009765625, -0.06867408752441406, -0.061870574951171875, -0.05506706237792969, -0.0482635498046875, -0.04146003723144531, -0.034656524658203125, -0.027853012084960938, -0.02104949951171875, -0.014245986938476562, -0.007442474365234375, -0.0006389617919921875, 0.00616455078125, 0.012968063354492188, 0.019771575927734375, 0.026575088500976562, 0.03337860107421875, 0.04018211364746094, 0.046985626220703125, 0.05378913879394531, 0.0605926513671875, 0.06739616394042969, 0.07419967651367188, 0.08100318908691406, 0.08780670166015625, 0.09461021423339844, 0.10141372680664062, 0.10821723937988281, 0.115020751953125, 0.12182426452636719, 0.12862777709960938, 0.13543128967285156, 0.14223480224609375, 0.14903831481933594, 0.15584182739257812, 0.1626453399658203, 0.1694488525390625, 0.1762523651123047, 0.18305587768554688, 0.18985939025878906, 0.19666290283203125, 0.20346641540527344, 0.21026992797851562, 0.2170734405517578, 0.223876953125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 7.0, 17.0, 12.0, 17.0, 23.0, 28.0, 50.0, 84.0, 94.0, 194.0, 351.0, 1122.0, 1235.0, 349.0, 162.0, 92.0, 79.0, 39.0, 24.0, 29.0, 19.0, 13.0, 10.0, 6.0, 6.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0], "bins": [-0.10089111328125, -0.09837007522583008, -0.09584903717041016, -0.09332799911499023, -0.09080696105957031, -0.08828592300415039, -0.08576488494873047, -0.08324384689331055, -0.08072280883789062, -0.0782017707824707, -0.07568073272705078, -0.07315969467163086, -0.07063865661621094, -0.06811761856079102, -0.0655965805053711, -0.06307554244995117, -0.06055450439453125, -0.05803346633911133, -0.055512428283691406, -0.052991390228271484, -0.05047035217285156, -0.04794931411743164, -0.04542827606201172, -0.0429072380065918, -0.040386199951171875, -0.03786516189575195, -0.03534412384033203, -0.03282308578491211, -0.030302047729492188, -0.027781009674072266, -0.025259971618652344, -0.022738933563232422, -0.0202178955078125, -0.017696857452392578, -0.015175819396972656, -0.012654781341552734, -0.010133743286132812, -0.007612705230712891, -0.005091667175292969, -0.002570629119873047, -4.9591064453125e-05, 0.002471446990966797, 0.004992485046386719, 0.007513523101806641, 0.010034561157226562, 0.012555599212646484, 0.015076637268066406, 0.017597675323486328, 0.02011871337890625, 0.022639751434326172, 0.025160789489746094, 0.027681827545166016, 0.030202865600585938, 0.03272390365600586, 0.03524494171142578, 0.0377659797668457, 0.040287017822265625, 0.04280805587768555, 0.04532909393310547, 0.04785013198852539, 0.05037117004394531, 0.052892208099365234, 0.055413246154785156, 0.05793428421020508, 0.060455322265625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 7.0, 19.0, 47.0, 66.0, 166.0, 246.0, 216.0, 130.0, 57.0, 31.0, 17.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3823726177215576, -0.3583725094795227, -0.3343724012374878, -0.3103722929954529, -0.28637218475341797, -0.26237207651138306, -0.23837193846702576, -0.21437183022499084, -0.19037172198295593, -0.16637161374092102, -0.1423715054988861, -0.11837138235569, -0.09437127411365509, -0.07037116587162018, -0.04637104272842407, -0.02237093448638916, 0.001629173755645752, 0.025629285722970963, 0.04962939769029617, 0.07362951338291168, 0.0976296216249466, 0.1216297298669815, 0.1456298530101776, 0.16962996125221252, 0.19363006949424744, 0.21763017773628235, 0.24163028597831726, 0.26563042402267456, 0.2896305322647095, 0.3136306405067444, 0.3376307487487793, 0.3616308569908142, 0.3856309652328491, 0.40963107347488403, 0.43363118171691895, 0.45763128995895386, 0.48163139820098877, 0.5056315064430237, 0.5296316146850586, 0.5536317825317383, 0.5776318311691284, 0.6016319394111633, 0.6256320476531982, 0.6496321558952332, 0.6736322641372681, 0.697632372379303, 0.7216324806213379, 0.7456326484680176, 0.7696327567100525, 0.7936328649520874, 0.8176329731941223, 0.8416330814361572, 0.8656331896781921, 0.889633297920227, 0.9136334657669067, 0.9376335144042969, 0.9616336822509766, 0.9856337904930115, 1.0096338987350464, 1.033634066581726, 1.0576341152191162, 1.081634283065796, 1.105634331703186, 1.1296344995498657, 1.1536345481872559]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 6.0, 5.0, 3.0, 11.0, 5.0, 10.0, 10.0, 14.0, 16.0, 14.0, 27.0, 19.0, 25.0, 29.0, 31.0, 32.0, 36.0, 47.0, 42.0, 48.0, 46.0, 40.0, 37.0, 37.0, 36.0, 29.0, 40.0, 37.0, 36.0, 27.0, 37.0, 21.0, 22.0, 30.0, 16.0, 9.0, 13.0, 14.0, 8.0, 9.0, 6.0, 4.0, 3.0, 4.0, 7.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.21842819452285767, -0.2109563797712326, -0.20348455011844635, -0.1960127353668213, -0.18854090571403503, -0.18106909096240997, -0.1735972762107849, -0.16612544655799866, -0.1586536318063736, -0.15118181705474854, -0.14370998740196228, -0.13623817265033722, -0.12876635789871216, -0.1212945282459259, -0.11382271349430084, -0.10635089129209518, -0.09887906908988953, -0.09140724688768387, -0.08393542468547821, -0.07646360993385315, -0.06899178773164749, -0.061519965529441833, -0.054048147052526474, -0.046576328575611115, -0.03910450637340546, -0.0316326841711998, -0.02416086569428444, -0.01668904535472393, -0.009217225015163422, -0.0017454028129577637, 0.005726415663957596, 0.013198234140872955, 0.020670056343078613, 0.028141876682639122, 0.03561369702219963, 0.04308551549911499, 0.05055733770132065, 0.058029159903526306, 0.06550097465515137, 0.07297279685735703, 0.08044461905956268, 0.08791644126176834, 0.095388263463974, 0.10286007821559906, 0.11033190041780472, 0.11780372262001038, 0.12527553737163544, 0.1327473521232605, 0.14021918177604675, 0.14769099652767181, 0.15516282618045807, 0.16263464093208313, 0.17010647058486938, 0.17757828533649445, 0.1850501000881195, 0.19252192974090576, 0.19999374449253082, 0.20746555924415588, 0.21493738889694214, 0.2224092036485672, 0.22988101840019226, 0.23735284805297852, 0.24482466280460358, 0.25229647755622864, 0.2597683072090149]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 9.0, 3.0, 5.0, 9.0, 17.0, 17.0, 37.0, 36.0, 59.0, 81.0, 111.0, 224.0, 321.0, 480.0, 760.0, 1418.0, 2469.0, 4906.0, 9686.0, 19605.0, 42483.0, 94913.0, 208869.0, 316479.0, 186725.0, 84713.0, 37987.0, 17558.0, 8442.0, 4380.0, 2359.0, 1278.0, 775.0, 480.0, 281.0, 202.0, 126.0, 82.0, 59.0, 44.0, 25.0, 17.0, 10.0, 7.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.1641845703125, -0.15979766845703125, -0.1554107666015625, -0.15102386474609375, -0.146636962890625, -0.14225006103515625, -0.1378631591796875, -0.13347625732421875, -0.12908935546875, -0.12470245361328125, -0.1203155517578125, -0.11592864990234375, -0.111541748046875, -0.10715484619140625, -0.1027679443359375, -0.09838104248046875, -0.093994140625, -0.08960723876953125, -0.0852203369140625, -0.08083343505859375, -0.076446533203125, -0.07205963134765625, -0.0676727294921875, -0.06328582763671875, -0.05889892578125, -0.05451202392578125, -0.0501251220703125, -0.04573822021484375, -0.041351318359375, -0.03696441650390625, -0.0325775146484375, -0.02819061279296875, -0.0238037109375, -0.01941680908203125, -0.0150299072265625, -0.01064300537109375, -0.006256103515625, -0.00186920166015625, 0.0025177001953125, 0.00690460205078125, 0.01129150390625, 0.01567840576171875, 0.0200653076171875, 0.02445220947265625, 0.028839111328125, 0.03322601318359375, 0.0376129150390625, 0.04199981689453125, 0.04638671875, 0.05077362060546875, 0.0551605224609375, 0.05954742431640625, 0.063934326171875, 0.06832122802734375, 0.0727081298828125, 0.07709503173828125, 0.08148193359375, 0.08586883544921875, 0.0902557373046875, 0.09464263916015625, 0.099029541015625, 0.10341644287109375, 0.1078033447265625, 0.11219024658203125, 0.1165771484375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 10.0, 11.0, 11.0, 19.0, 26.0, 30.0, 32.0, 52.0, 48.0, 40.0, 60.0, 93.0, 68.0, 77.0, 74.0, 64.0, 50.0, 48.0, 41.0, 29.0, 33.0, 18.0, 17.0, 11.0, 10.0, 4.0, 7.0, 7.0, 1.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.06231689453125, -0.06062889099121094, -0.058940887451171875, -0.05725288391113281, -0.05556488037109375, -0.05387687683105469, -0.052188873291015625, -0.05050086975097656, -0.0488128662109375, -0.04712486267089844, -0.045436859130859375, -0.04374885559082031, -0.04206085205078125, -0.04037284851074219, -0.038684844970703125, -0.03699684143066406, -0.035308837890625, -0.03362083435058594, -0.031932830810546875, -0.030244827270507812, -0.02855682373046875, -0.026868820190429688, -0.025180816650390625, -0.023492813110351562, -0.0218048095703125, -0.020116806030273438, -0.018428802490234375, -0.016740798950195312, -0.01505279541015625, -0.013364791870117188, -0.011676788330078125, -0.009988784790039062, -0.00830078125, -0.0066127777099609375, -0.004924774169921875, -0.0032367706298828125, -0.00154876708984375, 0.0001392364501953125, 0.001827239990234375, 0.0035152435302734375, 0.0052032470703125, 0.0068912506103515625, 0.008579254150390625, 0.010267257690429688, 0.01195526123046875, 0.013643264770507812, 0.015331268310546875, 0.017019271850585938, 0.018707275390625, 0.020395278930664062, 0.022083282470703125, 0.023771286010742188, 0.02545928955078125, 0.027147293090820312, 0.028835296630859375, 0.030523300170898438, 0.0322113037109375, 0.03389930725097656, 0.035587310791015625, 0.03727531433105469, 0.03896331787109375, 0.04065132141113281, 0.042339324951171875, 0.04402732849121094, 0.04571533203125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 8.0, 9.0, 7.0, 8.0, 20.0, 32.0, 35.0, 63.0, 68.0, 93.0, 159.0, 227.0, 393.0, 630.0, 1229.0, 2419.0, 5650.0, 15875.0, 54567.0, 192746.0, 433521.0, 238765.0, 69242.0, 19978.0, 6825.0, 2781.0, 1302.0, 701.0, 396.0, 272.0, 150.0, 114.0, 74.0, 52.0, 43.0, 30.0, 23.0, 13.0, 12.0, 5.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.228515625, -0.22243690490722656, -0.21635818481445312, -0.2102794647216797, -0.20420074462890625, -0.1981220245361328, -0.19204330444335938, -0.18596458435058594, -0.1798858642578125, -0.17380714416503906, -0.16772842407226562, -0.1616497039794922, -0.15557098388671875, -0.1494922637939453, -0.14341354370117188, -0.13733482360839844, -0.131256103515625, -0.12517738342285156, -0.11909866333007812, -0.11301994323730469, -0.10694122314453125, -0.10086250305175781, -0.09478378295898438, -0.08870506286621094, -0.0826263427734375, -0.07654762268066406, -0.07046890258789062, -0.06439018249511719, -0.05831146240234375, -0.05223274230957031, -0.046154022216796875, -0.04007530212402344, -0.03399658203125, -0.027917861938476562, -0.021839141845703125, -0.015760421752929688, -0.00968170166015625, -0.0036029815673828125, 0.002475738525390625, 0.008554458618164062, 0.0146331787109375, 0.020711898803710938, 0.026790618896484375, 0.03286933898925781, 0.03894805908203125, 0.04502677917480469, 0.051105499267578125, 0.05718421936035156, 0.063262939453125, 0.06934165954589844, 0.07542037963867188, 0.08149909973144531, 0.08757781982421875, 0.09365653991699219, 0.09973526000976562, 0.10581398010253906, 0.1118927001953125, 0.11797142028808594, 0.12405014038085938, 0.1301288604736328, 0.13620758056640625, 0.1422863006591797, 0.14836502075195312, 0.15444374084472656, 0.1605224609375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 13.0, 8.0, 5.0, 16.0, 16.0, 17.0, 23.0, 37.0, 36.0, 33.0, 47.0, 49.0, 51.0, 61.0, 58.0, 56.0, 59.0, 47.0, 57.0, 44.0, 49.0, 42.0, 42.0, 21.0, 20.0, 23.0, 17.0, 13.0, 6.0, 6.0, 10.0, 7.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.315185546875, -0.3072471618652344, -0.29930877685546875, -0.2913703918457031, -0.2834320068359375, -0.2754936218261719, -0.26755523681640625, -0.2596168518066406, -0.251678466796875, -0.24374008178710938, -0.23580169677734375, -0.22786331176757812, -0.2199249267578125, -0.21198654174804688, -0.20404815673828125, -0.19610977172851562, -0.18817138671875, -0.18023300170898438, -0.17229461669921875, -0.16435623168945312, -0.1564178466796875, -0.14847946166992188, -0.14054107666015625, -0.13260269165039062, -0.124664306640625, -0.11672592163085938, -0.10878753662109375, -0.10084915161132812, -0.0929107666015625, -0.08497238159179688, -0.07703399658203125, -0.06909561157226562, -0.0611572265625, -0.053218841552734375, -0.04528045654296875, -0.037342071533203125, -0.0294036865234375, -0.021465301513671875, -0.01352691650390625, -0.005588531494140625, 0.002349853515625, 0.010288238525390625, 0.01822662353515625, 0.026165008544921875, 0.0341033935546875, 0.042041778564453125, 0.04998016357421875, 0.057918548583984375, 0.06585693359375, 0.07379531860351562, 0.08173370361328125, 0.08967208862304688, 0.0976104736328125, 0.10554885864257812, 0.11348724365234375, 0.12142562866210938, 0.129364013671875, 0.13730239868164062, 0.14524078369140625, 0.15317916870117188, 0.1611175537109375, 0.16905593872070312, 0.17699432373046875, 0.18493270874023438, 0.19287109375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 16.0, 13.0, 16.0, 27.0, 38.0, 65.0, 88.0, 158.0, 201.0, 374.0, 649.0, 1150.0, 2540.0, 5550.0, 13831.0, 38678.0, 125935.0, 401739.0, 317508.0, 90954.0, 29132.0, 10856.0, 4415.0, 2090.0, 1066.0, 586.0, 293.0, 200.0, 120.0, 84.0, 53.0, 37.0, 26.0, 18.0, 16.0, 12.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0712890625, -0.06863594055175781, -0.06598281860351562, -0.06332969665527344, -0.06067657470703125, -0.05802345275878906, -0.055370330810546875, -0.05271720886230469, -0.0500640869140625, -0.04741096496582031, -0.044757843017578125, -0.04210472106933594, -0.03945159912109375, -0.03679847717285156, -0.034145355224609375, -0.03149223327636719, -0.028839111328125, -0.026185989379882812, -0.023532867431640625, -0.020879745483398438, -0.01822662353515625, -0.015573501586914062, -0.012920379638671875, -0.010267257690429688, -0.0076141357421875, -0.0049610137939453125, -0.002307891845703125, 0.0003452301025390625, 0.00299835205078125, 0.0056514739990234375, 0.008304595947265625, 0.010957717895507812, 0.01361083984375, 0.016263961791992188, 0.018917083740234375, 0.021570205688476562, 0.02422332763671875, 0.026876449584960938, 0.029529571533203125, 0.03218269348144531, 0.0348358154296875, 0.03748893737792969, 0.040142059326171875, 0.04279518127441406, 0.04544830322265625, 0.04810142517089844, 0.050754547119140625, 0.05340766906738281, 0.056060791015625, 0.05871391296386719, 0.061367034912109375, 0.06402015686035156, 0.06667327880859375, 0.06932640075683594, 0.07197952270507812, 0.07463264465332031, 0.0772857666015625, 0.07993888854980469, 0.08259201049804688, 0.08524513244628906, 0.08789825439453125, 0.09055137634277344, 0.09320449829101562, 0.09585762023925781, 0.0985107421875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 8.0, 8.0, 17.0, 17.0, 19.0, 22.0, 36.0, 41.0, 43.0, 54.0, 54.0, 65.0, 68.0, 68.0, 68.0, 58.0, 62.0, 52.0, 51.0, 56.0, 29.0, 25.0, 15.0, 13.0, 13.0, 10.0, 2.0, 8.0, 7.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.7578086853027344e-05, -5.5806711316108704e-05, -5.4035335779190063e-05, -5.226396024227142e-05, -5.049258470535278e-05, -4.872120916843414e-05, -4.69498336315155e-05, -4.517845809459686e-05, -4.340708255767822e-05, -4.163570702075958e-05, -3.986433148384094e-05, -3.80929559469223e-05, -3.632158041000366e-05, -3.455020487308502e-05, -3.277882933616638e-05, -3.100745379924774e-05, -2.92360782623291e-05, -2.746470272541046e-05, -2.569332718849182e-05, -2.392195165157318e-05, -2.215057611465454e-05, -2.03792005777359e-05, -1.860782504081726e-05, -1.683644950389862e-05, -1.506507396697998e-05, -1.329369843006134e-05, -1.15223228931427e-05, -9.75094735622406e-06, -7.97957181930542e-06, -6.20819628238678e-06, -4.43682074546814e-06, -2.6654452085494995e-06, -8.940696716308594e-07, 8.773058652877808e-07, 2.648681402206421e-06, 4.420056939125061e-06, 6.191432476043701e-06, 7.962808012962341e-06, 9.734183549880981e-06, 1.1505559086799622e-05, 1.3276934623718262e-05, 1.5048310160636902e-05, 1.6819685697555542e-05, 1.8591061234474182e-05, 2.0362436771392822e-05, 2.2133812308311462e-05, 2.3905187845230103e-05, 2.5676563382148743e-05, 2.7447938919067383e-05, 2.9219314455986023e-05, 3.099068999290466e-05, 3.27620655298233e-05, 3.453344106674194e-05, 3.6304816603660583e-05, 3.8076192140579224e-05, 3.9847567677497864e-05, 4.1618943214416504e-05, 4.3390318751335144e-05, 4.5161694288253784e-05, 4.6933069825172424e-05, 4.8704445362091064e-05, 5.0475820899009705e-05, 5.2247196435928345e-05, 5.4018571972846985e-05, 5.5789947509765625e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 9.0, 9.0, 14.0, 29.0, 24.0, 43.0, 58.0, 107.0, 121.0, 238.0, 422.0, 735.0, 1563.0, 3191.0, 7762.0, 22279.0, 74866.0, 300314.0, 453042.0, 127706.0, 35368.0, 11663.0, 4616.0, 1968.0, 1001.0, 527.0, 288.0, 196.0, 115.0, 74.0, 63.0, 36.0, 22.0, 20.0, 9.0, 9.0, 6.0, 8.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0819091796875, -0.07919692993164062, -0.07648468017578125, -0.07377243041992188, -0.0710601806640625, -0.06834793090820312, -0.06563568115234375, -0.06292343139648438, -0.060211181640625, -0.057498931884765625, -0.05478668212890625, -0.052074432373046875, -0.0493621826171875, -0.046649932861328125, -0.04393768310546875, -0.041225433349609375, -0.03851318359375, -0.035800933837890625, -0.03308868408203125, -0.030376434326171875, -0.0276641845703125, -0.024951934814453125, -0.02223968505859375, -0.019527435302734375, -0.016815185546875, -0.014102935791015625, -0.01139068603515625, -0.008678436279296875, -0.0059661865234375, -0.003253936767578125, -0.00054168701171875, 0.002170562744140625, 0.0048828125, 0.007595062255859375, 0.01030731201171875, 0.013019561767578125, 0.0157318115234375, 0.018444061279296875, 0.02115631103515625, 0.023868560791015625, 0.026580810546875, 0.029293060302734375, 0.03200531005859375, 0.034717559814453125, 0.0374298095703125, 0.040142059326171875, 0.04285430908203125, 0.045566558837890625, 0.04827880859375, 0.050991058349609375, 0.05370330810546875, 0.056415557861328125, 0.0591278076171875, 0.061840057373046875, 0.06455230712890625, 0.06726455688476562, 0.069976806640625, 0.07268905639648438, 0.07540130615234375, 0.07811355590820312, 0.0808258056640625, 0.08353805541992188, 0.08625030517578125, 0.08896255493164062, 0.0916748046875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 3.0, 4.0, 1.0, 3.0, 8.0, 8.0, 11.0, 13.0, 21.0, 23.0, 20.0, 30.0, 26.0, 52.0, 55.0, 49.0, 61.0, 83.0, 64.0, 59.0, 79.0, 48.0, 55.0, 41.0, 33.0, 32.0, 28.0, 23.0, 21.0, 16.0, 7.0, 8.0, 7.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0517578125, -0.049953460693359375, -0.04814910888671875, -0.046344757080078125, -0.0445404052734375, -0.042736053466796875, -0.04093170166015625, -0.039127349853515625, -0.037322998046875, -0.035518646240234375, -0.03371429443359375, -0.031909942626953125, -0.0301055908203125, -0.028301239013671875, -0.02649688720703125, -0.024692535400390625, -0.02288818359375, -0.021083831787109375, -0.01927947998046875, -0.017475128173828125, -0.0156707763671875, -0.013866424560546875, -0.01206207275390625, -0.010257720947265625, -0.008453369140625, -0.006649017333984375, -0.00484466552734375, -0.003040313720703125, -0.0012359619140625, 0.000568389892578125, 0.00237274169921875, 0.004177093505859375, 0.0059814453125, 0.007785797119140625, 0.00959014892578125, 0.011394500732421875, 0.0131988525390625, 0.015003204345703125, 0.01680755615234375, 0.018611907958984375, 0.020416259765625, 0.022220611572265625, 0.02402496337890625, 0.025829315185546875, 0.0276336669921875, 0.029438018798828125, 0.03124237060546875, 0.033046722412109375, 0.03485107421875, 0.036655426025390625, 0.03845977783203125, 0.040264129638671875, 0.0420684814453125, 0.043872833251953125, 0.04567718505859375, 0.047481536865234375, 0.049285888671875, 0.051090240478515625, 0.05289459228515625, 0.054698944091796875, 0.0565032958984375, 0.058307647705078125, 0.06011199951171875, 0.061916351318359375, 0.063720703125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 4.0, 4.0, 4.0, 9.0, 16.0, 29.0, 46.0, 60.0, 94.0, 117.0, 151.0, 144.0, 103.0, 93.0, 55.0, 36.0, 18.0, 8.0, 6.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5754654407501221, -0.5339462757110596, -0.4924270808696747, -0.4509079158306122, -0.4093887209892273, -0.3678695559501648, -0.3263503909111023, -0.2848311960697174, -0.2433120310306549, -0.2017928510904312, -0.16027367115020752, -0.11875450611114502, -0.07723532617092133, -0.03571614623069763, 0.005803018808364868, 0.047322213649749756, 0.08884137868881226, 0.13036055862903595, 0.17187973856925964, 0.21339890360832214, 0.25491809844970703, 0.29643726348876953, 0.33795642852783203, 0.3794756233692169, 0.4209947884082794, 0.4625139534473419, 0.5040331482887268, 0.5455523133277893, 0.5870714783668518, 0.6285907030105591, 0.6701098680496216, 0.7116290330886841, 0.7531481981277466, 0.7946673631668091, 0.8361865282058716, 0.8777056932449341, 0.9192249178886414, 0.9607440829277039, 1.0022633075714111, 1.0437824726104736, 1.0853016376495361, 1.1268208026885986, 1.1683399677276611, 1.2098591327667236, 1.2513782978057861, 1.2928974628448486, 1.3344166278839111, 1.3759359121322632, 1.4174549579620361, 1.4589741230010986, 1.5004932880401611, 1.5420124530792236, 1.5835316181182861, 1.6250507831573486, 1.6665699481964111, 1.7080892324447632, 1.7496083974838257, 1.7911275625228882, 1.8326467275619507, 1.8741658926010132, 1.9156850576400757, 1.9572043418884277, 1.9987235069274902, 2.0402426719665527, 2.0817618370056152]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 1.0, 2.0, 7.0, 2.0, 4.0, 10.0, 10.0, 18.0, 17.0, 18.0, 25.0, 27.0, 21.0, 27.0, 32.0, 36.0, 32.0, 35.0, 41.0, 30.0, 45.0, 45.0, 59.0, 53.0, 37.0, 43.0, 32.0, 33.0, 30.0, 25.0, 28.0, 28.0, 14.0, 26.0, 19.0, 15.0, 16.0, 7.0, 13.0, 8.0, 3.0, 7.0, 7.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.980883002281189, -0.9472073316574097, -0.9135316610336304, -0.8798559904098511, -0.846180260181427, -0.8125045895576477, -0.7788289189338684, -0.7451532483100891, -0.711477518081665, -0.6778018474578857, -0.6441261768341064, -0.6104505062103271, -0.5767747759819031, -0.5430991053581238, -0.5094234347343445, -0.4757477641105652, -0.4420720934867859, -0.4083964228630066, -0.3747207224369049, -0.3410450518131256, -0.3073693513870239, -0.27369368076324463, -0.24001801013946533, -0.20634232461452484, -0.17266663908958435, -0.13899095356464386, -0.10531527549028397, -0.07163959741592407, -0.03796391189098358, -0.004288226366043091, 0.029387444257736206, 0.0630631297826767, 0.09673881530761719, 0.13041450083255768, 0.16409018635749817, 0.19776585698127747, 0.23144154250621796, 0.26511722803115845, 0.29879289865493774, 0.33246856927871704, 0.3661442697048187, 0.399819940328598, 0.4334956407546997, 0.467171311378479, 0.5008469820022583, 0.5345226526260376, 0.5681983232498169, 0.601874053478241, 0.6355497241020203, 0.6692253947257996, 0.7029010653495789, 0.7365767955780029, 0.7702524662017822, 0.8039281368255615, 0.8376038074493408, 0.8712794780731201, 0.9049551486968994, 0.9386308193206787, 0.972306489944458, 1.0059821605682373, 1.0396578311920166, 1.073333501815796, 1.1070091724395752, 1.140684962272644, 1.1743606328964233]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 6.0, 9.0, 12.0, 25.0, 34.0, 46.0, 69.0, 101.0, 160.0, 261.0, 429.0, 729.0, 1259.0, 2512.0, 5346.0, 12686.0, 36858.0, 158277.0, 3417267.0, 456218.0, 66198.0, 20082.0, 7807.0, 3561.0, 1800.0, 976.0, 539.0, 329.0, 209.0, 137.0, 95.0, 71.0, 36.0, 31.0, 26.0, 15.0, 15.0, 13.0, 10.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.189208984375, -0.18262290954589844, -0.17603683471679688, -0.1694507598876953, -0.16286468505859375, -0.1562786102294922, -0.14969253540039062, -0.14310646057128906, -0.1365203857421875, -0.12993431091308594, -0.12334823608398438, -0.11676216125488281, -0.11017608642578125, -0.10359001159667969, -0.09700393676757812, -0.09041786193847656, -0.083831787109375, -0.07724571228027344, -0.07065963745117188, -0.06407356262207031, -0.05748748779296875, -0.05090141296386719, -0.044315338134765625, -0.03772926330566406, -0.0311431884765625, -0.024557113647460938, -0.017971038818359375, -0.011384963989257812, -0.00479888916015625, 0.0017871856689453125, 0.008373260498046875, 0.014959335327148438, 0.02154541015625, 0.028131484985351562, 0.034717559814453125, 0.04130363464355469, 0.04788970947265625, 0.05447578430175781, 0.061061859130859375, 0.06764793395996094, 0.0742340087890625, 0.08082008361816406, 0.08740615844726562, 0.09399223327636719, 0.10057830810546875, 0.10716438293457031, 0.11375045776367188, 0.12033653259277344, 0.126922607421875, 0.13350868225097656, 0.14009475708007812, 0.1466808319091797, 0.15326690673828125, 0.1598529815673828, 0.16643905639648438, 0.17302513122558594, 0.1796112060546875, 0.18619728088378906, 0.19278335571289062, 0.1993694305419922, 0.20595550537109375, 0.2125415802001953, 0.21912765502929688, 0.22571372985839844, 0.2322998046875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 4.0, 17.0, 24.0, 22.0, 26.0, 29.0, 37.0, 21.0, 37.0, 42.0, 48.0, 59.0, 62.0, 67.0, 51.0, 55.0, 49.0, 54.0, 40.0, 37.0, 42.0, 28.0, 26.0, 22.0, 16.0, 14.0, 13.0, 11.0, 6.0, 7.0, 7.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041259765625, -0.039888858795166016, -0.03851795196533203, -0.03714704513549805, -0.03577613830566406, -0.03440523147583008, -0.033034324645996094, -0.03166341781616211, -0.030292510986328125, -0.02892160415649414, -0.027550697326660156, -0.026179790496826172, -0.024808883666992188, -0.023437976837158203, -0.02206707000732422, -0.020696163177490234, -0.01932525634765625, -0.017954349517822266, -0.01658344268798828, -0.015212535858154297, -0.013841629028320312, -0.012470722198486328, -0.011099815368652344, -0.00972890853881836, -0.008358001708984375, -0.006987094879150391, -0.005616188049316406, -0.004245281219482422, -0.0028743743896484375, -0.0015034675598144531, -0.00013256072998046875, 0.0012383460998535156, 0.0026092529296875, 0.003980159759521484, 0.005351066589355469, 0.006721973419189453, 0.008092880249023438, 0.009463787078857422, 0.010834693908691406, 0.01220560073852539, 0.013576507568359375, 0.01494741439819336, 0.016318321228027344, 0.017689228057861328, 0.019060134887695312, 0.020431041717529297, 0.02180194854736328, 0.023172855377197266, 0.02454376220703125, 0.025914669036865234, 0.02728557586669922, 0.028656482696533203, 0.030027389526367188, 0.03139829635620117, 0.032769203186035156, 0.03414011001586914, 0.035511016845703125, 0.03688192367553711, 0.038252830505371094, 0.03962373733520508, 0.04099464416503906, 0.04236555099487305, 0.04373645782470703, 0.045107364654541016, 0.046478271484375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 7.0, 9.0, 10.0, 10.0, 30.0, 38.0, 55.0, 82.0, 129.0, 221.0, 338.0, 691.0, 1310.0, 2776.0, 6231.0, 16597.0, 53464.0, 270453.0, 3196294.0, 528099.0, 79623.0, 22145.0, 8180.0, 3654.0, 1733.0, 867.0, 486.0, 266.0, 173.0, 102.0, 60.0, 43.0, 29.0, 23.0, 11.0, 15.0, 12.0, 2.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177001953125, -0.17103195190429688, -0.16506195068359375, -0.15909194946289062, -0.1531219482421875, -0.14715194702148438, -0.14118194580078125, -0.13521194458007812, -0.129241943359375, -0.12327194213867188, -0.11730194091796875, -0.11133193969726562, -0.1053619384765625, -0.09939193725585938, -0.09342193603515625, -0.08745193481445312, -0.08148193359375, -0.07551193237304688, -0.06954193115234375, -0.06357192993164062, -0.0576019287109375, -0.051631927490234375, -0.04566192626953125, -0.039691925048828125, -0.033721923828125, -0.027751922607421875, -0.02178192138671875, -0.015811920166015625, -0.0098419189453125, -0.003871917724609375, 0.00209808349609375, 0.008068084716796875, 0.0140380859375, 0.020008087158203125, 0.02597808837890625, 0.031948089599609375, 0.0379180908203125, 0.043888092041015625, 0.04985809326171875, 0.055828094482421875, 0.061798095703125, 0.06776809692382812, 0.07373809814453125, 0.07970809936523438, 0.0856781005859375, 0.09164810180664062, 0.09761810302734375, 0.10358810424804688, 0.10955810546875, 0.11552810668945312, 0.12149810791015625, 0.12746810913085938, 0.1334381103515625, 0.13940811157226562, 0.14537811279296875, 0.15134811401367188, 0.157318115234375, 0.16328811645507812, 0.16925811767578125, 0.17522811889648438, 0.1811981201171875, 0.18716812133789062, 0.19313812255859375, 0.19910812377929688, 0.205078125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 7.0, 6.0, 11.0, 18.0, 21.0, 18.0, 30.0, 50.0, 66.0, 94.0, 174.0, 238.0, 579.0, 1470.0, 588.0, 250.0, 148.0, 106.0, 58.0, 29.0, 30.0, 12.0, 12.0, 9.0, 12.0, 7.0, 3.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.049163818359375, -0.04730653762817383, -0.045449256896972656, -0.043591976165771484, -0.04173469543457031, -0.03987741470336914, -0.03802013397216797, -0.0361628532409668, -0.034305572509765625, -0.03244829177856445, -0.03059101104736328, -0.02873373031616211, -0.026876449584960938, -0.025019168853759766, -0.023161888122558594, -0.021304607391357422, -0.01944732666015625, -0.017590045928955078, -0.015732765197753906, -0.013875484466552734, -0.012018203735351562, -0.01016092300415039, -0.008303642272949219, -0.006446361541748047, -0.004589080810546875, -0.002731800079345703, -0.0008745193481445312, 0.0009827613830566406, 0.0028400421142578125, 0.004697322845458984, 0.006554603576660156, 0.008411884307861328, 0.0102691650390625, 0.012126445770263672, 0.013983726501464844, 0.015841007232666016, 0.017698287963867188, 0.01955556869506836, 0.02141284942626953, 0.023270130157470703, 0.025127410888671875, 0.026984691619873047, 0.02884197235107422, 0.03069925308227539, 0.03255653381347656, 0.034413814544677734, 0.036271095275878906, 0.03812837600708008, 0.03998565673828125, 0.04184293746948242, 0.043700218200683594, 0.045557498931884766, 0.04741477966308594, 0.04927206039428711, 0.05112934112548828, 0.05298662185668945, 0.054843902587890625, 0.0567011833190918, 0.05855846405029297, 0.06041574478149414, 0.06227302551269531, 0.06413030624389648, 0.06598758697509766, 0.06784486770629883, 0.0697021484375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 5.0, 9.0, 13.0, 36.0, 46.0, 100.0, 129.0, 143.0, 145.0, 138.0, 93.0, 58.0, 42.0, 15.0, 12.0, 14.0, 4.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25761300325393677, -0.2436131238937378, -0.2296132594347, -0.21561338007450104, -0.20161351561546326, -0.18761363625526428, -0.1736137568950653, -0.15961389243602753, -0.14561402797698975, -0.13161414861679077, -0.11761428415775299, -0.10361440479755402, -0.08961454033851624, -0.07561466097831726, -0.06161478906869888, -0.047614917159080505, -0.03361503779888153, -0.019615165889263153, -0.005615292116999626, 0.0083845816552639, 0.02238445356488228, 0.036384329199790955, 0.05038420110940933, 0.06438407301902771, 0.07838394492864609, 0.09238381683826447, 0.10638368874788284, 0.12038356065750122, 0.1343834400177002, 0.14838331937789917, 0.16238318383693695, 0.17638304829597473, 0.1903829276561737, 0.20438280701637268, 0.21838267147541046, 0.23238255083560944, 0.24638241529464722, 0.2603822946548462, 0.27438217401504517, 0.28838205337524414, 0.3023819029331207, 0.3163817822933197, 0.3303816616535187, 0.34438151121139526, 0.35838139057159424, 0.3723812699317932, 0.3863811492919922, 0.40038102865219116, 0.41438090801239014, 0.4283807873725891, 0.4423806667327881, 0.4563805162906647, 0.47038039565086365, 0.4843802750110626, 0.4983801543712616, 0.5123800039291382, 0.5263798832893372, 0.5403797626495361, 0.5543796420097351, 0.5683795213699341, 0.5823794007301331, 0.596379280090332, 0.6103790998458862, 0.6243789792060852, 0.6383788585662842]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 2.0, 6.0, 5.0, 9.0, 13.0, 6.0, 8.0, 15.0, 13.0, 33.0, 22.0, 30.0, 30.0, 42.0, 32.0, 52.0, 44.0, 45.0, 42.0, 30.0, 44.0, 42.0, 43.0, 35.0, 36.0, 39.0, 33.0, 28.0, 36.0, 32.0, 22.0, 22.0, 19.0, 18.0, 17.0, 16.0, 7.0, 2.0, 9.0, 2.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.21582037210464478, -0.20919713377952576, -0.20257388055324554, -0.19595062732696533, -0.1893273890018463, -0.1827041506767273, -0.17608089745044708, -0.16945764422416687, -0.16283440589904785, -0.15621116757392883, -0.14958791434764862, -0.1429646611213684, -0.1363414227962494, -0.12971818447113037, -0.12309493124485016, -0.11647168546915054, -0.10984843969345093, -0.10322519391775131, -0.0966019481420517, -0.08997870236635208, -0.08335545659065247, -0.07673221081495285, -0.07010896503925323, -0.06348571926355362, -0.056862473487854004, -0.05023922771215439, -0.04361598193645477, -0.03699273616075516, -0.030369490385055542, -0.023746244609355927, -0.01712299883365631, -0.010499753057956696, -0.00387650728225708, 0.0027467384934425354, 0.009369984269142151, 0.015993230044841766, 0.022616475820541382, 0.029239721596240997, 0.03586296737194061, 0.04248621314764023, 0.049109458923339844, 0.05573270469903946, 0.062355950474739075, 0.06897919625043869, 0.0756024420261383, 0.08222568780183792, 0.08884893357753754, 0.09547217935323715, 0.10209542512893677, 0.10871867090463638, 0.115341916680336, 0.12196516245603561, 0.12858840823173523, 0.13521164655685425, 0.14183489978313446, 0.14845815300941467, 0.1550813913345337, 0.1617046296596527, 0.16832788288593292, 0.17495113611221313, 0.18157437443733215, 0.18819761276245117, 0.19482086598873138, 0.2014441192150116, 0.20806735754013062]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 6.0, 12.0, 7.0, 11.0, 17.0, 19.0, 23.0, 41.0, 59.0, 115.0, 161.0, 252.0, 391.0, 648.0, 1149.0, 2000.0, 3598.0, 7144.0, 14370.0, 29693.0, 62082.0, 128601.0, 238989.0, 264371.0, 150637.0, 73818.0, 34989.0, 17056.0, 8369.0, 4270.0, 2358.0, 1297.0, 754.0, 400.0, 306.0, 173.0, 117.0, 63.0, 61.0, 32.0, 28.0, 20.0, 16.0, 11.0, 5.0, 3.0, 3.0, 3.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11712646484375, -0.1134796142578125, -0.109832763671875, -0.1061859130859375, -0.1025390625, -0.0988922119140625, -0.095245361328125, -0.0915985107421875, -0.08795166015625, -0.0843048095703125, -0.080657958984375, -0.0770111083984375, -0.0733642578125, -0.0697174072265625, -0.066070556640625, -0.0624237060546875, -0.05877685546875, -0.0551300048828125, -0.051483154296875, -0.0478363037109375, -0.044189453125, -0.0405426025390625, -0.036895751953125, -0.0332489013671875, -0.02960205078125, -0.0259552001953125, -0.022308349609375, -0.0186614990234375, -0.0150146484375, -0.0113677978515625, -0.007720947265625, -0.0040740966796875, -0.00042724609375, 0.0032196044921875, 0.006866455078125, 0.0105133056640625, 0.01416015625, 0.0178070068359375, 0.021453857421875, 0.0251007080078125, 0.02874755859375, 0.0323944091796875, 0.036041259765625, 0.0396881103515625, 0.0433349609375, 0.0469818115234375, 0.050628662109375, 0.0542755126953125, 0.05792236328125, 0.0615692138671875, 0.065216064453125, 0.0688629150390625, 0.072509765625, 0.0761566162109375, 0.079803466796875, 0.0834503173828125, 0.08709716796875, 0.0907440185546875, 0.094390869140625, 0.0980377197265625, 0.1016845703125, 0.1053314208984375, 0.108978271484375, 0.1126251220703125, 0.11627197265625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 7.0, 3.0, 6.0, 10.0, 12.0, 22.0, 15.0, 25.0, 30.0, 33.0, 17.0, 35.0, 39.0, 38.0, 42.0, 34.0, 57.0, 56.0, 61.0, 46.0, 47.0, 36.0, 51.0, 49.0, 37.0, 26.0, 29.0, 20.0, 22.0, 17.0, 16.0, 13.0, 6.0, 4.0, 9.0, 9.0, 2.0, 3.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.039642333984375, -0.03841400146484375, -0.0371856689453125, -0.03595733642578125, -0.03472900390625, -0.03350067138671875, -0.0322723388671875, -0.03104400634765625, -0.029815673828125, -0.02858734130859375, -0.0273590087890625, -0.02613067626953125, -0.02490234375, -0.02367401123046875, -0.0224456787109375, -0.02121734619140625, -0.019989013671875, -0.01876068115234375, -0.0175323486328125, -0.01630401611328125, -0.01507568359375, -0.01384735107421875, -0.0126190185546875, -0.01139068603515625, -0.010162353515625, -0.00893402099609375, -0.0077056884765625, -0.00647735595703125, -0.0052490234375, -0.00402069091796875, -0.0027923583984375, -0.00156402587890625, -0.000335693359375, 0.00089263916015625, 0.0021209716796875, 0.00334930419921875, 0.00457763671875, 0.00580596923828125, 0.0070343017578125, 0.00826263427734375, 0.009490966796875, 0.01071929931640625, 0.0119476318359375, 0.01317596435546875, 0.014404296875, 0.01563262939453125, 0.0168609619140625, 0.01808929443359375, 0.019317626953125, 0.02054595947265625, 0.0217742919921875, 0.02300262451171875, 0.02423095703125, 0.02545928955078125, 0.0266876220703125, 0.02791595458984375, 0.029144287109375, 0.03037261962890625, 0.0316009521484375, 0.03282928466796875, 0.0340576171875, 0.03528594970703125, 0.0365142822265625, 0.03774261474609375, 0.038970947265625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 5.0, 5.0, 4.0, 14.0, 24.0, 22.0, 34.0, 56.0, 72.0, 104.0, 170.0, 277.0, 419.0, 765.0, 1574.0, 3891.0, 12977.0, 57765.0, 265084.0, 500270.0, 157681.0, 33618.0, 8211.0, 2725.0, 1133.0, 576.0, 370.0, 228.0, 180.0, 108.0, 57.0, 49.0, 22.0, 17.0, 14.0, 9.0, 8.0, 5.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2244873046875, -0.21794700622558594, -0.21140670776367188, -0.2048664093017578, -0.19832611083984375, -0.1917858123779297, -0.18524551391601562, -0.17870521545410156, -0.1721649169921875, -0.16562461853027344, -0.15908432006835938, -0.1525440216064453, -0.14600372314453125, -0.1394634246826172, -0.13292312622070312, -0.12638282775878906, -0.119842529296875, -0.11330223083496094, -0.10676193237304688, -0.10022163391113281, -0.09368133544921875, -0.08714103698730469, -0.08060073852539062, -0.07406044006347656, -0.0675201416015625, -0.06097984313964844, -0.054439544677734375, -0.04789924621582031, -0.04135894775390625, -0.03481864929199219, -0.028278350830078125, -0.021738052368164062, -0.01519775390625, -0.008657455444335938, -0.002117156982421875, 0.0044231414794921875, 0.01096343994140625, 0.017503738403320312, 0.024044036865234375, 0.030584335327148438, 0.0371246337890625, 0.04366493225097656, 0.050205230712890625, 0.05674552917480469, 0.06328582763671875, 0.06982612609863281, 0.07636642456054688, 0.08290672302246094, 0.089447021484375, 0.09598731994628906, 0.10252761840820312, 0.10906791687011719, 0.11560821533203125, 0.12214851379394531, 0.12868881225585938, 0.13522911071777344, 0.1417694091796875, 0.14830970764160156, 0.15485000610351562, 0.1613903045654297, 0.16793060302734375, 0.1744709014892578, 0.18101119995117188, 0.18755149841308594, 0.194091796875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 7.0, 10.0, 7.0, 14.0, 12.0, 13.0, 17.0, 14.0, 26.0, 20.0, 24.0, 35.0, 46.0, 45.0, 48.0, 53.0, 51.0, 49.0, 48.0, 46.0, 47.0, 45.0, 48.0, 30.0, 36.0, 37.0, 31.0, 26.0, 22.0, 17.0, 18.0, 13.0, 12.0, 3.0, 8.0, 6.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 3.0, 1.0], "bins": [-0.205810546875, -0.2001323699951172, -0.19445419311523438, -0.18877601623535156, -0.18309783935546875, -0.17741966247558594, -0.17174148559570312, -0.1660633087158203, -0.1603851318359375, -0.1547069549560547, -0.14902877807617188, -0.14335060119628906, -0.13767242431640625, -0.13199424743652344, -0.12631607055664062, -0.12063789367675781, -0.114959716796875, -0.10928153991699219, -0.10360336303710938, -0.09792518615722656, -0.09224700927734375, -0.08656883239746094, -0.08089065551757812, -0.07521247863769531, -0.0695343017578125, -0.06385612487792969, -0.058177947998046875, -0.05249977111816406, -0.04682159423828125, -0.04114341735839844, -0.035465240478515625, -0.029787063598632812, -0.02410888671875, -0.018430709838867188, -0.012752532958984375, -0.0070743560791015625, -0.00139617919921875, 0.0042819976806640625, 0.009960174560546875, 0.015638351440429688, 0.0213165283203125, 0.026994705200195312, 0.032672882080078125, 0.03835105895996094, 0.04402923583984375, 0.04970741271972656, 0.055385589599609375, 0.06106376647949219, 0.066741943359375, 0.07242012023925781, 0.07809829711914062, 0.08377647399902344, 0.08945465087890625, 0.09513282775878906, 0.10081100463867188, 0.10648918151855469, 0.1121673583984375, 0.11784553527832031, 0.12352371215820312, 0.12920188903808594, 0.13488006591796875, 0.14055824279785156, 0.14623641967773438, 0.1519145965576172, 0.1575927734375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 8.0, 13.0, 22.0, 40.0, 66.0, 170.0, 392.0, 1154.0, 4639.0, 25900.0, 235833.0, 677263.0, 87075.0, 12116.0, 2616.0, 759.0, 253.0, 103.0, 62.0, 30.0, 10.0, 13.0, 1.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177978515625, -0.17293548583984375, -0.1678924560546875, -0.16284942626953125, -0.157806396484375, -0.15276336669921875, -0.1477203369140625, -0.14267730712890625, -0.13763427734375, -0.13259124755859375, -0.1275482177734375, -0.12250518798828125, -0.117462158203125, -0.11241912841796875, -0.1073760986328125, -0.10233306884765625, -0.0972900390625, -0.09224700927734375, -0.0872039794921875, -0.08216094970703125, -0.077117919921875, -0.07207489013671875, -0.0670318603515625, -0.06198883056640625, -0.05694580078125, -0.05190277099609375, -0.0468597412109375, -0.04181671142578125, -0.036773681640625, -0.03173065185546875, -0.0266876220703125, -0.02164459228515625, -0.0166015625, -0.01155853271484375, -0.0065155029296875, -0.00147247314453125, 0.003570556640625, 0.00861358642578125, 0.0136566162109375, 0.01869964599609375, 0.02374267578125, 0.02878570556640625, 0.0338287353515625, 0.03887176513671875, 0.043914794921875, 0.04895782470703125, 0.0540008544921875, 0.05904388427734375, 0.0640869140625, 0.06912994384765625, 0.0741729736328125, 0.07921600341796875, 0.084259033203125, 0.08930206298828125, 0.0943450927734375, 0.09938812255859375, 0.10443115234375, 0.10947418212890625, 0.1145172119140625, 0.11956024169921875, 0.124603271484375, 0.12964630126953125, 0.1346893310546875, 0.13973236083984375, 0.144775390625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 3.0, 6.0, 5.0, 13.0, 10.0, 24.0, 26.0, 42.0, 50.0, 58.0, 79.0, 112.0, 116.0, 100.0, 74.0, 67.0, 49.0, 37.0, 29.0, 21.0, 21.0, 13.0, 13.0, 9.0, 7.0, 3.0, 4.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010138750076293945, -9.847059845924377e-05, -9.55536961555481e-05, -9.263679385185242e-05, -8.971989154815674e-05, -8.680298924446106e-05, -8.388608694076538e-05, -8.09691846370697e-05, -7.805228233337402e-05, -7.513538002967834e-05, -7.221847772598267e-05, -6.930157542228699e-05, -6.638467311859131e-05, -6.346777081489563e-05, -6.055086851119995e-05, -5.763396620750427e-05, -5.4717063903808594e-05, -5.1800161600112915e-05, -4.8883259296417236e-05, -4.596635699272156e-05, -4.304945468902588e-05, -4.01325523853302e-05, -3.721565008163452e-05, -3.429874777793884e-05, -3.1381845474243164e-05, -2.8464943170547485e-05, -2.5548040866851807e-05, -2.2631138563156128e-05, -1.971423625946045e-05, -1.679733395576477e-05, -1.3880431652069092e-05, -1.0963529348373413e-05, -8.046627044677734e-06, -5.129724740982056e-06, -2.212822437286377e-06, 7.040798664093018e-07, 3.6209821701049805e-06, 6.537884473800659e-06, 9.454786777496338e-06, 1.2371689081192017e-05, 1.5288591384887695e-05, 1.8205493688583374e-05, 2.1122395992279053e-05, 2.403929829597473e-05, 2.695620059967041e-05, 2.987310290336609e-05, 3.279000520706177e-05, 3.5706907510757446e-05, 3.8623809814453125e-05, 4.1540712118148804e-05, 4.445761442184448e-05, 4.737451672554016e-05, 5.029141902923584e-05, 5.320832133293152e-05, 5.61252236366272e-05, 5.9042125940322876e-05, 6.195902824401855e-05, 6.487593054771423e-05, 6.779283285140991e-05, 7.070973515510559e-05, 7.362663745880127e-05, 7.654353976249695e-05, 7.946044206619263e-05, 8.23773443698883e-05, 8.529424667358398e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 7.0, 8.0, 14.0, 17.0, 28.0, 47.0, 86.0, 135.0, 253.0, 534.0, 1172.0, 3112.0, 11662.0, 77383.0, 665004.0, 253441.0, 26704.0, 5609.0, 1817.0, 734.0, 351.0, 171.0, 99.0, 72.0, 27.0, 16.0, 10.0, 14.0, 11.0, 7.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1688232421875, -0.1642284393310547, -0.15963363647460938, -0.15503883361816406, -0.15044403076171875, -0.14584922790527344, -0.14125442504882812, -0.1366596221923828, -0.1320648193359375, -0.1274700164794922, -0.12287521362304688, -0.11828041076660156, -0.11368560791015625, -0.10909080505371094, -0.10449600219726562, -0.09990119934082031, -0.095306396484375, -0.09071159362792969, -0.08611679077148438, -0.08152198791503906, -0.07692718505859375, -0.07233238220214844, -0.06773757934570312, -0.06314277648925781, -0.0585479736328125, -0.05395317077636719, -0.049358367919921875, -0.04476356506347656, -0.04016876220703125, -0.03557395935058594, -0.030979156494140625, -0.026384353637695312, -0.02178955078125, -0.017194747924804688, -0.012599945068359375, -0.008005142211914062, -0.00341033935546875, 0.0011844635009765625, 0.005779266357421875, 0.010374069213867188, 0.0149688720703125, 0.019563674926757812, 0.024158477783203125, 0.028753280639648438, 0.03334808349609375, 0.03794288635253906, 0.042537689208984375, 0.04713249206542969, 0.051727294921875, 0.05632209777832031, 0.060916900634765625, 0.06551170349121094, 0.07010650634765625, 0.07470130920410156, 0.07929611206054688, 0.08389091491699219, 0.0884857177734375, 0.09308052062988281, 0.09767532348632812, 0.10227012634277344, 0.10686492919921875, 0.11145973205566406, 0.11605453491210938, 0.12064933776855469, 0.125244140625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 4.0, 5.0, 14.0, 22.0, 29.0, 39.0, 55.0, 78.0, 104.0, 116.0, 135.0, 105.0, 89.0, 71.0, 33.0, 34.0, 14.0, 12.0, 13.0, 6.0, 3.0, 3.0, 2.0, 0.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07080078125, -0.0678701400756836, -0.06493949890136719, -0.06200885772705078, -0.059078216552734375, -0.05614757537841797, -0.05321693420410156, -0.050286293029785156, -0.04735565185546875, -0.044425010681152344, -0.04149436950683594, -0.03856372833251953, -0.035633087158203125, -0.03270244598388672, -0.029771804809570312, -0.026841163635253906, -0.0239105224609375, -0.020979881286621094, -0.018049240112304688, -0.015118598937988281, -0.012187957763671875, -0.009257316589355469, -0.0063266754150390625, -0.0033960342407226562, -0.00046539306640625, 0.0024652481079101562, 0.0053958892822265625, 0.008326530456542969, 0.011257171630859375, 0.014187812805175781, 0.017118453979492188, 0.020049095153808594, 0.022979736328125, 0.025910377502441406, 0.028841018676757812, 0.03177165985107422, 0.034702301025390625, 0.03763294219970703, 0.04056358337402344, 0.043494224548339844, 0.04642486572265625, 0.049355506896972656, 0.05228614807128906, 0.05521678924560547, 0.058147430419921875, 0.06107807159423828, 0.06400871276855469, 0.0669393539428711, 0.0698699951171875, 0.0728006362915039, 0.07573127746582031, 0.07866191864013672, 0.08159255981445312, 0.08452320098876953, 0.08745384216308594, 0.09038448333740234, 0.09331512451171875, 0.09624576568603516, 0.09917640686035156, 0.10210704803466797, 0.10503768920898438, 0.10796833038330078, 0.11089897155761719, 0.1138296127319336, 0.11676025390625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 18.0, 61.0, 169.0, 280.0, 248.0, 149.0, 56.0, 21.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5243494510650635, -1.4398808479309082, -1.3554123640060425, -1.2709437608718872, -1.1864752769470215, -1.1020066738128662, -1.017538070678711, -0.9330695271492004, -0.8486009836196899, -0.7641324400901794, -0.679663896560669, -0.5951952934265137, -0.5107267498970032, -0.4262582063674927, -0.3417896032333374, -0.2573210597038269, -0.1728525161743164, -0.08838395774364471, -0.0039153993129730225, 0.08055317401885986, 0.16502171754837036, 0.24949026107788086, 0.33395886421203613, 0.41842740774154663, 0.5028959512710571, 0.5873644948005676, 0.6718330383300781, 0.7563016414642334, 0.8407701849937439, 0.9252387285232544, 1.0097073316574097, 1.0941758155822754, 1.1786446571350098, 1.263113260269165, 1.3475817441940308, 1.432050347328186, 1.5165188312530518, 1.600987434387207, 1.6854560375213623, 1.7699246406555176, 1.8543931245803833, 1.9388617277145386, 2.0233302116394043, 2.1077988147735596, 2.192267417907715, 2.276735782623291, 2.3612046241760254, 2.4456729888916016, 2.530141592025757, 2.614610195159912, 2.6990787982940674, 2.7835474014282227, 2.868015766143799, 2.952484369277954, 3.0369529724121094, 3.1214215755462646, 3.20589017868042, 3.290358781814575, 3.3748273849487305, 3.4592957496643066, 3.543764352798462, 3.628232955932617, 3.7127015590667725, 3.7971701622009277, 3.881638526916504]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 10.0, 15.0, 12.0, 11.0, 18.0, 22.0, 40.0, 24.0, 43.0, 50.0, 44.0, 47.0, 59.0, 61.0, 57.0, 55.0, 55.0, 48.0, 77.0, 41.0, 45.0, 37.0, 26.0, 20.0, 17.0, 18.0, 13.0, 10.0, 4.0, 10.0, 5.0, 9.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9450921416282654, -0.9084863066673279, -0.8718804717063904, -0.8352746367454529, -0.7986688017845154, -0.7620629668235779, -0.7254571318626404, -0.6888512969017029, -0.6522454619407654, -0.6156396269798279, -0.5790337920188904, -0.5424279570579529, -0.5058221220970154, -0.4692162871360779, -0.4326104521751404, -0.3960046172142029, -0.3593987822532654, -0.3227929472923279, -0.2861871123313904, -0.24958127737045288, -0.21297544240951538, -0.17636960744857788, -0.13976377248764038, -0.10315793752670288, -0.06655210256576538, -0.02994626760482788, 0.006659567356109619, 0.04326540231704712, 0.07987123727798462, 0.11647707223892212, 0.15308290719985962, 0.18968874216079712, 0.22629451751708984, 0.26290035247802734, 0.29950618743896484, 0.33611202239990234, 0.37271785736083984, 0.40932369232177734, 0.44592952728271484, 0.48253536224365234, 0.5191411972045898, 0.5557470321655273, 0.5923528671264648, 0.6289587020874023, 0.6655645370483398, 0.7021703720092773, 0.7387762069702148, 0.7753820419311523, 0.8119878768920898, 0.8485937118530273, 0.8851995468139648, 0.9218053817749023, 0.9584112167358398, 0.9950170516967773, 1.0316228866577148, 1.0682287216186523, 1.1048345565795898, 1.1414403915405273, 1.1780462265014648, 1.2146520614624023, 1.2512578964233398, 1.2878637313842773, 1.3244695663452148, 1.3610754013061523, 1.3976812362670898]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 6.0, 9.0, 9.0, 12.0, 13.0, 26.0, 29.0, 46.0, 78.0, 116.0, 209.0, 358.0, 630.0, 1102.0, 2377.0, 5396.0, 13851.0, 44381.0, 215730.0, 3271553.0, 525277.0, 77076.0, 21591.0, 7751.0, 3204.0, 1499.0, 807.0, 473.0, 225.0, 156.0, 106.0, 63.0, 39.0, 25.0, 19.0, 20.0, 10.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.182373046875, -0.17623138427734375, -0.1700897216796875, -0.16394805908203125, -0.157806396484375, -0.15166473388671875, -0.1455230712890625, -0.13938140869140625, -0.13323974609375, -0.12709808349609375, -0.1209564208984375, -0.11481475830078125, -0.108673095703125, -0.10253143310546875, -0.0963897705078125, -0.09024810791015625, -0.0841064453125, -0.07796478271484375, -0.0718231201171875, -0.06568145751953125, -0.059539794921875, -0.05339813232421875, -0.0472564697265625, -0.04111480712890625, -0.03497314453125, -0.02883148193359375, -0.0226898193359375, -0.01654815673828125, -0.010406494140625, -0.00426483154296875, 0.0018768310546875, 0.00801849365234375, 0.01416015625, 0.02030181884765625, 0.0264434814453125, 0.03258514404296875, 0.038726806640625, 0.04486846923828125, 0.0510101318359375, 0.05715179443359375, 0.06329345703125, 0.06943511962890625, 0.0755767822265625, 0.08171844482421875, 0.087860107421875, 0.09400177001953125, 0.1001434326171875, 0.10628509521484375, 0.1124267578125, 0.11856842041015625, 0.1247100830078125, 0.13085174560546875, 0.136993408203125, 0.14313507080078125, 0.1492767333984375, 0.15541839599609375, 0.16156005859375, 0.16770172119140625, 0.1738433837890625, 0.17998504638671875, 0.186126708984375, 0.19226837158203125, 0.1984100341796875, 0.20455169677734375, 0.210693359375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 4.0, 11.0, 16.0, 15.0, 20.0, 26.0, 35.0, 35.0, 38.0, 56.0, 53.0, 64.0, 51.0, 68.0, 61.0, 54.0, 51.0, 63.0, 48.0, 41.0, 33.0, 26.0, 18.0, 22.0, 18.0, 11.0, 11.0, 7.0, 11.0, 3.0, 3.0, 7.0, 2.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04840087890625, -0.046933650970458984, -0.04546642303466797, -0.04399919509887695, -0.04253196716308594, -0.04106473922729492, -0.039597511291503906, -0.03813028335571289, -0.036663055419921875, -0.03519582748413086, -0.033728599548339844, -0.03226137161254883, -0.030794143676757812, -0.029326915740966797, -0.02785968780517578, -0.026392459869384766, -0.02492523193359375, -0.023458003997802734, -0.02199077606201172, -0.020523548126220703, -0.019056320190429688, -0.017589092254638672, -0.016121864318847656, -0.01465463638305664, -0.013187408447265625, -0.01172018051147461, -0.010252952575683594, -0.008785724639892578, -0.0073184967041015625, -0.005851268768310547, -0.004384040832519531, -0.0029168128967285156, -0.0014495849609375, 1.7642974853515625e-05, 0.0014848709106445312, 0.002952098846435547, 0.0044193267822265625, 0.005886554718017578, 0.007353782653808594, 0.00882101058959961, 0.010288238525390625, 0.01175546646118164, 0.013222694396972656, 0.014689922332763672, 0.016157150268554688, 0.017624378204345703, 0.01909160614013672, 0.020558834075927734, 0.02202606201171875, 0.023493289947509766, 0.02496051788330078, 0.026427745819091797, 0.027894973754882812, 0.029362201690673828, 0.030829429626464844, 0.03229665756225586, 0.033763885498046875, 0.03523111343383789, 0.036698341369628906, 0.03816556930541992, 0.03963279724121094, 0.04110002517700195, 0.04256725311279297, 0.044034481048583984, 0.045501708984375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 8.0, 7.0, 8.0, 11.0, 10.0, 19.0, 34.0, 38.0, 81.0, 104.0, 165.0, 281.0, 465.0, 896.0, 1812.0, 4070.0, 10089.0, 28945.0, 103492.0, 592138.0, 2941353.0, 394411.0, 78149.0, 22788.0, 8160.0, 3394.0, 1519.0, 779.0, 391.0, 256.0, 159.0, 79.0, 55.0, 39.0, 21.0, 22.0, 12.0, 7.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.176513671875, -0.17152786254882812, -0.16654205322265625, -0.16155624389648438, -0.1565704345703125, -0.15158462524414062, -0.14659881591796875, -0.14161300659179688, -0.136627197265625, -0.13164138793945312, -0.12665557861328125, -0.12166976928710938, -0.1166839599609375, -0.11169815063476562, -0.10671234130859375, -0.10172653198242188, -0.09674072265625, -0.09175491333007812, -0.08676910400390625, -0.08178329467773438, -0.0767974853515625, -0.07181167602539062, -0.06682586669921875, -0.061840057373046875, -0.056854248046875, -0.051868438720703125, -0.04688262939453125, -0.041896820068359375, -0.0369110107421875, -0.031925201416015625, -0.02693939208984375, -0.021953582763671875, -0.0169677734375, -0.011981964111328125, -0.00699615478515625, -0.002010345458984375, 0.0029754638671875, 0.007961273193359375, 0.01294708251953125, 0.017932891845703125, 0.022918701171875, 0.027904510498046875, 0.03289031982421875, 0.037876129150390625, 0.0428619384765625, 0.047847747802734375, 0.05283355712890625, 0.057819366455078125, 0.06280517578125, 0.06779098510742188, 0.07277679443359375, 0.07776260375976562, 0.0827484130859375, 0.08773422241210938, 0.09272003173828125, 0.09770584106445312, 0.102691650390625, 0.10767745971679688, 0.11266326904296875, 0.11764907836914062, 0.1226348876953125, 0.12762069702148438, 0.13260650634765625, 0.13759231567382812, 0.142578125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 8.0, 12.0, 8.0, 6.0, 13.0, 19.0, 23.0, 27.0, 48.0, 62.0, 79.0, 164.0, 188.0, 350.0, 582.0, 994.0, 567.0, 282.0, 207.0, 117.0, 81.0, 69.0, 36.0, 38.0, 24.0, 14.0, 12.0, 4.0, 7.0, 5.0, 4.0, 4.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.0775146484375, -0.07538890838623047, -0.07326316833496094, -0.0711374282836914, -0.06901168823242188, -0.06688594818115234, -0.06476020812988281, -0.06263446807861328, -0.06050872802734375, -0.05838298797607422, -0.05625724792480469, -0.054131507873535156, -0.052005767822265625, -0.049880027770996094, -0.04775428771972656, -0.04562854766845703, -0.0435028076171875, -0.04137706756591797, -0.03925132751464844, -0.037125587463378906, -0.034999847412109375, -0.032874107360839844, -0.030748367309570312, -0.02862262725830078, -0.02649688720703125, -0.02437114715576172, -0.022245407104492188, -0.020119667053222656, -0.017993927001953125, -0.015868186950683594, -0.013742446899414062, -0.011616706848144531, -0.009490966796875, -0.007365226745605469, -0.0052394866943359375, -0.0031137466430664062, -0.000988006591796875, 0.0011377334594726562, 0.0032634735107421875, 0.005389213562011719, 0.00751495361328125, 0.009640693664550781, 0.011766433715820312, 0.013892173767089844, 0.016017913818359375, 0.018143653869628906, 0.020269393920898438, 0.02239513397216797, 0.0245208740234375, 0.02664661407470703, 0.028772354125976562, 0.030898094177246094, 0.033023834228515625, 0.035149574279785156, 0.03727531433105469, 0.03940105438232422, 0.04152679443359375, 0.04365253448486328, 0.04577827453613281, 0.047904014587402344, 0.050029754638671875, 0.052155494689941406, 0.05428123474121094, 0.05640697479248047, 0.05853271484375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 9.0, 10.0, 25.0, 48.0, 114.0, 170.0, 232.0, 213.0, 102.0, 40.0, 24.0, 11.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.2824467420578003, -1.2523645162582397, -1.2222822904586792, -1.192199945449829, -1.1621177196502686, -1.132035493850708, -1.1019532680511475, -1.071871042251587, -1.0417888164520264, -1.0117065906524658, -0.9816243052482605, -0.9515420794487, -0.9214598536491394, -0.8913775682449341, -0.8612953424453735, -0.831213116645813, -0.8011308312416077, -0.7710486054420471, -0.7409663200378418, -0.7108840942382812, -0.6808018684387207, -0.6507196426391602, -0.6206373572349548, -0.5905551314353943, -0.560472846031189, -0.5303906202316284, -0.5003083348274231, -0.47022610902786255, -0.440143883228302, -0.41006162762641907, -0.37997937202453613, -0.3498971462249756, -0.3198149800300598, -0.2897327244281769, -0.25965049862861633, -0.2295682430267334, -0.19948600232601166, -0.16940376162528992, -0.13932150602340698, -0.10923926532268524, -0.0791570246219635, -0.04907478019595146, -0.018992535769939423, 0.011089712381362915, 0.041171953082084656, 0.0712541937828064, 0.10133644938468933, 0.13141869008541107, 0.1615009307861328, 0.19158317148685455, 0.2216654121875763, 0.25174766778945923, 0.2818298935890198, 0.3119121491909027, 0.34199440479278564, 0.3720766305923462, 0.4021588861942291, 0.43224114179611206, 0.4623233675956726, 0.49240562319755554, 0.5224878787994385, 0.552570104598999, 0.5826523303985596, 0.6127346158027649, 0.6428168416023254]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 8.0, 5.0, 6.0, 14.0, 9.0, 15.0, 15.0, 26.0, 20.0, 28.0, 19.0, 22.0, 36.0, 27.0, 46.0, 64.0, 47.0, 48.0, 40.0, 38.0, 36.0, 48.0, 45.0, 36.0, 42.0, 34.0, 42.0, 25.0, 25.0, 27.0, 18.0, 11.0, 19.0, 15.0, 8.0, 9.0, 11.0, 1.0, 5.0, 4.0, 3.0, 4.0, 2.0, 3.0], "bins": [-0.3536110520362854, -0.3444724678993225, -0.335333913564682, -0.3261953294277191, -0.3170567750930786, -0.3079181909561157, -0.29877960681915283, -0.28964105248451233, -0.28050246834754944, -0.27136388421058655, -0.26222532987594604, -0.25308674573898315, -0.24394817650318146, -0.23480960726737976, -0.22567103803157806, -0.21653246879577637, -0.20739389955997467, -0.19825533032417297, -0.18911676108837128, -0.17997819185256958, -0.1708396077156067, -0.161701038479805, -0.1525624692440033, -0.1434238851070404, -0.1342853307723999, -0.1251467615365982, -0.11600818485021591, -0.10686961561441422, -0.09773103892803192, -0.08859246969223022, -0.07945390045642853, -0.07031532377004623, -0.06117674708366394, -0.052038174122571945, -0.04289960116147995, -0.03376103192567825, -0.024622458964586258, -0.015483886003494263, -0.006345316767692566, 0.002793259918689728, 0.011931829154491425, 0.02107040211558342, 0.030208973214030266, 0.03934754431247711, 0.04848611727356911, 0.0576246902346611, 0.0667632594704628, 0.07590183615684509, 0.08504040539264679, 0.09417897462844849, 0.10331755131483078, 0.11245612055063248, 0.12159469723701477, 0.13073326647281647, 0.13987183570861816, 0.14901041984558105, 0.15814897418022156, 0.16728754341602325, 0.17642611265182495, 0.18556469678878784, 0.19470326602458954, 0.20384183526039124, 0.21298040449619293, 0.22211897373199463, 0.23125755786895752]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 1.0, 5.0, 13.0, 11.0, 18.0, 30.0, 37.0, 50.0, 104.0, 162.0, 352.0, 843.0, 2166.0, 7028.0, 26534.0, 120935.0, 547813.0, 269499.0, 53723.0, 13046.0, 3758.0, 1353.0, 502.0, 245.0, 112.0, 68.0, 57.0, 26.0, 24.0, 18.0, 4.0, 5.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.291259765625, -0.2823638916015625, -0.273468017578125, -0.2645721435546875, -0.25567626953125, -0.2467803955078125, -0.237884521484375, -0.2289886474609375, -0.2200927734375, -0.2111968994140625, -0.202301025390625, -0.1934051513671875, -0.18450927734375, -0.1756134033203125, -0.166717529296875, -0.1578216552734375, -0.14892578125, -0.1400299072265625, -0.131134033203125, -0.1222381591796875, -0.11334228515625, -0.1044464111328125, -0.095550537109375, -0.0866546630859375, -0.0777587890625, -0.0688629150390625, -0.059967041015625, -0.0510711669921875, -0.04217529296875, -0.0332794189453125, -0.024383544921875, -0.0154876708984375, -0.006591796875, 0.0023040771484375, 0.011199951171875, 0.0200958251953125, 0.02899169921875, 0.0378875732421875, 0.046783447265625, 0.0556793212890625, 0.0645751953125, 0.0734710693359375, 0.082366943359375, 0.0912628173828125, 0.10015869140625, 0.1090545654296875, 0.117950439453125, 0.1268463134765625, 0.1357421875, 0.1446380615234375, 0.153533935546875, 0.1624298095703125, 0.17132568359375, 0.1802215576171875, 0.189117431640625, 0.1980133056640625, 0.2069091796875, 0.2158050537109375, 0.224700927734375, 0.2335968017578125, 0.24249267578125, 0.2513885498046875, 0.260284423828125, 0.2691802978515625, 0.278076171875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 9.0, 6.0, 5.0, 11.0, 15.0, 22.0, 14.0, 27.0, 38.0, 35.0, 47.0, 55.0, 55.0, 48.0, 62.0, 52.0, 55.0, 59.0, 59.0, 56.0, 52.0, 36.0, 30.0, 37.0, 21.0, 21.0, 14.0, 10.0, 10.0, 6.0, 7.0, 6.0, 3.0, 7.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.050018310546875, -0.04862022399902344, -0.047222137451171875, -0.04582405090332031, -0.04442596435546875, -0.04302787780761719, -0.041629791259765625, -0.04023170471191406, -0.0388336181640625, -0.03743553161621094, -0.036037445068359375, -0.03463935852050781, -0.03324127197265625, -0.03184318542480469, -0.030445098876953125, -0.029047012329101562, -0.02764892578125, -0.026250839233398438, -0.024852752685546875, -0.023454666137695312, -0.02205657958984375, -0.020658493041992188, -0.019260406494140625, -0.017862319946289062, -0.0164642333984375, -0.015066146850585938, -0.013668060302734375, -0.012269973754882812, -0.01087188720703125, -0.009473800659179688, -0.008075714111328125, -0.0066776275634765625, -0.005279541015625, -0.0038814544677734375, -0.002483367919921875, -0.0010852813720703125, 0.00031280517578125, 0.0017108917236328125, 0.003108978271484375, 0.0045070648193359375, 0.0059051513671875, 0.0073032379150390625, 0.008701324462890625, 0.010099411010742188, 0.01149749755859375, 0.012895584106445312, 0.014293670654296875, 0.015691757202148438, 0.01708984375, 0.018487930297851562, 0.019886016845703125, 0.021284103393554688, 0.02268218994140625, 0.024080276489257812, 0.025478363037109375, 0.026876449584960938, 0.0282745361328125, 0.029672622680664062, 0.031070709228515625, 0.03246879577636719, 0.03386688232421875, 0.03526496887207031, 0.036663055419921875, 0.03806114196777344, 0.039459228515625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 4.0, 6.0, 10.0, 19.0, 16.0, 32.0, 44.0, 54.0, 90.0, 110.0, 136.0, 205.0, 349.0, 502.0, 832.0, 1426.0, 2572.0, 5054.0, 10922.0, 26211.0, 68829.0, 178729.0, 367701.0, 232196.0, 90076.0, 34404.0, 14123.0, 6261.0, 3135.0, 1709.0, 1003.0, 616.0, 342.0, 261.0, 169.0, 133.0, 83.0, 45.0, 37.0, 34.0, 24.0, 14.0, 14.0, 16.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.134521484375, -0.13027000427246094, -0.12601852416992188, -0.12176704406738281, -0.11751556396484375, -0.11326408386230469, -0.10901260375976562, -0.10476112365722656, -0.1005096435546875, -0.09625816345214844, -0.09200668334960938, -0.08775520324707031, -0.08350372314453125, -0.07925224304199219, -0.07500076293945312, -0.07074928283691406, -0.066497802734375, -0.06224632263183594, -0.057994842529296875, -0.05374336242675781, -0.04949188232421875, -0.04524040222167969, -0.040988922119140625, -0.03673744201660156, -0.0324859619140625, -0.028234481811523438, -0.023983001708984375, -0.019731521606445312, -0.01548004150390625, -0.011228561401367188, -0.006977081298828125, -0.0027256011962890625, 0.00152587890625, 0.0057773590087890625, 0.010028839111328125, 0.014280319213867188, 0.01853179931640625, 0.022783279418945312, 0.027034759521484375, 0.03128623962402344, 0.0355377197265625, 0.03978919982910156, 0.044040679931640625, 0.04829216003417969, 0.05254364013671875, 0.05679512023925781, 0.061046600341796875, 0.06529808044433594, 0.069549560546875, 0.07380104064941406, 0.07805252075195312, 0.08230400085449219, 0.08655548095703125, 0.09080696105957031, 0.09505844116210938, 0.09930992126464844, 0.1035614013671875, 0.10781288146972656, 0.11206436157226562, 0.11631584167480469, 0.12056732177734375, 0.12481880187988281, 0.12907028198242188, 0.13332176208496094, 0.1375732421875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 5.0, 11.0, 7.0, 8.0, 13.0, 16.0, 8.0, 13.0, 19.0, 22.0, 22.0, 28.0, 29.0, 29.0, 33.0, 31.0, 47.0, 42.0, 34.0, 52.0, 40.0, 41.0, 42.0, 49.0, 38.0, 36.0, 33.0, 24.0, 34.0, 25.0, 26.0, 20.0, 26.0, 20.0, 19.0, 11.0, 12.0, 8.0, 12.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16650390625, -0.161102294921875, -0.15570068359375, -0.150299072265625, -0.1448974609375, -0.139495849609375, -0.13409423828125, -0.128692626953125, -0.123291015625, -0.117889404296875, -0.11248779296875, -0.107086181640625, -0.1016845703125, -0.096282958984375, -0.09088134765625, -0.085479736328125, -0.080078125, -0.074676513671875, -0.06927490234375, -0.063873291015625, -0.0584716796875, -0.053070068359375, -0.04766845703125, -0.042266845703125, -0.036865234375, -0.031463623046875, -0.02606201171875, -0.020660400390625, -0.0152587890625, -0.009857177734375, -0.00445556640625, 0.000946044921875, 0.00634765625, 0.011749267578125, 0.01715087890625, 0.022552490234375, 0.0279541015625, 0.033355712890625, 0.03875732421875, 0.044158935546875, 0.049560546875, 0.054962158203125, 0.06036376953125, 0.065765380859375, 0.0711669921875, 0.076568603515625, 0.08197021484375, 0.087371826171875, 0.0927734375, 0.098175048828125, 0.10357666015625, 0.108978271484375, 0.1143798828125, 0.119781494140625, 0.12518310546875, 0.130584716796875, 0.135986328125, 0.141387939453125, 0.14678955078125, 0.152191162109375, 0.1575927734375, 0.162994384765625, 0.16839599609375, 0.173797607421875, 0.17919921875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 4.0, 7.0, 8.0, 7.0, 14.0, 23.0, 41.0, 80.0, 127.0, 226.0, 443.0, 1071.0, 3181.0, 12749.0, 71930.0, 585644.0, 321192.0, 40240.0, 7942.0, 2052.0, 777.0, 362.0, 172.0, 104.0, 52.0, 41.0, 24.0, 12.0, 12.0, 7.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.189453125, -0.1838550567626953, -0.17825698852539062, -0.17265892028808594, -0.16706085205078125, -0.16146278381347656, -0.15586471557617188, -0.1502666473388672, -0.1446685791015625, -0.1390705108642578, -0.13347244262695312, -0.12787437438964844, -0.12227630615234375, -0.11667823791503906, -0.11108016967773438, -0.10548210144042969, -0.099884033203125, -0.09428596496582031, -0.08868789672851562, -0.08308982849121094, -0.07749176025390625, -0.07189369201660156, -0.06629562377929688, -0.06069755554199219, -0.0550994873046875, -0.04950141906738281, -0.043903350830078125, -0.03830528259277344, -0.03270721435546875, -0.027109146118164062, -0.021511077880859375, -0.015913009643554688, -0.01031494140625, -0.0047168731689453125, 0.000881195068359375, 0.0064792633056640625, 0.01207733154296875, 0.017675399780273438, 0.023273468017578125, 0.028871536254882812, 0.0344696044921875, 0.04006767272949219, 0.045665740966796875, 0.05126380920410156, 0.05686187744140625, 0.06245994567871094, 0.06805801391601562, 0.07365608215332031, 0.079254150390625, 0.08485221862792969, 0.09045028686523438, 0.09604835510253906, 0.10164642333984375, 0.10724449157714844, 0.11284255981445312, 0.11844062805175781, 0.1240386962890625, 0.1296367645263672, 0.13523483276367188, 0.14083290100097656, 0.14643096923828125, 0.15202903747558594, 0.15762710571289062, 0.1632251739501953, 0.1688232421875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 10.0, 5.0, 6.0, 11.0, 11.0, 7.0, 15.0, 20.0, 31.0, 31.0, 38.0, 45.0, 47.0, 52.0, 68.0, 57.0, 72.0, 60.0, 55.0, 57.0, 59.0, 41.0, 37.0, 42.0, 15.0, 30.0, 14.0, 15.0, 17.0, 8.0, 6.0, 4.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.282329559326172e-05, -6.113201379776001e-05, -5.94407320022583e-05, -5.774945020675659e-05, -5.605816841125488e-05, -5.4366886615753174e-05, -5.2675604820251465e-05, -5.0984323024749756e-05, -4.929304122924805e-05, -4.760175943374634e-05, -4.591047763824463e-05, -4.421919584274292e-05, -4.252791404724121e-05, -4.08366322517395e-05, -3.914535045623779e-05, -3.7454068660736084e-05, -3.5762786865234375e-05, -3.4071505069732666e-05, -3.238022327423096e-05, -3.068894147872925e-05, -2.899765968322754e-05, -2.730637788772583e-05, -2.561509609222412e-05, -2.3923814296722412e-05, -2.2232532501220703e-05, -2.0541250705718994e-05, -1.8849968910217285e-05, -1.7158687114715576e-05, -1.5467405319213867e-05, -1.3776123523712158e-05, -1.208484172821045e-05, -1.039355993270874e-05, -8.702278137207031e-06, -7.010996341705322e-06, -5.319714546203613e-06, -3.6284327507019043e-06, -1.9371509552001953e-06, -2.4586915969848633e-07, 1.4454126358032227e-06, 3.1366944313049316e-06, 4.827976226806641e-06, 6.51925802230835e-06, 8.210539817810059e-06, 9.901821613311768e-06, 1.1593103408813477e-05, 1.3284385204315186e-05, 1.4975666999816895e-05, 1.6666948795318604e-05, 1.8358230590820312e-05, 2.004951238632202e-05, 2.174079418182373e-05, 2.343207597732544e-05, 2.512335777282715e-05, 2.6814639568328857e-05, 2.8505921363830566e-05, 3.0197203159332275e-05, 3.1888484954833984e-05, 3.357976675033569e-05, 3.52710485458374e-05, 3.696233034133911e-05, 3.865361213684082e-05, 4.034489393234253e-05, 4.203617572784424e-05, 4.372745752334595e-05, 4.5418739318847656e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 2.0, 7.0, 10.0, 14.0, 24.0, 37.0, 44.0, 62.0, 110.0, 193.0, 342.0, 559.0, 1178.0, 2428.0, 5679.0, 15162.0, 48181.0, 206780.0, 542269.0, 163326.0, 39829.0, 12890.0, 4998.0, 2124.0, 1030.0, 512.0, 267.0, 157.0, 93.0, 78.0, 35.0, 34.0, 29.0, 13.0, 18.0, 8.0, 8.0, 6.0, 7.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1109619140625, -0.10773849487304688, -0.10451507568359375, -0.10129165649414062, -0.0980682373046875, -0.09484481811523438, -0.09162139892578125, -0.08839797973632812, -0.085174560546875, -0.08195114135742188, -0.07872772216796875, -0.07550430297851562, -0.0722808837890625, -0.06905746459960938, -0.06583404541015625, -0.06261062622070312, -0.05938720703125, -0.056163787841796875, -0.05294036865234375, -0.049716949462890625, -0.0464935302734375, -0.043270111083984375, -0.04004669189453125, -0.036823272705078125, -0.033599853515625, -0.030376434326171875, -0.02715301513671875, -0.023929595947265625, -0.0207061767578125, -0.017482757568359375, -0.01425933837890625, -0.011035919189453125, -0.0078125, -0.004589080810546875, -0.00136566162109375, 0.001857757568359375, 0.0050811767578125, 0.008304595947265625, 0.01152801513671875, 0.014751434326171875, 0.017974853515625, 0.021198272705078125, 0.02442169189453125, 0.027645111083984375, 0.0308685302734375, 0.034091949462890625, 0.03731536865234375, 0.040538787841796875, 0.04376220703125, 0.046985626220703125, 0.05020904541015625, 0.053432464599609375, 0.0566558837890625, 0.059879302978515625, 0.06310272216796875, 0.06632614135742188, 0.069549560546875, 0.07277297973632812, 0.07599639892578125, 0.07921981811523438, 0.0824432373046875, 0.08566665649414062, 0.08889007568359375, 0.09211349487304688, 0.0953369140625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 3.0, 8.0, 4.0, 12.0, 13.0, 18.0, 16.0, 40.0, 45.0, 58.0, 75.0, 97.0, 84.0, 90.0, 76.0, 77.0, 65.0, 56.0, 44.0, 24.0, 29.0, 10.0, 13.0, 6.0, 8.0, 6.0, 5.0, 9.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06866455078125, -0.06606769561767578, -0.06347084045410156, -0.060873985290527344, -0.058277130126953125, -0.055680274963378906, -0.05308341979980469, -0.05048656463623047, -0.04788970947265625, -0.04529285430908203, -0.04269599914550781, -0.040099143981933594, -0.037502288818359375, -0.034905433654785156, -0.03230857849121094, -0.02971172332763672, -0.0271148681640625, -0.02451801300048828, -0.021921157836914062, -0.019324302673339844, -0.016727447509765625, -0.014130592346191406, -0.011533737182617188, -0.008936882019042969, -0.00634002685546875, -0.0037431716918945312, -0.0011463165283203125, 0.0014505386352539062, 0.004047393798828125, 0.006644248962402344, 0.009241104125976562, 0.011837959289550781, 0.014434814453125, 0.01703166961669922, 0.019628524780273438, 0.022225379943847656, 0.024822235107421875, 0.027419090270996094, 0.030015945434570312, 0.03261280059814453, 0.03520965576171875, 0.03780651092529297, 0.04040336608886719, 0.043000221252441406, 0.045597076416015625, 0.048193931579589844, 0.05079078674316406, 0.05338764190673828, 0.0559844970703125, 0.05858135223388672, 0.06117820739746094, 0.06377506256103516, 0.06637191772460938, 0.0689687728881836, 0.07156562805175781, 0.07416248321533203, 0.07675933837890625, 0.07935619354248047, 0.08195304870605469, 0.0845499038696289, 0.08714675903320312, 0.08974361419677734, 0.09234046936035156, 0.09493732452392578, 0.0975341796875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 2.0, 2.0, 14.0, 12.0, 35.0, 72.0, 108.0, 121.0, 159.0, 153.0, 122.0, 91.0, 53.0, 23.0, 18.0, 12.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7730293273925781, -1.722174048423767, -1.6713188886642456, -1.6204636096954346, -1.569608449935913, -1.518753170967102, -1.467897891998291, -1.4170427322387695, -1.366187572479248, -1.315332293510437, -1.2644771337509155, -1.2136218547821045, -1.162766695022583, -1.111911416053772, -1.061056137084961, -1.0102009773254395, -0.9593456983566284, -0.9084904789924622, -0.8576352596282959, -0.8067799806594849, -0.7559248208999634, -0.7050695419311523, -0.6542143225669861, -0.6033591032028198, -0.5525038838386536, -0.5016486644744873, -0.45079344511032104, -0.3999381959438324, -0.34908297657966614, -0.2982277572154999, -0.24737250804901123, -0.19651728868484497, -0.14566195011138916, -0.0948067232966423, -0.04395149648189545, 0.006903737783432007, 0.05775895714759827, 0.10861417651176453, 0.15946942567825317, 0.21032464504241943, 0.2611798644065857, 0.31203508377075195, 0.3628903031349182, 0.41374555230140686, 0.4646007716655731, 0.515455961227417, 0.566311240196228, 0.6171664595603943, 0.6680216789245605, 0.7188768982887268, 0.7697321176528931, 0.8205873966217041, 0.8714425563812256, 0.9222978353500366, 0.9731530547142029, 1.0240082740783691, 1.0748634338378906, 1.1257187128067017, 1.1765738725662231, 1.2274291515350342, 1.2782843112945557, 1.3291395902633667, 1.3799948692321777, 1.4308500289916992, 1.4817053079605103]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 11.0, 15.0, 17.0, 27.0, 21.0, 29.0, 29.0, 37.0, 39.0, 54.0, 54.0, 67.0, 69.0, 52.0, 63.0, 59.0, 50.0, 43.0, 47.0, 32.0, 42.0, 30.0, 31.0, 20.0, 14.0, 16.0, 10.0, 4.0, 7.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4824278354644775, -1.4419621229171753, -1.401496410369873, -1.3610308170318604, -1.320565104484558, -1.2800993919372559, -1.2396336793899536, -1.1991679668426514, -1.1587023735046387, -1.1182366609573364, -1.0777709484100342, -1.0373053550720215, -0.9968396425247192, -0.956373929977417, -0.9159082174301147, -0.8754425048828125, -0.8349767923355103, -0.794511079788208, -0.7540454268455505, -0.7135797142982483, -0.6731140613555908, -0.6326483488082886, -0.5921826362609863, -0.5517169237136841, -0.5112512707710266, -0.47078558802604675, -0.4303199052810669, -0.38985419273376465, -0.3493885099887848, -0.30892282724380493, -0.2684571146965027, -0.22799143195152283, -0.18752574920654297, -0.1470600664615631, -0.10659436881542206, -0.0661286786198616, -0.025662988424301147, 0.014802694320678711, 0.05526839196681976, 0.09573408961296082, 0.13619977235794067, 0.17666545510292053, 0.21713115274906158, 0.25759685039520264, 0.2980625331401825, 0.33852821588516235, 0.3789939284324646, 0.41945961117744446, 0.4599252939224243, 0.5003910064697266, 0.540856659412384, 0.5813223719596863, 0.6217880249023438, 0.662253737449646, 0.7027194499969482, 0.7431851625442505, 0.783650815486908, 0.8241165280342102, 0.8645821809768677, 0.9050478935241699, 0.9455136060714722, 0.9859792590141296, 1.026444911956787, 1.0669106245040894, 1.1073763370513916]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 5.0, 3.0, 2.0, 5.0, 6.0, 9.0, 16.0, 18.0, 24.0, 35.0, 34.0, 73.0, 103.0, 184.0, 237.0, 348.0, 567.0, 981.0, 1688.0, 3220.0, 6551.0, 15370.0, 44261.0, 208364.0, 3436588.0, 375649.0, 62900.0, 19890.0, 8089.0, 4010.0, 2082.0, 1159.0, 680.0, 407.0, 268.0, 160.0, 100.0, 67.0, 38.0, 39.0, 23.0, 9.0, 8.0, 9.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.186767578125, -0.1810436248779297, -0.17531967163085938, -0.16959571838378906, -0.16387176513671875, -0.15814781188964844, -0.15242385864257812, -0.1466999053955078, -0.1409759521484375, -0.1352519989013672, -0.12952804565429688, -0.12380409240722656, -0.11808013916015625, -0.11235618591308594, -0.10663223266601562, -0.10090827941894531, -0.095184326171875, -0.08946037292480469, -0.08373641967773438, -0.07801246643066406, -0.07228851318359375, -0.06656455993652344, -0.060840606689453125, -0.05511665344238281, -0.0493927001953125, -0.04366874694824219, -0.037944793701171875, -0.03222084045410156, -0.02649688720703125, -0.020772933959960938, -0.015048980712890625, -0.009325027465820312, -0.00360107421875, 0.0021228790283203125, 0.007846832275390625, 0.013570785522460938, 0.01929473876953125, 0.025018692016601562, 0.030742645263671875, 0.03646659851074219, 0.0421905517578125, 0.04791450500488281, 0.053638458251953125, 0.05936241149902344, 0.06508636474609375, 0.07081031799316406, 0.07653427124023438, 0.08225822448730469, 0.087982177734375, 0.09370613098144531, 0.09943008422851562, 0.10515403747558594, 0.11087799072265625, 0.11660194396972656, 0.12232589721679688, 0.1280498504638672, 0.1337738037109375, 0.1394977569580078, 0.14522171020507812, 0.15094566345214844, 0.15666961669921875, 0.16239356994628906, 0.16811752319335938, 0.1738414764404297, 0.1795654296875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 4.0, 7.0, 12.0, 7.0, 16.0, 22.0, 26.0, 22.0, 37.0, 45.0, 31.0, 42.0, 49.0, 63.0, 49.0, 59.0, 66.0, 57.0, 58.0, 58.0, 50.0, 38.0, 37.0, 19.0, 31.0, 14.0, 22.0, 6.0, 12.0, 11.0, 3.0, 8.0, 6.0, 4.0, 6.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0498046875, -0.048293113708496094, -0.04678153991699219, -0.04526996612548828, -0.043758392333984375, -0.04224681854248047, -0.04073524475097656, -0.039223670959472656, -0.03771209716796875, -0.036200523376464844, -0.03468894958496094, -0.03317737579345703, -0.031665802001953125, -0.03015422821044922, -0.028642654418945312, -0.027131080627441406, -0.0256195068359375, -0.024107933044433594, -0.022596359252929688, -0.02108478546142578, -0.019573211669921875, -0.01806163787841797, -0.016550064086914062, -0.015038490295410156, -0.01352691650390625, -0.012015342712402344, -0.010503768920898438, -0.008992195129394531, -0.007480621337890625, -0.005969047546386719, -0.0044574737548828125, -0.0029458999633789062, -0.001434326171875, 7.724761962890625e-05, 0.0015888214111328125, 0.0031003952026367188, 0.004611968994140625, 0.006123542785644531, 0.0076351165771484375, 0.009146690368652344, 0.01065826416015625, 0.012169837951660156, 0.013681411743164062, 0.015192985534667969, 0.016704559326171875, 0.01821613311767578, 0.019727706909179688, 0.021239280700683594, 0.0227508544921875, 0.024262428283691406, 0.025774002075195312, 0.02728557586669922, 0.028797149658203125, 0.03030872344970703, 0.03182029724121094, 0.033331871032714844, 0.03484344482421875, 0.036355018615722656, 0.03786659240722656, 0.03937816619873047, 0.040889739990234375, 0.04240131378173828, 0.04391288757324219, 0.045424461364746094, 0.04693603515625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 8.0, 15.0, 11.0, 15.0, 22.0, 27.0, 38.0, 71.0, 95.0, 115.0, 174.0, 248.0, 391.0, 621.0, 998.0, 1631.0, 2917.0, 5498.0, 11448.0, 25666.0, 68843.0, 241242.0, 2519673.0, 1058666.0, 163493.0, 51514.0, 20568.0, 9319.0, 4647.0, 2485.0, 1396.0, 851.0, 530.0, 334.0, 231.0, 155.0, 94.0, 73.0, 54.0, 23.0, 25.0, 15.0, 17.0, 7.0, 7.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.143798828125, -0.13942337036132812, -0.13504791259765625, -0.13067245483398438, -0.1262969970703125, -0.12192153930664062, -0.11754608154296875, -0.11317062377929688, -0.108795166015625, -0.10441970825195312, -0.10004425048828125, -0.09566879272460938, -0.0912933349609375, -0.08691787719726562, -0.08254241943359375, -0.07816696166992188, -0.07379150390625, -0.06941604614257812, -0.06504058837890625, -0.060665130615234375, -0.0562896728515625, -0.051914215087890625, -0.04753875732421875, -0.043163299560546875, -0.038787841796875, -0.034412384033203125, -0.03003692626953125, -0.025661468505859375, -0.0212860107421875, -0.016910552978515625, -0.01253509521484375, -0.008159637451171875, -0.0037841796875, 0.000591278076171875, 0.00496673583984375, 0.009342193603515625, 0.0137176513671875, 0.018093109130859375, 0.02246856689453125, 0.026844024658203125, 0.031219482421875, 0.035594940185546875, 0.03997039794921875, 0.044345855712890625, 0.0487213134765625, 0.053096771240234375, 0.05747222900390625, 0.061847686767578125, 0.06622314453125, 0.07059860229492188, 0.07497406005859375, 0.07934951782226562, 0.0837249755859375, 0.08810043334960938, 0.09247589111328125, 0.09685134887695312, 0.101226806640625, 0.10560226440429688, 0.10997772216796875, 0.11435317993164062, 0.1187286376953125, 0.12310409545898438, 0.12747955322265625, 0.13185501098632812, 0.13623046875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 7.0, 5.0, 9.0, 9.0, 14.0, 18.0, 23.0, 28.0, 27.0, 50.0, 61.0, 106.0, 175.0, 320.0, 798.0, 1307.0, 454.0, 245.0, 130.0, 96.0, 44.0, 32.0, 30.0, 18.0, 19.0, 8.0, 10.0, 6.0, 7.0, 5.0, 2.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.07843017578125, -0.076202392578125, -0.073974609375, -0.071746826171875, -0.06951904296875, -0.067291259765625, -0.0650634765625, -0.062835693359375, -0.06060791015625, -0.058380126953125, -0.05615234375, -0.053924560546875, -0.05169677734375, -0.049468994140625, -0.0472412109375, -0.045013427734375, -0.04278564453125, -0.040557861328125, -0.038330078125, -0.036102294921875, -0.03387451171875, -0.031646728515625, -0.0294189453125, -0.027191162109375, -0.02496337890625, -0.022735595703125, -0.0205078125, -0.018280029296875, -0.01605224609375, -0.013824462890625, -0.0115966796875, -0.009368896484375, -0.00714111328125, -0.004913330078125, -0.002685546875, -0.000457763671875, 0.00177001953125, 0.003997802734375, 0.0062255859375, 0.008453369140625, 0.01068115234375, 0.012908935546875, 0.01513671875, 0.017364501953125, 0.01959228515625, 0.021820068359375, 0.0240478515625, 0.026275634765625, 0.02850341796875, 0.030731201171875, 0.032958984375, 0.035186767578125, 0.03741455078125, 0.039642333984375, 0.0418701171875, 0.044097900390625, 0.04632568359375, 0.048553466796875, 0.05078125, 0.053009033203125, 0.05523681640625, 0.057464599609375, 0.0596923828125, 0.061920166015625, 0.06414794921875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 7.0, 13.0, 16.0, 34.0, 48.0, 66.0, 79.0, 95.0, 92.0, 103.0, 101.0, 89.0, 87.0, 52.0, 37.0, 24.0, 20.0, 10.0, 7.0, 5.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3733952045440674, -0.35986822843551636, -0.34634125232696533, -0.3328142762184143, -0.3192873001098633, -0.30576032400131226, -0.29223334789276123, -0.2787063717842102, -0.2651793956756592, -0.25165241956710815, -0.23812544345855713, -0.2245984673500061, -0.21107149124145508, -0.19754451513290405, -0.18401755392551422, -0.1704905778169632, -0.15696361660957336, -0.14343664050102234, -0.1299096643924713, -0.11638269573450089, -0.10285571962594986, -0.08932874351739883, -0.0758017748594284, -0.06227479875087738, -0.048747822642326355, -0.03522084653377533, -0.021693874150514603, -0.008166901767253876, 0.00536007434129715, 0.018887050449848175, 0.032414019107818604, 0.04594099521636963, 0.05946794152259827, 0.07299491763114929, 0.08652189373970032, 0.10004886239767075, 0.11357583850622177, 0.1271028220653534, 0.14062978327274323, 0.15415675938129425, 0.16768373548984528, 0.1812107115983963, 0.19473768770694733, 0.20826464891433716, 0.22179162502288818, 0.2353186011314392, 0.24884557723999023, 0.26237255334854126, 0.2758995294570923, 0.2894265055656433, 0.30295348167419434, 0.31648045778274536, 0.3300074338912964, 0.3435344099998474, 0.35706138610839844, 0.37058836221694946, 0.3841153383255005, 0.3976423144340515, 0.41116929054260254, 0.42469626665115356, 0.4382232427597046, 0.4517502188682556, 0.46527719497680664, 0.47880417108535767, 0.4923311173915863]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 10.0, 2.0, 13.0, 6.0, 11.0, 10.0, 13.0, 15.0, 19.0, 34.0, 27.0, 22.0, 34.0, 33.0, 31.0, 36.0, 36.0, 45.0, 40.0, 42.0, 32.0, 34.0, 44.0, 36.0, 33.0, 46.0, 33.0, 28.0, 34.0, 27.0, 23.0, 23.0, 17.0, 18.0, 21.0, 10.0, 15.0, 10.0, 10.0, 5.0, 5.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22394448518753052, -0.2160816788673401, -0.20821885764598846, -0.20035603642463684, -0.1924932301044464, -0.18463042378425598, -0.17676760256290436, -0.16890478134155273, -0.1610419750213623, -0.15317916870117188, -0.14531634747982025, -0.13745352625846863, -0.1295907199382782, -0.12172790616750717, -0.11386509239673615, -0.10600227862596512, -0.09813946485519409, -0.09027665108442307, -0.08241383731365204, -0.07455102354288101, -0.06668820977210999, -0.05882539600133896, -0.05096258223056793, -0.043099768459796906, -0.03523695468902588, -0.027374140918254852, -0.019511327147483826, -0.011648513376712799, -0.0037856996059417725, 0.004077114164829254, 0.01193992793560028, 0.019802741706371307, 0.027665555477142334, 0.03552836924791336, 0.04339118301868439, 0.051253996789455414, 0.05911681056022644, 0.06697962433099747, 0.0748424381017685, 0.08270525187253952, 0.09056806564331055, 0.09843087941408157, 0.1062936931848526, 0.11415650695562363, 0.12201932072639465, 0.12988212704658508, 0.1377449482679367, 0.14560776948928833, 0.15347057580947876, 0.1613333821296692, 0.1691962033510208, 0.17705902457237244, 0.18492183089256287, 0.1927846372127533, 0.20064745843410492, 0.20851027965545654, 0.21637308597564697, 0.2242358922958374, 0.23209871351718903, 0.23996153473854065, 0.24782434105873108, 0.2556871473789215, 0.2635499835014343, 0.27141278982162476, 0.2792755961418152]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 15.0, 18.0, 31.0, 35.0, 74.0, 129.0, 183.0, 310.0, 562.0, 965.0, 1841.0, 3500.0, 6742.0, 13667.0, 27426.0, 55606.0, 112224.0, 229189.0, 292245.0, 152645.0, 75911.0, 37570.0, 18262.0, 9180.0, 4743.0, 2375.0, 1338.0, 756.0, 377.0, 250.0, 142.0, 84.0, 57.0, 37.0, 23.0, 16.0, 7.0, 11.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1485595703125, -0.14434146881103516, -0.1401233673095703, -0.13590526580810547, -0.13168716430664062, -0.12746906280517578, -0.12325096130371094, -0.1190328598022461, -0.11481475830078125, -0.1105966567993164, -0.10637855529785156, -0.10216045379638672, -0.09794235229492188, -0.09372425079345703, -0.08950614929199219, -0.08528804779052734, -0.0810699462890625, -0.07685184478759766, -0.07263374328613281, -0.06841564178466797, -0.06419754028320312, -0.05997943878173828, -0.05576133728027344, -0.051543235778808594, -0.04732513427734375, -0.043107032775878906, -0.03888893127441406, -0.03467082977294922, -0.030452728271484375, -0.02623462677001953, -0.022016525268554688, -0.017798423767089844, -0.013580322265625, -0.009362220764160156, -0.0051441192626953125, -0.0009260177612304688, 0.003292083740234375, 0.007510185241699219, 0.011728286743164062, 0.015946388244628906, 0.02016448974609375, 0.024382591247558594, 0.028600692749023438, 0.03281879425048828, 0.037036895751953125, 0.04125499725341797, 0.04547309875488281, 0.049691200256347656, 0.0539093017578125, 0.058127403259277344, 0.06234550476074219, 0.06656360626220703, 0.07078170776367188, 0.07499980926513672, 0.07921791076660156, 0.0834360122680664, 0.08765411376953125, 0.0918722152709961, 0.09609031677246094, 0.10030841827392578, 0.10452651977539062, 0.10874462127685547, 0.11296272277832031, 0.11718082427978516, 0.12139892578125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 8.0, 6.0, 11.0, 13.0, 19.0, 20.0, 24.0, 27.0, 20.0, 38.0, 48.0, 48.0, 49.0, 38.0, 44.0, 52.0, 51.0, 58.0, 54.0, 61.0, 46.0, 39.0, 34.0, 35.0, 23.0, 33.0, 17.0, 20.0, 12.0, 8.0, 11.0, 10.0, 3.0, 6.0, 3.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.047576904296875, -0.046154022216796875, -0.04473114013671875, -0.043308258056640625, -0.0418853759765625, -0.040462493896484375, -0.03903961181640625, -0.037616729736328125, -0.03619384765625, -0.034770965576171875, -0.03334808349609375, -0.031925201416015625, -0.0305023193359375, -0.029079437255859375, -0.02765655517578125, -0.026233673095703125, -0.024810791015625, -0.023387908935546875, -0.02196502685546875, -0.020542144775390625, -0.0191192626953125, -0.017696380615234375, -0.01627349853515625, -0.014850616455078125, -0.013427734375, -0.012004852294921875, -0.01058197021484375, -0.009159088134765625, -0.0077362060546875, -0.006313323974609375, -0.00489044189453125, -0.003467559814453125, -0.002044677734375, -0.000621795654296875, 0.00080108642578125, 0.002223968505859375, 0.0036468505859375, 0.005069732666015625, 0.00649261474609375, 0.007915496826171875, 0.00933837890625, 0.010761260986328125, 0.01218414306640625, 0.013607025146484375, 0.0150299072265625, 0.016452789306640625, 0.01787567138671875, 0.019298553466796875, 0.020721435546875, 0.022144317626953125, 0.02356719970703125, 0.024990081787109375, 0.0264129638671875, 0.027835845947265625, 0.02925872802734375, 0.030681610107421875, 0.0321044921875, 0.033527374267578125, 0.03495025634765625, 0.036373138427734375, 0.0377960205078125, 0.039218902587890625, 0.04064178466796875, 0.042064666748046875, 0.043487548828125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 2.0, 4.0, 8.0, 10.0, 14.0, 24.0, 29.0, 31.0, 39.0, 71.0, 58.0, 102.0, 144.0, 227.0, 350.0, 520.0, 943.0, 1866.0, 4623.0, 15741.0, 63439.0, 250382.0, 486325.0, 165009.0, 40917.0, 10623.0, 3362.0, 1442.0, 754.0, 499.0, 282.0, 195.0, 149.0, 120.0, 67.0, 47.0, 38.0, 30.0, 17.0, 12.0, 13.0, 9.0, 6.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.219970703125, -0.21356582641601562, -0.20716094970703125, -0.20075607299804688, -0.1943511962890625, -0.18794631958007812, -0.18154144287109375, -0.17513656616210938, -0.168731689453125, -0.16232681274414062, -0.15592193603515625, -0.14951705932617188, -0.1431121826171875, -0.13670730590820312, -0.13030242919921875, -0.12389755249023438, -0.11749267578125, -0.11108779907226562, -0.10468292236328125, -0.09827804565429688, -0.0918731689453125, -0.08546829223632812, -0.07906341552734375, -0.07265853881835938, -0.066253662109375, -0.059848785400390625, -0.05344390869140625, -0.047039031982421875, -0.0406341552734375, -0.034229278564453125, -0.02782440185546875, -0.021419525146484375, -0.0150146484375, -0.008609771728515625, -0.00220489501953125, 0.004199981689453125, 0.0106048583984375, 0.017009735107421875, 0.02341461181640625, 0.029819488525390625, 0.036224365234375, 0.042629241943359375, 0.04903411865234375, 0.055438995361328125, 0.0618438720703125, 0.06824874877929688, 0.07465362548828125, 0.08105850219726562, 0.08746337890625, 0.09386825561523438, 0.10027313232421875, 0.10667800903320312, 0.1130828857421875, 0.11948776245117188, 0.12589263916015625, 0.13229751586914062, 0.138702392578125, 0.14510726928710938, 0.15151214599609375, 0.15791702270507812, 0.1643218994140625, 0.17072677612304688, 0.17713165283203125, 0.18353652954101562, 0.18994140625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 6.0, 12.0, 15.0, 15.0, 19.0, 25.0, 33.0, 24.0, 30.0, 29.0, 34.0, 47.0, 35.0, 48.0, 55.0, 46.0, 45.0, 46.0, 50.0, 38.0, 30.0, 37.0, 38.0, 37.0, 34.0, 26.0, 31.0, 21.0, 13.0, 15.0, 13.0, 6.0, 5.0, 7.0, 4.0, 5.0, 7.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1636962890625, -0.1577930450439453, -0.15188980102539062, -0.14598655700683594, -0.14008331298828125, -0.13418006896972656, -0.12827682495117188, -0.12237358093261719, -0.1164703369140625, -0.11056709289550781, -0.10466384887695312, -0.09876060485839844, -0.09285736083984375, -0.08695411682128906, -0.08105087280273438, -0.07514762878417969, -0.069244384765625, -0.06334114074707031, -0.057437896728515625, -0.05153465270996094, -0.04563140869140625, -0.03972816467285156, -0.033824920654296875, -0.027921676635742188, -0.0220184326171875, -0.016115188598632812, -0.010211944580078125, -0.0043087005615234375, 0.00159454345703125, 0.0074977874755859375, 0.013401031494140625, 0.019304275512695312, 0.02520751953125, 0.031110763549804688, 0.037014007568359375, 0.04291725158691406, 0.04882049560546875, 0.05472373962402344, 0.060626983642578125, 0.06653022766113281, 0.0724334716796875, 0.07833671569824219, 0.08423995971679688, 0.09014320373535156, 0.09604644775390625, 0.10194969177246094, 0.10785293579101562, 0.11375617980957031, 0.119659423828125, 0.1255626678466797, 0.13146591186523438, 0.13736915588378906, 0.14327239990234375, 0.14917564392089844, 0.15507888793945312, 0.1609821319580078, 0.1668853759765625, 0.1727886199951172, 0.17869186401367188, 0.18459510803222656, 0.19049835205078125, 0.19640159606933594, 0.20230484008789062, 0.2082080841064453, 0.214111328125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 6.0, 7.0, 17.0, 24.0, 17.0, 49.0, 54.0, 95.0, 169.0, 221.0, 378.0, 653.0, 1232.0, 2420.0, 5434.0, 13416.0, 41961.0, 186219.0, 558195.0, 175201.0, 39299.0, 12839.0, 5285.0, 2443.0, 1187.0, 660.0, 408.0, 221.0, 163.0, 81.0, 60.0, 42.0, 31.0, 28.0, 18.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11572265625, -0.11179733276367188, -0.10787200927734375, -0.10394668579101562, -0.1000213623046875, -0.09609603881835938, -0.09217071533203125, -0.08824539184570312, -0.084320068359375, -0.08039474487304688, -0.07646942138671875, -0.07254409790039062, -0.0686187744140625, -0.06469345092773438, -0.06076812744140625, -0.056842803955078125, -0.05291748046875, -0.048992156982421875, -0.04506683349609375, -0.041141510009765625, -0.0372161865234375, -0.033290863037109375, -0.02936553955078125, -0.025440216064453125, -0.021514892578125, -0.017589569091796875, -0.01366424560546875, -0.009738922119140625, -0.0058135986328125, -0.001888275146484375, 0.00203704833984375, 0.005962371826171875, 0.0098876953125, 0.013813018798828125, 0.01773834228515625, 0.021663665771484375, 0.0255889892578125, 0.029514312744140625, 0.03343963623046875, 0.037364959716796875, 0.041290283203125, 0.045215606689453125, 0.04914093017578125, 0.053066253662109375, 0.0569915771484375, 0.060916900634765625, 0.06484222412109375, 0.06876754760742188, 0.07269287109375, 0.07661819458007812, 0.08054351806640625, 0.08446884155273438, 0.0883941650390625, 0.09231948852539062, 0.09624481201171875, 0.10017013549804688, 0.104095458984375, 0.10802078247070312, 0.11194610595703125, 0.11587142944335938, 0.1197967529296875, 0.12372207641601562, 0.12764739990234375, 0.13157272338867188, 0.135498046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 4.0, 3.0, 2.0, 5.0, 4.0, 7.0, 4.0, 7.0, 8.0, 14.0, 28.0, 20.0, 25.0, 29.0, 49.0, 42.0, 52.0, 39.0, 73.0, 52.0, 57.0, 55.0, 74.0, 54.0, 58.0, 31.0, 43.0, 25.0, 29.0, 18.0, 19.0, 19.0, 8.0, 9.0, 6.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-5.7697296142578125e-05, -5.596969276666641e-05, -5.42420893907547e-05, -5.251448601484299e-05, -5.0786882638931274e-05, -4.905927926301956e-05, -4.733167588710785e-05, -4.5604072511196136e-05, -4.3876469135284424e-05, -4.214886575937271e-05, -4.0421262383461e-05, -3.8693659007549286e-05, -3.696605563163757e-05, -3.523845225572586e-05, -3.351084887981415e-05, -3.1783245503902435e-05, -3.0055642127990723e-05, -2.832803875207901e-05, -2.6600435376167297e-05, -2.4872832000255585e-05, -2.3145228624343872e-05, -2.141762524843216e-05, -1.9690021872520447e-05, -1.7962418496608734e-05, -1.623481512069702e-05, -1.4507211744785309e-05, -1.2779608368873596e-05, -1.1052004992961884e-05, -9.324401617050171e-06, -7.596798241138458e-06, -5.869194865226746e-06, -4.141591489315033e-06, -2.4139881134033203e-06, -6.863847374916077e-07, 1.041218638420105e-06, 2.7688220143318176e-06, 4.49642539024353e-06, 6.224028766155243e-06, 7.951632142066956e-06, 9.679235517978668e-06, 1.1406838893890381e-05, 1.3134442269802094e-05, 1.4862045645713806e-05, 1.658964902162552e-05, 1.831725239753723e-05, 2.0044855773448944e-05, 2.1772459149360657e-05, 2.350006252527237e-05, 2.5227665901184082e-05, 2.6955269277095795e-05, 2.8682872653007507e-05, 3.041047602891922e-05, 3.213807940483093e-05, 3.3865682780742645e-05, 3.559328615665436e-05, 3.732088953256607e-05, 3.904849290847778e-05, 4.0776096284389496e-05, 4.250369966030121e-05, 4.423130303621292e-05, 4.5958906412124634e-05, 4.7686509788036346e-05, 4.941411316394806e-05, 5.114171653985977e-05, 5.2869319915771484e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 6.0, 8.0, 6.0, 15.0, 15.0, 21.0, 29.0, 42.0, 59.0, 80.0, 116.0, 202.0, 390.0, 769.0, 1668.0, 4286.0, 13076.0, 51713.0, 389074.0, 496643.0, 66137.0, 15336.0, 4981.0, 1953.0, 858.0, 383.0, 271.0, 130.0, 90.0, 58.0, 50.0, 24.0, 8.0, 13.0, 14.0, 7.0, 8.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.1431884765625, -0.13872337341308594, -0.13425827026367188, -0.1297931671142578, -0.12532806396484375, -0.12086296081542969, -0.11639785766601562, -0.11193275451660156, -0.1074676513671875, -0.10300254821777344, -0.09853744506835938, -0.09407234191894531, -0.08960723876953125, -0.08514213562011719, -0.08067703247070312, -0.07621192932128906, -0.071746826171875, -0.06728172302246094, -0.06281661987304688, -0.05835151672363281, -0.05388641357421875, -0.04942131042480469, -0.044956207275390625, -0.04049110412597656, -0.0360260009765625, -0.03156089782714844, -0.027095794677734375, -0.022630691528320312, -0.01816558837890625, -0.013700485229492188, -0.009235382080078125, -0.0047702789306640625, -0.00030517578125, 0.0041599273681640625, 0.008625030517578125, 0.013090133666992188, 0.01755523681640625, 0.022020339965820312, 0.026485443115234375, 0.030950546264648438, 0.0354156494140625, 0.03988075256347656, 0.044345855712890625, 0.04881095886230469, 0.05327606201171875, 0.05774116516113281, 0.062206268310546875, 0.06667137145996094, 0.071136474609375, 0.07560157775878906, 0.08006668090820312, 0.08453178405761719, 0.08899688720703125, 0.09346199035644531, 0.09792709350585938, 0.10239219665527344, 0.1068572998046875, 0.11132240295410156, 0.11578750610351562, 0.12025260925292969, 0.12471771240234375, 0.1291828155517578, 0.13364791870117188, 0.13811302185058594, 0.142578125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 8.0, 4.0, 6.0, 5.0, 11.0, 16.0, 27.0, 54.0, 61.0, 113.0, 142.0, 170.0, 127.0, 85.0, 60.0, 36.0, 23.0, 14.0, 11.0, 13.0, 5.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1988525390625, -0.19436073303222656, -0.18986892700195312, -0.1853771209716797, -0.18088531494140625, -0.1763935089111328, -0.17190170288085938, -0.16740989685058594, -0.1629180908203125, -0.15842628479003906, -0.15393447875976562, -0.1494426727294922, -0.14495086669921875, -0.1404590606689453, -0.13596725463867188, -0.13147544860839844, -0.126983642578125, -0.12249183654785156, -0.11800003051757812, -0.11350822448730469, -0.10901641845703125, -0.10452461242675781, -0.10003280639648438, -0.09554100036621094, -0.0910491943359375, -0.08655738830566406, -0.08206558227539062, -0.07757377624511719, -0.07308197021484375, -0.06859016418457031, -0.06409835815429688, -0.05960655212402344, -0.05511474609375, -0.05062294006347656, -0.046131134033203125, -0.04163932800292969, -0.03714752197265625, -0.03265571594238281, -0.028163909912109375, -0.023672103881835938, -0.0191802978515625, -0.014688491821289062, -0.010196685791015625, -0.0057048797607421875, -0.00121307373046875, 0.0032787322998046875, 0.007770538330078125, 0.012262344360351562, 0.016754150390625, 0.021245956420898438, 0.025737762451171875, 0.030229568481445312, 0.03472137451171875, 0.03921318054199219, 0.043704986572265625, 0.04819679260253906, 0.0526885986328125, 0.05718040466308594, 0.061672210693359375, 0.06616401672363281, 0.07065582275390625, 0.07514762878417969, 0.07963943481445312, 0.08413124084472656, 0.088623046875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 13.0, 24.0, 54.0, 84.0, 152.0, 189.0, 166.0, 131.0, 82.0, 59.0, 25.0, 12.0, 7.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.302182197570801, -2.243377685546875, -2.18457293510437, -2.1257684230804443, -2.0669639110565186, -2.0081591606140137, -1.949354648590088, -1.890550136566162, -1.8317455053329468, -1.7729408740997314, -1.7141363620758057, -1.6553317308425903, -1.5965272188186646, -1.5377225875854492, -1.4789180755615234, -1.420113444328308, -1.3613088130950928, -1.3025041818618774, -1.2436996698379517, -1.1848950386047363, -1.1260905265808105, -1.0672858953475952, -1.0084812641143799, -0.9496767520904541, -0.8908722400665283, -0.8320676684379578, -0.7732630968093872, -0.7144584655761719, -0.6556538939476013, -0.5968493223190308, -0.5380447506904602, -0.47924014925956726, -0.4204355478286743, -0.36163097620010376, -0.3028263747692108, -0.24402180314064026, -0.1852172166109085, -0.12641263008117676, -0.0676080584526062, -0.008803457021713257, 0.0500011146068573, 0.10880570113658905, 0.1676102876663208, 0.22641485929489136, 0.2852194309234619, 0.34402403235435486, 0.4028286039829254, 0.46163320541381836, 0.5204377770423889, 0.5792423486709595, 0.63804692029953, 0.6968514919281006, 0.7556561231613159, 0.8144606947898865, 0.873265266418457, 0.9320698976516724, 0.9908744096755981, 1.0496790409088135, 1.1084835529327393, 1.1672881841659546, 1.2260926961898804, 1.2848973274230957, 1.3437018394470215, 1.4025064706802368, 1.4613111019134521]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 5.0, 6.0, 12.0, 8.0, 6.0, 5.0, 5.0, 15.0, 14.0, 29.0, 14.0, 24.0, 26.0, 41.0, 34.0, 33.0, 41.0, 28.0, 32.0, 29.0, 41.0, 40.0, 37.0, 42.0, 37.0, 44.0, 36.0, 31.0, 26.0, 27.0, 24.0, 29.0, 31.0, 24.0, 15.0, 20.0, 11.0, 12.0, 11.0, 11.0, 9.0, 7.0, 3.0, 6.0, 9.0, 0.0, 9.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.9869225025177002, -0.9588083028793335, -0.9306941628456116, -0.9025799632072449, -0.8744657635688782, -0.8463516235351562, -0.8182374238967896, -0.7901232242584229, -0.7620090246200562, -0.7338948249816895, -0.7057806849479675, -0.6776664853096008, -0.6495522856712341, -0.6214381456375122, -0.5933239459991455, -0.5652097463607788, -0.5370956063270569, -0.5089814066886902, -0.4808672368526459, -0.45275306701660156, -0.42463886737823486, -0.39652469754219055, -0.36841052770614624, -0.34029632806777954, -0.31218215823173523, -0.2840679883956909, -0.2559537887573242, -0.2278396189212799, -0.1997254341840744, -0.1716112494468689, -0.14349707961082458, -0.11538289487361908, -0.08726876974105835, -0.05915458872914314, -0.031040407717227936, -0.0029262304306030273, 0.025187954306602478, 0.05330213904380798, 0.0814163088798523, 0.1095304936170578, 0.1376446783542633, 0.1657588630914688, 0.19387304782867432, 0.22198721766471863, 0.25010138750076294, 0.27821558713912964, 0.30632975697517395, 0.33444392681121826, 0.36255812644958496, 0.3906722962856293, 0.41878649592399597, 0.4469006657600403, 0.475014865398407, 0.5031290054321289, 0.5312432050704956, 0.5593574047088623, 0.587471604347229, 0.6155858039855957, 0.6436999440193176, 0.6718141436576843, 0.699928343296051, 0.728042483329773, 0.7561566829681396, 0.7842708826065063, 0.8123850226402283]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 8.0, 10.0, 4.0, 23.0, 23.0, 43.0, 60.0, 107.0, 125.0, 204.0, 376.0, 544.0, 1024.0, 1751.0, 3501.0, 7321.0, 17220.0, 47364.0, 172935.0, 2597360.0, 1141655.0, 133953.0, 39854.0, 15121.0, 6508.0, 3117.0, 1732.0, 915.0, 508.0, 301.0, 203.0, 131.0, 81.0, 58.0, 44.0, 26.0, 18.0, 14.0, 9.0, 7.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.148193359375, -0.14323997497558594, -0.13828659057617188, -0.1333332061767578, -0.12837982177734375, -0.12342643737792969, -0.11847305297851562, -0.11351966857910156, -0.1085662841796875, -0.10361289978027344, -0.09865951538085938, -0.09370613098144531, -0.08875274658203125, -0.08379936218261719, -0.07884597778320312, -0.07389259338378906, -0.068939208984375, -0.06398582458496094, -0.059032440185546875, -0.05407905578613281, -0.04912567138671875, -0.04417228698730469, -0.039218902587890625, -0.03426551818847656, -0.0293121337890625, -0.024358749389648438, -0.019405364990234375, -0.014451980590820312, -0.00949859619140625, -0.0045452117919921875, 0.000408172607421875, 0.0053615570068359375, 0.01031494140625, 0.015268325805664062, 0.020221710205078125, 0.025175094604492188, 0.03012847900390625, 0.03508186340332031, 0.040035247802734375, 0.04498863220214844, 0.0499420166015625, 0.05489540100097656, 0.059848785400390625, 0.06480216979980469, 0.06975555419921875, 0.07470893859863281, 0.07966232299804688, 0.08461570739746094, 0.089569091796875, 0.09452247619628906, 0.09947586059570312, 0.10442924499511719, 0.10938262939453125, 0.11433601379394531, 0.11928939819335938, 0.12424278259277344, 0.1291961669921875, 0.13414955139160156, 0.13910293579101562, 0.1440563201904297, 0.14900970458984375, 0.1539630889892578, 0.15891647338867188, 0.16386985778808594, 0.1688232421875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 10.0, 7.0, 14.0, 12.0, 23.0, 19.0, 31.0, 24.0, 36.0, 44.0, 36.0, 56.0, 45.0, 44.0, 70.0, 60.0, 64.0, 63.0, 52.0, 46.0, 38.0, 40.0, 39.0, 23.0, 22.0, 17.0, 14.0, 9.0, 8.0, 10.0, 7.0, 4.0, 3.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04901123046875, -0.04739570617675781, -0.045780181884765625, -0.04416465759277344, -0.04254913330078125, -0.04093360900878906, -0.039318084716796875, -0.03770256042480469, -0.0360870361328125, -0.03447151184082031, -0.032855987548828125, -0.031240463256835938, -0.02962493896484375, -0.028009414672851562, -0.026393890380859375, -0.024778366088867188, -0.023162841796875, -0.021547317504882812, -0.019931793212890625, -0.018316268920898438, -0.01670074462890625, -0.015085220336914062, -0.013469696044921875, -0.011854171752929688, -0.0102386474609375, -0.008623123168945312, -0.007007598876953125, -0.0053920745849609375, -0.00377655029296875, -0.0021610260009765625, -0.000545501708984375, 0.0010700225830078125, 0.002685546875, 0.0043010711669921875, 0.005916595458984375, 0.0075321197509765625, 0.00914764404296875, 0.010763168334960938, 0.012378692626953125, 0.013994216918945312, 0.0156097412109375, 0.017225265502929688, 0.018840789794921875, 0.020456314086914062, 0.02207183837890625, 0.023687362670898438, 0.025302886962890625, 0.026918411254882812, 0.028533935546875, 0.030149459838867188, 0.031764984130859375, 0.03338050842285156, 0.03499603271484375, 0.03661155700683594, 0.038227081298828125, 0.03984260559082031, 0.0414581298828125, 0.04307365417480469, 0.044689178466796875, 0.04630470275878906, 0.04792022705078125, 0.04953575134277344, 0.051151275634765625, 0.05276679992675781, 0.05438232421875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 6.0, 6.0, 10.0, 13.0, 28.0, 25.0, 42.0, 71.0, 80.0, 171.0, 245.0, 413.0, 569.0, 1016.0, 1877.0, 3399.0, 7033.0, 15267.0, 36543.0, 102563.0, 386745.0, 2705067.0, 695706.0, 149714.0, 49771.0, 19435.0, 8859.0, 4178.0, 2242.0, 1195.0, 713.0, 471.0, 270.0, 184.0, 117.0, 79.0, 53.0, 31.0, 26.0, 13.0, 9.0, 11.0, 8.0, 1.0, 2.0, 4.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1383056640625, -0.13407135009765625, -0.1298370361328125, -0.12560272216796875, -0.121368408203125, -0.11713409423828125, -0.1128997802734375, -0.10866546630859375, -0.10443115234375, -0.10019683837890625, -0.0959625244140625, -0.09172821044921875, -0.087493896484375, -0.08325958251953125, -0.0790252685546875, -0.07479095458984375, -0.070556640625, -0.06632232666015625, -0.0620880126953125, -0.05785369873046875, -0.053619384765625, -0.04938507080078125, -0.0451507568359375, -0.04091644287109375, -0.03668212890625, -0.03244781494140625, -0.0282135009765625, -0.02397918701171875, -0.019744873046875, -0.01551055908203125, -0.0112762451171875, -0.00704193115234375, -0.0028076171875, 0.00142669677734375, 0.0056610107421875, 0.00989532470703125, 0.014129638671875, 0.01836395263671875, 0.0225982666015625, 0.02683258056640625, 0.03106689453125, 0.03530120849609375, 0.0395355224609375, 0.04376983642578125, 0.048004150390625, 0.05223846435546875, 0.0564727783203125, 0.06070709228515625, 0.06494140625, 0.06917572021484375, 0.0734100341796875, 0.07764434814453125, 0.081878662109375, 0.08611297607421875, 0.0903472900390625, 0.09458160400390625, 0.09881591796875, 0.10305023193359375, 0.1072845458984375, 0.11151885986328125, 0.115753173828125, 0.11998748779296875, 0.1242218017578125, 0.12845611572265625, 0.1326904296875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 9.0, 7.0, 9.0, 10.0, 19.0, 25.0, 25.0, 42.0, 63.0, 70.0, 101.0, 177.0, 261.0, 457.0, 1065.0, 766.0, 330.0, 195.0, 142.0, 87.0, 53.0, 45.0, 32.0, 21.0, 14.0, 13.0, 8.0, 7.0, 5.0, 5.0, 2.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0841064453125, -0.08154487609863281, -0.07898330688476562, -0.07642173767089844, -0.07386016845703125, -0.07129859924316406, -0.06873703002929688, -0.06617546081542969, -0.0636138916015625, -0.06105232238769531, -0.058490753173828125, -0.05592918395996094, -0.05336761474609375, -0.05080604553222656, -0.048244476318359375, -0.04568290710449219, -0.043121337890625, -0.04055976867675781, -0.037998199462890625, -0.03543663024902344, -0.03287506103515625, -0.030313491821289062, -0.027751922607421875, -0.025190353393554688, -0.0226287841796875, -0.020067214965820312, -0.017505645751953125, -0.014944076538085938, -0.01238250732421875, -0.009820938110351562, -0.007259368896484375, -0.0046977996826171875, -0.00213623046875, 0.0004253387451171875, 0.002986907958984375, 0.0055484771728515625, 0.00811004638671875, 0.010671615600585938, 0.013233184814453125, 0.015794754028320312, 0.0183563232421875, 0.020917892456054688, 0.023479461669921875, 0.026041030883789062, 0.02860260009765625, 0.031164169311523438, 0.033725738525390625, 0.03628730773925781, 0.038848876953125, 0.04141044616699219, 0.043972015380859375, 0.04653358459472656, 0.04909515380859375, 0.05165672302246094, 0.054218292236328125, 0.05677986145019531, 0.0593414306640625, 0.06190299987792969, 0.06446456909179688, 0.06702613830566406, 0.06958770751953125, 0.07214927673339844, 0.07471084594726562, 0.07727241516113281, 0.079833984375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 9.0, 12.0, 28.0, 47.0, 68.0, 120.0, 137.0, 136.0, 116.0, 125.0, 88.0, 58.0, 29.0, 15.0, 9.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.1035006046295166, -1.0809924602508545, -1.058484435081482, -1.0359762907028198, -1.0134681463241577, -0.9909600615501404, -0.968451976776123, -0.9459438323974609, -0.9234357476234436, -0.9009276628494263, -0.8784195184707642, -0.8559114336967468, -0.8334033489227295, -0.8108952045440674, -0.78838711977005, -0.7658790349960327, -0.7433708906173706, -0.7208628058433533, -0.6983546614646912, -0.6758465766906738, -0.6533384323120117, -0.6308303475379944, -0.608322262763977, -0.5858141183853149, -0.5633060336112976, -0.5407979488372803, -0.5182898044586182, -0.49578171968460083, -0.4732736051082611, -0.4507654905319214, -0.42825740575790405, -0.40574929118156433, -0.3832412362098694, -0.36073312163352966, -0.33822500705718994, -0.3157169222831726, -0.2932088077068329, -0.27070069313049316, -0.24819259345531464, -0.2256844937801361, -0.2031763792037964, -0.18066826462745667, -0.15816016495227814, -0.1356520652770996, -0.11314395070075989, -0.09063584357500076, -0.06812773644924164, -0.04561963677406311, -0.02311152219772339, -0.0006034150719642639, 0.02190469205379486, 0.044412799179553986, 0.06692090630531311, 0.08942901343107224, 0.11193712055683136, 0.1344452202320099, 0.1569533348083496, 0.17946144938468933, 0.20196954905986786, 0.2244776487350464, 0.2469857633113861, 0.26949387788772583, 0.29200196266174316, 0.3145100772380829, 0.3370181918144226]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 9.0, 2.0, 11.0, 7.0, 10.0, 20.0, 19.0, 18.0, 16.0, 25.0, 23.0, 31.0, 36.0, 43.0, 39.0, 45.0, 52.0, 46.0, 44.0, 45.0, 43.0, 45.0, 45.0, 44.0, 39.0, 26.0, 27.0, 35.0, 21.0, 23.0, 20.0, 21.0, 10.0, 10.0, 4.0, 4.0, 9.0, 14.0, 5.0, 5.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31915968656539917, -0.3087106943130493, -0.2982616722583771, -0.28781265020370483, -0.277363657951355, -0.2669146656990051, -0.2564656436443329, -0.24601663649082184, -0.2355676293373108, -0.22511862218379974, -0.2146696150302887, -0.20422060787677765, -0.1937716007232666, -0.18332259356975555, -0.1728735864162445, -0.16242457926273346, -0.1519755721092224, -0.14152656495571136, -0.13107755780220032, -0.12062855064868927, -0.11017954349517822, -0.09973053634166718, -0.08928152918815613, -0.07883252203464508, -0.06838351488113403, -0.057934507727622986, -0.04748550057411194, -0.03703649342060089, -0.026587486267089844, -0.016138479113578796, -0.005689471960067749, 0.004759535193443298, 0.015208542346954346, 0.025657549500465393, 0.03610655665397644, 0.04655556380748749, 0.057004570960998535, 0.06745357811450958, 0.07790258526802063, 0.08835159242153168, 0.09880059957504272, 0.10924960672855377, 0.11969861388206482, 0.13014762103557587, 0.14059662818908691, 0.15104563534259796, 0.161494642496109, 0.17194364964962006, 0.1823926568031311, 0.19284166395664215, 0.2032906711101532, 0.21373967826366425, 0.2241886854171753, 0.23463769257068634, 0.2450866997241974, 0.25553572177886963, 0.2659847140312195, 0.27643370628356934, 0.2868827283382416, 0.2973317503929138, 0.30778074264526367, 0.3182297348976135, 0.32867875695228577, 0.339127779006958, 0.34957677125930786]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 11.0, 12.0, 18.0, 33.0, 44.0, 58.0, 111.0, 173.0, 312.0, 523.0, 968.0, 1898.0, 3993.0, 8796.0, 21329.0, 58272.0, 212845.0, 551891.0, 120120.0, 39230.0, 15138.0, 6468.0, 2992.0, 1477.0, 808.0, 399.0, 253.0, 122.0, 85.0, 60.0, 31.0, 34.0, 21.0, 8.0, 4.0, 9.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2281494140625, -0.22150039672851562, -0.21485137939453125, -0.20820236206054688, -0.2015533447265625, -0.19490432739257812, -0.18825531005859375, -0.18160629272460938, -0.174957275390625, -0.16830825805664062, -0.16165924072265625, -0.15501022338867188, -0.1483612060546875, -0.14171218872070312, -0.13506317138671875, -0.12841415405273438, -0.12176513671875, -0.11511611938476562, -0.10846710205078125, -0.10181808471679688, -0.0951690673828125, -0.08852005004882812, -0.08187103271484375, -0.07522201538085938, -0.068572998046875, -0.061923980712890625, -0.05527496337890625, -0.048625946044921875, -0.0419769287109375, -0.035327911376953125, -0.02867889404296875, -0.022029876708984375, -0.015380859375, -0.008731842041015625, -0.00208282470703125, 0.004566192626953125, 0.0112152099609375, 0.017864227294921875, 0.02451324462890625, 0.031162261962890625, 0.037811279296875, 0.044460296630859375, 0.05110931396484375, 0.057758331298828125, 0.0644073486328125, 0.07105636596679688, 0.07770538330078125, 0.08435440063476562, 0.09100341796875, 0.09765243530273438, 0.10430145263671875, 0.11095046997070312, 0.1175994873046875, 0.12424850463867188, 0.13089752197265625, 0.13754653930664062, 0.144195556640625, 0.15084457397460938, 0.15749359130859375, 0.16414260864257812, 0.1707916259765625, 0.17744064331054688, 0.18408966064453125, 0.19073867797851562, 0.1973876953125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 5.0, 17.0, 8.0, 14.0, 21.0, 22.0, 24.0, 30.0, 38.0, 49.0, 32.0, 46.0, 59.0, 53.0, 62.0, 58.0, 66.0, 62.0, 57.0, 51.0, 41.0, 39.0, 27.0, 15.0, 18.0, 24.0, 14.0, 9.0, 9.0, 8.0, 6.0, 4.0, 6.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050811767578125, -0.049180030822753906, -0.04754829406738281, -0.04591655731201172, -0.044284820556640625, -0.04265308380126953, -0.04102134704589844, -0.039389610290527344, -0.03775787353515625, -0.036126136779785156, -0.03449440002441406, -0.03286266326904297, -0.031230926513671875, -0.02959918975830078, -0.027967453002929688, -0.026335716247558594, -0.0247039794921875, -0.023072242736816406, -0.021440505981445312, -0.01980876922607422, -0.018177032470703125, -0.01654529571533203, -0.014913558959960938, -0.013281822204589844, -0.01165008544921875, -0.010018348693847656, -0.008386611938476562, -0.006754875183105469, -0.005123138427734375, -0.0034914016723632812, -0.0018596649169921875, -0.00022792816162109375, 0.00140380859375, 0.0030355453491210938, 0.0046672821044921875, 0.006299018859863281, 0.007930755615234375, 0.009562492370605469, 0.011194229125976562, 0.012825965881347656, 0.01445770263671875, 0.016089439392089844, 0.017721176147460938, 0.01935291290283203, 0.020984649658203125, 0.02261638641357422, 0.024248123168945312, 0.025879859924316406, 0.0275115966796875, 0.029143333435058594, 0.030775070190429688, 0.03240680694580078, 0.034038543701171875, 0.03567028045654297, 0.03730201721191406, 0.038933753967285156, 0.04056549072265625, 0.042197227478027344, 0.04382896423339844, 0.04546070098876953, 0.047092437744140625, 0.04872417449951172, 0.05035591125488281, 0.051987648010253906, 0.053619384765625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 6.0, 6.0, 10.0, 15.0, 14.0, 19.0, 38.0, 31.0, 67.0, 66.0, 123.0, 161.0, 260.0, 377.0, 629.0, 1057.0, 2268.0, 6077.0, 20622.0, 95847.0, 631167.0, 231454.0, 40868.0, 10110.0, 3574.0, 1572.0, 744.0, 432.0, 281.0, 201.0, 128.0, 84.0, 63.0, 45.0, 44.0, 26.0, 24.0, 17.0, 9.0, 9.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2386474609375, -0.2308826446533203, -0.22311782836914062, -0.21535301208496094, -0.20758819580078125, -0.19982337951660156, -0.19205856323242188, -0.1842937469482422, -0.1765289306640625, -0.1687641143798828, -0.16099929809570312, -0.15323448181152344, -0.14546966552734375, -0.13770484924316406, -0.12994003295898438, -0.12217521667480469, -0.114410400390625, -0.10664558410644531, -0.09888076782226562, -0.09111595153808594, -0.08335113525390625, -0.07558631896972656, -0.06782150268554688, -0.06005668640136719, -0.0522918701171875, -0.04452705383300781, -0.036762237548828125, -0.028997421264648438, -0.02123260498046875, -0.013467788696289062, -0.005702972412109375, 0.0020618438720703125, 0.00982666015625, 0.017591476440429688, 0.025356292724609375, 0.03312110900878906, 0.04088592529296875, 0.04865074157714844, 0.056415557861328125, 0.06418037414550781, 0.0719451904296875, 0.07971000671386719, 0.08747482299804688, 0.09523963928222656, 0.10300445556640625, 0.11076927185058594, 0.11853408813476562, 0.1262989044189453, 0.134063720703125, 0.1418285369873047, 0.14959335327148438, 0.15735816955566406, 0.16512298583984375, 0.17288780212402344, 0.18065261840820312, 0.1884174346923828, 0.1961822509765625, 0.2039470672607422, 0.21171188354492188, 0.21947669982910156, 0.22724151611328125, 0.23500633239746094, 0.24277114868164062, 0.2505359649658203, 0.25830078125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 5.0, 6.0, 11.0, 14.0, 13.0, 15.0, 17.0, 21.0, 38.0, 34.0, 46.0, 46.0, 34.0, 56.0, 68.0, 57.0, 70.0, 54.0, 39.0, 44.0, 47.0, 47.0, 32.0, 30.0, 39.0, 29.0, 16.0, 16.0, 19.0, 8.0, 4.0, 6.0, 1.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2044677734375, -0.19736862182617188, -0.19026947021484375, -0.18317031860351562, -0.1760711669921875, -0.16897201538085938, -0.16187286376953125, -0.15477371215820312, -0.147674560546875, -0.14057540893554688, -0.13347625732421875, -0.12637710571289062, -0.1192779541015625, -0.11217880249023438, -0.10507965087890625, -0.09798049926757812, -0.09088134765625, -0.08378219604492188, -0.07668304443359375, -0.06958389282226562, -0.0624847412109375, -0.055385589599609375, -0.04828643798828125, -0.041187286376953125, -0.034088134765625, -0.026988983154296875, -0.01988983154296875, -0.012790679931640625, -0.0056915283203125, 0.001407623291015625, 0.00850677490234375, 0.015605926513671875, 0.022705078125, 0.029804229736328125, 0.03690338134765625, 0.044002532958984375, 0.0511016845703125, 0.058200836181640625, 0.06529998779296875, 0.07239913940429688, 0.079498291015625, 0.08659744262695312, 0.09369659423828125, 0.10079574584960938, 0.1078948974609375, 0.11499404907226562, 0.12209320068359375, 0.12919235229492188, 0.13629150390625, 0.14339065551757812, 0.15048980712890625, 0.15758895874023438, 0.1646881103515625, 0.17178726196289062, 0.17888641357421875, 0.18598556518554688, 0.193084716796875, 0.20018386840820312, 0.20728302001953125, 0.21438217163085938, 0.2214813232421875, 0.22858047485351562, 0.23567962646484375, 0.24277877807617188, 0.2498779296875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 4.0, 7.0, 9.0, 17.0, 24.0, 37.0, 39.0, 72.0, 90.0, 141.0, 250.0, 462.0, 891.0, 2057.0, 5000.0, 13755.0, 43751.0, 222556.0, 634906.0, 85686.0, 24515.0, 8199.0, 3171.0, 1343.0, 643.0, 344.0, 205.0, 119.0, 70.0, 41.0, 36.0, 21.0, 22.0, 18.0, 11.0, 10.0, 3.0, 3.0, 6.0, 1.0, 3.0, 1.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.1353759765625, -0.1314239501953125, -0.127471923828125, -0.1235198974609375, -0.11956787109375, -0.1156158447265625, -0.111663818359375, -0.1077117919921875, -0.103759765625, -0.0998077392578125, -0.095855712890625, -0.0919036865234375, -0.08795166015625, -0.0839996337890625, -0.080047607421875, -0.0760955810546875, -0.0721435546875, -0.0681915283203125, -0.064239501953125, -0.0602874755859375, -0.05633544921875, -0.0523834228515625, -0.048431396484375, -0.0444793701171875, -0.04052734375, -0.0365753173828125, -0.032623291015625, -0.0286712646484375, -0.02471923828125, -0.0207672119140625, -0.016815185546875, -0.0128631591796875, -0.0089111328125, -0.0049591064453125, -0.001007080078125, 0.0029449462890625, 0.00689697265625, 0.0108489990234375, 0.014801025390625, 0.0187530517578125, 0.022705078125, 0.0266571044921875, 0.030609130859375, 0.0345611572265625, 0.03851318359375, 0.0424652099609375, 0.046417236328125, 0.0503692626953125, 0.0543212890625, 0.0582733154296875, 0.062225341796875, 0.0661773681640625, 0.07012939453125, 0.0740814208984375, 0.078033447265625, 0.0819854736328125, 0.0859375, 0.0898895263671875, 0.093841552734375, 0.0977935791015625, 0.10174560546875, 0.1056976318359375, 0.109649658203125, 0.1136016845703125, 0.1175537109375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 1.0, 12.0, 5.0, 10.0, 19.0, 43.0, 64.0, 95.0, 130.0, 163.0, 118.0, 108.0, 72.0, 55.0, 30.0, 17.0, 13.0, 10.0, 9.0, 3.0, 4.0, 2.0, 2.0, 5.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010323524475097656, -9.97716560959816e-05, -9.630806744098663e-05, -9.284447878599167e-05, -8.93808901309967e-05, -8.591730147600174e-05, -8.245371282100677e-05, -7.899012416601181e-05, -7.552653551101685e-05, -7.206294685602188e-05, -6.859935820102692e-05, -6.513576954603195e-05, -6.167218089103699e-05, -5.820859223604202e-05, -5.474500358104706e-05, -5.1281414926052094e-05, -4.781782627105713e-05, -4.4354237616062164e-05, -4.08906489610672e-05, -3.7427060306072235e-05, -3.396347165107727e-05, -3.0499882996082306e-05, -2.703629434108734e-05, -2.3572705686092377e-05, -2.0109117031097412e-05, -1.6645528376102448e-05, -1.3181939721107483e-05, -9.718351066112518e-06, -6.254762411117554e-06, -2.791173756122589e-06, 6.724148988723755e-07, 4.13600355386734e-06, 7.599592208862305e-06, 1.106318086385727e-05, 1.4526769518852234e-05, 1.79903581738472e-05, 2.1453946828842163e-05, 2.4917535483837128e-05, 2.8381124138832092e-05, 3.184471279382706e-05, 3.530830144882202e-05, 3.8771890103816986e-05, 4.223547875881195e-05, 4.5699067413806915e-05, 4.916265606880188e-05, 5.2626244723796844e-05, 5.608983337879181e-05, 5.9553422033786774e-05, 6.301701068878174e-05, 6.64805993437767e-05, 6.994418799877167e-05, 7.340777665376663e-05, 7.68713653087616e-05, 8.033495396375656e-05, 8.379854261875153e-05, 8.726213127374649e-05, 9.072571992874146e-05, 9.418930858373642e-05, 9.765289723873138e-05, 0.00010111648589372635, 0.00010458007454872131, 0.00010804366320371628, 0.00011150725185871124, 0.00011497084051370621, 0.00011843442916870117]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 12.0, 10.0, 14.0, 35.0, 59.0, 113.0, 183.0, 344.0, 836.0, 2126.0, 7674.0, 39488.0, 481664.0, 466170.0, 38558.0, 7550.0, 2049.0, 818.0, 349.0, 189.0, 112.0, 71.0, 39.0, 39.0, 16.0, 9.0, 4.0, 11.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1719970703125, -0.16678428649902344, -0.16157150268554688, -0.1563587188720703, -0.15114593505859375, -0.1459331512451172, -0.14072036743164062, -0.13550758361816406, -0.1302947998046875, -0.12508201599121094, -0.11986923217773438, -0.11465644836425781, -0.10944366455078125, -0.10423088073730469, -0.09901809692382812, -0.09380531311035156, -0.088592529296875, -0.08337974548339844, -0.07816696166992188, -0.07295417785644531, -0.06774139404296875, -0.06252861022949219, -0.057315826416015625, -0.05210304260253906, -0.0468902587890625, -0.04167747497558594, -0.036464691162109375, -0.03125190734863281, -0.02603912353515625, -0.020826339721679688, -0.015613555908203125, -0.010400772094726562, -0.00518798828125, 2.47955322265625e-05, 0.005237579345703125, 0.010450363159179688, 0.01566314697265625, 0.020875930786132812, 0.026088714599609375, 0.03130149841308594, 0.0365142822265625, 0.04172706604003906, 0.046939849853515625, 0.05215263366699219, 0.05736541748046875, 0.06257820129394531, 0.06779098510742188, 0.07300376892089844, 0.078216552734375, 0.08342933654785156, 0.08864212036132812, 0.09385490417480469, 0.09906768798828125, 0.10428047180175781, 0.10949325561523438, 0.11470603942871094, 0.1199188232421875, 0.12513160705566406, 0.13034439086914062, 0.1355571746826172, 0.14076995849609375, 0.1459827423095703, 0.15119552612304688, 0.15640830993652344, 0.16162109375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 5.0, 7.0, 7.0, 10.0, 14.0, 9.0, 11.0, 11.0, 20.0, 22.0, 38.0, 50.0, 75.0, 136.0, 135.0, 125.0, 92.0, 64.0, 42.0, 35.0, 15.0, 18.0, 12.0, 14.0, 12.0, 5.0, 1.0, 5.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.091064453125, -0.08809089660644531, -0.08511734008789062, -0.08214378356933594, -0.07917022705078125, -0.07619667053222656, -0.07322311401367188, -0.07024955749511719, -0.0672760009765625, -0.06430244445800781, -0.061328887939453125, -0.05835533142089844, -0.05538177490234375, -0.05240821838378906, -0.049434661865234375, -0.04646110534667969, -0.043487548828125, -0.04051399230957031, -0.037540435791015625, -0.03456687927246094, -0.03159332275390625, -0.028619766235351562, -0.025646209716796875, -0.022672653198242188, -0.0196990966796875, -0.016725540161132812, -0.013751983642578125, -0.010778427124023438, -0.00780487060546875, -0.0048313140869140625, -0.001857757568359375, 0.0011157989501953125, 0.00408935546875, 0.0070629119873046875, 0.010036468505859375, 0.013010025024414062, 0.01598358154296875, 0.018957138061523438, 0.021930694580078125, 0.024904251098632812, 0.0278778076171875, 0.030851364135742188, 0.033824920654296875, 0.03679847717285156, 0.03977203369140625, 0.04274559020996094, 0.045719146728515625, 0.04869270324707031, 0.051666259765625, 0.05463981628417969, 0.057613372802734375, 0.06058692932128906, 0.06356048583984375, 0.06653404235839844, 0.06950759887695312, 0.07248115539550781, 0.0754547119140625, 0.07842826843261719, 0.08140182495117188, 0.08437538146972656, 0.08734893798828125, 0.09032249450683594, 0.09329605102539062, 0.09626960754394531, 0.0992431640625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 13.0, 21.0, 43.0, 69.0, 112.0, 137.0, 176.0, 148.0, 108.0, 76.0, 44.0, 26.0, 12.0, 12.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.679431676864624, -1.6258400678634644, -1.5722485780715942, -1.5186569690704346, -1.465065360069275, -1.4114737510681152, -1.3578822612762451, -1.3042906522750854, -1.2506990432739258, -1.1971074342727661, -1.143515944480896, -1.0899243354797363, -1.0363327264785767, -0.9827411770820618, -0.9291496276855469, -0.8755580186843872, -0.8219665288925171, -0.7683749794960022, -0.7147833704948425, -0.6611918210983276, -0.607600212097168, -0.5540086627006531, -0.5004171133041382, -0.4468255341053009, -0.3932339549064636, -0.33964237570762634, -0.28605079650878906, -0.23245924711227417, -0.1788676679134369, -0.1252760887145996, -0.07168453931808472, -0.018092960119247437, 0.035498738288879395, 0.08909031003713608, 0.14268188178539276, 0.19627344608306885, 0.24986502528190613, 0.3034566044807434, 0.3570481538772583, 0.4106397330760956, 0.46423131227493286, 0.5178228616714478, 0.5714144706726074, 0.6250060200691223, 0.6785975694656372, 0.7321891784667969, 0.7857807278633118, 0.8393722772598267, 0.8929638862609863, 0.9465554356575012, 1.0001469850540161, 1.0537385940551758, 1.1073302030563354, 1.1609218120574951, 1.2145133018493652, 1.268104910850525, 1.3216965198516846, 1.3752881288528442, 1.4288796186447144, 1.482471227645874, 1.5360628366470337, 1.5896544456481934, 1.6432459354400635, 1.6968375444412231, 1.7504290342330933]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 5.0, 8.0, 7.0, 5.0, 12.0, 10.0, 7.0, 15.0, 30.0, 23.0, 41.0, 29.0, 20.0, 39.0, 40.0, 38.0, 29.0, 42.0, 39.0, 38.0, 48.0, 64.0, 48.0, 38.0, 39.0, 34.0, 29.0, 32.0, 31.0, 21.0, 31.0, 19.0, 11.0, 21.0, 14.0, 10.0, 10.0, 10.0, 5.0, 8.0, 6.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0763580799102783, -1.04521906375885, -1.0140800476074219, -0.9829409718513489, -0.9518018960952759, -0.9206628799438477, -0.8895238041877747, -0.8583847880363464, -0.8272457122802734, -0.7961066961288452, -0.7649676203727722, -0.733828604221344, -0.702689528465271, -0.6715505123138428, -0.6404114365577698, -0.6092724204063416, -0.5781333446502686, -0.5469943284988403, -0.5158552527427673, -0.4847162067890167, -0.4535771608352661, -0.4224381446838379, -0.3912990689277649, -0.36016005277633667, -0.32902103662490845, -0.29788199067115784, -0.2667429447174072, -0.23560389876365662, -0.204464852809906, -0.1733258217573166, -0.14218677580356598, -0.11104772984981537, -0.07990866899490356, -0.048769623041152954, -0.017630580812692642, 0.01350846141576767, 0.04464750736951828, 0.0757865458726883, 0.1069255918264389, 0.13806463778018951, 0.16920368373394012, 0.20034272968769073, 0.23148177564144135, 0.26262080669403076, 0.29375985264778137, 0.324898898601532, 0.3560379445552826, 0.3871769905090332, 0.4183160364627838, 0.4494550824165344, 0.48059412837028503, 0.5117331743240356, 0.5428721904754639, 0.5740112662315369, 0.6051502823829651, 0.6362893581390381, 0.6674283742904663, 0.6985673904418945, 0.7297064661979675, 0.7608454823493958, 0.7919845581054688, 0.823123574256897, 0.85426265001297, 0.8854016661643982, 0.9165407419204712]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 9.0, 7.0, 10.0, 4.0, 10.0, 16.0, 37.0, 45.0, 80.0, 118.0, 188.0, 256.0, 391.0, 670.0, 1011.0, 1825.0, 3231.0, 5862.0, 11367.0, 23507.0, 57239.0, 183316.0, 2663310.0, 1009977.0, 141477.0, 47735.0, 20495.0, 9952.0, 5104.0, 2908.0, 1581.0, 964.0, 556.0, 348.0, 229.0, 149.0, 106.0, 64.0, 41.0, 30.0, 17.0, 13.0, 7.0, 10.0, 3.0, 4.0, 9.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1431884765625, -0.13896560668945312, -0.13474273681640625, -0.13051986694335938, -0.1262969970703125, -0.12207412719726562, -0.11785125732421875, -0.11362838745117188, -0.109405517578125, -0.10518264770507812, -0.10095977783203125, -0.09673690795898438, -0.0925140380859375, -0.08829116821289062, -0.08406829833984375, -0.07984542846679688, -0.07562255859375, -0.07139968872070312, -0.06717681884765625, -0.06295394897460938, -0.0587310791015625, -0.054508209228515625, -0.05028533935546875, -0.046062469482421875, -0.041839599609375, -0.037616729736328125, -0.03339385986328125, -0.029170989990234375, -0.0249481201171875, -0.020725250244140625, -0.01650238037109375, -0.012279510498046875, -0.008056640625, -0.003833770751953125, 0.00038909912109375, 0.004611968994140625, 0.0088348388671875, 0.013057708740234375, 0.01728057861328125, 0.021503448486328125, 0.025726318359375, 0.029949188232421875, 0.03417205810546875, 0.038394927978515625, 0.0426177978515625, 0.046840667724609375, 0.05106353759765625, 0.055286407470703125, 0.05950927734375, 0.06373214721679688, 0.06795501708984375, 0.07217788696289062, 0.0764007568359375, 0.08062362670898438, 0.08484649658203125, 0.08906936645507812, 0.093292236328125, 0.09751510620117188, 0.10173797607421875, 0.10596084594726562, 0.1101837158203125, 0.11440658569335938, 0.11862945556640625, 0.12285232543945312, 0.1270751953125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 8.0, 7.0, 10.0, 15.0, 16.0, 22.0, 26.0, 27.0, 37.0, 30.0, 32.0, 45.0, 40.0, 47.0, 50.0, 47.0, 45.0, 43.0, 56.0, 52.0, 51.0, 49.0, 37.0, 35.0, 44.0, 28.0, 12.0, 18.0, 13.0, 6.0, 12.0, 6.0, 11.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052215576171875, -0.050655364990234375, -0.04909515380859375, -0.047534942626953125, -0.0459747314453125, -0.044414520263671875, -0.04285430908203125, -0.041294097900390625, -0.03973388671875, -0.038173675537109375, -0.03661346435546875, -0.035053253173828125, -0.0334930419921875, -0.031932830810546875, -0.03037261962890625, -0.028812408447265625, -0.027252197265625, -0.025691986083984375, -0.02413177490234375, -0.022571563720703125, -0.0210113525390625, -0.019451141357421875, -0.01789093017578125, -0.016330718994140625, -0.0147705078125, -0.013210296630859375, -0.01165008544921875, -0.010089874267578125, -0.0085296630859375, -0.006969451904296875, -0.00540924072265625, -0.003849029541015625, -0.002288818359375, -0.000728607177734375, 0.00083160400390625, 0.002391815185546875, 0.0039520263671875, 0.005512237548828125, 0.00707244873046875, 0.008632659912109375, 0.01019287109375, 0.011753082275390625, 0.01331329345703125, 0.014873504638671875, 0.0164337158203125, 0.017993927001953125, 0.01955413818359375, 0.021114349365234375, 0.022674560546875, 0.024234771728515625, 0.02579498291015625, 0.027355194091796875, 0.0289154052734375, 0.030475616455078125, 0.03203582763671875, 0.033596038818359375, 0.03515625, 0.036716461181640625, 0.03827667236328125, 0.039836883544921875, 0.0413970947265625, 0.042957305908203125, 0.04451751708984375, 0.046077728271484375, 0.047637939453125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 8.0, 14.0, 17.0, 24.0, 53.0, 44.0, 80.0, 118.0, 183.0, 222.0, 392.0, 555.0, 871.0, 1347.0, 2425.0, 4150.0, 8156.0, 16919.0, 40728.0, 119891.0, 614775.0, 2944332.0, 303307.0, 78312.0, 29183.0, 12983.0, 6263.0, 3564.0, 1927.0, 1199.0, 710.0, 424.0, 350.0, 243.0, 151.0, 109.0, 81.0, 60.0, 30.0, 34.0, 13.0, 14.0, 6.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.1624755859375, -0.15774154663085938, -0.15300750732421875, -0.14827346801757812, -0.1435394287109375, -0.13880538940429688, -0.13407135009765625, -0.12933731079101562, -0.124603271484375, -0.11986923217773438, -0.11513519287109375, -0.11040115356445312, -0.1056671142578125, -0.10093307495117188, -0.09619903564453125, -0.09146499633789062, -0.08673095703125, -0.08199691772460938, -0.07726287841796875, -0.07252883911132812, -0.0677947998046875, -0.06306076049804688, -0.05832672119140625, -0.053592681884765625, -0.048858642578125, -0.044124603271484375, -0.03939056396484375, -0.034656524658203125, -0.0299224853515625, -0.025188446044921875, -0.02045440673828125, -0.015720367431640625, -0.010986328125, -0.006252288818359375, -0.00151824951171875, 0.003215789794921875, 0.0079498291015625, 0.012683868408203125, 0.01741790771484375, 0.022151947021484375, 0.026885986328125, 0.031620025634765625, 0.03635406494140625, 0.041088104248046875, 0.0458221435546875, 0.050556182861328125, 0.05529022216796875, 0.060024261474609375, 0.06475830078125, 0.06949234008789062, 0.07422637939453125, 0.07896041870117188, 0.0836944580078125, 0.08842849731445312, 0.09316253662109375, 0.09789657592773438, 0.102630615234375, 0.10736465454101562, 0.11209869384765625, 0.11683273315429688, 0.1215667724609375, 0.12630081176757812, 0.13103485107421875, 0.13576889038085938, 0.1405029296875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 2.0, 4.0, 7.0, 12.0, 17.0, 30.0, 36.0, 61.0, 84.0, 158.0, 344.0, 1219.0, 1300.0, 365.0, 166.0, 103.0, 58.0, 27.0, 18.0, 19.0, 10.0, 9.0, 4.0, 6.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.12310791015625, -0.11959266662597656, -0.11607742309570312, -0.11256217956542969, -0.10904693603515625, -0.10553169250488281, -0.10201644897460938, -0.09850120544433594, -0.0949859619140625, -0.09147071838378906, -0.08795547485351562, -0.08444023132324219, -0.08092498779296875, -0.07740974426269531, -0.07389450073242188, -0.07037925720214844, -0.066864013671875, -0.06334877014160156, -0.059833526611328125, -0.05631828308105469, -0.05280303955078125, -0.04928779602050781, -0.045772552490234375, -0.04225730895996094, -0.0387420654296875, -0.03522682189941406, -0.031711578369140625, -0.028196334838867188, -0.02468109130859375, -0.021165847778320312, -0.017650604248046875, -0.014135360717773438, -0.0106201171875, -0.0071048736572265625, -0.003589630126953125, -7.43865966796875e-05, 0.00344085693359375, 0.0069561004638671875, 0.010471343994140625, 0.013986587524414062, 0.0175018310546875, 0.021017074584960938, 0.024532318115234375, 0.028047561645507812, 0.03156280517578125, 0.03507804870605469, 0.038593292236328125, 0.04210853576660156, 0.045623779296875, 0.04913902282714844, 0.052654266357421875, 0.05616950988769531, 0.05968475341796875, 0.06319999694824219, 0.06671524047851562, 0.07023048400878906, 0.0737457275390625, 0.07726097106933594, 0.08077621459960938, 0.08429145812988281, 0.08780670166015625, 0.09132194519042969, 0.09483718872070312, 0.09835243225097656, 0.10186767578125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 7.0, 7.0, 9.0, 21.0, 28.0, 52.0, 68.0, 96.0, 112.0, 121.0, 129.0, 111.0, 69.0, 51.0, 40.0, 30.0, 11.0, 13.0, 6.0, 5.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5777998566627502, -0.5606703758239746, -0.543540894985199, -0.5264114141464233, -0.5092819333076477, -0.49215245246887207, -0.47502294182777405, -0.4578934609889984, -0.4407639801502228, -0.42363449931144714, -0.4065050184726715, -0.3893755376338959, -0.37224602699279785, -0.3551165461540222, -0.3379870653152466, -0.32085758447647095, -0.3037281036376953, -0.2865986227989197, -0.26946914196014404, -0.2523396611213684, -0.23521016538143158, -0.21808068454265594, -0.20095118880271912, -0.18382170796394348, -0.16669222712516785, -0.1495627462863922, -0.13243326544761658, -0.11530376970767975, -0.09817428886890411, -0.08104480803012848, -0.06391531974077225, -0.046785831451416016, -0.02965635061264038, -0.012526866048574448, 0.004602618515491486, 0.02173210307955742, 0.03886158764362335, 0.05599106848239899, 0.07312055677175522, 0.09025004506111145, 0.10737952589988708, 0.12450900673866272, 0.14163848757743835, 0.15876798331737518, 0.17589746415615082, 0.19302694499492645, 0.21015644073486328, 0.22728592157363892, 0.24441540241241455, 0.2615448832511902, 0.2786743640899658, 0.29580384492874146, 0.3129333257675171, 0.3300628066062927, 0.34719231724739075, 0.3643217980861664, 0.381451278924942, 0.39858075976371765, 0.4157102406024933, 0.4328397214412689, 0.44996923208236694, 0.4670987129211426, 0.4842281937599182, 0.5013576745986938, 0.5184871554374695]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 2.0, 4.0, 3.0, 7.0, 6.0, 16.0, 18.0, 12.0, 12.0, 22.0, 13.0, 22.0, 22.0, 30.0, 23.0, 32.0, 42.0, 44.0, 45.0, 31.0, 55.0, 51.0, 50.0, 38.0, 51.0, 33.0, 41.0, 26.0, 39.0, 28.0, 23.0, 35.0, 12.0, 15.0, 27.0, 16.0, 8.0, 11.0, 10.0, 11.0, 3.0, 2.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.32235443592071533, -0.3130477964878082, -0.3037411570549011, -0.294434517621994, -0.2851278781890869, -0.2758212685585022, -0.2665145993232727, -0.257207989692688, -0.24790135025978088, -0.23859471082687378, -0.22928807139396667, -0.21998143196105957, -0.21067480742931366, -0.20136816799640656, -0.19206152856349945, -0.18275490403175354, -0.17344824969768524, -0.16414161026477814, -0.15483497083187103, -0.14552834630012512, -0.13622170686721802, -0.1269150674343109, -0.11760842800140381, -0.1083017960190773, -0.0989951565861702, -0.08968851715326309, -0.08038188517093658, -0.07107524573802948, -0.061768610030412674, -0.05246197432279587, -0.04315533488988876, -0.033848702907562256, -0.02454206347465515, -0.01523542683571577, -0.00592879019677639, 0.003377847373485565, 0.012684483081102371, 0.021991118788719177, 0.03129775822162628, 0.04060439020395279, 0.049911029636859894, 0.0592176653444767, 0.0685243010520935, 0.07783094048500061, 0.08713757991790771, 0.09644421190023422, 0.10575085133314133, 0.11505748331546783, 0.12436412274837494, 0.13367076218128204, 0.14297740161418915, 0.15228402614593506, 0.16159066557884216, 0.17089730501174927, 0.18020394444465637, 0.18951058387756348, 0.19881722331047058, 0.20812386274337769, 0.2174305021762848, 0.2267371416091919, 0.2360437661409378, 0.2453504055738449, 0.2546570301055908, 0.2639636695384979, 0.27327030897140503]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 11.0, 15.0, 17.0, 15.0, 36.0, 39.0, 66.0, 98.0, 173.0, 270.0, 648.0, 1452.0, 3746.0, 10120.0, 27465.0, 83558.0, 437707.0, 369806.0, 73505.0, 24616.0, 9085.0, 3494.0, 1311.0, 583.0, 276.0, 157.0, 95.0, 72.0, 31.0, 25.0, 18.0, 11.0, 11.0, 3.0, 1.0, 6.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.197265625, -0.19127845764160156, -0.18529129028320312, -0.1793041229248047, -0.17331695556640625, -0.1673297882080078, -0.16134262084960938, -0.15535545349121094, -0.1493682861328125, -0.14338111877441406, -0.13739395141601562, -0.1314067840576172, -0.12541961669921875, -0.11943244934082031, -0.11344528198242188, -0.10745811462402344, -0.101470947265625, -0.09548377990722656, -0.08949661254882812, -0.08350944519042969, -0.07752227783203125, -0.07153511047363281, -0.06554794311523438, -0.05956077575683594, -0.0535736083984375, -0.04758644104003906, -0.041599273681640625, -0.03561210632324219, -0.02962493896484375, -0.023637771606445312, -0.017650604248046875, -0.011663436889648438, -0.00567626953125, 0.0003108978271484375, 0.006298065185546875, 0.012285232543945312, 0.01827239990234375, 0.024259567260742188, 0.030246734619140625, 0.03623390197753906, 0.0422210693359375, 0.04820823669433594, 0.054195404052734375, 0.06018257141113281, 0.06616973876953125, 0.07215690612792969, 0.07814407348632812, 0.08413124084472656, 0.090118408203125, 0.09610557556152344, 0.10209274291992188, 0.10807991027832031, 0.11406707763671875, 0.12005424499511719, 0.12604141235351562, 0.13202857971191406, 0.1380157470703125, 0.14400291442871094, 0.14999008178710938, 0.1559772491455078, 0.16196441650390625, 0.1679515838623047, 0.17393875122070312, 0.17992591857910156, 0.1859130859375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 6.0, 5.0, 6.0, 18.0, 17.0, 18.0, 19.0, 15.0, 27.0, 36.0, 31.0, 36.0, 50.0, 40.0, 39.0, 58.0, 54.0, 58.0, 40.0, 49.0, 47.0, 50.0, 36.0, 36.0, 40.0, 40.0, 18.0, 18.0, 15.0, 16.0, 14.0, 11.0, 13.0, 4.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.052520751953125, -0.05094099044799805, -0.049361228942871094, -0.04778146743774414, -0.04620170593261719, -0.044621944427490234, -0.04304218292236328, -0.04146242141723633, -0.039882659912109375, -0.03830289840698242, -0.03672313690185547, -0.035143375396728516, -0.03356361389160156, -0.03198385238647461, -0.030404090881347656, -0.028824329376220703, -0.02724456787109375, -0.025664806365966797, -0.024085044860839844, -0.02250528335571289, -0.020925521850585938, -0.019345760345458984, -0.01776599884033203, -0.016186237335205078, -0.014606475830078125, -0.013026714324951172, -0.011446952819824219, -0.009867191314697266, -0.008287429809570312, -0.006707668304443359, -0.005127906799316406, -0.003548145294189453, -0.0019683837890625, -0.0003886222839355469, 0.0011911392211914062, 0.0027709007263183594, 0.0043506622314453125, 0.005930423736572266, 0.007510185241699219, 0.009089946746826172, 0.010669708251953125, 0.012249469757080078, 0.013829231262207031, 0.015408992767333984, 0.016988754272460938, 0.01856851577758789, 0.020148277282714844, 0.021728038787841797, 0.02330780029296875, 0.024887561798095703, 0.026467323303222656, 0.02804708480834961, 0.029626846313476562, 0.031206607818603516, 0.03278636932373047, 0.03436613082885742, 0.035945892333984375, 0.03752565383911133, 0.03910541534423828, 0.040685176849365234, 0.04226493835449219, 0.04384469985961914, 0.045424461364746094, 0.04700422286987305, 0.048583984375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 2.0, 4.0, 8.0, 4.0, 11.0, 11.0, 14.0, 21.0, 20.0, 34.0, 35.0, 67.0, 84.0, 129.0, 228.0, 355.0, 637.0, 1275.0, 2537.0, 5699.0, 12946.0, 30417.0, 87118.0, 525656.0, 283734.0, 56825.0, 22615.0, 9479.0, 4267.0, 1974.0, 982.0, 468.0, 284.0, 189.0, 132.0, 76.0, 53.0, 34.0, 37.0, 23.0, 20.0, 16.0, 8.0, 11.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1845703125, -0.17894744873046875, -0.1733245849609375, -0.16770172119140625, -0.162078857421875, -0.15645599365234375, -0.1508331298828125, -0.14521026611328125, -0.13958740234375, -0.13396453857421875, -0.1283416748046875, -0.12271881103515625, -0.117095947265625, -0.11147308349609375, -0.1058502197265625, -0.10022735595703125, -0.0946044921875, -0.08898162841796875, -0.0833587646484375, -0.07773590087890625, -0.072113037109375, -0.06649017333984375, -0.0608673095703125, -0.05524444580078125, -0.04962158203125, -0.04399871826171875, -0.0383758544921875, -0.03275299072265625, -0.027130126953125, -0.02150726318359375, -0.0158843994140625, -0.01026153564453125, -0.004638671875, 0.00098419189453125, 0.0066070556640625, 0.01222991943359375, 0.017852783203125, 0.02347564697265625, 0.0290985107421875, 0.03472137451171875, 0.04034423828125, 0.04596710205078125, 0.0515899658203125, 0.05721282958984375, 0.062835693359375, 0.06845855712890625, 0.0740814208984375, 0.07970428466796875, 0.0853271484375, 0.09095001220703125, 0.0965728759765625, 0.10219573974609375, 0.107818603515625, 0.11344146728515625, 0.1190643310546875, 0.12468719482421875, 0.13031005859375, 0.13593292236328125, 0.1415557861328125, 0.14717864990234375, 0.152801513671875, 0.15842437744140625, 0.1640472412109375, 0.16967010498046875, 0.17529296875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 3.0, 1.0, 5.0, 1.0, 9.0, 7.0, 6.0, 9.0, 13.0, 11.0, 17.0, 16.0, 23.0, 29.0, 27.0, 31.0, 44.0, 38.0, 40.0, 37.0, 45.0, 50.0, 46.0, 37.0, 49.0, 44.0, 48.0, 33.0, 38.0, 33.0, 35.0, 21.0, 28.0, 25.0, 21.0, 19.0, 15.0, 10.0, 6.0, 11.0, 5.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.220947265625, -0.21445846557617188, -0.20796966552734375, -0.20148086547851562, -0.1949920654296875, -0.18850326538085938, -0.18201446533203125, -0.17552566528320312, -0.169036865234375, -0.16254806518554688, -0.15605926513671875, -0.14957046508789062, -0.1430816650390625, -0.13659286499023438, -0.13010406494140625, -0.12361526489257812, -0.11712646484375, -0.11063766479492188, -0.10414886474609375, -0.09766006469726562, -0.0911712646484375, -0.08468246459960938, -0.07819366455078125, -0.07170486450195312, -0.065216064453125, -0.058727264404296875, -0.05223846435546875, -0.045749664306640625, -0.0392608642578125, -0.032772064208984375, -0.02628326416015625, -0.019794464111328125, -0.0133056640625, -0.006816864013671875, -0.00032806396484375, 0.006160736083984375, 0.0126495361328125, 0.019138336181640625, 0.02562713623046875, 0.032115936279296875, 0.038604736328125, 0.045093536376953125, 0.05158233642578125, 0.058071136474609375, 0.0645599365234375, 0.07104873657226562, 0.07753753662109375, 0.08402633666992188, 0.09051513671875, 0.09700393676757812, 0.10349273681640625, 0.10998153686523438, 0.1164703369140625, 0.12295913696289062, 0.12944793701171875, 0.13593673706054688, 0.142425537109375, 0.14891433715820312, 0.15540313720703125, 0.16189193725585938, 0.1683807373046875, 0.17486953735351562, 0.18135833740234375, 0.18784713745117188, 0.1943359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 12.0, 6.0, 14.0, 23.0, 25.0, 33.0, 65.0, 103.0, 163.0, 282.0, 530.0, 931.0, 1892.0, 4160.0, 9224.0, 21380.0, 51593.0, 272314.0, 559298.0, 74862.0, 28782.0, 12379.0, 5380.0, 2447.0, 1134.0, 661.0, 362.0, 175.0, 106.0, 94.0, 45.0, 30.0, 17.0, 12.0, 14.0, 5.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0955810546875, -0.09278392791748047, -0.08998680114746094, -0.0871896743774414, -0.08439254760742188, -0.08159542083740234, -0.07879829406738281, -0.07600116729736328, -0.07320404052734375, -0.07040691375732422, -0.06760978698730469, -0.06481266021728516, -0.062015533447265625, -0.059218406677246094, -0.05642127990722656, -0.05362415313720703, -0.0508270263671875, -0.04802989959716797, -0.04523277282714844, -0.042435646057128906, -0.039638519287109375, -0.036841392517089844, -0.03404426574707031, -0.03124713897705078, -0.02845001220703125, -0.02565288543701172, -0.022855758666992188, -0.020058631896972656, -0.017261505126953125, -0.014464378356933594, -0.011667251586914062, -0.008870124816894531, -0.006072998046875, -0.0032758712768554688, -0.0004787445068359375, 0.0023183822631835938, 0.005115509033203125, 0.007912635803222656, 0.010709762573242188, 0.013506889343261719, 0.01630401611328125, 0.01910114288330078, 0.021898269653320312, 0.024695396423339844, 0.027492523193359375, 0.030289649963378906, 0.03308677673339844, 0.03588390350341797, 0.0386810302734375, 0.04147815704345703, 0.04427528381347656, 0.047072410583496094, 0.049869537353515625, 0.052666664123535156, 0.05546379089355469, 0.05826091766357422, 0.06105804443359375, 0.06385517120361328, 0.06665229797363281, 0.06944942474365234, 0.07224655151367188, 0.0750436782836914, 0.07784080505371094, 0.08063793182373047, 0.08343505859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 5.0, 11.0, 9.0, 18.0, 23.0, 32.0, 38.0, 57.0, 87.0, 114.0, 106.0, 92.0, 85.0, 82.0, 60.0, 39.0, 37.0, 31.0, 22.0, 10.0, 13.0, 4.0, 4.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.00010013580322265625, -9.7629614174366e-05, -9.512342512607574e-05, -9.261723607778549e-05, -9.011104702949524e-05, -8.760485798120499e-05, -8.509866893291473e-05, -8.259247988462448e-05, -8.008629083633423e-05, -7.758010178804398e-05, -7.507391273975372e-05, -7.256772369146347e-05, -7.006153464317322e-05, -6.755534559488297e-05, -6.504915654659271e-05, -6.254296749830246e-05, -6.003677845001221e-05, -5.7530589401721954e-05, -5.50244003534317e-05, -5.251821130514145e-05, -5.0012022256851196e-05, -4.7505833208560944e-05, -4.499964416027069e-05, -4.249345511198044e-05, -3.9987266063690186e-05, -3.748107701539993e-05, -3.497488796710968e-05, -3.246869891881943e-05, -2.9962509870529175e-05, -2.7456320822238922e-05, -2.495013177394867e-05, -2.2443942725658417e-05, -1.9937753677368164e-05, -1.743156462907791e-05, -1.4925375580787659e-05, -1.2419186532497406e-05, -9.912997484207153e-06, -7.406808435916901e-06, -4.900619387626648e-06, -2.3944303393363953e-06, 1.1175870895385742e-07, 2.61794775724411e-06, 5.124136805534363e-06, 7.630325853824615e-06, 1.0136514902114868e-05, 1.2642703950405121e-05, 1.5148892998695374e-05, 1.7655082046985626e-05, 2.016127109527588e-05, 2.266746014356613e-05, 2.5173649191856384e-05, 2.7679838240146637e-05, 3.018602728843689e-05, 3.269221633672714e-05, 3.5198405385017395e-05, 3.770459443330765e-05, 4.02107834815979e-05, 4.271697252988815e-05, 4.5223161578178406e-05, 4.772935062646866e-05, 5.023553967475891e-05, 5.2741728723049164e-05, 5.5247917771339417e-05, 5.775410681962967e-05, 6.026029586791992e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 3.0, 6.0, 11.0, 13.0, 14.0, 28.0, 64.0, 61.0, 116.0, 177.0, 301.0, 592.0, 1162.0, 2901.0, 8085.0, 24248.0, 87975.0, 727625.0, 145267.0, 32746.0, 10431.0, 3632.0, 1517.0, 703.0, 339.0, 201.0, 124.0, 78.0, 40.0, 32.0, 14.0, 22.0, 10.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0928955078125, -0.08953285217285156, -0.08617019653320312, -0.08280754089355469, -0.07944488525390625, -0.07608222961425781, -0.07271957397460938, -0.06935691833496094, -0.0659942626953125, -0.06263160705566406, -0.059268951416015625, -0.05590629577636719, -0.05254364013671875, -0.04918098449707031, -0.045818328857421875, -0.04245567321777344, -0.039093017578125, -0.03573036193847656, -0.032367706298828125, -0.029005050659179688, -0.02564239501953125, -0.022279739379882812, -0.018917083740234375, -0.015554428100585938, -0.0121917724609375, -0.008829116821289062, -0.005466461181640625, -0.0021038055419921875, 0.00125885009765625, 0.0046215057373046875, 0.007984161376953125, 0.011346817016601562, 0.01470947265625, 0.018072128295898438, 0.021434783935546875, 0.024797439575195312, 0.02816009521484375, 0.03152275085449219, 0.034885406494140625, 0.03824806213378906, 0.0416107177734375, 0.04497337341308594, 0.048336029052734375, 0.05169868469238281, 0.05506134033203125, 0.05842399597167969, 0.061786651611328125, 0.06514930725097656, 0.068511962890625, 0.07187461853027344, 0.07523727416992188, 0.07859992980957031, 0.08196258544921875, 0.08532524108886719, 0.08868789672851562, 0.09205055236816406, 0.0954132080078125, 0.09877586364746094, 0.10213851928710938, 0.10550117492675781, 0.10886383056640625, 0.11222648620605469, 0.11558914184570312, 0.11895179748535156, 0.122314453125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 9.0, 9.0, 8.0, 13.0, 12.0, 12.0, 21.0, 45.0, 63.0, 130.0, 180.0, 180.0, 126.0, 59.0, 38.0, 22.0, 15.0, 10.0, 10.0, 5.0, 10.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1019287109375, -0.09862804412841797, -0.09532737731933594, -0.0920267105102539, -0.08872604370117188, -0.08542537689208984, -0.08212471008300781, -0.07882404327392578, -0.07552337646484375, -0.07222270965576172, -0.06892204284667969, -0.06562137603759766, -0.062320709228515625, -0.059020042419433594, -0.05571937561035156, -0.05241870880126953, -0.0491180419921875, -0.04581737518310547, -0.04251670837402344, -0.039216041564941406, -0.035915374755859375, -0.032614707946777344, -0.029314041137695312, -0.02601337432861328, -0.02271270751953125, -0.01941204071044922, -0.016111373901367188, -0.012810707092285156, -0.009510040283203125, -0.006209373474121094, -0.0029087066650390625, 0.00039196014404296875, 0.003692626953125, 0.006993293762207031, 0.010293960571289062, 0.013594627380371094, 0.016895294189453125, 0.020195960998535156, 0.023496627807617188, 0.02679729461669922, 0.03009796142578125, 0.03339862823486328, 0.03669929504394531, 0.039999961853027344, 0.043300628662109375, 0.046601295471191406, 0.04990196228027344, 0.05320262908935547, 0.0565032958984375, 0.05980396270751953, 0.06310462951660156, 0.0664052963256836, 0.06970596313476562, 0.07300662994384766, 0.07630729675292969, 0.07960796356201172, 0.08290863037109375, 0.08620929718017578, 0.08950996398925781, 0.09281063079833984, 0.09611129760742188, 0.0994119644165039, 0.10271263122558594, 0.10601329803466797, 0.10931396484375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 9.0, 13.0, 40.0, 62.0, 95.0, 133.0, 162.0, 170.0, 130.0, 92.0, 50.0, 22.0, 11.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.187971591949463, -2.1345534324645996, -2.0811355113983154, -2.027717351913452, -1.9742993116378784, -1.9208812713623047, -1.8674631118774414, -1.8140450716018677, -1.760627031326294, -1.7072089910507202, -1.653790831565857, -1.6003727912902832, -1.5469547510147095, -1.4935367107391357, -1.4401185512542725, -1.3867005109786987, -1.333282470703125, -1.2798644304275513, -1.226446270942688, -1.1730282306671143, -1.1196101903915405, -1.0661921501159668, -1.0127739906311035, -0.9593559503555298, -0.9059377908706665, -0.852519690990448, -0.7991016507148743, -0.7456835508346558, -0.692265510559082, -0.6388474106788635, -0.585429310798645, -0.5320112705230713, -0.47859323024749756, -0.42517516016960144, -0.3717570900917053, -0.3183389902114868, -0.2649209499359131, -0.21150285005569458, -0.15808477997779846, -0.10466670989990234, -0.051248639822006226, 0.002169433981180191, 0.05558750778436661, 0.10900558531284332, 0.16242365539073944, 0.21584174036979675, 0.26925981044769287, 0.322677880525589, 0.3760959506034851, 0.4295140206813812, 0.48293209075927734, 0.5363501906394958, 0.5897682309150696, 0.6431863307952881, 0.6966043710708618, 0.7500224709510803, 0.8034405708312988, 0.8568586707115173, 0.9102767109870911, 0.9636948108673096, 1.0171128511428833, 1.070530891418457, 1.1239490509033203, 1.177367091178894, 1.2307851314544678]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 5.0, 3.0, 9.0, 12.0, 15.0, 15.0, 16.0, 23.0, 28.0, 27.0, 33.0, 37.0, 44.0, 46.0, 40.0, 38.0, 44.0, 47.0, 34.0, 46.0, 39.0, 30.0, 44.0, 35.0, 39.0, 37.0, 30.0, 25.0, 23.0, 23.0, 17.0, 24.0, 8.0, 13.0, 11.0, 10.0, 7.0, 0.0, 4.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.9527403116226196, -0.9240773916244507, -0.8954145312309265, -0.8667516112327576, -0.8380887508392334, -0.8094258308410645, -0.7807629108428955, -0.7520999908447266, -0.7234371304512024, -0.6947742104530334, -0.6661113500595093, -0.6374484300613403, -0.6087855100631714, -0.5801226496696472, -0.5514597296714783, -0.5227968692779541, -0.49413394927978516, -0.4654710590839386, -0.43680816888809204, -0.4081452488899231, -0.37948235869407654, -0.35081946849823, -0.32215654850006104, -0.2934936583042145, -0.2648307681083679, -0.23616787791252136, -0.2075049728155136, -0.17884206771850586, -0.1501791775226593, -0.12151628732681274, -0.09285338222980499, -0.06419047713279724, -0.03552752733230591, -0.006864629685878754, 0.0217982679605484, 0.050461165606975555, 0.07912406325340271, 0.10778695344924927, 0.13644985854625702, 0.16511276364326477, 0.19377565383911133, 0.22243854403495789, 0.25110143423080444, 0.2797643542289734, 0.30842724442481995, 0.3370901346206665, 0.36575305461883545, 0.394415944814682, 0.42307883501052856, 0.4517417252063751, 0.4804046154022217, 0.5090675354003906, 0.5377304553985596, 0.5663933157920837, 0.5950562357902527, 0.6237190961837769, 0.6523820161819458, 0.6810449361801147, 0.7097077965736389, 0.7383707165718079, 0.767033576965332, 0.795696496963501, 0.8243594169616699, 0.8530223369598389, 0.881685197353363]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 7.0, 4.0, 6.0, 13.0, 18.0, 20.0, 24.0, 38.0, 55.0, 106.0, 139.0, 184.0, 347.0, 508.0, 813.0, 1365.0, 2384.0, 4421.0, 8805.0, 17998.0, 43305.0, 131267.0, 986459.0, 2741983.0, 161614.0, 50654.0, 20711.0, 9770.0, 4918.0, 2565.0, 1448.0, 845.0, 529.0, 340.0, 220.0, 115.0, 84.0, 57.0, 39.0, 23.0, 21.0, 17.0, 16.0, 10.0, 8.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.181640625, -0.1759777069091797, -0.17031478881835938, -0.16465187072753906, -0.15898895263671875, -0.15332603454589844, -0.14766311645507812, -0.1420001983642578, -0.1363372802734375, -0.1306743621826172, -0.12501144409179688, -0.11934852600097656, -0.11368560791015625, -0.10802268981933594, -0.10235977172851562, -0.09669685363769531, -0.091033935546875, -0.08537101745605469, -0.07970809936523438, -0.07404518127441406, -0.06838226318359375, -0.06271934509277344, -0.057056427001953125, -0.05139350891113281, -0.0457305908203125, -0.04006767272949219, -0.034404754638671875, -0.028741836547851562, -0.02307891845703125, -0.017416000366210938, -0.011753082275390625, -0.0060901641845703125, -0.00042724609375, 0.0052356719970703125, 0.010898590087890625, 0.016561508178710938, 0.02222442626953125, 0.027887344360351562, 0.033550262451171875, 0.03921318054199219, 0.0448760986328125, 0.05053901672363281, 0.056201934814453125, 0.06186485290527344, 0.06752777099609375, 0.07319068908691406, 0.07885360717773438, 0.08451652526855469, 0.090179443359375, 0.09584236145019531, 0.10150527954101562, 0.10716819763183594, 0.11283111572265625, 0.11849403381347656, 0.12415695190429688, 0.1298198699951172, 0.1354827880859375, 0.1411457061767578, 0.14680862426757812, 0.15247154235839844, 0.15813446044921875, 0.16379737854003906, 0.16946029663085938, 0.1751232147216797, 0.1807861328125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 3.0, 3.0, 2.0, 13.0, 14.0, 18.0, 18.0, 19.0, 20.0, 21.0, 27.0, 19.0, 41.0, 46.0, 50.0, 38.0, 49.0, 54.0, 56.0, 52.0, 45.0, 52.0, 48.0, 58.0, 33.0, 34.0, 28.0, 19.0, 28.0, 17.0, 14.0, 15.0, 7.0, 8.0, 7.0, 8.0, 4.0, 2.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0518798828125, -0.05023765563964844, -0.048595428466796875, -0.04695320129394531, -0.04531097412109375, -0.04366874694824219, -0.042026519775390625, -0.04038429260253906, -0.0387420654296875, -0.03709983825683594, -0.035457611083984375, -0.03381538391113281, -0.03217315673828125, -0.030530929565429688, -0.028888702392578125, -0.027246475219726562, -0.025604248046875, -0.023962020874023438, -0.022319793701171875, -0.020677566528320312, -0.01903533935546875, -0.017393112182617188, -0.015750885009765625, -0.014108657836914062, -0.0124664306640625, -0.010824203491210938, -0.009181976318359375, -0.0075397491455078125, -0.00589752197265625, -0.0042552947998046875, -0.002613067626953125, -0.0009708404541015625, 0.00067138671875, 0.0023136138916015625, 0.003955841064453125, 0.0055980682373046875, 0.00724029541015625, 0.008882522583007812, 0.010524749755859375, 0.012166976928710938, 0.0138092041015625, 0.015451431274414062, 0.017093658447265625, 0.018735885620117188, 0.02037811279296875, 0.022020339965820312, 0.023662567138671875, 0.025304794311523438, 0.026947021484375, 0.028589248657226562, 0.030231475830078125, 0.03187370300292969, 0.03351593017578125, 0.03515815734863281, 0.036800384521484375, 0.03844261169433594, 0.0400848388671875, 0.04172706604003906, 0.043369293212890625, 0.04501152038574219, 0.04665374755859375, 0.04829597473144531, 0.049938201904296875, 0.05158042907714844, 0.05322265625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 5.0, 3.0, 6.0, 2.0, 4.0, 9.0, 12.0, 11.0, 22.0, 19.0, 38.0, 36.0, 53.0, 62.0, 89.0, 120.0, 170.0, 322.0, 613.0, 1239.0, 2790.0, 7135.0, 21469.0, 91021.0, 1172408.0, 2745620.0, 111592.0, 25245.0, 8125.0, 3013.0, 1342.0, 648.0, 367.0, 177.0, 132.0, 94.0, 54.0, 45.0, 37.0, 31.0, 22.0, 18.0, 18.0, 13.0, 13.0, 6.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.339599609375, -0.3293266296386719, -0.31905364990234375, -0.3087806701660156, -0.2985076904296875, -0.2882347106933594, -0.27796173095703125, -0.2676887512207031, -0.257415771484375, -0.24714279174804688, -0.23686981201171875, -0.22659683227539062, -0.2163238525390625, -0.20605087280273438, -0.19577789306640625, -0.18550491333007812, -0.17523193359375, -0.16495895385742188, -0.15468597412109375, -0.14441299438476562, -0.1341400146484375, -0.12386703491210938, -0.11359405517578125, -0.10332107543945312, -0.093048095703125, -0.08277511596679688, -0.07250213623046875, -0.062229156494140625, -0.0519561767578125, -0.041683197021484375, -0.03141021728515625, -0.021137237548828125, -0.0108642578125, -0.000591278076171875, 0.00968170166015625, 0.019954681396484375, 0.0302276611328125, 0.040500640869140625, 0.05077362060546875, 0.061046600341796875, 0.071319580078125, 0.08159255981445312, 0.09186553955078125, 0.10213851928710938, 0.1124114990234375, 0.12268447875976562, 0.13295745849609375, 0.14323043823242188, 0.15350341796875, 0.16377639770507812, 0.17404937744140625, 0.18432235717773438, 0.1945953369140625, 0.20486831665039062, 0.21514129638671875, 0.22541427612304688, 0.235687255859375, 0.24596023559570312, 0.25623321533203125, 0.2665061950683594, 0.2767791748046875, 0.2870521545410156, 0.29732513427734375, 0.3075981140136719, 0.31787109375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 8.0, 9.0, 6.0, 16.0, 17.0, 42.0, 63.0, 136.0, 249.0, 992.0, 1847.0, 327.0, 149.0, 80.0, 47.0, 19.0, 25.0, 14.0, 16.0, 6.0, 7.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.206298828125, -0.20088577270507812, -0.19547271728515625, -0.19005966186523438, -0.1846466064453125, -0.17923355102539062, -0.17382049560546875, -0.16840744018554688, -0.162994384765625, -0.15758132934570312, -0.15216827392578125, -0.14675521850585938, -0.1413421630859375, -0.13592910766601562, -0.13051605224609375, -0.12510299682617188, -0.11968994140625, -0.11427688598632812, -0.10886383056640625, -0.10345077514648438, -0.0980377197265625, -0.09262466430664062, -0.08721160888671875, -0.08179855346679688, -0.076385498046875, -0.07097244262695312, -0.06555938720703125, -0.060146331787109375, -0.0547332763671875, -0.049320220947265625, -0.04390716552734375, -0.038494110107421875, -0.0330810546875, -0.027667999267578125, -0.02225494384765625, -0.016841888427734375, -0.0114288330078125, -0.006015777587890625, -0.00060272216796875, 0.004810333251953125, 0.010223388671875, 0.015636444091796875, 0.02104949951171875, 0.026462554931640625, 0.0318756103515625, 0.037288665771484375, 0.04270172119140625, 0.048114776611328125, 0.05352783203125, 0.058940887451171875, 0.06435394287109375, 0.06976699829101562, 0.0751800537109375, 0.08059310913085938, 0.08600616455078125, 0.09141921997070312, 0.096832275390625, 0.10224533081054688, 0.10765838623046875, 0.11307144165039062, 0.1184844970703125, 0.12389755249023438, 0.12931060791015625, 0.13472366333007812, 0.14013671875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 5.0, 5.0, 6.0, 7.0, 16.0, 20.0, 34.0, 36.0, 64.0, 79.0, 108.0, 116.0, 119.0, 103.0, 77.0, 69.0, 45.0, 22.0, 20.0, 12.0, 10.0, 11.0, 4.0, 3.0, 9.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44253700971603394, -0.4220002591609955, -0.40146347880363464, -0.3809267282485962, -0.36038994789123535, -0.3398531973361969, -0.31931644678115845, -0.2987796664237976, -0.27824291586875916, -0.2577061653137207, -0.23716938495635986, -0.2166326344013214, -0.19609586894512177, -0.17555910348892212, -0.15502235293388367, -0.13448558747768402, -0.11394882202148438, -0.09341205656528473, -0.07287529855966568, -0.05233853682875633, -0.031801775097846985, -0.011265009641647339, 0.00927174836397171, 0.02980850636959076, 0.050345271825790405, 0.07088203728199005, 0.0914187952876091, 0.11195555329322815, 0.1324923187494278, 0.15302908420562744, 0.1735658347606659, 0.19410260021686554, 0.2146393060684204, 0.23517607152462006, 0.2557128369808197, 0.27624958753585815, 0.296786367893219, 0.31732311844825745, 0.3378598690032959, 0.35839664936065674, 0.3789333999156952, 0.39947015047073364, 0.4200069308280945, 0.44054368138313293, 0.4610804319381714, 0.4816172122955322, 0.5021539926528931, 0.5226907134056091, 0.54322749376297, 0.5637642741203308, 0.5843009948730469, 0.6048377752304077, 0.6253745555877686, 0.6459113359451294, 0.6664480566978455, 0.6869848370552063, 0.7075215578079224, 0.7280583381652832, 0.7485950589179993, 0.7691318392753601, 0.789668619632721, 0.810205340385437, 0.8307421207427979, 0.8512789011001587, 0.8718156814575195]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 1.0, 5.0, 5.0, 5.0, 5.0, 11.0, 6.0, 10.0, 15.0, 12.0, 15.0, 18.0, 25.0, 14.0, 22.0, 29.0, 24.0, 24.0, 29.0, 42.0, 42.0, 47.0, 42.0, 44.0, 33.0, 37.0, 51.0, 48.0, 37.0, 39.0, 35.0, 29.0, 37.0, 27.0, 31.0, 20.0, 15.0, 14.0, 16.0, 13.0, 8.0, 8.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.348694384098053, -0.3364925682544708, -0.32429075241088867, -0.31208890676498413, -0.299887090921402, -0.2876852750778198, -0.27548345923423767, -0.2632816433906555, -0.251079797744751, -0.23887798190116882, -0.22667615115642548, -0.21447433531284332, -0.20227250456809998, -0.19007068872451782, -0.17786887288093567, -0.16566704213619232, -0.15346522629261017, -0.14126341044902802, -0.12906157970428467, -0.11685976386070251, -0.10465793311595917, -0.09245611727237701, -0.08025429397821426, -0.06805247068405151, -0.05585064738988876, -0.04364882409572601, -0.03144700080156326, -0.01924518123269081, -0.007043357938528061, 0.005158465355634689, 0.01736028492450714, 0.02956210821866989, 0.04176393151283264, 0.05396575480699539, 0.06616757810115814, 0.0783693939447403, 0.09057122468948364, 0.1027730405330658, 0.11497486382722855, 0.1271766871213913, 0.13937851786613464, 0.1515803337097168, 0.16378216445446014, 0.1759839802980423, 0.18818581104278564, 0.2003876268863678, 0.21258944272994995, 0.2247912734746933, 0.23699308931827545, 0.2491949051618576, 0.26139673590660095, 0.2735985517501831, 0.28580036759376526, 0.2980022132396698, 0.31020402908325195, 0.3224058449268341, 0.33460766077041626, 0.3468094766139984, 0.35901129245758057, 0.3712131381034851, 0.38341495394706726, 0.3956167697906494, 0.40781858563423157, 0.4200204014778137, 0.43222224712371826]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 5.0, 1.0, 5.0, 5.0, 12.0, 15.0, 10.0, 31.0, 47.0, 66.0, 89.0, 136.0, 206.0, 332.0, 568.0, 863.0, 1404.0, 2450.0, 4215.0, 7644.0, 13814.0, 25203.0, 45690.0, 81530.0, 149181.0, 267475.0, 203805.0, 107782.0, 59706.0, 33626.0, 18618.0, 10418.0, 5736.0, 3152.0, 1835.0, 1126.0, 647.0, 397.0, 268.0, 153.0, 103.0, 72.0, 47.0, 24.0, 16.0, 10.0, 9.0, 4.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.11859130859375, -0.11485481262207031, -0.11111831665039062, -0.10738182067871094, -0.10364532470703125, -0.09990882873535156, -0.09617233276367188, -0.09243583679199219, -0.0886993408203125, -0.08496284484863281, -0.08122634887695312, -0.07748985290527344, -0.07375335693359375, -0.07001686096191406, -0.06628036499023438, -0.06254386901855469, -0.058807373046875, -0.05507087707519531, -0.051334381103515625, -0.04759788513183594, -0.04386138916015625, -0.04012489318847656, -0.036388397216796875, -0.03265190124511719, -0.0289154052734375, -0.025178909301757812, -0.021442413330078125, -0.017705917358398438, -0.01396942138671875, -0.010232925415039062, -0.006496429443359375, -0.0027599334716796875, 0.0009765625, 0.0047130584716796875, 0.008449554443359375, 0.012186050415039062, 0.01592254638671875, 0.019659042358398438, 0.023395538330078125, 0.027132034301757812, 0.0308685302734375, 0.03460502624511719, 0.038341522216796875, 0.04207801818847656, 0.04581451416015625, 0.04955101013183594, 0.053287506103515625, 0.05702400207519531, 0.060760498046875, 0.06449699401855469, 0.06823348999023438, 0.07196998596191406, 0.07570648193359375, 0.07944297790527344, 0.08317947387695312, 0.08691596984863281, 0.0906524658203125, 0.09438896179199219, 0.09812545776367188, 0.10186195373535156, 0.10559844970703125, 0.10933494567871094, 0.11307144165039062, 0.11680793762207031, 0.12054443359375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 4.0, 3.0, 4.0, 9.0, 13.0, 11.0, 16.0, 21.0, 27.0, 31.0, 28.0, 33.0, 32.0, 35.0, 29.0, 41.0, 50.0, 51.0, 55.0, 46.0, 53.0, 49.0, 45.0, 27.0, 37.0, 43.0, 34.0, 35.0, 24.0, 17.0, 18.0, 16.0, 8.0, 11.0, 9.0, 6.0, 11.0, 8.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0548095703125, -0.053148746490478516, -0.05148792266845703, -0.04982709884643555, -0.04816627502441406, -0.04650545120239258, -0.044844627380371094, -0.04318380355834961, -0.041522979736328125, -0.03986215591430664, -0.038201332092285156, -0.03654050827026367, -0.03487968444824219, -0.0332188606262207, -0.03155803680419922, -0.029897212982177734, -0.02823638916015625, -0.026575565338134766, -0.02491474151611328, -0.023253917694091797, -0.021593093872070312, -0.019932270050048828, -0.018271446228027344, -0.01661062240600586, -0.014949798583984375, -0.01328897476196289, -0.011628150939941406, -0.009967327117919922, -0.008306503295898438, -0.006645679473876953, -0.004984855651855469, -0.0033240318298339844, -0.0016632080078125, -2.384185791015625e-06, 0.0016584396362304688, 0.003319263458251953, 0.0049800872802734375, 0.006640911102294922, 0.008301734924316406, 0.00996255874633789, 0.011623382568359375, 0.01328420639038086, 0.014945030212402344, 0.016605854034423828, 0.018266677856445312, 0.019927501678466797, 0.02158832550048828, 0.023249149322509766, 0.02490997314453125, 0.026570796966552734, 0.02823162078857422, 0.029892444610595703, 0.03155326843261719, 0.03321409225463867, 0.034874916076660156, 0.03653573989868164, 0.038196563720703125, 0.03985738754272461, 0.041518211364746094, 0.04317903518676758, 0.04483985900878906, 0.04650068283081055, 0.04816150665283203, 0.049822330474853516, 0.051483154296875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 7.0, 11.0, 16.0, 19.0, 29.0, 40.0, 48.0, 71.0, 118.0, 121.0, 200.0, 292.0, 451.0, 712.0, 1167.0, 2622.0, 7088.0, 26073.0, 111909.0, 524565.0, 285357.0, 63190.0, 15364.0, 4529.0, 1846.0, 952.0, 579.0, 376.0, 230.0, 137.0, 113.0, 82.0, 56.0, 38.0, 33.0, 23.0, 18.0, 11.0, 18.0, 14.0, 2.0, 6.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.263671875, -0.2551116943359375, -0.246551513671875, -0.2379913330078125, -0.22943115234375, -0.2208709716796875, -0.212310791015625, -0.2037506103515625, -0.1951904296875, -0.1866302490234375, -0.178070068359375, -0.1695098876953125, -0.16094970703125, -0.1523895263671875, -0.143829345703125, -0.1352691650390625, -0.126708984375, -0.1181488037109375, -0.109588623046875, -0.1010284423828125, -0.09246826171875, -0.0839080810546875, -0.075347900390625, -0.0667877197265625, -0.0582275390625, -0.0496673583984375, -0.041107177734375, -0.0325469970703125, -0.02398681640625, -0.0154266357421875, -0.006866455078125, 0.0016937255859375, 0.01025390625, 0.0188140869140625, 0.027374267578125, 0.0359344482421875, 0.04449462890625, 0.0530548095703125, 0.061614990234375, 0.0701751708984375, 0.0787353515625, 0.0872955322265625, 0.095855712890625, 0.1044158935546875, 0.11297607421875, 0.1215362548828125, 0.130096435546875, 0.1386566162109375, 0.147216796875, 0.1557769775390625, 0.164337158203125, 0.1728973388671875, 0.18145751953125, 0.1900177001953125, 0.198577880859375, 0.2071380615234375, 0.2156982421875, 0.2242584228515625, 0.232818603515625, 0.2413787841796875, 0.24993896484375, 0.2584991455078125, 0.267059326171875, 0.2756195068359375, 0.2841796875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 6.0, 7.0, 3.0, 7.0, 9.0, 15.0, 17.0, 21.0, 23.0, 23.0, 28.0, 40.0, 47.0, 31.0, 45.0, 38.0, 46.0, 52.0, 53.0, 59.0, 67.0, 46.0, 47.0, 47.0, 29.0, 36.0, 21.0, 23.0, 20.0, 21.0, 10.0, 13.0, 19.0, 11.0, 8.0, 6.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.298583984375, -0.29010009765625, -0.2816162109375, -0.27313232421875, -0.2646484375, -0.25616455078125, -0.2476806640625, -0.23919677734375, -0.230712890625, -0.22222900390625, -0.2137451171875, -0.20526123046875, -0.19677734375, -0.18829345703125, -0.1798095703125, -0.17132568359375, -0.162841796875, -0.15435791015625, -0.1458740234375, -0.13739013671875, -0.12890625, -0.12042236328125, -0.1119384765625, -0.10345458984375, -0.094970703125, -0.08648681640625, -0.0780029296875, -0.06951904296875, -0.06103515625, -0.05255126953125, -0.0440673828125, -0.03558349609375, -0.027099609375, -0.01861572265625, -0.0101318359375, -0.00164794921875, 0.0068359375, 0.01531982421875, 0.0238037109375, 0.03228759765625, 0.040771484375, 0.04925537109375, 0.0577392578125, 0.06622314453125, 0.07470703125, 0.08319091796875, 0.0916748046875, 0.10015869140625, 0.108642578125, 0.11712646484375, 0.1256103515625, 0.13409423828125, 0.142578125, 0.15106201171875, 0.1595458984375, 0.16802978515625, 0.176513671875, 0.18499755859375, 0.1934814453125, 0.20196533203125, 0.21044921875, 0.21893310546875, 0.2274169921875, 0.23590087890625, 0.244384765625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 0.0, 3.0, 8.0, 11.0, 22.0, 28.0, 48.0, 84.0, 172.0, 381.0, 937.0, 2669.0, 10322.0, 80894.0, 711119.0, 212262.0, 22752.0, 4402.0, 1406.0, 533.0, 229.0, 128.0, 58.0, 44.0, 24.0, 5.0, 7.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2254638671875, -0.218353271484375, -0.21124267578125, -0.204132080078125, -0.197021484375, -0.189910888671875, -0.18280029296875, -0.175689697265625, -0.1685791015625, -0.161468505859375, -0.15435791015625, -0.147247314453125, -0.14013671875, -0.133026123046875, -0.12591552734375, -0.118804931640625, -0.1116943359375, -0.104583740234375, -0.09747314453125, -0.090362548828125, -0.083251953125, -0.076141357421875, -0.06903076171875, -0.061920166015625, -0.0548095703125, -0.047698974609375, -0.04058837890625, -0.033477783203125, -0.0263671875, -0.019256591796875, -0.01214599609375, -0.005035400390625, 0.0020751953125, 0.009185791015625, 0.01629638671875, 0.023406982421875, 0.030517578125, 0.037628173828125, 0.04473876953125, 0.051849365234375, 0.0589599609375, 0.066070556640625, 0.07318115234375, 0.080291748046875, 0.08740234375, 0.094512939453125, 0.10162353515625, 0.108734130859375, 0.1158447265625, 0.122955322265625, 0.13006591796875, 0.137176513671875, 0.144287109375, 0.151397705078125, 0.15850830078125, 0.165618896484375, 0.1727294921875, 0.179840087890625, 0.18695068359375, 0.194061279296875, 0.201171875, 0.208282470703125, 0.21539306640625, 0.222503662109375, 0.2296142578125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 8.0, 13.0, 16.0, 10.0, 35.0, 27.0, 35.0, 59.0, 74.0, 82.0, 98.0, 74.0, 86.0, 66.0, 74.0, 52.0, 47.0, 26.0, 35.0, 22.0, 28.0, 9.0, 10.0, 7.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6862831115722656e-05, -5.464628338813782e-05, -5.242973566055298e-05, -5.021318793296814e-05, -4.79966402053833e-05, -4.578009247779846e-05, -4.356354475021362e-05, -4.1346997022628784e-05, -3.9130449295043945e-05, -3.6913901567459106e-05, -3.469735383987427e-05, -3.248080611228943e-05, -3.026425838470459e-05, -2.804771065711975e-05, -2.5831162929534912e-05, -2.3614615201950073e-05, -2.1398067474365234e-05, -1.9181519746780396e-05, -1.6964972019195557e-05, -1.4748424291610718e-05, -1.2531876564025879e-05, -1.031532883644104e-05, -8.098781108856201e-06, -5.882233381271362e-06, -3.6656856536865234e-06, -1.4491379261016846e-06, 7.674098014831543e-07, 2.983957529067993e-06, 5.200505256652832e-06, 7.417052984237671e-06, 9.63360071182251e-06, 1.1850148439407349e-05, 1.4066696166992188e-05, 1.6283243894577026e-05, 1.8499791622161865e-05, 2.0716339349746704e-05, 2.2932887077331543e-05, 2.5149434804916382e-05, 2.736598253250122e-05, 2.958253026008606e-05, 3.17990779876709e-05, 3.401562571525574e-05, 3.6232173442840576e-05, 3.8448721170425415e-05, 4.0665268898010254e-05, 4.288181662559509e-05, 4.509836435317993e-05, 4.731491208076477e-05, 4.953145980834961e-05, 5.174800753593445e-05, 5.396455526351929e-05, 5.6181102991104126e-05, 5.8397650718688965e-05, 6.0614198446273804e-05, 6.283074617385864e-05, 6.504729390144348e-05, 6.726384162902832e-05, 6.948038935661316e-05, 7.1696937084198e-05, 7.391348481178284e-05, 7.613003253936768e-05, 7.834658026695251e-05, 8.056312799453735e-05, 8.277967572212219e-05, 8.499622344970703e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 7.0, 7.0, 11.0, 25.0, 22.0, 25.0, 38.0, 58.0, 100.0, 137.0, 242.0, 340.0, 749.0, 1654.0, 4003.0, 12820.0, 59535.0, 361456.0, 497028.0, 84222.0, 17208.0, 4943.0, 1887.0, 860.0, 470.0, 260.0, 143.0, 91.0, 69.0, 45.0, 25.0, 30.0, 17.0, 10.0, 6.0, 2.0, 4.0, 1.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.172119140625, -0.16721534729003906, -0.16231155395507812, -0.1574077606201172, -0.15250396728515625, -0.1476001739501953, -0.14269638061523438, -0.13779258728027344, -0.1328887939453125, -0.12798500061035156, -0.12308120727539062, -0.11817741394042969, -0.11327362060546875, -0.10836982727050781, -0.10346603393554688, -0.09856224060058594, -0.093658447265625, -0.08875465393066406, -0.08385086059570312, -0.07894706726074219, -0.07404327392578125, -0.06913948059082031, -0.06423568725585938, -0.05933189392089844, -0.0544281005859375, -0.04952430725097656, -0.044620513916015625, -0.03971672058105469, -0.03481292724609375, -0.029909133911132812, -0.025005340576171875, -0.020101547241210938, -0.01519775390625, -0.010293960571289062, -0.005390167236328125, -0.0004863739013671875, 0.00441741943359375, 0.009321212768554688, 0.014225006103515625, 0.019128799438476562, 0.0240325927734375, 0.028936386108398438, 0.033840179443359375, 0.03874397277832031, 0.04364776611328125, 0.04855155944824219, 0.053455352783203125, 0.05835914611816406, 0.063262939453125, 0.06816673278808594, 0.07307052612304688, 0.07797431945800781, 0.08287811279296875, 0.08778190612792969, 0.09268569946289062, 0.09758949279785156, 0.1024932861328125, 0.10739707946777344, 0.11230087280273438, 0.11720466613769531, 0.12210845947265625, 0.1270122528076172, 0.13191604614257812, 0.13681983947753906, 0.1417236328125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 4.0, 8.0, 5.0, 8.0, 14.0, 15.0, 18.0, 23.0, 28.0, 34.0, 37.0, 46.0, 68.0, 74.0, 99.0, 77.0, 84.0, 63.0, 56.0, 42.0, 42.0, 36.0, 15.0, 18.0, 10.0, 18.0, 7.0, 7.0, 11.0, 9.0, 10.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10479736328125, -0.10106563568115234, -0.09733390808105469, -0.09360218048095703, -0.08987045288085938, -0.08613872528076172, -0.08240699768066406, -0.0786752700805664, -0.07494354248046875, -0.0712118148803711, -0.06748008728027344, -0.06374835968017578, -0.060016632080078125, -0.05628490447998047, -0.05255317687988281, -0.048821449279785156, -0.0450897216796875, -0.041357994079589844, -0.03762626647949219, -0.03389453887939453, -0.030162811279296875, -0.02643108367919922, -0.022699356079101562, -0.018967628479003906, -0.01523590087890625, -0.011504173278808594, -0.0077724456787109375, -0.004040718078613281, -0.000308990478515625, 0.0034227371215820312, 0.0071544647216796875, 0.010886192321777344, 0.014617919921875, 0.018349647521972656, 0.022081375122070312, 0.02581310272216797, 0.029544830322265625, 0.03327655792236328, 0.03700828552246094, 0.040740013122558594, 0.04447174072265625, 0.048203468322753906, 0.05193519592285156, 0.05566692352294922, 0.059398651123046875, 0.06313037872314453, 0.06686210632324219, 0.07059383392333984, 0.0743255615234375, 0.07805728912353516, 0.08178901672363281, 0.08552074432373047, 0.08925247192382812, 0.09298419952392578, 0.09671592712402344, 0.1004476547241211, 0.10417938232421875, 0.1079111099243164, 0.11164283752441406, 0.11537456512451172, 0.11910629272460938, 0.12283802032470703, 0.1265697479248047, 0.13030147552490234, 0.134033203125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 12.0, 21.0, 41.0, 68.0, 112.0, 138.0, 149.0, 140.0, 131.0, 71.0, 47.0, 32.0, 26.0, 9.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6079115867614746, -2.5323643684387207, -2.456817150115967, -2.381269931793213, -2.305722713470459, -2.230175733566284, -2.1546285152435303, -2.0790812969207764, -2.0035340785980225, -1.9279868602752686, -1.8524396419525146, -1.7768925428390503, -1.7013453245162964, -1.6257981061935425, -1.5502510070800781, -1.4747037887573242, -1.3991565704345703, -1.3236093521118164, -1.2480621337890625, -1.1725150346755981, -1.0969678163528442, -1.0214205980300903, -0.9458734393119812, -0.8703262805938721, -0.7947790622711182, -0.7192318439483643, -0.6436846852302551, -0.568137526512146, -0.4925903081893921, -0.41704311966896057, -0.34149593114852905, -0.2659487724304199, -0.19040131568908691, -0.1148541271686554, -0.03930693864822388, 0.03624024987220764, 0.11178743839263916, 0.18733462691307068, 0.2628818154335022, 0.33842897415161133, 0.41397619247436523, 0.48952338099479675, 0.5650705695152283, 0.6406177282333374, 0.7161649465560913, 0.7917121648788452, 0.8672593235969543, 0.9428064823150635, 1.0183537006378174, 1.0939009189605713, 1.1694481372833252, 1.2449952363967896, 1.3205424547195435, 1.3960896730422974, 1.4716367721557617, 1.5471839904785156, 1.6227312088012695, 1.6982784271240234, 1.7738256454467773, 1.8493727445602417, 1.9249199628829956, 2.00046706199646, 2.076014280319214, 2.1515614986419678, 2.2271087169647217]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 7.0, 4.0, 9.0, 14.0, 10.0, 16.0, 15.0, 20.0, 15.0, 22.0, 30.0, 27.0, 35.0, 36.0, 36.0, 47.0, 41.0, 37.0, 54.0, 37.0, 49.0, 42.0, 41.0, 32.0, 44.0, 40.0, 29.0, 29.0, 24.0, 32.0, 20.0, 18.0, 16.0, 18.0, 6.0, 7.0, 7.0, 7.0, 5.0, 6.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0, 3.0], "bins": [-1.4591898918151855, -1.4181658029556274, -1.3771418333053589, -1.3361177444458008, -1.2950937747955322, -1.2540696859359741, -1.213045597076416, -1.1720216274261475, -1.1309975385665894, -1.0899734497070312, -1.0489494800567627, -1.0079253911972046, -0.9669013619422913, -0.9258773326873779, -0.8848533034324646, -0.8438292741775513, -0.8028052449226379, -0.7617812156677246, -0.7207571864128113, -0.679733157157898, -0.6387090682983398, -0.5976850390434265, -0.5566610097885132, -0.5156369209289551, -0.47461292147636414, -0.4335888922214508, -0.3925648331642151, -0.35154080390930176, -0.3105167746543884, -0.2694927155971527, -0.22846868634223938, -0.18744462728500366, -0.14642059803009033, -0.10539655387401581, -0.06437251716852188, -0.023348480463027954, 0.01767556369304657, 0.058699607849121094, 0.09972363710403442, 0.14074769616127014, 0.18177172541618347, 0.222795769572258, 0.2638198137283325, 0.30484384298324585, 0.3458678722381592, 0.3868919312953949, 0.4279159605503082, 0.46894001960754395, 0.5099640488624573, 0.5509880781173706, 0.5920121073722839, 0.6330361366271973, 0.6740602254867554, 0.7150842547416687, 0.756108283996582, 0.7971323728561401, 0.8381563425064087, 0.879180371761322, 0.9202044010162354, 0.9612284898757935, 1.002252459526062, 1.0432765483856201, 1.0843005180358887, 1.1253246068954468, 1.1663486957550049]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 7.0, 7.0, 13.0, 23.0, 16.0, 33.0, 38.0, 60.0, 72.0, 128.0, 190.0, 309.0, 493.0, 735.0, 1283.0, 2280.0, 4286.0, 8756.0, 19914.0, 53330.0, 195645.0, 2829591.0, 877274.0, 128091.0, 40027.0, 15906.0, 7166.0, 3631.0, 1973.0, 1113.0, 653.0, 390.0, 279.0, 177.0, 103.0, 76.0, 63.0, 39.0, 24.0, 19.0, 16.0, 13.0, 8.0, 8.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.190185546875, -0.18421554565429688, -0.17824554443359375, -0.17227554321289062, -0.1663055419921875, -0.16033554077148438, -0.15436553955078125, -0.14839553833007812, -0.142425537109375, -0.13645553588867188, -0.13048553466796875, -0.12451553344726562, -0.1185455322265625, -0.11257553100585938, -0.10660552978515625, -0.10063552856445312, -0.09466552734375, -0.08869552612304688, -0.08272552490234375, -0.07675552368164062, -0.0707855224609375, -0.06481552124023438, -0.05884552001953125, -0.052875518798828125, -0.046905517578125, -0.040935516357421875, -0.03496551513671875, -0.028995513916015625, -0.0230255126953125, -0.017055511474609375, -0.01108551025390625, -0.005115509033203125, 0.0008544921875, 0.006824493408203125, 0.01279449462890625, 0.018764495849609375, 0.0247344970703125, 0.030704498291015625, 0.03667449951171875, 0.042644500732421875, 0.048614501953125, 0.054584503173828125, 0.06055450439453125, 0.06652450561523438, 0.0724945068359375, 0.07846450805664062, 0.08443450927734375, 0.09040451049804688, 0.09637451171875, 0.10234451293945312, 0.10831451416015625, 0.11428451538085938, 0.1202545166015625, 0.12622451782226562, 0.13219451904296875, 0.13816452026367188, 0.144134521484375, 0.15010452270507812, 0.15607452392578125, 0.16204452514648438, 0.1680145263671875, 0.17398452758789062, 0.17995452880859375, 0.18592453002929688, 0.19189453125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 6.0, 0.0, 5.0, 1.0, 3.0, 6.0, 6.0, 11.0, 15.0, 18.0, 15.0, 12.0, 19.0, 16.0, 29.0, 31.0, 33.0, 51.0, 32.0, 38.0, 33.0, 52.0, 47.0, 52.0, 40.0, 50.0, 40.0, 30.0, 33.0, 45.0, 38.0, 26.0, 28.0, 20.0, 21.0, 16.0, 15.0, 19.0, 9.0, 13.0, 7.0, 11.0, 5.0, 2.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.052093505859375, -0.05044746398925781, -0.048801422119140625, -0.04715538024902344, -0.04550933837890625, -0.04386329650878906, -0.042217254638671875, -0.04057121276855469, -0.0389251708984375, -0.03727912902832031, -0.035633087158203125, -0.03398704528808594, -0.03234100341796875, -0.030694961547851562, -0.029048919677734375, -0.027402877807617188, -0.0257568359375, -0.024110794067382812, -0.022464752197265625, -0.020818710327148438, -0.01917266845703125, -0.017526626586914062, -0.015880584716796875, -0.014234542846679688, -0.0125885009765625, -0.010942459106445312, -0.009296417236328125, -0.0076503753662109375, -0.00600433349609375, -0.0043582916259765625, -0.002712249755859375, -0.0010662078857421875, 0.000579833984375, 0.0022258758544921875, 0.003871917724609375, 0.0055179595947265625, 0.00716400146484375, 0.008810043334960938, 0.010456085205078125, 0.012102127075195312, 0.0137481689453125, 0.015394210815429688, 0.017040252685546875, 0.018686294555664062, 0.02033233642578125, 0.021978378295898438, 0.023624420166015625, 0.025270462036132812, 0.02691650390625, 0.028562545776367188, 0.030208587646484375, 0.03185462951660156, 0.03350067138671875, 0.03514671325683594, 0.036792755126953125, 0.03843879699707031, 0.0400848388671875, 0.04173088073730469, 0.043376922607421875, 0.04502296447753906, 0.04666900634765625, 0.04831504821777344, 0.049961090087890625, 0.05160713195800781, 0.053253173828125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 4.0, 14.0, 12.0, 19.0, 29.0, 32.0, 75.0, 91.0, 140.0, 217.0, 371.0, 542.0, 839.0, 1578.0, 2834.0, 6090.0, 15226.0, 46514.0, 202239.0, 2797936.0, 945123.0, 120697.0, 31672.0, 11226.0, 4980.0, 2373.0, 1333.0, 777.0, 445.0, 286.0, 192.0, 111.0, 85.0, 56.0, 37.0, 31.0, 17.0, 17.0, 8.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.280029296875, -0.2715034484863281, -0.26297760009765625, -0.2544517517089844, -0.2459259033203125, -0.23740005493164062, -0.22887420654296875, -0.22034835815429688, -0.211822509765625, -0.20329666137695312, -0.19477081298828125, -0.18624496459960938, -0.1777191162109375, -0.16919326782226562, -0.16066741943359375, -0.15214157104492188, -0.14361572265625, -0.13508987426757812, -0.12656402587890625, -0.11803817749023438, -0.1095123291015625, -0.10098648071289062, -0.09246063232421875, -0.08393478393554688, -0.075408935546875, -0.06688308715820312, -0.05835723876953125, -0.049831390380859375, -0.0413055419921875, -0.032779693603515625, -0.02425384521484375, -0.015727996826171875, -0.0072021484375, 0.001323699951171875, 0.00984954833984375, 0.018375396728515625, 0.0269012451171875, 0.035427093505859375, 0.04395294189453125, 0.052478790283203125, 0.061004638671875, 0.06953048706054688, 0.07805633544921875, 0.08658218383789062, 0.0951080322265625, 0.10363388061523438, 0.11215972900390625, 0.12068557739257812, 0.12921142578125, 0.13773727416992188, 0.14626312255859375, 0.15478897094726562, 0.1633148193359375, 0.17184066772460938, 0.18036651611328125, 0.18889236450195312, 0.197418212890625, 0.20594406127929688, 0.21446990966796875, 0.22299575805664062, 0.2315216064453125, 0.24004745483398438, 0.24857330322265625, 0.2570991516113281, 0.265625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 0.0, 4.0, 6.0, 6.0, 7.0, 13.0, 18.0, 17.0, 34.0, 73.0, 105.0, 202.0, 443.0, 1716.0, 766.0, 318.0, 131.0, 84.0, 50.0, 34.0, 11.0, 9.0, 11.0, 10.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.200927734375, -0.19438552856445312, -0.18784332275390625, -0.18130111694335938, -0.1747589111328125, -0.16821670532226562, -0.16167449951171875, -0.15513229370117188, -0.148590087890625, -0.14204788208007812, -0.13550567626953125, -0.12896347045898438, -0.1224212646484375, -0.11587905883789062, -0.10933685302734375, -0.10279464721679688, -0.09625244140625, -0.08971023559570312, -0.08316802978515625, -0.07662582397460938, -0.0700836181640625, -0.06354141235351562, -0.05699920654296875, -0.050457000732421875, -0.043914794921875, -0.037372589111328125, -0.03083038330078125, -0.024288177490234375, -0.0177459716796875, -0.011203765869140625, -0.00466156005859375, 0.001880645751953125, 0.0084228515625, 0.014965057373046875, 0.02150726318359375, 0.028049468994140625, 0.0345916748046875, 0.041133880615234375, 0.04767608642578125, 0.054218292236328125, 0.060760498046875, 0.06730270385742188, 0.07384490966796875, 0.08038711547851562, 0.0869293212890625, 0.09347152709960938, 0.10001373291015625, 0.10655593872070312, 0.11309814453125, 0.11964035034179688, 0.12618255615234375, 0.13272476196289062, 0.1392669677734375, 0.14580917358398438, 0.15235137939453125, 0.15889358520507812, 0.165435791015625, 0.17197799682617188, 0.17852020263671875, 0.18506240844726562, 0.1916046142578125, 0.19814682006835938, 0.20468902587890625, 0.21123123168945312, 0.2177734375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 4.0, 11.0, 30.0, 38.0, 62.0, 93.0, 106.0, 129.0, 150.0, 119.0, 88.0, 74.0, 41.0, 22.0, 20.0, 6.0, 2.0, 0.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5917373895645142, -0.5554035902023315, -0.5190697908401489, -0.4827359914779663, -0.4464021921157837, -0.4100683927536011, -0.37373459339141846, -0.33740079402923584, -0.3010669946670532, -0.2647331953048706, -0.228399395942688, -0.19206559658050537, -0.15573179721832275, -0.11939799785614014, -0.08306419849395752, -0.0467303991317749, -0.010396599769592285, 0.025937199592590332, 0.06227099895477295, 0.09860479831695557, 0.13493859767913818, 0.1712723970413208, 0.20760619640350342, 0.24393999576568604, 0.28027379512786865, 0.31660759449005127, 0.3529413938522339, 0.3892751932144165, 0.4256089925765991, 0.46194279193878174, 0.49827659130096436, 0.534610390663147, 0.5709443092346191, 0.6072781085968018, 0.6436119079589844, 0.679945707321167, 0.7162795066833496, 0.7526133060455322, 0.7889471054077148, 0.8252809047698975, 0.8616147041320801, 0.8979485034942627, 0.9342823028564453, 0.9706161022186279, 1.0069499015808105, 1.0432837009429932, 1.0796175003051758, 1.1159512996673584, 1.152285099029541, 1.1886188983917236, 1.2249526977539062, 1.2612864971160889, 1.2976202964782715, 1.333954095840454, 1.3702878952026367, 1.4066216945648193, 1.442955493927002, 1.4792892932891846, 1.5156230926513672, 1.5519568920135498, 1.5882906913757324, 1.624624490737915, 1.6609582901000977, 1.6972920894622803, 1.733625888824463]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 5.0, 5.0, 8.0, 8.0, 13.0, 10.0, 14.0, 18.0, 15.0, 15.0, 25.0, 29.0, 28.0, 48.0, 36.0, 36.0, 41.0, 44.0, 43.0, 57.0, 50.0, 46.0, 45.0, 28.0, 30.0, 39.0, 31.0, 38.0, 29.0, 25.0, 18.0, 30.0, 19.0, 20.0, 10.0, 7.0, 8.0, 9.0, 7.0, 3.0, 6.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4947463870048523, -0.476949006319046, -0.45915162563323975, -0.44135424494743347, -0.4235568642616272, -0.4057595133781433, -0.38796213269233704, -0.37016475200653076, -0.3523673713207245, -0.3345699906349182, -0.31677260994911194, -0.29897522926330566, -0.2811778783798218, -0.2633804678916931, -0.24558311700820923, -0.22778573632240295, -0.20998835563659668, -0.1921909749507904, -0.17439359426498413, -0.15659622848033905, -0.13879884779453278, -0.1210014671087265, -0.10320409387350082, -0.08540672063827515, -0.06760933995246887, -0.049811962991952896, -0.03201458603143692, -0.014217209070920944, 0.0035801678895950317, 0.021377548575401306, 0.039174921810626984, 0.05697229504585266, 0.07476961612701416, 0.09256699681282043, 0.11036437004804611, 0.1281617432832718, 0.14595912396907806, 0.16375650465488434, 0.18155387043952942, 0.1993512511253357, 0.21714863181114197, 0.23494601249694824, 0.2527433931827545, 0.2705407738685608, 0.2883381247520447, 0.30613553524017334, 0.3239328861236572, 0.3417302668094635, 0.3595276474952698, 0.37732502818107605, 0.3951224088668823, 0.4129197895526886, 0.4307171702384949, 0.44851452112197876, 0.46631190180778503, 0.4841092824935913, 0.5019066333770752, 0.5197039842605591, 0.5375013947486877, 0.5552987456321716, 0.5730961561203003, 0.5908935070037842, 0.6086909174919128, 0.6264882683753967, 0.6442856788635254]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 5.0, 7.0, 11.0, 19.0, 21.0, 41.0, 49.0, 64.0, 97.0, 165.0, 219.0, 338.0, 546.0, 867.0, 1444.0, 2486.0, 4168.0, 7517.0, 14060.0, 26987.0, 51927.0, 96208.0, 168435.0, 227097.0, 192823.0, 116802.0, 63609.0, 32887.0, 17654.0, 9446.0, 5127.0, 2878.0, 1708.0, 989.0, 615.0, 434.0, 237.0, 162.0, 116.0, 101.0, 57.0, 42.0, 28.0, 19.0, 16.0, 10.0, 4.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1314697265625, -0.1271820068359375, -0.122894287109375, -0.1186065673828125, -0.11431884765625, -0.1100311279296875, -0.105743408203125, -0.1014556884765625, -0.09716796875, -0.0928802490234375, -0.088592529296875, -0.0843048095703125, -0.08001708984375, -0.0757293701171875, -0.071441650390625, -0.0671539306640625, -0.0628662109375, -0.0585784912109375, -0.054290771484375, -0.0500030517578125, -0.04571533203125, -0.0414276123046875, -0.037139892578125, -0.0328521728515625, -0.028564453125, -0.0242767333984375, -0.019989013671875, -0.0157012939453125, -0.01141357421875, -0.0071258544921875, -0.002838134765625, 0.0014495849609375, 0.0057373046875, 0.0100250244140625, 0.014312744140625, 0.0186004638671875, 0.02288818359375, 0.0271759033203125, 0.031463623046875, 0.0357513427734375, 0.0400390625, 0.0443267822265625, 0.048614501953125, 0.0529022216796875, 0.05718994140625, 0.0614776611328125, 0.065765380859375, 0.0700531005859375, 0.0743408203125, 0.0786285400390625, 0.082916259765625, 0.0872039794921875, 0.09149169921875, 0.0957794189453125, 0.100067138671875, 0.1043548583984375, 0.108642578125, 0.1129302978515625, 0.117218017578125, 0.1215057373046875, 0.12579345703125, 0.1300811767578125, 0.134368896484375, 0.1386566162109375, 0.1429443359375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 3.0, 8.0, 10.0, 15.0, 5.0, 26.0, 12.0, 18.0, 22.0, 25.0, 23.0, 45.0, 34.0, 38.0, 45.0, 47.0, 43.0, 49.0, 45.0, 44.0, 53.0, 50.0, 40.0, 40.0, 37.0, 28.0, 36.0, 38.0, 13.0, 16.0, 14.0, 10.0, 21.0, 5.0, 15.0, 5.0, 5.0, 6.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055511474609375, -0.0535426139831543, -0.051573753356933594, -0.04960489273071289, -0.04763603210449219, -0.045667171478271484, -0.04369831085205078, -0.04172945022583008, -0.039760589599609375, -0.03779172897338867, -0.03582286834716797, -0.033854007720947266, -0.03188514709472656, -0.02991628646850586, -0.027947425842285156, -0.025978565216064453, -0.02400970458984375, -0.022040843963623047, -0.020071983337402344, -0.01810312271118164, -0.016134262084960938, -0.014165401458740234, -0.012196540832519531, -0.010227680206298828, -0.008258819580078125, -0.006289958953857422, -0.004321098327636719, -0.0023522377014160156, -0.0003833770751953125, 0.0015854835510253906, 0.0035543441772460938, 0.005523204803466797, 0.0074920654296875, 0.009460926055908203, 0.011429786682128906, 0.01339864730834961, 0.015367507934570312, 0.017336368560791016, 0.01930522918701172, 0.021274089813232422, 0.023242950439453125, 0.025211811065673828, 0.02718067169189453, 0.029149532318115234, 0.031118392944335938, 0.03308725357055664, 0.035056114196777344, 0.03702497482299805, 0.03899383544921875, 0.04096269607543945, 0.042931556701660156, 0.04490041732788086, 0.04686927795410156, 0.048838138580322266, 0.05080699920654297, 0.05277585983276367, 0.054744720458984375, 0.05671358108520508, 0.05868244171142578, 0.060651302337646484, 0.06262016296386719, 0.06458902359008789, 0.0665578842163086, 0.0685267448425293, 0.07049560546875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 2.0, 8.0, 13.0, 21.0, 25.0, 37.0, 38.0, 64.0, 80.0, 127.0, 185.0, 279.0, 481.0, 805.0, 1683.0, 4762.0, 19146.0, 110461.0, 522701.0, 317940.0, 53292.0, 10357.0, 2998.0, 1226.0, 642.0, 416.0, 279.0, 150.0, 110.0, 70.0, 38.0, 29.0, 28.0, 13.0, 12.0, 7.0, 10.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.329345703125, -0.31790924072265625, -0.3064727783203125, -0.29503631591796875, -0.283599853515625, -0.27216339111328125, -0.2607269287109375, -0.24929046630859375, -0.23785400390625, -0.22641754150390625, -0.2149810791015625, -0.20354461669921875, -0.192108154296875, -0.18067169189453125, -0.1692352294921875, -0.15779876708984375, -0.1463623046875, -0.13492584228515625, -0.1234893798828125, -0.11205291748046875, -0.100616455078125, -0.08917999267578125, -0.0777435302734375, -0.06630706787109375, -0.05487060546875, -0.04343414306640625, -0.0319976806640625, -0.02056121826171875, -0.009124755859375, 0.00231170654296875, 0.0137481689453125, 0.02518463134765625, 0.03662109375, 0.04805755615234375, 0.0594940185546875, 0.07093048095703125, 0.082366943359375, 0.09380340576171875, 0.1052398681640625, 0.11667633056640625, 0.12811279296875, 0.13954925537109375, 0.1509857177734375, 0.16242218017578125, 0.173858642578125, 0.18529510498046875, 0.1967315673828125, 0.20816802978515625, 0.2196044921875, 0.23104095458984375, 0.2424774169921875, 0.25391387939453125, 0.265350341796875, 0.27678680419921875, 0.2882232666015625, 0.29965972900390625, 0.31109619140625, 0.32253265380859375, 0.3339691162109375, 0.34540557861328125, 0.356842041015625, 0.36827850341796875, 0.3797149658203125, 0.39115142822265625, 0.402587890625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 5.0, 8.0, 15.0, 3.0, 16.0, 10.0, 14.0, 20.0, 18.0, 15.0, 29.0, 24.0, 34.0, 30.0, 36.0, 43.0, 36.0, 48.0, 48.0, 53.0, 50.0, 34.0, 43.0, 50.0, 39.0, 29.0, 36.0, 28.0, 30.0, 24.0, 15.0, 14.0, 18.0, 23.0, 17.0, 11.0, 10.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.344482421875, -0.3341560363769531, -0.32382965087890625, -0.3135032653808594, -0.3031768798828125, -0.2928504943847656, -0.28252410888671875, -0.2721977233886719, -0.261871337890625, -0.2515449523925781, -0.24121856689453125, -0.23089218139648438, -0.2205657958984375, -0.21023941040039062, -0.19991302490234375, -0.18958663940429688, -0.17926025390625, -0.16893386840820312, -0.15860748291015625, -0.14828109741210938, -0.1379547119140625, -0.12762832641601562, -0.11730194091796875, -0.10697555541992188, -0.096649169921875, -0.08632278442382812, -0.07599639892578125, -0.06567001342773438, -0.0553436279296875, -0.045017242431640625, -0.03469085693359375, -0.024364471435546875, -0.0140380859375, -0.003711700439453125, 0.00661468505859375, 0.016941070556640625, 0.0272674560546875, 0.037593841552734375, 0.04792022705078125, 0.058246612548828125, 0.068572998046875, 0.07889938354492188, 0.08922576904296875, 0.09955215454101562, 0.1098785400390625, 0.12020492553710938, 0.13053131103515625, 0.14085769653320312, 0.15118408203125, 0.16151046752929688, 0.17183685302734375, 0.18216323852539062, 0.1924896240234375, 0.20281600952148438, 0.21314239501953125, 0.22346878051757812, 0.233795166015625, 0.24412155151367188, 0.25444793701171875, 0.2647743225097656, 0.2751007080078125, 0.2854270935058594, 0.29575347900390625, 0.3060798645019531, 0.31640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 12.0, 1.0, 12.0, 14.0, 10.0, 33.0, 42.0, 46.0, 100.0, 127.0, 205.0, 347.0, 626.0, 1289.0, 2791.0, 7116.0, 23598.0, 119434.0, 516269.0, 300482.0, 54477.0, 13049.0, 4461.0, 1869.0, 954.0, 475.0, 261.0, 175.0, 97.0, 62.0, 29.0, 33.0, 24.0, 8.0, 8.0, 6.0, 8.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.18505859375, -0.17923355102539062, -0.17340850830078125, -0.16758346557617188, -0.1617584228515625, -0.15593338012695312, -0.15010833740234375, -0.14428329467773438, -0.138458251953125, -0.13263320922851562, -0.12680816650390625, -0.12098312377929688, -0.1151580810546875, -0.10933303833007812, -0.10350799560546875, -0.09768295288085938, -0.09185791015625, -0.08603286743164062, -0.08020782470703125, -0.07438278198242188, -0.0685577392578125, -0.06273269653320312, -0.05690765380859375, -0.051082611083984375, -0.045257568359375, -0.039432525634765625, -0.03360748291015625, -0.027782440185546875, -0.0219573974609375, -0.016132354736328125, -0.01030731201171875, -0.004482269287109375, 0.0013427734375, 0.007167816162109375, 0.01299285888671875, 0.018817901611328125, 0.0246429443359375, 0.030467987060546875, 0.03629302978515625, 0.042118072509765625, 0.047943115234375, 0.053768157958984375, 0.05959320068359375, 0.06541824340820312, 0.0712432861328125, 0.07706832885742188, 0.08289337158203125, 0.08871841430664062, 0.09454345703125, 0.10036849975585938, 0.10619354248046875, 0.11201858520507812, 0.1178436279296875, 0.12366867065429688, 0.12949371337890625, 0.13531875610351562, 0.141143798828125, 0.14696884155273438, 0.15279388427734375, 0.15861892700195312, 0.1644439697265625, 0.17026901245117188, 0.17609405517578125, 0.18191909790039062, 0.187744140625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 4.0, 6.0, 12.0, 12.0, 17.0, 24.0, 23.0, 26.0, 32.0, 43.0, 55.0, 55.0, 67.0, 76.0, 59.0, 62.0, 76.0, 60.0, 46.0, 47.0, 38.0, 42.0, 26.0, 18.0, 12.0, 13.0, 10.0, 12.0, 8.0, 8.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.11679458618164e-05, -6.905663758516312e-05, -6.694532930850983e-05, -6.483402103185654e-05, -6.272271275520325e-05, -6.061140447854996e-05, -5.850009620189667e-05, -5.638878792524338e-05, -5.427747964859009e-05, -5.21661713719368e-05, -5.005486309528351e-05, -4.794355481863022e-05, -4.583224654197693e-05, -4.372093826532364e-05, -4.160962998867035e-05, -3.949832171201706e-05, -3.738701343536377e-05, -3.527570515871048e-05, -3.316439688205719e-05, -3.10530886054039e-05, -2.894178032875061e-05, -2.683047205209732e-05, -2.471916377544403e-05, -2.260785549879074e-05, -2.049654722213745e-05, -1.838523894548416e-05, -1.627393066883087e-05, -1.4162622392177582e-05, -1.2051314115524292e-05, -9.940005838871002e-06, -7.828697562217712e-06, -5.717389285564423e-06, -3.606081008911133e-06, -1.494772732257843e-06, 6.165355443954468e-07, 2.7278438210487366e-06, 4.839152097702026e-06, 6.950460374355316e-06, 9.061768651008606e-06, 1.1173076927661896e-05, 1.3284385204315186e-05, 1.5395693480968475e-05, 1.7507001757621765e-05, 1.9618310034275055e-05, 2.1729618310928345e-05, 2.3840926587581635e-05, 2.5952234864234924e-05, 2.8063543140888214e-05, 3.0174851417541504e-05, 3.2286159694194794e-05, 3.4397467970848083e-05, 3.650877624750137e-05, 3.862008452415466e-05, 4.073139280080795e-05, 4.284270107746124e-05, 4.495400935411453e-05, 4.706531763076782e-05, 4.917662590742111e-05, 5.12879341840744e-05, 5.339924246072769e-05, 5.551055073738098e-05, 5.762185901403427e-05, 5.973316729068756e-05, 6.184447556734085e-05, 6.395578384399414e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 6.0, 5.0, 6.0, 13.0, 12.0, 15.0, 29.0, 43.0, 58.0, 109.0, 195.0, 331.0, 707.0, 1652.0, 4507.0, 16301.0, 97994.0, 599505.0, 278869.0, 35457.0, 7953.0, 2649.0, 1023.0, 496.0, 245.0, 133.0, 88.0, 61.0, 31.0, 15.0, 16.0, 7.0, 5.0, 5.0, 4.0, 0.0, 4.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21728515625, -0.21043968200683594, -0.20359420776367188, -0.1967487335205078, -0.18990325927734375, -0.1830577850341797, -0.17621231079101562, -0.16936683654785156, -0.1625213623046875, -0.15567588806152344, -0.14883041381835938, -0.1419849395751953, -0.13513946533203125, -0.1282939910888672, -0.12144851684570312, -0.11460304260253906, -0.107757568359375, -0.10091209411621094, -0.09406661987304688, -0.08722114562988281, -0.08037567138671875, -0.07353019714355469, -0.06668472290039062, -0.05983924865722656, -0.0529937744140625, -0.04614830017089844, -0.039302825927734375, -0.03245735168457031, -0.02561187744140625, -0.018766403198242188, -0.011920928955078125, -0.0050754547119140625, 0.00177001953125, 0.008615493774414062, 0.015460968017578125, 0.022306442260742188, 0.02915191650390625, 0.03599739074707031, 0.042842864990234375, 0.04968833923339844, 0.0565338134765625, 0.06337928771972656, 0.07022476196289062, 0.07707023620605469, 0.08391571044921875, 0.09076118469238281, 0.09760665893554688, 0.10445213317871094, 0.111297607421875, 0.11814308166503906, 0.12498855590820312, 0.1318340301513672, 0.13867950439453125, 0.1455249786376953, 0.15237045288085938, 0.15921592712402344, 0.1660614013671875, 0.17290687561035156, 0.17975234985351562, 0.1865978240966797, 0.19344329833984375, 0.2002887725830078, 0.20713424682617188, 0.21397972106933594, 0.2208251953125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 4.0, 8.0, 6.0, 10.0, 22.0, 32.0, 34.0, 63.0, 80.0, 93.0, 108.0, 117.0, 103.0, 82.0, 58.0, 56.0, 34.0, 27.0, 19.0, 12.0, 5.0, 5.0, 8.0, 2.0, 3.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.155029296875, -0.148895263671875, -0.14276123046875, -0.136627197265625, -0.1304931640625, -0.124359130859375, -0.11822509765625, -0.112091064453125, -0.10595703125, -0.099822998046875, -0.09368896484375, -0.087554931640625, -0.0814208984375, -0.075286865234375, -0.06915283203125, -0.063018798828125, -0.056884765625, -0.050750732421875, -0.04461669921875, -0.038482666015625, -0.0323486328125, -0.026214599609375, -0.02008056640625, -0.013946533203125, -0.0078125, -0.001678466796875, 0.00445556640625, 0.010589599609375, 0.0167236328125, 0.022857666015625, 0.02899169921875, 0.035125732421875, 0.041259765625, 0.047393798828125, 0.05352783203125, 0.059661865234375, 0.0657958984375, 0.071929931640625, 0.07806396484375, 0.084197998046875, 0.09033203125, 0.096466064453125, 0.10260009765625, 0.108734130859375, 0.1148681640625, 0.121002197265625, 0.12713623046875, 0.133270263671875, 0.139404296875, 0.145538330078125, 0.15167236328125, 0.157806396484375, 0.1639404296875, 0.170074462890625, 0.17620849609375, 0.182342529296875, 0.1884765625, 0.194610595703125, 0.20074462890625, 0.206878662109375, 0.2130126953125, 0.219146728515625, 0.22528076171875, 0.231414794921875, 0.237548828125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 11.0, 16.0, 23.0, 38.0, 61.0, 86.0, 83.0, 124.0, 105.0, 112.0, 104.0, 85.0, 41.0, 34.0, 29.0, 18.0, 6.0, 7.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.481602907180786, -2.4121639728546143, -2.3427250385284424, -2.2732861042022705, -2.2038471698760986, -2.1344079971313477, -2.064969062805176, -1.9955302476882935, -1.926091194152832, -1.8566522598266602, -1.7872133255004883, -1.7177743911743164, -1.648335337638855, -1.578896403312683, -1.5094574689865112, -1.4400185346603394, -1.3705796003341675, -1.3011406660079956, -1.2317017316818237, -1.1622626781463623, -1.0928237438201904, -1.0233848094940186, -0.9539458751678467, -0.8845069408416748, -0.8150679469108582, -0.7456290125846863, -0.6761900186538696, -0.6067510843276978, -0.5373121500015259, -0.46787315607070923, -0.39843422174453735, -0.3289952576160431, -0.25955629348754883, -0.19011732935905457, -0.1206783801317215, -0.05123943090438843, 0.018199533224105835, 0.0876384973526001, 0.15707743167877197, 0.22651639580726624, 0.2959553599357605, 0.36539432406425476, 0.434833288192749, 0.5042722225189209, 0.5737111568450928, 0.6431501507759094, 0.7125890851020813, 0.782028079032898, 0.8514670133590698, 0.9209059476852417, 0.9903449416160583, 1.059783935546875, 1.1292228698730469, 1.1986618041992188, 1.2681007385253906, 1.3375396728515625, 1.4069786071777344, 1.4764175415039062, 1.5458564758300781, 1.61529541015625, 1.6847344636917114, 1.7541733980178833, 1.8236123323440552, 1.893051266670227, 1.9624903202056885]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 5.0, 7.0, 6.0, 6.0, 14.0, 18.0, 17.0, 20.0, 29.0, 24.0, 32.0, 27.0, 31.0, 33.0, 48.0, 49.0, 35.0, 45.0, 49.0, 47.0, 43.0, 48.0, 35.0, 55.0, 34.0, 36.0, 31.0, 34.0, 25.0, 11.0, 21.0, 21.0, 11.0, 14.0, 9.0, 7.0, 9.0, 7.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.795438528060913, -1.7371033430099487, -1.6787681579589844, -1.62043297290802, -1.5620977878570557, -1.5037624835968018, -1.445427417755127, -1.387092113494873, -1.3287569284439087, -1.2704217433929443, -1.21208655834198, -1.1537513732910156, -1.0954161882400513, -1.037081003189087, -0.9787457585334778, -0.9204105138778687, -0.8620753884315491, -0.8037402033805847, -0.7454050183296204, -0.6870697736740112, -0.6287345886230469, -0.5703994035720825, -0.5120642185211182, -0.4537290036678314, -0.39539381861686707, -0.3370586335659027, -0.27872341871261597, -0.2203882336616516, -0.16205303370952606, -0.10371783375740051, -0.04538264870643616, 0.012952566146850586, 0.07128775119781494, 0.1296229511499405, 0.18795815110206604, 0.2462933361530304, 0.30462855100631714, 0.3629637360572815, 0.42129892110824585, 0.4796341359615326, 0.5379693508148193, 0.5963045358657837, 0.654639720916748, 0.7129749059677124, 0.7713101506233215, 0.8296453356742859, 0.8879805207252502, 0.9463157653808594, 1.0046508312225342, 1.0629860162734985, 1.121321201324463, 1.1796563863754272, 1.2379915714263916, 1.2963268756866455, 1.3546619415283203, 1.4129972457885742, 1.4713324308395386, 1.529667615890503, 1.5880028009414673, 1.6463379859924316, 1.704673171043396, 1.7630083560943604, 1.8213436603546143, 1.8796788454055786, 1.938014030456543]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 13.0, 21.0, 15.0, 34.0, 24.0, 44.0, 59.0, 82.0, 104.0, 154.0, 216.0, 330.0, 494.0, 680.0, 974.0, 1467.0, 2337.0, 4004.0, 7228.0, 14993.0, 40464.0, 260288.0, 3743869.0, 71913.0, 21323.0, 9543.0, 4973.0, 2980.0, 1764.0, 1197.0, 775.0, 530.0, 407.0, 267.0, 189.0, 144.0, 91.0, 78.0, 50.0, 39.0, 28.0, 24.0, 18.0, 17.0, 9.0, 11.0, 4.0, 4.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0], "bins": [-0.2125244140625, -0.20592498779296875, -0.1993255615234375, -0.19272613525390625, -0.186126708984375, -0.17952728271484375, -0.1729278564453125, -0.16632843017578125, -0.15972900390625, -0.15312957763671875, -0.1465301513671875, -0.13993072509765625, -0.133331298828125, -0.12673187255859375, -0.1201324462890625, -0.11353302001953125, -0.10693359375, -0.10033416748046875, -0.0937347412109375, -0.08713531494140625, -0.080535888671875, -0.07393646240234375, -0.0673370361328125, -0.06073760986328125, -0.05413818359375, -0.04753875732421875, -0.0409393310546875, -0.03433990478515625, -0.027740478515625, -0.02114105224609375, -0.0145416259765625, -0.00794219970703125, -0.0013427734375, 0.00525665283203125, 0.0118560791015625, 0.01845550537109375, 0.025054931640625, 0.03165435791015625, 0.0382537841796875, 0.04485321044921875, 0.05145263671875, 0.05805206298828125, 0.0646514892578125, 0.07125091552734375, 0.077850341796875, 0.08444976806640625, 0.0910491943359375, 0.09764862060546875, 0.104248046875, 0.11084747314453125, 0.1174468994140625, 0.12404632568359375, 0.130645751953125, 0.13724517822265625, 0.1438446044921875, 0.15044403076171875, 0.15704345703125, 0.16364288330078125, 0.1702423095703125, 0.17684173583984375, 0.183441162109375, 0.19004058837890625, 0.1966400146484375, 0.20323944091796875, 0.2098388671875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 12.0, 6.0, 5.0, 6.0, 9.0, 10.0, 11.0, 18.0, 9.0, 21.0, 20.0, 25.0, 19.0, 33.0, 27.0, 47.0, 32.0, 42.0, 40.0, 49.0, 53.0, 41.0, 46.0, 53.0, 29.0, 33.0, 35.0, 38.0, 36.0, 32.0, 25.0, 23.0, 26.0, 21.0, 12.0, 9.0, 15.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.06488037109375, -0.06279945373535156, -0.060718536376953125, -0.05863761901855469, -0.05655670166015625, -0.05447578430175781, -0.052394866943359375, -0.05031394958496094, -0.0482330322265625, -0.04615211486816406, -0.044071197509765625, -0.04199028015136719, -0.03990936279296875, -0.03782844543457031, -0.035747528076171875, -0.03366661071777344, -0.031585693359375, -0.029504776000976562, -0.027423858642578125, -0.025342941284179688, -0.02326202392578125, -0.021181106567382812, -0.019100189208984375, -0.017019271850585938, -0.0149383544921875, -0.012857437133789062, -0.010776519775390625, -0.008695602416992188, -0.00661468505859375, -0.0045337677001953125, -0.002452850341796875, -0.0003719329833984375, 0.001708984375, 0.0037899017333984375, 0.005870819091796875, 0.007951736450195312, 0.01003265380859375, 0.012113571166992188, 0.014194488525390625, 0.016275405883789062, 0.0183563232421875, 0.020437240600585938, 0.022518157958984375, 0.024599075317382812, 0.02667999267578125, 0.028760910034179688, 0.030841827392578125, 0.03292274475097656, 0.035003662109375, 0.03708457946777344, 0.039165496826171875, 0.04124641418457031, 0.04332733154296875, 0.04540824890136719, 0.047489166259765625, 0.04957008361816406, 0.0516510009765625, 0.05373191833496094, 0.055812835693359375, 0.05789375305175781, 0.05997467041015625, 0.06205558776855469, 0.06413650512695312, 0.06621742248535156, 0.06829833984375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 8.0, 8.0, 16.0, 16.0, 32.0, 22.0, 30.0, 50.0, 53.0, 73.0, 93.0, 136.0, 205.0, 273.0, 410.0, 658.0, 1113.0, 2492.0, 6826.0, 38394.0, 3937090.0, 183114.0, 14816.0, 3929.0, 1739.0, 956.0, 538.0, 356.0, 235.0, 173.0, 105.0, 69.0, 55.0, 44.0, 41.0, 30.0, 20.0, 16.0, 8.0, 3.0, 6.0, 6.0, 4.0, 3.0, 3.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.58251953125, -0.5635833740234375, -0.544647216796875, -0.5257110595703125, -0.50677490234375, -0.4878387451171875, -0.468902587890625, -0.4499664306640625, -0.4310302734375, -0.4120941162109375, -0.393157958984375, -0.3742218017578125, -0.35528564453125, -0.3363494873046875, -0.317413330078125, -0.2984771728515625, -0.279541015625, -0.2606048583984375, -0.241668701171875, -0.2227325439453125, -0.20379638671875, -0.1848602294921875, -0.165924072265625, -0.1469879150390625, -0.1280517578125, -0.1091156005859375, -0.090179443359375, -0.0712432861328125, -0.05230712890625, -0.0333709716796875, -0.014434814453125, 0.0045013427734375, 0.0234375, 0.0423736572265625, 0.061309814453125, 0.0802459716796875, 0.09918212890625, 0.1181182861328125, 0.137054443359375, 0.1559906005859375, 0.1749267578125, 0.1938629150390625, 0.212799072265625, 0.2317352294921875, 0.25067138671875, 0.2696075439453125, 0.288543701171875, 0.3074798583984375, 0.326416015625, 0.3453521728515625, 0.364288330078125, 0.3832244873046875, 0.40216064453125, 0.4210968017578125, 0.440032958984375, 0.4589691162109375, 0.4779052734375, 0.4968414306640625, 0.515777587890625, 0.5347137451171875, 0.55364990234375, 0.5725860595703125, 0.591522216796875, 0.6104583740234375, 0.62939453125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 7.0, 4.0, 19.0, 46.0, 133.0, 3339.0, 385.0, 96.0, 20.0, 9.0, 11.0, 1.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.26171875, -0.2558755874633789, -0.2500324249267578, -0.24418926239013672, -0.23834609985351562, -0.23250293731689453, -0.22665977478027344, -0.22081661224365234, -0.21497344970703125, -0.20913028717041016, -0.20328712463378906, -0.19744396209716797, -0.19160079956054688, -0.18575763702392578, -0.1799144744873047, -0.1740713119506836, -0.1682281494140625, -0.1623849868774414, -0.1565418243408203, -0.15069866180419922, -0.14485549926757812, -0.13901233673095703, -0.13316917419433594, -0.12732601165771484, -0.12148284912109375, -0.11563968658447266, -0.10979652404785156, -0.10395336151123047, -0.09811019897460938, -0.09226703643798828, -0.08642387390136719, -0.0805807113647461, -0.074737548828125, -0.0688943862915039, -0.06305122375488281, -0.05720806121826172, -0.051364898681640625, -0.04552173614501953, -0.03967857360839844, -0.033835411071777344, -0.02799224853515625, -0.022149085998535156, -0.016305923461914062, -0.010462760925292969, -0.004619598388671875, 0.0012235641479492188, 0.0070667266845703125, 0.012909889221191406, 0.0187530517578125, 0.024596214294433594, 0.030439376831054688, 0.03628253936767578, 0.042125701904296875, 0.04796886444091797, 0.05381202697753906, 0.059655189514160156, 0.06549835205078125, 0.07134151458740234, 0.07718467712402344, 0.08302783966064453, 0.08887100219726562, 0.09471416473388672, 0.10055732727050781, 0.1064004898071289, 0.11224365234375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 6.0, 5.0, 5.0, 9.0, 12.0, 13.0, 23.0, 65.0, 59.0, 65.0, 58.0, 90.0, 106.0, 110.0, 95.0, 73.0, 66.0, 53.0, 26.0, 21.0, 11.0, 11.0, 9.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.25623372197151184, -0.24541980028152466, -0.23460589349269867, -0.2237919718027115, -0.2129780650138855, -0.20216414332389832, -0.19135022163391113, -0.18053629994392395, -0.16972239315509796, -0.15890847146511078, -0.1480945646762848, -0.1372806429862976, -0.12646672129631042, -0.11565281450748444, -0.10483889281749725, -0.09402497857809067, -0.08321106433868408, -0.0723971500992775, -0.06158323213458061, -0.05076931416988373, -0.03995539993047714, -0.029141485691070557, -0.018327564001083374, -0.007513649761676788, 0.0033002644777297974, 0.014114180579781532, 0.024928096681833267, 0.03574201464653015, 0.04655592888593674, 0.05736984312534332, 0.0681837648153305, 0.07899767905473709, 0.08981156349182129, 0.10062547773122787, 0.11143939197063446, 0.12225331366062164, 0.13306722044944763, 0.14388114213943481, 0.154695063829422, 0.16550898551940918, 0.17632289230823517, 0.18713681399822235, 0.19795072078704834, 0.20876464247703552, 0.2195785641670227, 0.2303924709558487, 0.24120639264583588, 0.25202029943466187, 0.26283422112464905, 0.27364814281463623, 0.2844620645046234, 0.2952759861946106, 0.3060898780822754, 0.3169037997722626, 0.32771772146224976, 0.33853164315223694, 0.3493455648422241, 0.3601594865322113, 0.3709734082221985, 0.3817873001098633, 0.39260122179985046, 0.40341514348983765, 0.41422906517982483, 0.425042986869812, 0.4358568787574768]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 12.0, 5.0, 8.0, 8.0, 11.0, 11.0, 17.0, 19.0, 22.0, 19.0, 24.0, 26.0, 24.0, 21.0, 29.0, 35.0, 36.0, 39.0, 33.0, 41.0, 34.0, 38.0, 38.0, 39.0, 34.0, 29.0, 34.0, 36.0, 40.0, 21.0, 23.0, 27.0, 22.0, 14.0, 23.0, 12.0, 14.0, 18.0, 11.0, 11.0, 11.0, 5.0, 10.0, 3.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 3.0, 2.0], "bins": [-0.2018650770187378, -0.19580957293510437, -0.18975405395030975, -0.18369854986667633, -0.1776430308818817, -0.1715875267982483, -0.16553202271461487, -0.15947651863098145, -0.15342099964618683, -0.1473654955625534, -0.1413099765777588, -0.13525447249412537, -0.12919896841049194, -0.12314344942569733, -0.1170879453420639, -0.11103243380784988, -0.10497692227363586, -0.09892141073942184, -0.09286589920520782, -0.0868103951215744, -0.08075488358736038, -0.07469937205314636, -0.06864386796951294, -0.06258835643529892, -0.0565328449010849, -0.05047733336687088, -0.04442182555794716, -0.03836631774902344, -0.03231080621480942, -0.026255296543240547, -0.020199786871671677, -0.014144279062747955, -0.008088767528533936, -0.002033257856965065, 0.0040222518146038055, 0.010077761486172676, 0.016133271157741547, 0.022188780829310417, 0.028244290500879288, 0.03429979830980301, 0.04035530984401703, 0.04641082137823105, 0.05246632918715477, 0.05852183699607849, 0.06457734853029251, 0.07063286006450653, 0.07668836414813995, 0.08274387568235397, 0.088799387216568, 0.09485489875078201, 0.10091041028499603, 0.10696591436862946, 0.11302142590284348, 0.1190769374370575, 0.12513244152069092, 0.13118794560432434, 0.13724346458911896, 0.14329896867275238, 0.149354487657547, 0.15540999174118042, 0.16146549582481384, 0.16752101480960846, 0.17357651889324188, 0.1796320378780365, 0.18568754196166992]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 8.0, 12.0, 7.0, 13.0, 12.0, 15.0, 29.0, 34.0, 69.0, 128.0, 246.0, 381.0, 741.0, 1380.0, 3023.0, 6265.0, 13289.0, 28625.0, 61810.0, 126473.0, 219902.0, 250813.0, 169439.0, 87982.0, 41475.0, 19024.0, 8781.0, 4197.0, 2076.0, 1036.0, 521.0, 305.0, 182.0, 84.0, 61.0, 28.0, 14.0, 14.0, 9.0, 8.0, 6.0, 5.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0], "bins": [-0.1739501953125, -0.1687164306640625, -0.163482666015625, -0.1582489013671875, -0.15301513671875, -0.1477813720703125, -0.142547607421875, -0.1373138427734375, -0.132080078125, -0.1268463134765625, -0.121612548828125, -0.1163787841796875, -0.11114501953125, -0.1059112548828125, -0.100677490234375, -0.0954437255859375, -0.0902099609375, -0.0849761962890625, -0.079742431640625, -0.0745086669921875, -0.06927490234375, -0.0640411376953125, -0.058807373046875, -0.0535736083984375, -0.04833984375, -0.0431060791015625, -0.037872314453125, -0.0326385498046875, -0.02740478515625, -0.0221710205078125, -0.016937255859375, -0.0117034912109375, -0.0064697265625, -0.0012359619140625, 0.003997802734375, 0.0092315673828125, 0.01446533203125, 0.0196990966796875, 0.024932861328125, 0.0301666259765625, 0.035400390625, 0.0406341552734375, 0.045867919921875, 0.0511016845703125, 0.05633544921875, 0.0615692138671875, 0.066802978515625, 0.0720367431640625, 0.0772705078125, 0.0825042724609375, 0.087738037109375, 0.0929718017578125, 0.09820556640625, 0.1034393310546875, 0.108673095703125, 0.1139068603515625, 0.119140625, 0.1243743896484375, 0.129608154296875, 0.1348419189453125, 0.14007568359375, 0.1453094482421875, 0.150543212890625, 0.1557769775390625, 0.1610107421875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 5.0, 5.0, 4.0, 9.0, 11.0, 12.0, 6.0, 12.0, 9.0, 21.0, 27.0, 20.0, 19.0, 19.0, 23.0, 29.0, 41.0, 26.0, 38.0, 35.0, 30.0, 52.0, 36.0, 34.0, 39.0, 49.0, 40.0, 31.0, 38.0, 34.0, 29.0, 29.0, 28.0, 31.0, 21.0, 16.0, 25.0, 13.0, 14.0, 9.0, 4.0, 6.0, 4.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.07330322265625, -0.07108592987060547, -0.06886863708496094, -0.0666513442993164, -0.06443405151367188, -0.062216758728027344, -0.05999946594238281, -0.05778217315673828, -0.05556488037109375, -0.05334758758544922, -0.05113029479980469, -0.048913002014160156, -0.046695709228515625, -0.044478416442871094, -0.04226112365722656, -0.04004383087158203, -0.0378265380859375, -0.03560924530029297, -0.03339195251464844, -0.031174659729003906, -0.028957366943359375, -0.026740074157714844, -0.024522781372070312, -0.02230548858642578, -0.02008819580078125, -0.01787090301513672, -0.015653610229492188, -0.013436317443847656, -0.011219024658203125, -0.009001731872558594, -0.0067844390869140625, -0.004567146301269531, -0.002349853515625, -0.00013256072998046875, 0.0020847320556640625, 0.004302024841308594, 0.006519317626953125, 0.008736610412597656, 0.010953903198242188, 0.013171195983886719, 0.01538848876953125, 0.01760578155517578, 0.019823074340820312, 0.022040367126464844, 0.024257659912109375, 0.026474952697753906, 0.028692245483398438, 0.03090953826904297, 0.0331268310546875, 0.03534412384033203, 0.03756141662597656, 0.039778709411621094, 0.041996002197265625, 0.044213294982910156, 0.04643058776855469, 0.04864788055419922, 0.05086517333984375, 0.05308246612548828, 0.05529975891113281, 0.057517051696777344, 0.059734344482421875, 0.061951637268066406, 0.06416893005371094, 0.06638622283935547, 0.068603515625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 8.0, 7.0, 5.0, 13.0, 16.0, 16.0, 25.0, 32.0, 43.0, 57.0, 79.0, 107.0, 141.0, 212.0, 298.0, 523.0, 790.0, 1285.0, 2868.0, 8393.0, 34649.0, 185715.0, 563839.0, 197340.0, 36592.0, 8805.0, 3069.0, 1407.0, 728.0, 490.0, 277.0, 205.0, 125.0, 103.0, 66.0, 57.0, 46.0, 26.0, 25.0, 19.0, 9.0, 17.0, 9.0, 5.0, 10.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.364013671875, -0.3531532287597656, -0.34229278564453125, -0.3314323425292969, -0.3205718994140625, -0.3097114562988281, -0.29885101318359375, -0.2879905700683594, -0.277130126953125, -0.2662696838378906, -0.25540924072265625, -0.24454879760742188, -0.2336883544921875, -0.22282791137695312, -0.21196746826171875, -0.20110702514648438, -0.19024658203125, -0.17938613891601562, -0.16852569580078125, -0.15766525268554688, -0.1468048095703125, -0.13594436645507812, -0.12508392333984375, -0.11422348022460938, -0.103363037109375, -0.09250259399414062, -0.08164215087890625, -0.07078170776367188, -0.0599212646484375, -0.049060821533203125, -0.03820037841796875, -0.027339935302734375, -0.0164794921875, -0.005619049072265625, 0.00524139404296875, 0.016101837158203125, 0.0269622802734375, 0.037822723388671875, 0.04868316650390625, 0.059543609619140625, 0.070404052734375, 0.08126449584960938, 0.09212493896484375, 0.10298538208007812, 0.1138458251953125, 0.12470626831054688, 0.13556671142578125, 0.14642715454101562, 0.15728759765625, 0.16814804077148438, 0.17900848388671875, 0.18986892700195312, 0.2007293701171875, 0.21158981323242188, 0.22245025634765625, 0.23331069946289062, 0.244171142578125, 0.2550315856933594, 0.26589202880859375, 0.2767524719238281, 0.2876129150390625, 0.2984733581542969, 0.30933380126953125, 0.3201942443847656, 0.3310546875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 5.0, 10.0, 8.0, 6.0, 12.0, 7.0, 12.0, 23.0, 27.0, 19.0, 29.0, 29.0, 24.0, 48.0, 47.0, 43.0, 35.0, 39.0, 51.0, 42.0, 39.0, 58.0, 41.0, 34.0, 46.0, 29.0, 38.0, 30.0, 28.0, 24.0, 20.0, 18.0, 16.0, 21.0, 9.0, 9.0, 10.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.392822265625, -0.37941741943359375, -0.3660125732421875, -0.35260772705078125, -0.339202880859375, -0.32579803466796875, -0.3123931884765625, -0.29898834228515625, -0.28558349609375, -0.27217864990234375, -0.2587738037109375, -0.24536895751953125, -0.231964111328125, -0.21855926513671875, -0.2051544189453125, -0.19174957275390625, -0.1783447265625, -0.16493988037109375, -0.1515350341796875, -0.13813018798828125, -0.124725341796875, -0.11132049560546875, -0.0979156494140625, -0.08451080322265625, -0.07110595703125, -0.05770111083984375, -0.0442962646484375, -0.03089141845703125, -0.017486572265625, -0.00408172607421875, 0.0093231201171875, 0.02272796630859375, 0.0361328125, 0.04953765869140625, 0.0629425048828125, 0.07634735107421875, 0.089752197265625, 0.10315704345703125, 0.1165618896484375, 0.12996673583984375, 0.14337158203125, 0.15677642822265625, 0.1701812744140625, 0.18358612060546875, 0.196990966796875, 0.21039581298828125, 0.2238006591796875, 0.23720550537109375, 0.2506103515625, 0.26401519775390625, 0.2774200439453125, 0.29082489013671875, 0.304229736328125, 0.31763458251953125, 0.3310394287109375, 0.34444427490234375, 0.35784912109375, 0.37125396728515625, 0.3846588134765625, 0.39806365966796875, 0.411468505859375, 0.42487335205078125, 0.4382781982421875, 0.45168304443359375, 0.465087890625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 10.0, 9.0, 13.0, 10.0, 18.0, 18.0, 35.0, 59.0, 73.0, 101.0, 152.0, 249.0, 434.0, 837.0, 1625.0, 3400.0, 8213.0, 24460.0, 92304.0, 374199.0, 400835.0, 99532.0, 25892.0, 8657.0, 3598.0, 1695.0, 839.0, 488.0, 293.0, 178.0, 103.0, 84.0, 44.0, 38.0, 18.0, 12.0, 11.0, 5.0, 7.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.14990234375, -0.14522171020507812, -0.14054107666015625, -0.13586044311523438, -0.1311798095703125, -0.12649917602539062, -0.12181854248046875, -0.11713790893554688, -0.112457275390625, -0.10777664184570312, -0.10309600830078125, -0.09841537475585938, -0.0937347412109375, -0.08905410766601562, -0.08437347412109375, -0.07969284057617188, -0.07501220703125, -0.07033157348632812, -0.06565093994140625, -0.060970306396484375, -0.0562896728515625, -0.051609039306640625, -0.04692840576171875, -0.042247772216796875, -0.037567138671875, -0.032886505126953125, -0.02820587158203125, -0.023525238037109375, -0.0188446044921875, -0.014163970947265625, -0.00948333740234375, -0.004802703857421875, -0.0001220703125, 0.004558563232421875, 0.00923919677734375, 0.013919830322265625, 0.0186004638671875, 0.023281097412109375, 0.02796173095703125, 0.032642364501953125, 0.037322998046875, 0.042003631591796875, 0.04668426513671875, 0.051364898681640625, 0.0560455322265625, 0.060726165771484375, 0.06540679931640625, 0.07008743286132812, 0.07476806640625, 0.07944869995117188, 0.08412933349609375, 0.08880996704101562, 0.0934906005859375, 0.09817123413085938, 0.10285186767578125, 0.10753250122070312, 0.112213134765625, 0.11689376831054688, 0.12157440185546875, 0.12625503540039062, 0.1309356689453125, 0.13561630249023438, 0.14029693603515625, 0.14497756958007812, 0.149658203125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 5.0, 4.0, 3.0, 17.0, 9.0, 9.0, 13.0, 17.0, 38.0, 18.0, 24.0, 26.0, 32.0, 34.0, 40.0, 45.0, 45.0, 49.0, 53.0, 50.0, 49.0, 50.0, 52.0, 56.0, 25.0, 43.0, 32.0, 38.0, 13.0, 23.0, 14.0, 8.0, 12.0, 8.0, 11.0, 9.0, 7.0, 9.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.0187110900878906e-05, -4.8590824007987976e-05, -4.6994537115097046e-05, -4.5398250222206116e-05, -4.3801963329315186e-05, -4.2205676436424255e-05, -4.0609389543533325e-05, -3.9013102650642395e-05, -3.7416815757751465e-05, -3.5820528864860535e-05, -3.4224241971969604e-05, -3.2627955079078674e-05, -3.1031668186187744e-05, -2.9435381293296814e-05, -2.7839094400405884e-05, -2.6242807507514954e-05, -2.4646520614624023e-05, -2.3050233721733093e-05, -2.1453946828842163e-05, -1.9857659935951233e-05, -1.8261373043060303e-05, -1.6665086150169373e-05, -1.5068799257278442e-05, -1.3472512364387512e-05, -1.1876225471496582e-05, -1.0279938578605652e-05, -8.683651685714722e-06, -7.0873647928237915e-06, -5.491077899932861e-06, -3.894791007041931e-06, -2.298504114151001e-06, -7.022172212600708e-07, 8.940696716308594e-07, 2.4903565645217896e-06, 4.08664345741272e-06, 5.68293035030365e-06, 7.27921724319458e-06, 8.87550413608551e-06, 1.047179102897644e-05, 1.206807792186737e-05, 1.36643648147583e-05, 1.526065170764923e-05, 1.685693860054016e-05, 1.845322549343109e-05, 2.004951238632202e-05, 2.164579927921295e-05, 2.3242086172103882e-05, 2.4838373064994812e-05, 2.6434659957885742e-05, 2.8030946850776672e-05, 2.9627233743667603e-05, 3.122352063655853e-05, 3.281980752944946e-05, 3.441609442234039e-05, 3.601238131523132e-05, 3.7608668208122253e-05, 3.9204955101013184e-05, 4.0801241993904114e-05, 4.2397528886795044e-05, 4.3993815779685974e-05, 4.5590102672576904e-05, 4.7186389565467834e-05, 4.8782676458358765e-05, 5.0378963351249695e-05, 5.1975250244140625e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 12.0, 14.0, 18.0, 23.0, 28.0, 56.0, 67.0, 91.0, 167.0, 270.0, 503.0, 1000.0, 2388.0, 7735.0, 38499.0, 311109.0, 579998.0, 86304.0, 13712.0, 3615.0, 1350.0, 669.0, 340.0, 201.0, 122.0, 70.0, 50.0, 32.0, 35.0, 20.0, 22.0, 9.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1832275390625, -0.17695236206054688, -0.17067718505859375, -0.16440200805664062, -0.1581268310546875, -0.15185165405273438, -0.14557647705078125, -0.13930130004882812, -0.133026123046875, -0.12675094604492188, -0.12047576904296875, -0.11420059204101562, -0.1079254150390625, -0.10165023803710938, -0.09537506103515625, -0.08909988403320312, -0.08282470703125, -0.07654953002929688, -0.07027435302734375, -0.06399917602539062, -0.0577239990234375, -0.051448822021484375, -0.04517364501953125, -0.038898468017578125, -0.032623291015625, -0.026348114013671875, -0.02007293701171875, -0.013797760009765625, -0.0075225830078125, -0.001247406005859375, 0.00502777099609375, 0.011302947998046875, 0.017578125, 0.023853302001953125, 0.03012847900390625, 0.036403656005859375, 0.0426788330078125, 0.048954010009765625, 0.05522918701171875, 0.061504364013671875, 0.067779541015625, 0.07405471801757812, 0.08032989501953125, 0.08660507202148438, 0.0928802490234375, 0.09915542602539062, 0.10543060302734375, 0.11170578002929688, 0.11798095703125, 0.12425613403320312, 0.13053131103515625, 0.13680648803710938, 0.1430816650390625, 0.14935684204101562, 0.15563201904296875, 0.16190719604492188, 0.168182373046875, 0.17445755004882812, 0.18073272705078125, 0.18700790405273438, 0.1932830810546875, 0.19955825805664062, 0.20583343505859375, 0.21210861206054688, 0.2183837890625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 7.0, 9.0, 9.0, 20.0, 16.0, 27.0, 29.0, 45.0, 52.0, 73.0, 72.0, 82.0, 94.0, 78.0, 79.0, 64.0, 44.0, 52.0, 33.0, 27.0, 17.0, 16.0, 14.0, 15.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.166015625, -0.16053009033203125, -0.1550445556640625, -0.14955902099609375, -0.144073486328125, -0.13858795166015625, -0.1331024169921875, -0.12761688232421875, -0.12213134765625, -0.11664581298828125, -0.1111602783203125, -0.10567474365234375, -0.100189208984375, -0.09470367431640625, -0.0892181396484375, -0.08373260498046875, -0.0782470703125, -0.07276153564453125, -0.0672760009765625, -0.06179046630859375, -0.056304931640625, -0.05081939697265625, -0.0453338623046875, -0.03984832763671875, -0.03436279296875, -0.02887725830078125, -0.0233917236328125, -0.01790618896484375, -0.012420654296875, -0.00693511962890625, -0.0014495849609375, 0.00403594970703125, 0.009521484375, 0.01500701904296875, 0.0204925537109375, 0.02597808837890625, 0.031463623046875, 0.03694915771484375, 0.0424346923828125, 0.04792022705078125, 0.05340576171875, 0.05889129638671875, 0.0643768310546875, 0.06986236572265625, 0.075347900390625, 0.08083343505859375, 0.0863189697265625, 0.09180450439453125, 0.0972900390625, 0.10277557373046875, 0.1082611083984375, 0.11374664306640625, 0.119232177734375, 0.12471771240234375, 0.1302032470703125, 0.13568878173828125, 0.14117431640625, 0.14665985107421875, 0.1521453857421875, 0.15763092041015625, 0.163116455078125, 0.16860198974609375, 0.1740875244140625, 0.17957305908203125, 0.18505859375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 10.0, 31.0, 50.0, 106.0, 143.0, 188.0, 171.0, 140.0, 88.0, 44.0, 14.0, 8.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.472292900085449, -2.3467941284179688, -2.2212953567504883, -2.095796585083008, -1.970297932624817, -1.8447991609573364, -1.7193005084991455, -1.593801736831665, -1.4683029651641846, -1.342804193496704, -1.2173054218292236, -1.0918067693710327, -0.9663079977035522, -0.8408092260360718, -0.7153105139732361, -0.5898118019104004, -0.4643130302429199, -0.33881428837776184, -0.21331554651260376, -0.08781680464744568, 0.0376819372177124, 0.16318070888519287, 0.28867942094802856, 0.41417813301086426, 0.5396769046783447, 0.6651756763458252, 0.7906743884086609, 0.9161731004714966, 1.041671872138977, 1.1671706438064575, 1.2926692962646484, 1.418168067932129, 1.5436668395996094, 1.6691656112670898, 1.7946643829345703, 1.9201630353927612, 2.0456619262695312, 2.1711606979370117, 2.296659231185913, 2.4221580028533936, 2.547656774520874, 2.6731555461883545, 2.798654317855835, 2.9241530895233154, 3.049651622772217, 3.1751503944396973, 3.3006491661071777, 3.426147937774658, 3.5516467094421387, 3.677145481109619, 3.8026442527770996, 3.92814302444458, 4.0536417961120605, 4.179140567779541, 4.3046393394470215, 4.430137634277344, 4.555636405944824, 4.681135177612305, 4.806633949279785, 4.932132720947266, 5.057631492614746, 5.183130264282227, 5.308629035949707, 5.4341278076171875, 5.559626579284668]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 7.0, 7.0, 5.0, 14.0, 14.0, 16.0, 21.0, 21.0, 25.0, 28.0, 33.0, 35.0, 38.0, 35.0, 33.0, 53.0, 44.0, 60.0, 52.0, 49.0, 48.0, 43.0, 34.0, 42.0, 38.0, 24.0, 30.0, 20.0, 22.0, 17.0, 15.0, 17.0, 14.0, 6.0, 8.0, 2.0, 3.0, 8.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.229708671569824, -2.1599161624908447, -2.0901236534118652, -2.0203311443328857, -1.9505386352539062, -1.8807461261749268, -1.8109536170959473, -1.7411611080169678, -1.6713685989379883, -1.6015760898590088, -1.5317835807800293, -1.4619910717010498, -1.3921985626220703, -1.3224060535430908, -1.2526135444641113, -1.1828210353851318, -1.113028645515442, -1.0432361364364624, -0.9734436273574829, -0.9036511182785034, -0.8338586091995239, -0.7640661001205444, -0.6942736506462097, -0.6244811415672302, -0.5546886324882507, -0.48489612340927124, -0.41510361433029175, -0.34531113505363464, -0.27551862597465515, -0.20572611689567566, -0.13593363761901855, -0.06614112854003906, 0.0036513805389404297, 0.07344388216733932, 0.14323638379573822, 0.21302887797355652, 0.282821387052536, 0.3526138961315155, 0.4224063754081726, 0.4921988844871521, 0.5619913935661316, 0.6317839026451111, 0.7015764117240906, 0.7713688611984253, 0.8411613702774048, 0.9109538793563843, 0.9807463884353638, 1.0505388975143433, 1.1203314065933228, 1.1901239156723022, 1.2599164247512817, 1.3297089338302612, 1.3995014429092407, 1.4692939519882202, 1.5390863418579102, 1.6088788509368896, 1.6786713600158691, 1.7484638690948486, 1.8182563781738281, 1.8880488872528076, 1.957841396331787, 2.0276339054107666, 2.097426414489746, 2.1672189235687256, 2.237011432647705]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 8.0, 9.0, 13.0, 19.0, 37.0, 53.0, 88.0, 110.0, 259.0, 406.0, 682.0, 1164.0, 1979.0, 3813.0, 7517.0, 18462.0, 74654.0, 3864265.0, 171732.0, 28420.0, 9999.0, 4644.0, 2517.0, 1395.0, 821.0, 471.0, 299.0, 157.0, 111.0, 59.0, 39.0, 33.0, 21.0, 12.0, 6.0, 7.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.294921875, -0.285614013671875, -0.27630615234375, -0.266998291015625, -0.2576904296875, -0.248382568359375, -0.23907470703125, -0.229766845703125, -0.220458984375, -0.211151123046875, -0.20184326171875, -0.192535400390625, -0.1832275390625, -0.173919677734375, -0.16461181640625, -0.155303955078125, -0.14599609375, -0.136688232421875, -0.12738037109375, -0.118072509765625, -0.1087646484375, -0.099456787109375, -0.09014892578125, -0.080841064453125, -0.071533203125, -0.062225341796875, -0.05291748046875, -0.043609619140625, -0.0343017578125, -0.024993896484375, -0.01568603515625, -0.006378173828125, 0.0029296875, 0.012237548828125, 0.02154541015625, 0.030853271484375, 0.0401611328125, 0.049468994140625, 0.05877685546875, 0.068084716796875, 0.077392578125, 0.086700439453125, 0.09600830078125, 0.105316162109375, 0.1146240234375, 0.123931884765625, 0.13323974609375, 0.142547607421875, 0.15185546875, 0.161163330078125, 0.17047119140625, 0.179779052734375, 0.1890869140625, 0.198394775390625, 0.20770263671875, 0.217010498046875, 0.226318359375, 0.235626220703125, 0.24493408203125, 0.254241943359375, 0.2635498046875, 0.272857666015625, 0.28216552734375, 0.291473388671875, 0.30078125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 4.0, 3.0, 10.0, 8.0, 8.0, 6.0, 12.0, 15.0, 22.0, 16.0, 26.0, 24.0, 37.0, 35.0, 32.0, 51.0, 42.0, 54.0, 50.0, 53.0, 46.0, 57.0, 55.0, 39.0, 43.0, 49.0, 36.0, 28.0, 23.0, 33.0, 9.0, 15.0, 13.0, 9.0, 10.0, 9.0, 8.0, 1.0, 3.0, 7.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10260009765625, -0.09972858428955078, -0.09685707092285156, -0.09398555755615234, -0.09111404418945312, -0.0882425308227539, -0.08537101745605469, -0.08249950408935547, -0.07962799072265625, -0.07675647735595703, -0.07388496398925781, -0.0710134506225586, -0.06814193725585938, -0.06527042388916016, -0.06239891052246094, -0.05952739715576172, -0.0566558837890625, -0.05378437042236328, -0.05091285705566406, -0.048041343688964844, -0.045169830322265625, -0.042298316955566406, -0.03942680358886719, -0.03655529022216797, -0.03368377685546875, -0.03081226348876953, -0.027940750122070312, -0.025069236755371094, -0.022197723388671875, -0.019326210021972656, -0.016454696655273438, -0.013583183288574219, -0.010711669921875, -0.007840156555175781, -0.0049686431884765625, -0.0020971298217773438, 0.000774383544921875, 0.0036458969116210938, 0.0065174102783203125, 0.009388923645019531, 0.01226043701171875, 0.015131950378417969, 0.018003463745117188, 0.020874977111816406, 0.023746490478515625, 0.026618003845214844, 0.029489517211914062, 0.03236103057861328, 0.0352325439453125, 0.03810405731201172, 0.04097557067871094, 0.043847084045410156, 0.046718597412109375, 0.049590110778808594, 0.05246162414550781, 0.05533313751220703, 0.05820465087890625, 0.06107616424560547, 0.06394767761230469, 0.0668191909790039, 0.06969070434570312, 0.07256221771240234, 0.07543373107910156, 0.07830524444580078, 0.0811767578125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 9.0, 20.0, 29.0, 35.0, 42.0, 65.0, 103.0, 168.0, 217.0, 337.0, 594.0, 988.0, 1800.0, 3271.0, 6528.0, 15826.0, 53264.0, 592962.0, 3418180.0, 65860.0, 18289.0, 7297.0, 3672.0, 1884.0, 1067.0, 659.0, 364.0, 247.0, 166.0, 118.0, 85.0, 47.0, 26.0, 20.0, 15.0, 9.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4052734375, -0.39434051513671875, -0.3834075927734375, -0.37247467041015625, -0.361541748046875, -0.35060882568359375, -0.3396759033203125, -0.32874298095703125, -0.31781005859375, -0.30687713623046875, -0.2959442138671875, -0.28501129150390625, -0.274078369140625, -0.26314544677734375, -0.2522125244140625, -0.24127960205078125, -0.2303466796875, -0.21941375732421875, -0.2084808349609375, -0.19754791259765625, -0.186614990234375, -0.17568206787109375, -0.1647491455078125, -0.15381622314453125, -0.14288330078125, -0.13195037841796875, -0.1210174560546875, -0.11008453369140625, -0.099151611328125, -0.08821868896484375, -0.0772857666015625, -0.06635284423828125, -0.055419921875, -0.04448699951171875, -0.0335540771484375, -0.02262115478515625, -0.011688232421875, -0.00075531005859375, 0.0101776123046875, 0.02111053466796875, 0.03204345703125, 0.04297637939453125, 0.0539093017578125, 0.06484222412109375, 0.075775146484375, 0.08670806884765625, 0.0976409912109375, 0.10857391357421875, 0.1195068359375, 0.13043975830078125, 0.1413726806640625, 0.15230560302734375, 0.163238525390625, 0.17417144775390625, 0.1851043701171875, 0.19603729248046875, 0.20697021484375, 0.21790313720703125, 0.2288360595703125, 0.23976898193359375, 0.250701904296875, 0.26163482666015625, 0.2725677490234375, 0.28350067138671875, 0.29443359375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 1.0, 7.0, 10.0, 11.0, 18.0, 32.0, 48.0, 84.0, 152.0, 2473.0, 863.0, 166.0, 81.0, 32.0, 23.0, 23.0, 8.0, 7.0, 8.0, 6.0, 0.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09405517578125, -0.09080886840820312, -0.08756256103515625, -0.08431625366210938, -0.0810699462890625, -0.07782363891601562, -0.07457733154296875, -0.07133102416992188, -0.068084716796875, -0.06483840942382812, -0.06159210205078125, -0.058345794677734375, -0.0550994873046875, -0.051853179931640625, -0.04860687255859375, -0.045360565185546875, -0.0421142578125, -0.038867950439453125, -0.03562164306640625, -0.032375335693359375, -0.0291290283203125, -0.025882720947265625, -0.02263641357421875, -0.019390106201171875, -0.016143798828125, -0.012897491455078125, -0.00965118408203125, -0.006404876708984375, -0.0031585693359375, 8.7738037109375e-05, 0.00333404541015625, 0.006580352783203125, 0.00982666015625, 0.013072967529296875, 0.01631927490234375, 0.019565582275390625, 0.0228118896484375, 0.026058197021484375, 0.02930450439453125, 0.032550811767578125, 0.035797119140625, 0.039043426513671875, 0.04228973388671875, 0.045536041259765625, 0.0487823486328125, 0.052028656005859375, 0.05527496337890625, 0.058521270751953125, 0.061767578125, 0.06501388549804688, 0.06826019287109375, 0.07150650024414062, 0.0747528076171875, 0.07799911499023438, 0.08124542236328125, 0.08449172973632812, 0.087738037109375, 0.09098434448242188, 0.09423065185546875, 0.09747695922851562, 0.1007232666015625, 0.10396957397460938, 0.10721588134765625, 0.11046218872070312, 0.11370849609375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 6.0, 6.0, 4.0, 11.0, 9.0, 12.0, 19.0, 32.0, 47.0, 42.0, 69.0, 75.0, 103.0, 98.0, 78.0, 83.0, 67.0, 58.0, 46.0, 48.0, 32.0, 12.0, 18.0, 7.0, 5.0, 5.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.342792272567749, -0.3319152593612671, -0.32103821635246277, -0.31016120314598083, -0.2992841601371765, -0.2884071469306946, -0.27753013372421265, -0.2666530907154083, -0.2557760775089264, -0.24489904940128326, -0.23402202129364014, -0.2231450080871582, -0.21226797997951508, -0.20139095187187195, -0.19051392376422882, -0.1796368956565857, -0.16875986754894257, -0.15788283944129944, -0.1470058113336563, -0.13612878322601318, -0.12525177001953125, -0.11437474191188812, -0.103497713804245, -0.09262069314718246, -0.08174366503953934, -0.07086663693189621, -0.05998961627483368, -0.04911258816719055, -0.03823556378483772, -0.027358539402484894, -0.016481511294841766, -0.005604490637779236, 0.005272537469863892, 0.01614956185221672, 0.0270265880972147, 0.03790361434221268, 0.048780638724565506, 0.059657663106918335, 0.07053469121456146, 0.08141171187162399, 0.09228873997926712, 0.10316576808691025, 0.11404278874397278, 0.1249198168516159, 0.13579684495925903, 0.14667385816574097, 0.1575509011745453, 0.16842791438102722, 0.17930494248867035, 0.19018197059631348, 0.2010589987039566, 0.21193602681159973, 0.22281304001808167, 0.2336900681257248, 0.24456709623336792, 0.25544410943984985, 0.2663211524486542, 0.2771981656551361, 0.28807520866394043, 0.29895222187042236, 0.3098292648792267, 0.3207062780857086, 0.33158332109451294, 0.3424603343009949, 0.3533373475074768]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 0.0, 6.0, 7.0, 4.0, 8.0, 9.0, 8.0, 10.0, 19.0, 16.0, 18.0, 29.0, 32.0, 26.0, 25.0, 33.0, 37.0, 32.0, 45.0, 49.0, 38.0, 32.0, 34.0, 46.0, 51.0, 46.0, 33.0, 34.0, 30.0, 38.0, 22.0, 28.0, 26.0, 17.0, 17.0, 15.0, 14.0, 12.0, 7.0, 9.0, 8.0, 6.0, 7.0, 4.0, 3.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.23529881238937378, -0.2280694842338562, -0.22084017097949982, -0.21361084282398224, -0.20638152956962585, -0.19915220141410828, -0.1919228732585907, -0.18469354510307312, -0.17746423184871674, -0.17023490369319916, -0.16300559043884277, -0.1557762622833252, -0.14854693412780762, -0.14131762087345123, -0.13408829271793365, -0.12685897946357727, -0.11962965130805969, -0.11240033060312271, -0.10517100989818573, -0.09794168174266815, -0.09071236103773117, -0.08348304033279419, -0.07625371217727661, -0.06902439147233963, -0.06179507076740265, -0.05456575006246567, -0.04733642563223839, -0.04010710120201111, -0.03287778049707413, -0.025648459792137146, -0.018419135361909866, -0.011189810931682587, -0.0039604902267456055, 0.003268832340836525, 0.010498154908418655, 0.017727477476000786, 0.024956800043582916, 0.0321861207485199, 0.03941544517874718, 0.04664476960897446, 0.05387409031391144, 0.06110341101884842, 0.0683327317237854, 0.07556205987930298, 0.08279138058423996, 0.09002070128917694, 0.09725002944469452, 0.1044793501496315, 0.11170867085456848, 0.11893799155950546, 0.12616731226444244, 0.13339664041996002, 0.1406259536743164, 0.14785528182983398, 0.15508460998535156, 0.16231393814086914, 0.16954325139522552, 0.1767725795507431, 0.1840018928050995, 0.19123122096061707, 0.19846054911613464, 0.20568986237049103, 0.2129191905260086, 0.220148503780365, 0.22737783193588257]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 12.0, 15.0, 11.0, 19.0, 36.0, 42.0, 94.0, 166.0, 261.0, 601.0, 1179.0, 2419.0, 5292.0, 12211.0, 27793.0, 65738.0, 151572.0, 280425.0, 263886.0, 134965.0, 57762.0, 24468.0, 10551.0, 4708.0, 2138.0, 1060.0, 504.0, 264.0, 147.0, 73.0, 48.0, 33.0, 16.0, 11.0, 11.0, 10.0, 6.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1837158203125, -0.17845535278320312, -0.17319488525390625, -0.16793441772460938, -0.1626739501953125, -0.15741348266601562, -0.15215301513671875, -0.14689254760742188, -0.141632080078125, -0.13637161254882812, -0.13111114501953125, -0.12585067749023438, -0.1205902099609375, -0.11532974243164062, -0.11006927490234375, -0.10480880737304688, -0.09954833984375, -0.09428787231445312, -0.08902740478515625, -0.08376693725585938, -0.0785064697265625, -0.07324600219726562, -0.06798553466796875, -0.06272506713867188, -0.057464599609375, -0.052204132080078125, -0.04694366455078125, -0.041683197021484375, -0.0364227294921875, -0.031162261962890625, -0.02590179443359375, -0.020641326904296875, -0.015380859375, -0.010120391845703125, -0.00485992431640625, 0.000400543212890625, 0.0056610107421875, 0.010921478271484375, 0.01618194580078125, 0.021442413330078125, 0.026702880859375, 0.031963348388671875, 0.03722381591796875, 0.042484283447265625, 0.0477447509765625, 0.053005218505859375, 0.05826568603515625, 0.06352615356445312, 0.06878662109375, 0.07404708862304688, 0.07930755615234375, 0.08456802368164062, 0.0898284912109375, 0.09508895874023438, 0.10034942626953125, 0.10560989379882812, 0.110870361328125, 0.11613082885742188, 0.12139129638671875, 0.12665176391601562, 0.1319122314453125, 0.13717269897460938, 0.14243316650390625, 0.14769363403320312, 0.1529541015625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 8.0, 7.0, 13.0, 11.0, 16.0, 13.0, 26.0, 28.0, 39.0, 41.0, 37.0, 46.0, 58.0, 59.0, 61.0, 59.0, 49.0, 63.0, 58.0, 62.0, 38.0, 30.0, 34.0, 28.0, 31.0, 16.0, 13.0, 16.0, 11.0, 7.0, 7.0, 7.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1104736328125, -0.10685920715332031, -0.10324478149414062, -0.09963035583496094, -0.09601593017578125, -0.09240150451660156, -0.08878707885742188, -0.08517265319824219, -0.0815582275390625, -0.07794380187988281, -0.07432937622070312, -0.07071495056152344, -0.06710052490234375, -0.06348609924316406, -0.059871673583984375, -0.05625724792480469, -0.052642822265625, -0.04902839660644531, -0.045413970947265625, -0.04179954528808594, -0.03818511962890625, -0.03457069396972656, -0.030956268310546875, -0.027341842651367188, -0.0237274169921875, -0.020112991333007812, -0.016498565673828125, -0.012884140014648438, -0.00926971435546875, -0.0056552886962890625, -0.002040863037109375, 0.0015735626220703125, 0.00518798828125, 0.008802413940429688, 0.012416839599609375, 0.016031265258789062, 0.01964569091796875, 0.023260116577148438, 0.026874542236328125, 0.030488967895507812, 0.0341033935546875, 0.03771781921386719, 0.041332244873046875, 0.04494667053222656, 0.04856109619140625, 0.05217552185058594, 0.055789947509765625, 0.05940437316894531, 0.063018798828125, 0.06663322448730469, 0.07024765014648438, 0.07386207580566406, 0.07747650146484375, 0.08109092712402344, 0.08470535278320312, 0.08831977844238281, 0.0919342041015625, 0.09554862976074219, 0.09916305541992188, 0.10277748107910156, 0.10639190673828125, 0.11000633239746094, 0.11362075805664062, 0.11723518371582031, 0.120849609375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 8.0, 5.0, 2.0, 3.0, 8.0, 9.0, 6.0, 18.0, 34.0, 41.0, 57.0, 68.0, 105.0, 117.0, 172.0, 260.0, 414.0, 653.0, 1087.0, 2431.0, 7831.0, 42756.0, 357773.0, 545822.0, 70867.0, 11497.0, 3079.0, 1350.0, 706.0, 442.0, 277.0, 190.0, 130.0, 83.0, 76.0, 54.0, 39.0, 31.0, 24.0, 15.0, 10.0, 8.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.390380859375, -0.3789405822753906, -0.36750030517578125, -0.3560600280761719, -0.3446197509765625, -0.3331794738769531, -0.32173919677734375, -0.3102989196777344, -0.298858642578125, -0.2874183654785156, -0.27597808837890625, -0.2645378112792969, -0.2530975341796875, -0.24165725708007812, -0.23021697998046875, -0.21877670288085938, -0.20733642578125, -0.19589614868164062, -0.18445587158203125, -0.17301559448242188, -0.1615753173828125, -0.15013504028320312, -0.13869476318359375, -0.12725448608398438, -0.115814208984375, -0.10437393188476562, -0.09293365478515625, -0.08149337768554688, -0.0700531005859375, -0.058612823486328125, -0.04717254638671875, -0.035732269287109375, -0.0242919921875, -0.012851715087890625, -0.00141143798828125, 0.010028839111328125, 0.0214691162109375, 0.032909393310546875, 0.04434967041015625, 0.055789947509765625, 0.067230224609375, 0.07867050170898438, 0.09011077880859375, 0.10155105590820312, 0.1129913330078125, 0.12443161010742188, 0.13587188720703125, 0.14731216430664062, 0.15875244140625, 0.17019271850585938, 0.18163299560546875, 0.19307327270507812, 0.2045135498046875, 0.21595382690429688, 0.22739410400390625, 0.23883438110351562, 0.250274658203125, 0.2617149353027344, 0.27315521240234375, 0.2845954895019531, 0.2960357666015625, 0.3074760437011719, 0.31891632080078125, 0.3303565979003906, 0.341796875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 1.0, 9.0, 8.0, 13.0, 17.0, 18.0, 15.0, 21.0, 18.0, 24.0, 21.0, 31.0, 31.0, 50.0, 40.0, 24.0, 41.0, 41.0, 44.0, 46.0, 49.0, 43.0, 41.0, 46.0, 42.0, 34.0, 24.0, 36.0, 34.0, 18.0, 14.0, 12.0, 14.0, 17.0, 15.0, 12.0, 8.0, 5.0, 8.0, 9.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.42236328125, -0.4081764221191406, -0.39398956298828125, -0.3798027038574219, -0.3656158447265625, -0.3514289855957031, -0.33724212646484375, -0.3230552673339844, -0.308868408203125, -0.2946815490722656, -0.28049468994140625, -0.2663078308105469, -0.2521209716796875, -0.23793411254882812, -0.22374725341796875, -0.20956039428710938, -0.19537353515625, -0.18118667602539062, -0.16699981689453125, -0.15281295776367188, -0.1386260986328125, -0.12443923950195312, -0.11025238037109375, -0.09606552124023438, -0.081878662109375, -0.06769180297851562, -0.05350494384765625, -0.039318084716796875, -0.0251312255859375, -0.010944366455078125, 0.00324249267578125, 0.017429351806640625, 0.0316162109375, 0.045803070068359375, 0.05998992919921875, 0.07417678833007812, 0.0883636474609375, 0.10255050659179688, 0.11673736572265625, 0.13092422485351562, 0.145111083984375, 0.15929794311523438, 0.17348480224609375, 0.18767166137695312, 0.2018585205078125, 0.21604537963867188, 0.23023223876953125, 0.24441909790039062, 0.25860595703125, 0.2727928161621094, 0.28697967529296875, 0.3011665344238281, 0.3153533935546875, 0.3295402526855469, 0.34372711181640625, 0.3579139709472656, 0.372100830078125, 0.3862876892089844, 0.40047454833984375, 0.4146614074707031, 0.4288482666015625, 0.4430351257324219, 0.45722198486328125, 0.4714088439941406, 0.485595703125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 3.0, 4.0, 6.0, 1.0, 10.0, 14.0, 28.0, 34.0, 45.0, 69.0, 133.0, 219.0, 398.0, 865.0, 2224.0, 8808.0, 55843.0, 553876.0, 378830.0, 37300.0, 6407.0, 1865.0, 702.0, 342.0, 204.0, 117.0, 76.0, 40.0, 26.0, 22.0, 16.0, 11.0, 5.0, 6.0, 4.0, 5.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1405029296875, -0.13408851623535156, -0.12767410278320312, -0.12125968933105469, -0.11484527587890625, -0.10843086242675781, -0.10201644897460938, -0.09560203552246094, -0.0891876220703125, -0.08277320861816406, -0.07635879516601562, -0.06994438171386719, -0.06352996826171875, -0.05711555480957031, -0.050701141357421875, -0.04428672790527344, -0.037872314453125, -0.03145790100097656, -0.025043487548828125, -0.018629074096679688, -0.01221466064453125, -0.0058002471923828125, 0.000614166259765625, 0.0070285797119140625, 0.0134429931640625, 0.019857406616210938, 0.026271820068359375, 0.03268623352050781, 0.03910064697265625, 0.04551506042480469, 0.051929473876953125, 0.05834388732910156, 0.06475830078125, 0.07117271423339844, 0.07758712768554688, 0.08400154113769531, 0.09041595458984375, 0.09683036804199219, 0.10324478149414062, 0.10965919494628906, 0.1160736083984375, 0.12248802185058594, 0.12890243530273438, 0.1353168487548828, 0.14173126220703125, 0.1481456756591797, 0.15456008911132812, 0.16097450256347656, 0.167388916015625, 0.17380332946777344, 0.18021774291992188, 0.1866321563720703, 0.19304656982421875, 0.1994609832763672, 0.20587539672851562, 0.21228981018066406, 0.2187042236328125, 0.22511863708496094, 0.23153305053710938, 0.2379474639892578, 0.24436187744140625, 0.2507762908935547, 0.2571907043457031, 0.26360511779785156, 0.27001953125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 2.0, 6.0, 12.0, 9.0, 14.0, 21.0, 22.0, 36.0, 48.0, 51.0, 67.0, 74.0, 80.0, 74.0, 85.0, 83.0, 79.0, 81.0, 44.0, 40.0, 25.0, 20.0, 10.0, 5.0, 8.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.178285598754883e-05, -3.941543400287628e-05, -3.7048012018203735e-05, -3.468059003353119e-05, -3.231316804885864e-05, -2.9945746064186096e-05, -2.757832407951355e-05, -2.5210902094841003e-05, -2.2843480110168457e-05, -2.047605812549591e-05, -1.8108636140823364e-05, -1.5741214156150818e-05, -1.3373792171478271e-05, -1.1006370186805725e-05, -8.638948202133179e-06, -6.271526217460632e-06, -3.904104232788086e-06, -1.5366822481155396e-06, 8.307397365570068e-07, 3.1981617212295532e-06, 5.5655837059021e-06, 7.933005690574646e-06, 1.0300427675247192e-05, 1.2667849659919739e-05, 1.5035271644592285e-05, 1.740269362926483e-05, 1.9770115613937378e-05, 2.2137537598609924e-05, 2.450495958328247e-05, 2.6872381567955017e-05, 2.9239803552627563e-05, 3.160722553730011e-05, 3.3974647521972656e-05, 3.63420695066452e-05, 3.870949149131775e-05, 4.1076913475990295e-05, 4.344433546066284e-05, 4.581175744533539e-05, 4.8179179430007935e-05, 5.054660141468048e-05, 5.291402339935303e-05, 5.5281445384025574e-05, 5.764886736869812e-05, 6.0016289353370667e-05, 6.238371133804321e-05, 6.475113332271576e-05, 6.71185553073883e-05, 6.948597729206085e-05, 7.18533992767334e-05, 7.422082126140594e-05, 7.658824324607849e-05, 7.895566523075104e-05, 8.132308721542358e-05, 8.369050920009613e-05, 8.605793118476868e-05, 8.842535316944122e-05, 9.079277515411377e-05, 9.316019713878632e-05, 9.552761912345886e-05, 9.789504110813141e-05, 0.00010026246309280396, 0.0001026298850774765, 0.00010499730706214905, 0.0001073647290468216, 0.00010973215103149414]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 7.0, 8.0, 11.0, 21.0, 47.0, 90.0, 181.0, 507.0, 1505.0, 7903.0, 212198.0, 797738.0, 24248.0, 2761.0, 756.0, 308.0, 131.0, 58.0, 29.0, 25.0, 18.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.340087890625, -0.329193115234375, -0.31829833984375, -0.307403564453125, -0.2965087890625, -0.285614013671875, -0.27471923828125, -0.263824462890625, -0.2529296875, -0.242034912109375, -0.23114013671875, -0.220245361328125, -0.2093505859375, -0.198455810546875, -0.18756103515625, -0.176666259765625, -0.165771484375, -0.154876708984375, -0.14398193359375, -0.133087158203125, -0.1221923828125, -0.111297607421875, -0.10040283203125, -0.089508056640625, -0.07861328125, -0.067718505859375, -0.05682373046875, -0.045928955078125, -0.0350341796875, -0.024139404296875, -0.01324462890625, -0.002349853515625, 0.008544921875, 0.019439697265625, 0.03033447265625, 0.041229248046875, 0.0521240234375, 0.063018798828125, 0.07391357421875, 0.084808349609375, 0.095703125, 0.106597900390625, 0.11749267578125, 0.128387451171875, 0.1392822265625, 0.150177001953125, 0.16107177734375, 0.171966552734375, 0.182861328125, 0.193756103515625, 0.20465087890625, 0.215545654296875, 0.2264404296875, 0.237335205078125, 0.24822998046875, 0.259124755859375, 0.27001953125, 0.280914306640625, 0.29180908203125, 0.302703857421875, 0.3135986328125, 0.324493408203125, 0.33538818359375, 0.346282958984375, 0.357177734375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 7.0, 11.0, 19.0, 45.0, 77.0, 137.0, 159.0, 159.0, 136.0, 107.0, 68.0, 39.0, 15.0, 10.0, 10.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13671875, -0.12723922729492188, -0.11775970458984375, -0.10828018188476562, -0.0988006591796875, -0.08932113647460938, -0.07984161376953125, -0.07036209106445312, -0.060882568359375, -0.051403045654296875, -0.04192352294921875, -0.032444000244140625, -0.0229644775390625, -0.013484954833984375, -0.00400543212890625, 0.005474090576171875, 0.01495361328125, 0.024433135986328125, 0.03391265869140625, 0.043392181396484375, 0.0528717041015625, 0.062351226806640625, 0.07183074951171875, 0.08131027221679688, 0.090789794921875, 0.10026931762695312, 0.10974884033203125, 0.11922836303710938, 0.1287078857421875, 0.13818740844726562, 0.14766693115234375, 0.15714645385742188, 0.1666259765625, 0.17610549926757812, 0.18558502197265625, 0.19506454467773438, 0.2045440673828125, 0.21402359008789062, 0.22350311279296875, 0.23298263549804688, 0.242462158203125, 0.2519416809082031, 0.26142120361328125, 0.2709007263183594, 0.2803802490234375, 0.2898597717285156, 0.29933929443359375, 0.3088188171386719, 0.31829833984375, 0.3277778625488281, 0.33725738525390625, 0.3467369079589844, 0.3562164306640625, 0.3656959533691406, 0.37517547607421875, 0.3846549987792969, 0.394134521484375, 0.4036140441894531, 0.41309356689453125, 0.4225730895996094, 0.4320526123046875, 0.4415321350097656, 0.45101165771484375, 0.4604911804199219, 0.469970703125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 9.0, 7.0, 15.0, 37.0, 43.0, 88.0, 100.0, 113.0, 118.0, 108.0, 109.0, 95.0, 50.0, 38.0, 26.0, 17.0, 5.0, 8.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0187923908233643, -0.9427394866943359, -0.8666865825653076, -0.7906336784362793, -0.714580774307251, -0.6385278701782227, -0.5624749660491943, -0.486422061920166, -0.4103691577911377, -0.3343162536621094, -0.25826334953308105, -0.18221044540405273, -0.10615754127502441, -0.030104637145996094, 0.04594826698303223, 0.12200117111206055, 0.19805407524108887, 0.2741069793701172, 0.3501598834991455, 0.42621278762817383, 0.5022656917572021, 0.5783185958862305, 0.6543715000152588, 0.7304244041442871, 0.8064773082733154, 0.8825302124023438, 0.9585831165313721, 1.0346360206604004, 1.1106889247894287, 1.186741828918457, 1.2627947330474854, 1.3388476371765137, 1.414900779724121, 1.4909536838531494, 1.5670065879821777, 1.643059492111206, 1.7191123962402344, 1.7951653003692627, 1.871218204498291, 1.9472711086273193, 2.0233240127563477, 2.099376916885376, 2.1754298210144043, 2.2514827251434326, 2.327535629272461, 2.4035885334014893, 2.4796414375305176, 2.555694341659546, 2.631747245788574, 2.7078001499176025, 2.783853054046631, 2.859905958175659, 2.9359588623046875, 3.012011766433716, 3.088064670562744, 3.1641175746917725, 3.240170478820801, 3.316223382949829, 3.3922762870788574, 3.4683291912078857, 3.544382095336914, 3.6204349994659424, 3.6964879035949707, 3.772540807723999, 3.8485937118530273]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 5.0, 4.0, 3.0, 8.0, 4.0, 11.0, 8.0, 11.0, 13.0, 13.0, 19.0, 24.0, 34.0, 35.0, 36.0, 48.0, 46.0, 44.0, 37.0, 54.0, 50.0, 57.0, 46.0, 38.0, 48.0, 43.0, 46.0, 40.0, 31.0, 23.0, 28.0, 30.0, 12.0, 9.0, 15.0, 11.0, 5.0, 6.0, 4.0, 1.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2285633087158203, -2.160181760787964, -2.0918002128601074, -2.023418664932251, -1.955036997795105, -1.8866554498672485, -1.818273901939392, -1.7498923540115356, -1.6815106868743896, -1.6131291389465332, -1.5447475910186768, -1.4763660430908203, -1.4079843759536743, -1.3396028280258179, -1.2712212800979614, -1.202839732170105, -1.1344581842422485, -1.066076636314392, -0.9976950287818909, -0.9293134808540344, -0.8609318733215332, -0.7925503253936768, -0.7241687774658203, -0.6557872295379639, -0.5874056220054626, -0.5190240740776062, -0.450642466545105, -0.38226091861724854, -0.3138793408870697, -0.24549776315689087, -0.17711621522903442, -0.10873463749885559, -0.04035305976867676, 0.02802851051092148, 0.09641008079051971, 0.16479164361953735, 0.2331732213497162, 0.301554799079895, 0.36993634700775146, 0.4383179247379303, 0.5066995024681091, 0.5750810503959656, 0.6434626579284668, 0.7118442058563232, 0.7802257537841797, 0.8486073613166809, 0.9169889092445374, 0.9853705167770386, 1.053752064704895, 1.1221336126327515, 1.190515160560608, 1.258896827697754, 1.3272783756256104, 1.3956599235534668, 1.4640414714813232, 1.5324230194091797, 1.6008045673370361, 1.6691861152648926, 1.737567663192749, 1.8059492111206055, 1.8743308782577515, 1.942712426185608, 2.011094093322754, 2.0794756412506104, 2.147857189178467]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 6.0, 20.0, 14.0, 21.0, 41.0, 41.0, 70.0, 107.0, 203.0, 282.0, 569.0, 922.0, 1769.0, 3784.0, 8388.0, 25997.0, 3717734.0, 394931.0, 23998.0, 7989.0, 3476.0, 1715.0, 905.0, 516.0, 328.0, 144.0, 126.0, 52.0, 48.0, 26.0, 19.0, 10.0, 12.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.328857421875, -0.3175048828125, -0.30615234375, -0.2947998046875, -0.283447265625, -0.2720947265625, -0.2607421875, -0.2493896484375, -0.238037109375, -0.2266845703125, -0.21533203125, -0.2039794921875, -0.192626953125, -0.1812744140625, -0.169921875, -0.1585693359375, -0.147216796875, -0.1358642578125, -0.12451171875, -0.1131591796875, -0.101806640625, -0.0904541015625, -0.0791015625, -0.0677490234375, -0.056396484375, -0.0450439453125, -0.03369140625, -0.0223388671875, -0.010986328125, 0.0003662109375, 0.01171875, 0.0230712890625, 0.034423828125, 0.0457763671875, 0.05712890625, 0.0684814453125, 0.079833984375, 0.0911865234375, 0.1025390625, 0.1138916015625, 0.125244140625, 0.1365966796875, 0.14794921875, 0.1593017578125, 0.170654296875, 0.1820068359375, 0.193359375, 0.2047119140625, 0.216064453125, 0.2274169921875, 0.23876953125, 0.2501220703125, 0.261474609375, 0.2728271484375, 0.2841796875, 0.2955322265625, 0.306884765625, 0.3182373046875, 0.32958984375, 0.3409423828125, 0.352294921875, 0.3636474609375, 0.375, 0.3863525390625, 0.397705078125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 5.0, 3.0, 5.0, 10.0, 16.0, 10.0, 18.0, 25.0, 24.0, 31.0, 40.0, 47.0, 46.0, 55.0, 49.0, 54.0, 56.0, 68.0, 55.0, 55.0, 44.0, 54.0, 49.0, 23.0, 29.0, 25.0, 22.0, 17.0, 12.0, 10.0, 9.0, 15.0, 7.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1337890625, -0.1301727294921875, -0.126556396484375, -0.1229400634765625, -0.11932373046875, -0.1157073974609375, -0.112091064453125, -0.1084747314453125, -0.1048583984375, -0.1012420654296875, -0.097625732421875, -0.0940093994140625, -0.09039306640625, -0.0867767333984375, -0.083160400390625, -0.0795440673828125, -0.075927734375, -0.0723114013671875, -0.068695068359375, -0.0650787353515625, -0.06146240234375, -0.0578460693359375, -0.054229736328125, -0.0506134033203125, -0.0469970703125, -0.0433807373046875, -0.039764404296875, -0.0361480712890625, -0.03253173828125, -0.0289154052734375, -0.025299072265625, -0.0216827392578125, -0.01806640625, -0.0144500732421875, -0.010833740234375, -0.0072174072265625, -0.00360107421875, 1.52587890625e-05, 0.003631591796875, 0.0072479248046875, 0.0108642578125, 0.0144805908203125, 0.018096923828125, 0.0217132568359375, 0.02532958984375, 0.0289459228515625, 0.032562255859375, 0.0361785888671875, 0.039794921875, 0.0434112548828125, 0.047027587890625, 0.0506439208984375, 0.05426025390625, 0.0578765869140625, 0.061492919921875, 0.0651092529296875, 0.0687255859375, 0.0723419189453125, 0.075958251953125, 0.0795745849609375, 0.08319091796875, 0.0868072509765625, 0.090423583984375, 0.0940399169921875, 0.09765625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 5.0, 4.0, 4.0, 9.0, 5.0, 16.0, 20.0, 21.0, 25.0, 43.0, 58.0, 90.0, 120.0, 163.0, 226.0, 405.0, 844.0, 1590.0, 3962.0, 15873.0, 327568.0, 3814307.0, 20378.0, 4606.0, 1740.0, 848.0, 454.0, 295.0, 157.0, 124.0, 73.0, 56.0, 39.0, 31.0, 20.0, 19.0, 18.0, 12.0, 14.0, 10.0, 7.0, 8.0, 0.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.68798828125, -0.6671829223632812, -0.6463775634765625, -0.6255722045898438, -0.604766845703125, -0.5839614868164062, -0.5631561279296875, -0.5423507690429688, -0.52154541015625, -0.5007400512695312, -0.4799346923828125, -0.45912933349609375, -0.438323974609375, -0.41751861572265625, -0.3967132568359375, -0.37590789794921875, -0.3551025390625, -0.33429718017578125, -0.3134918212890625, -0.29268646240234375, -0.271881103515625, -0.25107574462890625, -0.2302703857421875, -0.20946502685546875, -0.18865966796875, -0.16785430908203125, -0.1470489501953125, -0.12624359130859375, -0.105438232421875, -0.08463287353515625, -0.0638275146484375, -0.04302215576171875, -0.022216796875, -0.00141143798828125, 0.0193939208984375, 0.04019927978515625, 0.061004638671875, 0.08180999755859375, 0.1026153564453125, 0.12342071533203125, 0.14422607421875, 0.16503143310546875, 0.1858367919921875, 0.20664215087890625, 0.227447509765625, 0.24825286865234375, 0.2690582275390625, 0.28986358642578125, 0.3106689453125, 0.33147430419921875, 0.3522796630859375, 0.37308502197265625, 0.393890380859375, 0.41469573974609375, 0.4355010986328125, 0.45630645751953125, 0.47711181640625, 0.49791717529296875, 0.5187225341796875, 0.5395278930664062, 0.560333251953125, 0.5811386108398438, 0.6019439697265625, 0.6227493286132812, 0.6435546875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 4.0, 5.0, 10.0, 22.0, 48.0, 143.0, 3571.0, 164.0, 61.0, 22.0, 12.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177001953125, -0.170806884765625, -0.16461181640625, -0.158416748046875, -0.1522216796875, -0.146026611328125, -0.13983154296875, -0.133636474609375, -0.12744140625, -0.121246337890625, -0.11505126953125, -0.108856201171875, -0.1026611328125, -0.096466064453125, -0.09027099609375, -0.084075927734375, -0.077880859375, -0.071685791015625, -0.06549072265625, -0.059295654296875, -0.0531005859375, -0.046905517578125, -0.04071044921875, -0.034515380859375, -0.0283203125, -0.022125244140625, -0.01593017578125, -0.009735107421875, -0.0035400390625, 0.002655029296875, 0.00885009765625, 0.015045166015625, 0.021240234375, 0.027435302734375, 0.03363037109375, 0.039825439453125, 0.0460205078125, 0.052215576171875, 0.05841064453125, 0.064605712890625, 0.07080078125, 0.076995849609375, 0.08319091796875, 0.089385986328125, 0.0955810546875, 0.101776123046875, 0.10797119140625, 0.114166259765625, 0.120361328125, 0.126556396484375, 0.13275146484375, 0.138946533203125, 0.1451416015625, 0.151336669921875, 0.15753173828125, 0.163726806640625, 0.169921875, 0.176116943359375, 0.18231201171875, 0.188507080078125, 0.1947021484375, 0.200897216796875, 0.20709228515625, 0.213287353515625, 0.219482421875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 5.0, 10.0, 8.0, 6.0, 16.0, 23.0, 38.0, 40.0, 53.0, 53.0, 70.0, 84.0, 105.0, 94.0, 84.0, 75.0, 58.0, 52.0, 40.0, 22.0, 23.0, 9.0, 12.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3961038589477539, -0.38502028584480286, -0.3739367127418518, -0.36285313963890076, -0.3517695665359497, -0.34068599343299866, -0.3296024203300476, -0.31851884722709656, -0.3074352741241455, -0.29635170102119446, -0.2852681279182434, -0.27418455481529236, -0.2631009817123413, -0.25201740860939026, -0.2409338355064392, -0.22985026240348816, -0.2187667042016983, -0.20768313109874725, -0.1965995579957962, -0.18551598489284515, -0.1744324117898941, -0.16334883868694305, -0.1522652804851532, -0.14118170738220215, -0.1300981342792511, -0.11901456117630005, -0.107930988073349, -0.09684741497039795, -0.0857638418674469, -0.07468026876449585, -0.0635967031121254, -0.05251313000917435, -0.0414295494556427, -0.03034597635269165, -0.01926240511238575, -0.00817883387207985, 0.0029047392308712006, 0.01398831233382225, 0.025071881711483, 0.03615545481443405, 0.0472390279173851, 0.05832260102033615, 0.0694061741232872, 0.08048973977565765, 0.0915733128786087, 0.10265688598155975, 0.1137404590845108, 0.12482403218746185, 0.1359076052904129, 0.14699117839336395, 0.158074751496315, 0.16915832459926605, 0.1802418977022171, 0.19132547080516815, 0.202409029006958, 0.21349260210990906, 0.2245761752128601, 0.23565974831581116, 0.2467433214187622, 0.25782689452171326, 0.2689104676246643, 0.27999404072761536, 0.2910776138305664, 0.30216118693351746, 0.3132447600364685]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 5.0, 10.0, 7.0, 7.0, 7.0, 8.0, 8.0, 18.0, 21.0, 18.0, 18.0, 19.0, 25.0, 31.0, 22.0, 29.0, 38.0, 38.0, 31.0, 48.0, 42.0, 34.0, 30.0, 34.0, 36.0, 37.0, 39.0, 40.0, 38.0, 32.0, 23.0, 23.0, 24.0, 25.0, 19.0, 19.0, 13.0, 11.0, 11.0, 9.0, 9.0, 7.0, 6.0, 7.0, 3.0, 0.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.24584299325942993, -0.23785537481307983, -0.22986775636672974, -0.22188012301921844, -0.21389250457286835, -0.20590488612651825, -0.19791725277900696, -0.18992963433265686, -0.18194201588630676, -0.17395439743995667, -0.16596677899360657, -0.15797914564609528, -0.14999152719974518, -0.14200390875339508, -0.1340162754058838, -0.1260286569595337, -0.1180410385131836, -0.1100534200668335, -0.1020657941699028, -0.0940781682729721, -0.08609054982662201, -0.07810293138027191, -0.07011530548334122, -0.06212768331170082, -0.054140061140060425, -0.04615243896842003, -0.03816481679677963, -0.030177194625139236, -0.02218957245349884, -0.014201950281858444, -0.006214328110218048, 0.001773294061422348, 0.009760916233062744, 0.01774853840470314, 0.025736160576343536, 0.03372378274798393, 0.04171140491962433, 0.049699027091264725, 0.05768664926290512, 0.06567427515983582, 0.07366189360618591, 0.08164951205253601, 0.0896371379494667, 0.0976247638463974, 0.1056123822927475, 0.1136000007390976, 0.12158762663602829, 0.12957525253295898, 0.13756287097930908, 0.14555048942565918, 0.15353810787200928, 0.16152574121952057, 0.16951335966587067, 0.17750097811222076, 0.18548861145973206, 0.19347622990608215, 0.20146384835243225, 0.20945146679878235, 0.21743908524513245, 0.22542671859264374, 0.23341433703899384, 0.24140195548534393, 0.24938958883285522, 0.2573772072792053, 0.2653648257255554]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 7.0, 8.0, 11.0, 16.0, 32.0, 34.0, 49.0, 66.0, 126.0, 246.0, 420.0, 655.0, 1251.0, 2580.0, 5164.0, 10967.0, 25008.0, 58428.0, 136417.0, 283623.0, 282887.0, 135859.0, 58057.0, 24921.0, 11057.0, 5068.0, 2546.0, 1316.0, 710.0, 396.0, 232.0, 128.0, 83.0, 61.0, 44.0, 25.0, 10.0, 13.0, 9.0, 5.0, 6.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.151123046875, -0.14624786376953125, -0.1413726806640625, -0.13649749755859375, -0.131622314453125, -0.12674713134765625, -0.1218719482421875, -0.11699676513671875, -0.11212158203125, -0.10724639892578125, -0.1023712158203125, -0.09749603271484375, -0.092620849609375, -0.08774566650390625, -0.0828704833984375, -0.07799530029296875, -0.0731201171875, -0.06824493408203125, -0.0633697509765625, -0.05849456787109375, -0.053619384765625, -0.04874420166015625, -0.0438690185546875, -0.03899383544921875, -0.03411865234375, -0.02924346923828125, -0.0243682861328125, -0.01949310302734375, -0.014617919921875, -0.00974273681640625, -0.0048675537109375, 7.62939453125e-06, 0.0048828125, 0.00975799560546875, 0.0146331787109375, 0.01950836181640625, 0.024383544921875, 0.02925872802734375, 0.0341339111328125, 0.03900909423828125, 0.04388427734375, 0.04875946044921875, 0.0536346435546875, 0.05850982666015625, 0.063385009765625, 0.06826019287109375, 0.0731353759765625, 0.07801055908203125, 0.0828857421875, 0.08776092529296875, 0.0926361083984375, 0.09751129150390625, 0.102386474609375, 0.10726165771484375, 0.1121368408203125, 0.11701202392578125, 0.12188720703125, 0.12676239013671875, 0.1316375732421875, 0.13651275634765625, 0.141387939453125, 0.14626312255859375, 0.1511383056640625, 0.15601348876953125, 0.160888671875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 9.0, 3.0, 6.0, 7.0, 11.0, 8.0, 13.0, 11.0, 18.0, 25.0, 23.0, 41.0, 51.0, 40.0, 45.0, 47.0, 46.0, 59.0, 57.0, 53.0, 45.0, 54.0, 48.0, 47.0, 34.0, 34.0, 26.0, 24.0, 21.0, 23.0, 12.0, 10.0, 11.0, 10.0, 8.0, 4.0, 2.0, 6.0, 6.0, 1.0, 0.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1190185546875, -0.11527347564697266, -0.11152839660644531, -0.10778331756591797, -0.10403823852539062, -0.10029315948486328, -0.09654808044433594, -0.0928030014038086, -0.08905792236328125, -0.0853128433227539, -0.08156776428222656, -0.07782268524169922, -0.07407760620117188, -0.07033252716064453, -0.06658744812011719, -0.06284236907958984, -0.0590972900390625, -0.055352210998535156, -0.05160713195800781, -0.04786205291748047, -0.044116973876953125, -0.04037189483642578, -0.03662681579589844, -0.032881736755371094, -0.02913665771484375, -0.025391578674316406, -0.021646499633789062, -0.01790142059326172, -0.014156341552734375, -0.010411262512207031, -0.0066661834716796875, -0.0029211044311523438, 0.000823974609375, 0.004569053649902344, 0.008314132690429688, 0.012059211730957031, 0.015804290771484375, 0.01954936981201172, 0.023294448852539062, 0.027039527893066406, 0.03078460693359375, 0.034529685974121094, 0.03827476501464844, 0.04201984405517578, 0.045764923095703125, 0.04951000213623047, 0.05325508117675781, 0.057000160217285156, 0.0607452392578125, 0.06449031829833984, 0.06823539733886719, 0.07198047637939453, 0.07572555541992188, 0.07947063446044922, 0.08321571350097656, 0.0869607925415039, 0.09070587158203125, 0.0944509506225586, 0.09819602966308594, 0.10194110870361328, 0.10568618774414062, 0.10943126678466797, 0.11317634582519531, 0.11692142486572266, 0.12066650390625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 7.0, 10.0, 12.0, 8.0, 22.0, 24.0, 40.0, 52.0, 89.0, 127.0, 193.0, 280.0, 489.0, 834.0, 1564.0, 4500.0, 29300.0, 452135.0, 517109.0, 32897.0, 4940.0, 1664.0, 878.0, 469.0, 288.0, 216.0, 132.0, 90.0, 50.0, 43.0, 31.0, 25.0, 10.0, 13.0, 8.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.351318359375, -0.33831787109375, -0.3253173828125, -0.31231689453125, -0.29931640625, -0.28631591796875, -0.2733154296875, -0.26031494140625, -0.247314453125, -0.23431396484375, -0.2213134765625, -0.20831298828125, -0.1953125, -0.18231201171875, -0.1693115234375, -0.15631103515625, -0.143310546875, -0.13031005859375, -0.1173095703125, -0.10430908203125, -0.09130859375, -0.07830810546875, -0.0653076171875, -0.05230712890625, -0.039306640625, -0.02630615234375, -0.0133056640625, -0.00030517578125, 0.0126953125, 0.02569580078125, 0.0386962890625, 0.05169677734375, 0.064697265625, 0.07769775390625, 0.0906982421875, 0.10369873046875, 0.11669921875, 0.12969970703125, 0.1427001953125, 0.15570068359375, 0.168701171875, 0.18170166015625, 0.1947021484375, 0.20770263671875, 0.220703125, 0.23370361328125, 0.2467041015625, 0.25970458984375, 0.272705078125, 0.28570556640625, 0.2987060546875, 0.31170654296875, 0.32470703125, 0.33770751953125, 0.3507080078125, 0.36370849609375, 0.376708984375, 0.38970947265625, 0.4027099609375, 0.41571044921875, 0.4287109375, 0.44171142578125, 0.4547119140625, 0.46771240234375, 0.480712890625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 6.0, 12.0, 5.0, 10.0, 16.0, 13.0, 18.0, 18.0, 26.0, 32.0, 40.0, 41.0, 41.0, 54.0, 47.0, 44.0, 49.0, 41.0, 47.0, 39.0, 37.0, 44.0, 44.0, 34.0, 34.0, 31.0, 28.0, 22.0, 28.0, 17.0, 8.0, 10.0, 13.0, 8.0, 5.0, 5.0, 4.0, 5.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.55078125, -0.5348014831542969, -0.5188217163085938, -0.5028419494628906, -0.4868621826171875, -0.4708824157714844, -0.45490264892578125, -0.4389228820800781, -0.422943115234375, -0.4069633483886719, -0.39098358154296875, -0.3750038146972656, -0.3590240478515625, -0.3430442810058594, -0.32706451416015625, -0.3110847473144531, -0.29510498046875, -0.2791252136230469, -0.26314544677734375, -0.24716567993164062, -0.2311859130859375, -0.21520614624023438, -0.19922637939453125, -0.18324661254882812, -0.167266845703125, -0.15128707885742188, -0.13530731201171875, -0.11932754516601562, -0.1033477783203125, -0.08736801147460938, -0.07138824462890625, -0.055408477783203125, -0.0394287109375, -0.023448944091796875, -0.00746917724609375, 0.008510589599609375, 0.0244903564453125, 0.040470123291015625, 0.05644989013671875, 0.07242965698242188, 0.088409423828125, 0.10438919067382812, 0.12036895751953125, 0.13634872436523438, 0.1523284912109375, 0.16830825805664062, 0.18428802490234375, 0.20026779174804688, 0.21624755859375, 0.23222732543945312, 0.24820709228515625, 0.2641868591308594, 0.2801666259765625, 0.2961463928222656, 0.31212615966796875, 0.3281059265136719, 0.344085693359375, 0.3600654602050781, 0.37604522705078125, 0.3920249938964844, 0.4080047607421875, 0.4239845275878906, 0.43996429443359375, 0.4559440612792969, 0.471923828125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 12.0, 8.0, 18.0, 18.0, 44.0, 70.0, 120.0, 256.0, 686.0, 2312.0, 17229.0, 547814.0, 461142.0, 15492.0, 2179.0, 630.0, 260.0, 100.0, 68.0, 36.0, 15.0, 8.0, 11.0, 6.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.263427734375, -0.2543373107910156, -0.24524688720703125, -0.23615646362304688, -0.2270660400390625, -0.21797561645507812, -0.20888519287109375, -0.19979476928710938, -0.190704345703125, -0.18161392211914062, -0.17252349853515625, -0.16343307495117188, -0.1543426513671875, -0.14525222778320312, -0.13616180419921875, -0.12707138061523438, -0.11798095703125, -0.10889053344726562, -0.09980010986328125, -0.09070968627929688, -0.0816192626953125, -0.07252883911132812, -0.06343841552734375, -0.054347991943359375, -0.045257568359375, -0.036167144775390625, -0.02707672119140625, -0.017986297607421875, -0.0088958740234375, 0.000194549560546875, 0.00928497314453125, 0.018375396728515625, 0.0274658203125, 0.036556243896484375, 0.04564666748046875, 0.054737091064453125, 0.0638275146484375, 0.07291793823242188, 0.08200836181640625, 0.09109878540039062, 0.100189208984375, 0.10927963256835938, 0.11837005615234375, 0.12746047973632812, 0.1365509033203125, 0.14564132690429688, 0.15473175048828125, 0.16382217407226562, 0.17291259765625, 0.18200302124023438, 0.19109344482421875, 0.20018386840820312, 0.2092742919921875, 0.21836471557617188, 0.22745513916015625, 0.23654556274414062, 0.245635986328125, 0.2547264099121094, 0.26381683349609375, 0.2729072570800781, 0.2819976806640625, 0.2910881042480469, 0.30017852783203125, 0.3092689514160156, 0.318359375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 6.0, 4.0, 13.0, 8.0, 14.0, 11.0, 18.0, 23.0, 29.0, 40.0, 54.0, 58.0, 78.0, 74.0, 73.0, 66.0, 75.0, 54.0, 54.0, 40.0, 35.0, 19.0, 22.0, 18.0, 18.0, 12.0, 16.0, 7.0, 10.0, 8.0, 4.0, 3.0, 6.0, 3.0, 2.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.756450653076172e-05, -4.602503031492233e-05, -4.448555409908295e-05, -4.294607788324356e-05, -4.1406601667404175e-05, -3.986712545156479e-05, -3.83276492357254e-05, -3.678817301988602e-05, -3.524869680404663e-05, -3.3709220588207245e-05, -3.216974437236786e-05, -3.063026815652847e-05, -2.9090791940689087e-05, -2.75513157248497e-05, -2.6011839509010315e-05, -2.447236329317093e-05, -2.2932887077331543e-05, -2.1393410861492157e-05, -1.985393464565277e-05, -1.8314458429813385e-05, -1.6774982213974e-05, -1.5235505998134613e-05, -1.3696029782295227e-05, -1.2156553566455841e-05, -1.0617077350616455e-05, -9.077601134777069e-06, -7.538124918937683e-06, -5.998648703098297e-06, -4.459172487258911e-06, -2.919696271419525e-06, -1.3802200555801392e-06, 1.5925616025924683e-07, 1.6987323760986328e-06, 3.238208591938019e-06, 4.777684807777405e-06, 6.317161023616791e-06, 7.856637239456177e-06, 9.396113455295563e-06, 1.0935589671134949e-05, 1.2475065886974335e-05, 1.401454210281372e-05, 1.5554018318653107e-05, 1.7093494534492493e-05, 1.863297075033188e-05, 2.0172446966171265e-05, 2.171192318201065e-05, 2.3251399397850037e-05, 2.4790875613689423e-05, 2.633035182952881e-05, 2.7869828045368195e-05, 2.940930426120758e-05, 3.0948780477046967e-05, 3.248825669288635e-05, 3.402773290872574e-05, 3.5567209124565125e-05, 3.710668534040451e-05, 3.8646161556243896e-05, 4.018563777208328e-05, 4.172511398792267e-05, 4.3264590203762054e-05, 4.480406641960144e-05, 4.6343542635440826e-05, 4.788301885128021e-05, 4.94224950671196e-05, 5.0961971282958984e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 6.0, 8.0, 12.0, 13.0, 16.0, 35.0, 40.0, 61.0, 110.0, 185.0, 313.0, 573.0, 1127.0, 2843.0, 9704.0, 59346.0, 563640.0, 360983.0, 37655.0, 7338.0, 2372.0, 1013.0, 466.0, 266.0, 151.0, 83.0, 64.0, 35.0, 39.0, 20.0, 9.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1944580078125, -0.18888473510742188, -0.18331146240234375, -0.17773818969726562, -0.1721649169921875, -0.16659164428710938, -0.16101837158203125, -0.15544509887695312, -0.149871826171875, -0.14429855346679688, -0.13872528076171875, -0.13315200805664062, -0.1275787353515625, -0.12200546264648438, -0.11643218994140625, -0.11085891723632812, -0.10528564453125, -0.09971237182617188, -0.09413909912109375, -0.08856582641601562, -0.0829925537109375, -0.07741928100585938, -0.07184600830078125, -0.06627273559570312, -0.060699462890625, -0.055126190185546875, -0.04955291748046875, -0.043979644775390625, -0.0384063720703125, -0.032833099365234375, -0.02725982666015625, -0.021686553955078125, -0.01611328125, -0.010540008544921875, -0.00496673583984375, 0.000606536865234375, 0.0061798095703125, 0.011753082275390625, 0.01732635498046875, 0.022899627685546875, 0.028472900390625, 0.034046173095703125, 0.03961944580078125, 0.045192718505859375, 0.0507659912109375, 0.056339263916015625, 0.06191253662109375, 0.06748580932617188, 0.07305908203125, 0.07863235473632812, 0.08420562744140625, 0.08977890014648438, 0.0953521728515625, 0.10092544555664062, 0.10649871826171875, 0.11207199096679688, 0.117645263671875, 0.12321853637695312, 0.12879180908203125, 0.13436508178710938, 0.1399383544921875, 0.14551162719726562, 0.15108489990234375, 0.15665817260742188, 0.1622314453125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 8.0, 14.0, 20.0, 24.0, 30.0, 26.0, 64.0, 70.0, 109.0, 103.0, 106.0, 102.0, 82.0, 85.0, 60.0, 25.0, 26.0, 16.0, 8.0, 8.0, 5.0, 3.0, 3.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.228759765625, -0.22261810302734375, -0.2164764404296875, -0.21033477783203125, -0.204193115234375, -0.19805145263671875, -0.1919097900390625, -0.18576812744140625, -0.17962646484375, -0.17348480224609375, -0.1673431396484375, -0.16120147705078125, -0.155059814453125, -0.14891815185546875, -0.1427764892578125, -0.13663482666015625, -0.1304931640625, -0.12435150146484375, -0.1182098388671875, -0.11206817626953125, -0.105926513671875, -0.09978485107421875, -0.0936431884765625, -0.08750152587890625, -0.08135986328125, -0.07521820068359375, -0.0690765380859375, -0.06293487548828125, -0.056793212890625, -0.05065155029296875, -0.0445098876953125, -0.03836822509765625, -0.0322265625, -0.02608489990234375, -0.0199432373046875, -0.01380157470703125, -0.007659912109375, -0.00151824951171875, 0.0046234130859375, 0.01076507568359375, 0.01690673828125, 0.02304840087890625, 0.0291900634765625, 0.03533172607421875, 0.041473388671875, 0.04761505126953125, 0.0537567138671875, 0.05989837646484375, 0.0660400390625, 0.07218170166015625, 0.0783233642578125, 0.08446502685546875, 0.090606689453125, 0.09674835205078125, 0.1028900146484375, 0.10903167724609375, 0.11517333984375, 0.12131500244140625, 0.1274566650390625, 0.13359832763671875, 0.139739990234375, 0.14588165283203125, 0.1520233154296875, 0.15816497802734375, 0.164306640625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 1.0, 6.0, 17.0, 46.0, 74.0, 151.0, 186.0, 173.0, 141.0, 103.0, 42.0, 35.0, 18.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1499881744384766, -2.0461342334747314, -1.9422802925109863, -1.8384263515472412, -1.7345725297927856, -1.6307185888290405, -1.5268646478652954, -1.4230108261108398, -1.3191568851470947, -1.2153029441833496, -1.1114490032196045, -1.0075950622558594, -0.9037412405014038, -0.7998872995376587, -0.6960333585739136, -0.5921794772148132, -0.48832547664642334, -0.3844715654850006, -0.2806176543235779, -0.17676371335983276, -0.07290980219841003, 0.030944108963012695, 0.1347980499267578, 0.23865193128585815, 0.34250587224960327, 0.446359783411026, 0.5502136945724487, 0.6540676355361938, 0.757921576499939, 0.8617754578590393, 0.9656293988227844, 1.0694832801818848, 1.1733372211456299, 1.277191162109375, 1.3810451030731201, 1.4848990440368652, 1.5887528657913208, 1.692606806755066, 1.796460747718811, 1.9003145694732666, 2.0041685104370117, 2.108022451400757, 2.211876392364502, 2.315730333328247, 2.419584274291992, 2.523437976837158, 2.6272921562194824, 2.7311458587646484, 2.8350000381469727, 2.9388539791107178, 3.042707920074463, 3.146561861038208, 3.250415802001953, 3.354269504547119, 3.4581236839294434, 3.5619773864746094, 3.6658313274383545, 3.7696852684020996, 3.8735392093658447, 3.97739315032959, 4.081246852874756, 4.18510103225708, 4.288954734802246, 4.39280891418457, 4.496662616729736]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 6.0, 4.0, 10.0, 11.0, 21.0, 20.0, 30.0, 40.0, 42.0, 56.0, 60.0, 66.0, 55.0, 73.0, 81.0, 76.0, 64.0, 60.0, 49.0, 32.0, 30.0, 27.0, 18.0, 19.0, 10.0, 14.0, 11.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.448465585708618, -3.346440315246582, -3.244414806365967, -3.1423892974853516, -3.0403640270233154, -2.9383387565612793, -2.836313247680664, -2.734287738800049, -2.6322624683380127, -2.5302371978759766, -2.4282116889953613, -2.326186180114746, -2.22416090965271, -2.122135639190674, -2.0201101303100586, -1.918084740638733, -1.8160593509674072, -1.7140339612960815, -1.6120085716247559, -1.5099831819534302, -1.4079577922821045, -1.3059324026107788, -1.2039070129394531, -1.1018816232681274, -0.9998562335968018, -0.8978308439254761, -0.7958054542541504, -0.6937800645828247, -0.591754674911499, -0.48972928524017334, -0.38770389556884766, -0.285678505897522, -0.1836533546447754, -0.08162796497344971, 0.020397424697875977, 0.12242281436920166, 0.22444820404052734, 0.326473593711853, 0.4284989833831787, 0.5305243730545044, 0.6325497627258301, 0.7345751523971558, 0.8366005420684814, 0.9386259317398071, 1.0406513214111328, 1.1426767110824585, 1.2447021007537842, 1.3467274904251099, 1.4487528800964355, 1.5507782697677612, 1.652803659439087, 1.7548290491104126, 1.8568544387817383, 1.958879828453064, 2.0609052181243896, 2.162930488586426, 2.264955997467041, 2.3669815063476562, 2.4690067768096924, 2.5710320472717285, 2.6730575561523438, 2.775083065032959, 2.877108335494995, 2.9791336059570312, 3.0811591148376465]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 0.0, 5.0, 6.0, 5.0, 8.0, 20.0, 22.0, 27.0, 44.0, 63.0, 88.0, 146.0, 169.0, 271.0, 404.0, 585.0, 989.0, 1573.0, 2886.0, 5665.0, 14227.0, 48686.0, 1776052.0, 2266472.0, 48711.0, 14034.0, 5807.0, 2877.0, 1589.0, 961.0, 598.0, 415.0, 268.0, 187.0, 128.0, 96.0, 61.0, 43.0, 31.0, 25.0, 10.0, 7.0, 14.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.30615234375, -0.2974052429199219, -0.28865814208984375, -0.2799110412597656, -0.2711639404296875, -0.2624168395996094, -0.25366973876953125, -0.24492263793945312, -0.236175537109375, -0.22742843627929688, -0.21868133544921875, -0.20993423461914062, -0.2011871337890625, -0.19244003295898438, -0.18369293212890625, -0.17494583129882812, -0.16619873046875, -0.15745162963867188, -0.14870452880859375, -0.13995742797851562, -0.1312103271484375, -0.12246322631835938, -0.11371612548828125, -0.10496902465820312, -0.096221923828125, -0.08747482299804688, -0.07872772216796875, -0.06998062133789062, -0.0612335205078125, -0.052486419677734375, -0.04373931884765625, -0.034992218017578125, -0.0262451171875, -0.017498016357421875, -0.00875091552734375, -3.814697265625e-06, 0.0087432861328125, 0.017490386962890625, 0.02623748779296875, 0.034984588623046875, 0.043731689453125, 0.052478790283203125, 0.06122589111328125, 0.06997299194335938, 0.0787200927734375, 0.08746719360351562, 0.09621429443359375, 0.10496139526367188, 0.11370849609375, 0.12245559692382812, 0.13120269775390625, 0.13994979858398438, 0.1486968994140625, 0.15744400024414062, 0.16619110107421875, 0.17493820190429688, 0.183685302734375, 0.19243240356445312, 0.20117950439453125, 0.20992660522460938, 0.2186737060546875, 0.22742080688476562, 0.23616790771484375, 0.24491500854492188, 0.253662109375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 7.0, 4.0, 5.0, 6.0, 11.0, 11.0, 13.0, 26.0, 34.0, 36.0, 35.0, 52.0, 51.0, 67.0, 65.0, 56.0, 68.0, 67.0, 47.0, 59.0, 47.0, 40.0, 44.0, 29.0, 27.0, 24.0, 13.0, 11.0, 14.0, 12.0, 9.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1328125, -0.12845802307128906, -0.12410354614257812, -0.11974906921386719, -0.11539459228515625, -0.11104011535644531, -0.10668563842773438, -0.10233116149902344, -0.0979766845703125, -0.09362220764160156, -0.08926773071289062, -0.08491325378417969, -0.08055877685546875, -0.07620429992675781, -0.07184982299804688, -0.06749534606933594, -0.063140869140625, -0.05878639221191406, -0.054431915283203125, -0.05007743835449219, -0.04572296142578125, -0.04136848449707031, -0.037014007568359375, -0.03265953063964844, -0.0283050537109375, -0.023950576782226562, -0.019596099853515625, -0.015241622924804688, -0.01088714599609375, -0.0065326690673828125, -0.002178192138671875, 0.0021762847900390625, 0.00653076171875, 0.010885238647460938, 0.015239715576171875, 0.019594192504882812, 0.02394866943359375, 0.028303146362304688, 0.032657623291015625, 0.03701210021972656, 0.0413665771484375, 0.04572105407714844, 0.050075531005859375, 0.05443000793457031, 0.05878448486328125, 0.06313896179199219, 0.06749343872070312, 0.07184791564941406, 0.076202392578125, 0.08055686950683594, 0.08491134643554688, 0.08926582336425781, 0.09362030029296875, 0.09797477722167969, 0.10232925415039062, 0.10668373107910156, 0.1110382080078125, 0.11539268493652344, 0.11974716186523438, 0.12410163879394531, 0.12845611572265625, 0.1328105926513672, 0.13716506958007812, 0.14151954650878906, 0.1458740234375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 6.0, 9.0, 8.0, 26.0, 26.0, 20.0, 34.0, 31.0, 59.0, 67.0, 98.0, 157.0, 375.0, 712.0, 1883.0, 7053.0, 55074.0, 4000047.0, 113681.0, 10464.0, 2468.0, 870.0, 423.0, 204.0, 121.0, 86.0, 68.0, 39.0, 31.0, 20.0, 19.0, 16.0, 14.0, 13.0, 10.0, 8.0, 6.0, 5.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.6396484375, -0.6206207275390625, -0.601593017578125, -0.5825653076171875, -0.56353759765625, -0.5445098876953125, -0.525482177734375, -0.5064544677734375, -0.4874267578125, -0.4683990478515625, -0.449371337890625, -0.4303436279296875, -0.41131591796875, -0.3922882080078125, -0.373260498046875, -0.3542327880859375, -0.335205078125, -0.3161773681640625, -0.297149658203125, -0.2781219482421875, -0.25909423828125, -0.2400665283203125, -0.221038818359375, -0.2020111083984375, -0.1829833984375, -0.1639556884765625, -0.144927978515625, -0.1259002685546875, -0.10687255859375, -0.0878448486328125, -0.068817138671875, -0.0497894287109375, -0.03076171875, -0.0117340087890625, 0.007293701171875, 0.0263214111328125, 0.04534912109375, 0.0643768310546875, 0.083404541015625, 0.1024322509765625, 0.1214599609375, 0.1404876708984375, 0.159515380859375, 0.1785430908203125, 0.19757080078125, 0.2165985107421875, 0.235626220703125, 0.2546539306640625, 0.273681640625, 0.2927093505859375, 0.311737060546875, 0.3307647705078125, 0.34979248046875, 0.3688201904296875, 0.387847900390625, 0.4068756103515625, 0.4259033203125, 0.4449310302734375, 0.463958740234375, 0.4829864501953125, 0.50201416015625, 0.5210418701171875, 0.540069580078125, 0.5590972900390625, 0.578125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 10.0, 10.0, 27.0, 60.0, 110.0, 561.0, 2984.0, 200.0, 55.0, 29.0, 11.0, 9.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2200927734375, -0.21060752868652344, -0.20112228393554688, -0.1916370391845703, -0.18215179443359375, -0.1726665496826172, -0.16318130493164062, -0.15369606018066406, -0.1442108154296875, -0.13472557067871094, -0.12524032592773438, -0.11575508117675781, -0.10626983642578125, -0.09678459167480469, -0.08729934692382812, -0.07781410217285156, -0.068328857421875, -0.05884361267089844, -0.049358367919921875, -0.03987312316894531, -0.03038787841796875, -0.020902633666992188, -0.011417388916015625, -0.0019321441650390625, 0.0075531005859375, 0.017038345336914062, 0.026523590087890625, 0.03600883483886719, 0.04549407958984375, 0.05497932434082031, 0.06446456909179688, 0.07394981384277344, 0.08343505859375, 0.09292030334472656, 0.10240554809570312, 0.11189079284667969, 0.12137603759765625, 0.1308612823486328, 0.14034652709960938, 0.14983177185058594, 0.1593170166015625, 0.16880226135253906, 0.17828750610351562, 0.1877727508544922, 0.19725799560546875, 0.2067432403564453, 0.21622848510742188, 0.22571372985839844, 0.235198974609375, 0.24468421936035156, 0.2541694641113281, 0.2636547088623047, 0.27313995361328125, 0.2826251983642578, 0.2921104431152344, 0.30159568786621094, 0.3110809326171875, 0.32056617736816406, 0.3300514221191406, 0.3395366668701172, 0.34902191162109375, 0.3585071563720703, 0.3679924011230469, 0.37747764587402344, 0.386962890625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 6.0, 7.0, 8.0, 10.0, 28.0, 36.0, 69.0, 89.0, 100.0, 130.0, 129.0, 105.0, 96.0, 55.0, 40.0, 31.0, 17.0, 20.0, 3.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6400371789932251, -0.6159711480140686, -0.5919051170349121, -0.5678390264511108, -0.5437729954719543, -0.5197069644927979, -0.49564090371131897, -0.4715748429298401, -0.4475088119506836, -0.4234427809715271, -0.3993767201900482, -0.37531065940856934, -0.35124462842941284, -0.32717859745025635, -0.30311253666877747, -0.2790464758872986, -0.2549804449081421, -0.2309143990278244, -0.2068483531475067, -0.18278230726718903, -0.15871626138687134, -0.13465021550655365, -0.11058416962623596, -0.08651812374591827, -0.062452077865600586, -0.0383860319852829, -0.01431998610496521, 0.009746059775352478, 0.033812105655670166, 0.057878151535987854, 0.08194419741630554, 0.10601024329662323, 0.13007628917694092, 0.1541423350572586, 0.1782083809375763, 0.20227442681789398, 0.22634047269821167, 0.25040650367736816, 0.27447256445884705, 0.2985386252403259, 0.3226046562194824, 0.3466706871986389, 0.3707367479801178, 0.3948028087615967, 0.4188688397407532, 0.44293487071990967, 0.46700093150138855, 0.49106699228286743, 0.5151330232620239, 0.5391990542411804, 0.5632650852203369, 0.5873311758041382, 0.6113972067832947, 0.6354632377624512, 0.6595293283462524, 0.6835953593254089, 0.7076613903045654, 0.7317274212837219, 0.7557934522628784, 0.7798595428466797, 0.8039255738258362, 0.8279916048049927, 0.852057695388794, 0.8761237263679504, 0.9001897573471069]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 5.0, 12.0, 11.0, 12.0, 9.0, 12.0, 17.0, 27.0, 27.0, 34.0, 35.0, 39.0, 34.0, 37.0, 40.0, 53.0, 42.0, 57.0, 43.0, 56.0, 47.0, 40.0, 31.0, 39.0, 29.0, 22.0, 29.0, 19.0, 25.0, 21.0, 19.0, 16.0, 15.0, 14.0, 14.0, 3.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.48975038528442383, -0.47480884194374084, -0.45986732840538025, -0.44492578506469727, -0.42998427152633667, -0.4150427281856537, -0.4001011848449707, -0.3851596713066101, -0.3702181279659271, -0.35527658462524414, -0.34033507108688354, -0.32539352774620056, -0.3104519844055176, -0.295510470867157, -0.280568927526474, -0.265627384185791, -0.2506858706474304, -0.23574434220790863, -0.22080281376838684, -0.20586127042770386, -0.19091974198818207, -0.17597821354866028, -0.1610366702079773, -0.1460951417684555, -0.13115361332893372, -0.11621208488941193, -0.10127054899930954, -0.08632901310920715, -0.07138748466968536, -0.056445956230163574, -0.04150442034006119, -0.0265628844499588, -0.011621356010437012, 0.0033201761543750763, 0.018261708319187164, 0.03320324048399925, 0.04814477264881134, 0.06308630108833313, 0.07802783697843552, 0.0929693728685379, 0.10791090130805969, 0.12285242974758148, 0.13779395818710327, 0.15273550152778625, 0.16767702996730804, 0.18261855840682983, 0.19756010174751282, 0.2125016301870346, 0.2274431586265564, 0.24238468706607819, 0.2573262155056, 0.27226775884628296, 0.28720927238464355, 0.30215081572532654, 0.3170923590660095, 0.3320338726043701, 0.3469754159450531, 0.3619169592857361, 0.3768584728240967, 0.39180001616477966, 0.40674155950546265, 0.42168307304382324, 0.4366246163845062, 0.4515661597251892, 0.4665076732635498]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 6.0, 11.0, 16.0, 16.0, 46.0, 59.0, 76.0, 138.0, 213.0, 431.0, 812.0, 1488.0, 2973.0, 6415.0, 14439.0, 32453.0, 77755.0, 191703.0, 382725.0, 196866.0, 79546.0, 33131.0, 14297.0, 6536.0, 3111.0, 1528.0, 736.0, 409.0, 233.0, 144.0, 94.0, 43.0, 39.0, 25.0, 12.0, 4.0, 9.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2498779296875, -0.24263763427734375, -0.2353973388671875, -0.22815704345703125, -0.220916748046875, -0.21367645263671875, -0.2064361572265625, -0.19919586181640625, -0.19195556640625, -0.18471527099609375, -0.1774749755859375, -0.17023468017578125, -0.162994384765625, -0.15575408935546875, -0.1485137939453125, -0.14127349853515625, -0.134033203125, -0.12679290771484375, -0.1195526123046875, -0.11231231689453125, -0.105072021484375, -0.09783172607421875, -0.0905914306640625, -0.08335113525390625, -0.07611083984375, -0.06887054443359375, -0.0616302490234375, -0.05438995361328125, -0.047149658203125, -0.03990936279296875, -0.0326690673828125, -0.02542877197265625, -0.0181884765625, -0.01094818115234375, -0.0037078857421875, 0.00353240966796875, 0.010772705078125, 0.01801300048828125, 0.0252532958984375, 0.03249359130859375, 0.03973388671875, 0.04697418212890625, 0.0542144775390625, 0.06145477294921875, 0.068695068359375, 0.07593536376953125, 0.0831756591796875, 0.09041595458984375, 0.09765625, 0.10489654541015625, 0.1121368408203125, 0.11937713623046875, 0.126617431640625, 0.13385772705078125, 0.1410980224609375, 0.14833831787109375, 0.15557861328125, 0.16281890869140625, 0.1700592041015625, 0.17729949951171875, 0.184539794921875, 0.19178009033203125, 0.1990203857421875, 0.20626068115234375, 0.2135009765625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 4.0, 5.0, 5.0, 10.0, 16.0, 13.0, 20.0, 17.0, 25.0, 44.0, 32.0, 40.0, 43.0, 46.0, 51.0, 44.0, 47.0, 49.0, 50.0, 65.0, 49.0, 50.0, 38.0, 41.0, 30.0, 24.0, 19.0, 22.0, 23.0, 10.0, 18.0, 9.0, 7.0, 4.0, 11.0, 8.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.125244140625, -0.12140560150146484, -0.11756706237792969, -0.11372852325439453, -0.10988998413085938, -0.10605144500732422, -0.10221290588378906, -0.0983743667602539, -0.09453582763671875, -0.0906972885131836, -0.08685874938964844, -0.08302021026611328, -0.07918167114257812, -0.07534313201904297, -0.07150459289550781, -0.06766605377197266, -0.0638275146484375, -0.059988975524902344, -0.05615043640136719, -0.05231189727783203, -0.048473358154296875, -0.04463481903076172, -0.04079627990722656, -0.036957740783691406, -0.03311920166015625, -0.029280662536621094, -0.025442123413085938, -0.02160358428955078, -0.017765045166015625, -0.013926506042480469, -0.010087966918945312, -0.006249427795410156, -0.002410888671875, 0.0014276504516601562, 0.0052661895751953125, 0.009104728698730469, 0.012943267822265625, 0.01678180694580078, 0.020620346069335938, 0.024458885192871094, 0.02829742431640625, 0.032135963439941406, 0.03597450256347656, 0.03981304168701172, 0.043651580810546875, 0.04749011993408203, 0.05132865905761719, 0.055167198181152344, 0.0590057373046875, 0.06284427642822266, 0.06668281555175781, 0.07052135467529297, 0.07435989379882812, 0.07819843292236328, 0.08203697204589844, 0.0858755111694336, 0.08971405029296875, 0.0935525894165039, 0.09739112854003906, 0.10122966766357422, 0.10506820678710938, 0.10890674591064453, 0.11274528503417969, 0.11658382415771484, 0.12042236328125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 6.0, 7.0, 6.0, 14.0, 13.0, 26.0, 36.0, 43.0, 58.0, 79.0, 112.0, 214.0, 260.0, 417.0, 720.0, 1187.0, 2491.0, 6404.0, 27639.0, 208071.0, 673426.0, 102061.0, 16147.0, 4453.0, 1900.0, 1007.0, 584.0, 366.0, 263.0, 161.0, 100.0, 74.0, 67.0, 40.0, 31.0, 19.0, 12.0, 16.0, 9.0, 7.0, 6.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.353271484375, -0.3408050537109375, -0.328338623046875, -0.3158721923828125, -0.30340576171875, -0.2909393310546875, -0.278472900390625, -0.2660064697265625, -0.2535400390625, -0.2410736083984375, -0.228607177734375, -0.2161407470703125, -0.20367431640625, -0.1912078857421875, -0.178741455078125, -0.1662750244140625, -0.15380859375, -0.1413421630859375, -0.128875732421875, -0.1164093017578125, -0.10394287109375, -0.0914764404296875, -0.079010009765625, -0.0665435791015625, -0.0540771484375, -0.0416107177734375, -0.029144287109375, -0.0166778564453125, -0.00421142578125, 0.0082550048828125, 0.020721435546875, 0.0331878662109375, 0.045654296875, 0.0581207275390625, 0.070587158203125, 0.0830535888671875, 0.09552001953125, 0.1079864501953125, 0.120452880859375, 0.1329193115234375, 0.1453857421875, 0.1578521728515625, 0.170318603515625, 0.1827850341796875, 0.19525146484375, 0.2077178955078125, 0.220184326171875, 0.2326507568359375, 0.2451171875, 0.2575836181640625, 0.270050048828125, 0.2825164794921875, 0.29498291015625, 0.3074493408203125, 0.319915771484375, 0.3323822021484375, 0.3448486328125, 0.3573150634765625, 0.369781494140625, 0.3822479248046875, 0.39471435546875, 0.4071807861328125, 0.419647216796875, 0.4321136474609375, 0.444580078125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 7.0, 5.0, 6.0, 8.0, 8.0, 11.0, 13.0, 19.0, 22.0, 29.0, 31.0, 25.0, 34.0, 32.0, 32.0, 39.0, 51.0, 52.0, 42.0, 50.0, 39.0, 45.0, 39.0, 35.0, 43.0, 28.0, 30.0, 29.0, 42.0, 35.0, 22.0, 18.0, 14.0, 16.0, 8.0, 9.0, 8.0, 8.0, 9.0, 5.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.50732421875, -0.4927558898925781, -0.47818756103515625, -0.4636192321777344, -0.4490509033203125, -0.4344825744628906, -0.41991424560546875, -0.4053459167480469, -0.390777587890625, -0.3762092590332031, -0.36164093017578125, -0.3470726013183594, -0.3325042724609375, -0.3179359436035156, -0.30336761474609375, -0.2887992858886719, -0.27423095703125, -0.2596626281738281, -0.24509429931640625, -0.23052597045898438, -0.2159576416015625, -0.20138931274414062, -0.18682098388671875, -0.17225265502929688, -0.157684326171875, -0.14311599731445312, -0.12854766845703125, -0.11397933959960938, -0.0994110107421875, -0.08484268188476562, -0.07027435302734375, -0.055706024169921875, -0.0411376953125, -0.026569366455078125, -0.01200103759765625, 0.002567291259765625, 0.0171356201171875, 0.031703948974609375, 0.04627227783203125, 0.060840606689453125, 0.075408935546875, 0.08997726440429688, 0.10454559326171875, 0.11911392211914062, 0.1336822509765625, 0.14825057983398438, 0.16281890869140625, 0.17738723754882812, 0.19195556640625, 0.20652389526367188, 0.22109222412109375, 0.23566055297851562, 0.2502288818359375, 0.2647972106933594, 0.27936553955078125, 0.2939338684082031, 0.308502197265625, 0.3230705261230469, 0.33763885498046875, 0.3522071838378906, 0.3667755126953125, 0.3813438415527344, 0.39591217041015625, 0.4104804992675781, 0.425048828125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 5.0, 8.0, 14.0, 10.0, 20.0, 27.0, 47.0, 59.0, 88.0, 130.0, 203.0, 332.0, 547.0, 1050.0, 2058.0, 4922.0, 13190.0, 43790.0, 167780.0, 533523.0, 202642.0, 52160.0, 15156.0, 5646.0, 2285.0, 1136.0, 651.0, 359.0, 231.0, 161.0, 99.0, 70.0, 44.0, 28.0, 26.0, 15.0, 14.0, 10.0, 4.0, 5.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09375, -0.0904684066772461, -0.08718681335449219, -0.08390522003173828, -0.08062362670898438, -0.07734203338623047, -0.07406044006347656, -0.07077884674072266, -0.06749725341796875, -0.06421566009521484, -0.06093406677246094, -0.05765247344970703, -0.054370880126953125, -0.05108928680419922, -0.04780769348144531, -0.044526100158691406, -0.0412445068359375, -0.037962913513183594, -0.03468132019042969, -0.03139972686767578, -0.028118133544921875, -0.02483654022216797, -0.021554946899414062, -0.018273353576660156, -0.01499176025390625, -0.011710166931152344, -0.008428573608398438, -0.005146980285644531, -0.001865386962890625, 0.0014162063598632812, 0.0046977996826171875, 0.007979393005371094, 0.011260986328125, 0.014542579650878906, 0.017824172973632812, 0.02110576629638672, 0.024387359619140625, 0.02766895294189453, 0.030950546264648438, 0.034232139587402344, 0.03751373291015625, 0.040795326232910156, 0.04407691955566406, 0.04735851287841797, 0.050640106201171875, 0.05392169952392578, 0.05720329284667969, 0.060484886169433594, 0.0637664794921875, 0.0670480728149414, 0.07032966613769531, 0.07361125946044922, 0.07689285278320312, 0.08017444610595703, 0.08345603942871094, 0.08673763275146484, 0.09001922607421875, 0.09330081939697266, 0.09658241271972656, 0.09986400604248047, 0.10314559936523438, 0.10642719268798828, 0.10970878601074219, 0.1129903793334961, 0.11627197265625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 14.0, 4.0, 7.0, 18.0, 16.0, 18.0, 15.0, 12.0, 20.0, 25.0, 43.0, 59.0, 62.0, 74.0, 81.0, 101.0, 61.0, 52.0, 49.0, 47.0, 38.0, 25.0, 26.0, 28.0, 26.0, 19.0, 14.0, 9.0, 10.0, 4.0, 4.0, 5.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-5.7756900787353516e-05, -5.601998418569565e-05, -5.428306758403778e-05, -5.254615098237991e-05, -5.0809234380722046e-05, -4.907231777906418e-05, -4.733540117740631e-05, -4.5598484575748444e-05, -4.3861567974090576e-05, -4.212465137243271e-05, -4.038773477077484e-05, -3.8650818169116974e-05, -3.6913901567459106e-05, -3.517698496580124e-05, -3.344006836414337e-05, -3.1703151762485504e-05, -2.9966235160827637e-05, -2.822931855916977e-05, -2.6492401957511902e-05, -2.4755485355854034e-05, -2.3018568754196167e-05, -2.12816521525383e-05, -1.9544735550880432e-05, -1.7807818949222565e-05, -1.6070902347564697e-05, -1.433398574590683e-05, -1.2597069144248962e-05, -1.0860152542591095e-05, -9.123235940933228e-06, -7.38631933927536e-06, -5.649402737617493e-06, -3.912486135959625e-06, -2.175569534301758e-06, -4.386529326438904e-07, 1.298263669013977e-06, 3.0351802706718445e-06, 4.772096872329712e-06, 6.509013473987579e-06, 8.245930075645447e-06, 9.982846677303314e-06, 1.1719763278961182e-05, 1.3456679880619049e-05, 1.5193596482276917e-05, 1.6930513083934784e-05, 1.866742968559265e-05, 2.040434628725052e-05, 2.2141262888908386e-05, 2.3878179490566254e-05, 2.561509609222412e-05, 2.735201269388199e-05, 2.9088929295539856e-05, 3.0825845897197723e-05, 3.256276249885559e-05, 3.429967910051346e-05, 3.6036595702171326e-05, 3.777351230382919e-05, 3.951042890548706e-05, 4.124734550714493e-05, 4.2984262108802795e-05, 4.472117871046066e-05, 4.645809531211853e-05, 4.81950119137764e-05, 4.9931928515434265e-05, 5.166884511709213e-05, 5.340576171875e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 8.0, 9.0, 7.0, 18.0, 24.0, 45.0, 66.0, 155.0, 240.0, 472.0, 1153.0, 3454.0, 16878.0, 192524.0, 744443.0, 75962.0, 9189.0, 2176.0, 861.0, 415.0, 195.0, 108.0, 65.0, 29.0, 20.0, 13.0, 8.0, 4.0, 6.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1632080078125, -0.15723609924316406, -0.15126419067382812, -0.1452922821044922, -0.13932037353515625, -0.1333484649658203, -0.12737655639648438, -0.12140464782714844, -0.1154327392578125, -0.10946083068847656, -0.10348892211914062, -0.09751701354980469, -0.09154510498046875, -0.08557319641113281, -0.07960128784179688, -0.07362937927246094, -0.067657470703125, -0.06168556213378906, -0.055713653564453125, -0.04974174499511719, -0.04376983642578125, -0.03779792785644531, -0.031826019287109375, -0.025854110717773438, -0.0198822021484375, -0.013910293579101562, -0.007938385009765625, -0.0019664764404296875, 0.00400543212890625, 0.009977340698242188, 0.015949249267578125, 0.021921157836914062, 0.02789306640625, 0.03386497497558594, 0.039836883544921875, 0.04580879211425781, 0.05178070068359375, 0.05775260925292969, 0.06372451782226562, 0.06969642639160156, 0.0756683349609375, 0.08164024353027344, 0.08761215209960938, 0.09358406066894531, 0.09955596923828125, 0.10552787780761719, 0.11149978637695312, 0.11747169494628906, 0.123443603515625, 0.12941551208496094, 0.13538742065429688, 0.1413593292236328, 0.14733123779296875, 0.1533031463623047, 0.15927505493164062, 0.16524696350097656, 0.1712188720703125, 0.17719078063964844, 0.18316268920898438, 0.1891345977783203, 0.19510650634765625, 0.2010784149169922, 0.20705032348632812, 0.21302223205566406, 0.218994140625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 11.0, 6.0, 12.0, 19.0, 19.0, 25.0, 31.0, 35.0, 42.0, 56.0, 69.0, 80.0, 77.0, 76.0, 80.0, 68.0, 60.0, 44.0, 42.0, 47.0, 22.0, 15.0, 18.0, 15.0, 9.0, 6.0, 6.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.184814453125, -0.18032455444335938, -0.17583465576171875, -0.17134475708007812, -0.1668548583984375, -0.16236495971679688, -0.15787506103515625, -0.15338516235351562, -0.148895263671875, -0.14440536499023438, -0.13991546630859375, -0.13542556762695312, -0.1309356689453125, -0.12644577026367188, -0.12195587158203125, -0.11746597290039062, -0.11297607421875, -0.10848617553710938, -0.10399627685546875, -0.09950637817382812, -0.0950164794921875, -0.09052658081054688, -0.08603668212890625, -0.08154678344726562, -0.077056884765625, -0.07256698608398438, -0.06807708740234375, -0.06358718872070312, -0.0590972900390625, -0.054607391357421875, -0.05011749267578125, -0.045627593994140625, -0.0411376953125, -0.036647796630859375, -0.03215789794921875, -0.027667999267578125, -0.0231781005859375, -0.018688201904296875, -0.01419830322265625, -0.009708404541015625, -0.005218505859375, -0.000728607177734375, 0.00376129150390625, 0.008251190185546875, 0.0127410888671875, 0.017230987548828125, 0.02172088623046875, 0.026210784912109375, 0.03070068359375, 0.035190582275390625, 0.03968048095703125, 0.044170379638671875, 0.0486602783203125, 0.053150177001953125, 0.05764007568359375, 0.062129974365234375, 0.066619873046875, 0.07110977172851562, 0.07559967041015625, 0.08008956909179688, 0.0845794677734375, 0.08906936645507812, 0.09355926513671875, 0.09804916381835938, 0.1025390625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 7.0, 10.0, 19.0, 34.0, 49.0, 74.0, 93.0, 98.0, 140.0, 125.0, 110.0, 88.0, 56.0, 34.0, 17.0, 22.0, 8.0, 4.0, 7.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.698230504989624, -2.6213791370391846, -2.544527769088745, -2.4676764011383057, -2.390825033187866, -2.3139736652374268, -2.2371222972869873, -2.160270929336548, -2.0834195613861084, -2.006568193435669, -1.9297168254852295, -1.85286545753479, -1.7760140895843506, -1.6991627216339111, -1.6223113536834717, -1.5454599857330322, -1.4686086177825928, -1.3917572498321533, -1.3149058818817139, -1.2380545139312744, -1.161203145980835, -1.0843517780303955, -1.007500410079956, -0.9306490421295166, -0.8537976741790771, -0.7769463062286377, -0.7000949382781982, -0.6232435703277588, -0.5463922023773193, -0.4695408344268799, -0.39268946647644043, -0.315838098526001, -0.23898696899414062, -0.16213560104370117, -0.08528423309326172, -0.008432865142822266, 0.06841850280761719, 0.14526987075805664, 0.2221212387084961, 0.29897260665893555, 0.375823974609375, 0.45267534255981445, 0.5295267105102539, 0.6063780784606934, 0.6832294464111328, 0.7600808143615723, 0.8369321823120117, 0.9137835502624512, 0.9906349182128906, 1.06748628616333, 1.1443376541137695, 1.221189022064209, 1.2980403900146484, 1.374891757965088, 1.4517431259155273, 1.5285944938659668, 1.6054458618164062, 1.6822972297668457, 1.7591485977172852, 1.8359999656677246, 1.912851333618164, 1.9897027015686035, 2.066554069519043, 2.1434054374694824, 2.220256805419922]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 6.0, 6.0, 7.0, 12.0, 10.0, 15.0, 19.0, 30.0, 34.0, 38.0, 36.0, 42.0, 47.0, 47.0, 52.0, 66.0, 57.0, 67.0, 69.0, 45.0, 46.0, 55.0, 34.0, 22.0, 28.0, 25.0, 11.0, 17.0, 13.0, 8.0, 9.0, 3.0, 3.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.6690609455108643, -2.5888559818267822, -2.5086510181427, -2.428445816040039, -2.348240852355957, -2.268035888671875, -2.187830924987793, -2.107625961303711, -2.027420997619629, -1.9472160339355469, -1.8670109510421753, -1.7868059873580933, -1.7066009044647217, -1.6263959407806396, -1.5461909770965576, -1.4659860134124756, -1.3857808113098145, -1.3055758476257324, -1.2253707647323608, -1.1451658010482788, -1.0649607181549072, -0.9847557544708252, -0.9045507907867432, -0.8243457674980164, -0.7441407442092896, -0.6639357209205627, -0.5837306976318359, -0.5035257339477539, -0.4233207106590271, -0.3431156873703003, -0.2629106938838959, -0.18270570039749146, -0.10250043869018555, -0.022295430302619934, 0.05790957808494568, 0.1381145864725113, 0.2183195948600769, 0.2985246181488037, 0.37872961163520813, 0.45893460512161255, 0.5391396284103394, 0.6193446516990662, 0.699549674987793, 0.779754638671875, 0.8599596619606018, 0.9401646852493286, 1.0203696489334106, 1.1005747318267822, 1.1807796955108643, 1.2609846591949463, 1.3411897420883179, 1.4213947057724, 1.5015997886657715, 1.5818047523498535, 1.6620097160339355, 1.7422146797180176, 1.8224197626113892, 1.9026247262954712, 1.9828298091888428, 2.063034772872925, 2.143239736557007, 2.223444938659668, 2.30364990234375, 2.383854866027832, 2.464059829711914]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 9.0, 10.0, 11.0, 25.0, 20.0, 38.0, 39.0, 60.0, 81.0, 143.0, 244.0, 381.0, 731.0, 1245.0, 2344.0, 4602.0, 9979.0, 23620.0, 67940.0, 306300.0, 2507142.0, 1056663.0, 142270.0, 40254.0, 15700.0, 6850.0, 3292.0, 1770.0, 973.0, 587.0, 338.0, 184.0, 129.0, 85.0, 62.0, 40.0, 30.0, 29.0, 14.0, 10.0, 9.0, 8.0, 9.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1614990234375, -0.15588760375976562, -0.15027618408203125, -0.14466476440429688, -0.1390533447265625, -0.13344192504882812, -0.12783050537109375, -0.12221908569335938, -0.116607666015625, -0.11099624633789062, -0.10538482666015625, -0.09977340698242188, -0.0941619873046875, -0.08855056762695312, -0.08293914794921875, -0.07732772827148438, -0.07171630859375, -0.06610488891601562, -0.06049346923828125, -0.054882049560546875, -0.0492706298828125, -0.043659210205078125, -0.03804779052734375, -0.032436370849609375, -0.026824951171875, -0.021213531494140625, -0.01560211181640625, -0.009990692138671875, -0.0043792724609375, 0.001232147216796875, 0.00684356689453125, 0.012454986572265625, 0.01806640625, 0.023677825927734375, 0.02928924560546875, 0.034900665283203125, 0.0405120849609375, 0.046123504638671875, 0.05173492431640625, 0.057346343994140625, 0.062957763671875, 0.06856918334960938, 0.07418060302734375, 0.07979202270507812, 0.0854034423828125, 0.09101486206054688, 0.09662628173828125, 0.10223770141601562, 0.10784912109375, 0.11346054077148438, 0.11907196044921875, 0.12468338012695312, 0.1302947998046875, 0.13590621948242188, 0.14151763916015625, 0.14712905883789062, 0.152740478515625, 0.15835189819335938, 0.16396331787109375, 0.16957473754882812, 0.1751861572265625, 0.18079757690429688, 0.18640899658203125, 0.19202041625976562, 0.1976318359375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 8.0, 5.0, 12.0, 16.0, 12.0, 22.0, 33.0, 17.0, 29.0, 34.0, 26.0, 41.0, 47.0, 42.0, 46.0, 53.0, 52.0, 51.0, 50.0, 51.0, 45.0, 43.0, 39.0, 35.0, 25.0, 27.0, 26.0, 18.0, 18.0, 15.0, 16.0, 10.0, 6.0, 7.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0947265625, -0.09137535095214844, -0.08802413940429688, -0.08467292785644531, -0.08132171630859375, -0.07797050476074219, -0.07461929321289062, -0.07126808166503906, -0.0679168701171875, -0.06456565856933594, -0.061214447021484375, -0.05786323547363281, -0.05451202392578125, -0.05116081237792969, -0.047809600830078125, -0.04445838928222656, -0.041107177734375, -0.03775596618652344, -0.034404754638671875, -0.031053543090820312, -0.02770233154296875, -0.024351119995117188, -0.020999908447265625, -0.017648696899414062, -0.0142974853515625, -0.010946273803710938, -0.007595062255859375, -0.0042438507080078125, -0.00089263916015625, 0.0024585723876953125, 0.005809783935546875, 0.009160995483398438, 0.01251220703125, 0.015863418579101562, 0.019214630126953125, 0.022565841674804688, 0.02591705322265625, 0.029268264770507812, 0.032619476318359375, 0.03597068786621094, 0.0393218994140625, 0.04267311096191406, 0.046024322509765625, 0.04937553405761719, 0.05272674560546875, 0.05607795715332031, 0.059429168701171875, 0.06278038024902344, 0.066131591796875, 0.06948280334472656, 0.07283401489257812, 0.07618522644042969, 0.07953643798828125, 0.08288764953613281, 0.08623886108398438, 0.08959007263183594, 0.0929412841796875, 0.09629249572753906, 0.09964370727539062, 0.10299491882324219, 0.10634613037109375, 0.10969734191894531, 0.11304855346679688, 0.11639976501464844, 0.1197509765625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 1.0, 4.0, 6.0, 8.0, 6.0, 14.0, 25.0, 25.0, 37.0, 58.0, 90.0, 141.0, 232.0, 393.0, 695.0, 1366.0, 2880.0, 6638.0, 19475.0, 70948.0, 494011.0, 3190663.0, 325366.0, 54830.0, 15745.0, 5575.0, 2349.0, 1167.0, 604.0, 320.0, 200.0, 124.0, 84.0, 63.0, 37.0, 26.0, 19.0, 23.0, 6.0, 6.0, 8.0, 5.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2332763671875, -0.22476768493652344, -0.21625900268554688, -0.2077503204345703, -0.19924163818359375, -0.1907329559326172, -0.18222427368164062, -0.17371559143066406, -0.1652069091796875, -0.15669822692871094, -0.14818954467773438, -0.1396808624267578, -0.13117218017578125, -0.12266349792480469, -0.11415481567382812, -0.10564613342285156, -0.097137451171875, -0.08862876892089844, -0.08012008666992188, -0.07161140441894531, -0.06310272216796875, -0.05459403991699219, -0.046085357666015625, -0.03757667541503906, -0.0290679931640625, -0.020559310913085938, -0.012050628662109375, -0.0035419464111328125, 0.00496673583984375, 0.013475418090820312, 0.021984100341796875, 0.030492782592773438, 0.03900146484375, 0.04751014709472656, 0.056018829345703125, 0.06452751159667969, 0.07303619384765625, 0.08154487609863281, 0.09005355834960938, 0.09856224060058594, 0.1070709228515625, 0.11557960510253906, 0.12408828735351562, 0.1325969696044922, 0.14110565185546875, 0.1496143341064453, 0.15812301635742188, 0.16663169860839844, 0.175140380859375, 0.18364906311035156, 0.19215774536132812, 0.2006664276123047, 0.20917510986328125, 0.2176837921142578, 0.22619247436523438, 0.23470115661621094, 0.2432098388671875, 0.25171852111816406, 0.2602272033691406, 0.2687358856201172, 0.27724456787109375, 0.2857532501220703, 0.2942619323730469, 0.30277061462402344, 0.311279296875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 5.0, 12.0, 12.0, 8.0, 17.0, 22.0, 30.0, 34.0, 74.0, 76.0, 127.0, 262.0, 427.0, 861.0, 862.0, 484.0, 277.0, 175.0, 79.0, 61.0, 40.0, 29.0, 24.0, 22.0, 16.0, 4.0, 8.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34716796875, -0.3366851806640625, -0.326202392578125, -0.3157196044921875, -0.30523681640625, -0.2947540283203125, -0.284271240234375, -0.2737884521484375, -0.2633056640625, -0.2528228759765625, -0.242340087890625, -0.2318572998046875, -0.22137451171875, -0.2108917236328125, -0.200408935546875, -0.1899261474609375, -0.179443359375, -0.1689605712890625, -0.158477783203125, -0.1479949951171875, -0.13751220703125, -0.1270294189453125, -0.116546630859375, -0.1060638427734375, -0.0955810546875, -0.0850982666015625, -0.074615478515625, -0.0641326904296875, -0.05364990234375, -0.0431671142578125, -0.032684326171875, -0.0222015380859375, -0.01171875, -0.0012359619140625, 0.009246826171875, 0.0197296142578125, 0.03021240234375, 0.0406951904296875, 0.051177978515625, 0.0616607666015625, 0.0721435546875, 0.0826263427734375, 0.093109130859375, 0.1035919189453125, 0.11407470703125, 0.1245574951171875, 0.135040283203125, 0.1455230712890625, 0.156005859375, 0.1664886474609375, 0.176971435546875, 0.1874542236328125, 0.19793701171875, 0.2084197998046875, 0.218902587890625, 0.2293853759765625, 0.2398681640625, 0.2503509521484375, 0.260833740234375, 0.2713165283203125, 0.28179931640625, 0.2922821044921875, 0.302764892578125, 0.3132476806640625, 0.32373046875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 8.0, 8.0, 23.0, 77.0, 168.0, 323.0, 271.0, 87.0, 18.0, 8.0, 7.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.902897834777832, -4.725628852844238, -4.5483598709106445, -4.371090888977051, -4.193821907043457, -4.0165534019470215, -3.8392844200134277, -3.662015438079834, -3.4847464561462402, -3.3074774742126465, -3.1302084922790527, -2.952939748764038, -2.7756707668304443, -2.5984017848968506, -2.421133041381836, -2.243864059448242, -2.0665950775146484, -1.8893260955810547, -1.7120572328567505, -1.5347883701324463, -1.3575193881988525, -1.1802504062652588, -1.0029815435409546, -0.8257126808166504, -0.6484436988830566, -0.47117477655410767, -0.2939058542251587, -0.11663693189620972, 0.06063199043273926, 0.23790091276168823, 0.4151698350906372, 0.5924386978149414, 0.7697076797485352, 0.9469766020774841, 1.124245524406433, 1.3015143871307373, 1.478783369064331, 1.6560523509979248, 1.833321213722229, 2.010590076446533, 2.187859058380127, 2.3651280403137207, 2.5423970222473145, 2.719665765762329, 2.896934747695923, 3.0742037296295166, 3.2514724731445312, 3.428741455078125, 3.6060104370117188, 3.7832794189453125, 3.9605484008789062, 4.1378173828125, 4.315086364746094, 4.492354869842529, 4.669623851776123, 4.846892833709717, 5.0241618156433105, 5.201430797576904, 5.378699779510498, 5.555968761444092, 5.733237266540527, 5.910506248474121, 6.087775230407715, 6.265044212341309, 6.442313194274902]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 4.0, 1.0, 6.0, 4.0, 12.0, 7.0, 7.0, 12.0, 18.0, 17.0, 21.0, 31.0, 34.0, 35.0, 43.0, 41.0, 38.0, 49.0, 47.0, 51.0, 41.0, 48.0, 54.0, 44.0, 33.0, 37.0, 37.0, 24.0, 37.0, 19.0, 21.0, 23.0, 22.0, 17.0, 14.0, 14.0, 14.0, 8.0, 7.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5907424688339233, -1.5431251525878906, -1.4955079555511475, -1.4478906393051147, -1.400273323059082, -1.3526561260223389, -1.3050388097763062, -1.2574214935302734, -1.2098042964935303, -1.1621869802474976, -1.1145697832107544, -1.0669524669647217, -1.0193352699279785, -0.9717179536819458, -0.9241006374359131, -0.8764833807945251, -0.8288661241531372, -0.7812488675117493, -0.7336316108703613, -0.6860142946243286, -0.6383970379829407, -0.5907797813415527, -0.54316246509552, -0.4955452084541321, -0.44792795181274414, -0.4003106951713562, -0.3526934087276459, -0.30507612228393555, -0.2574588656425476, -0.20984159409999847, -0.16222432255744934, -0.11460703611373901, -0.06698989868164062, -0.01937262713909149, 0.02824464440345764, 0.07586191594600677, 0.12347918748855591, 0.17109645903110504, 0.21871373057365417, 0.2663310170173645, 0.31394827365875244, 0.3615655303001404, 0.4091828167438507, 0.45680010318756104, 0.504417359828949, 0.5520346164703369, 0.5996519327163696, 0.6472691893577576, 0.6948864459991455, 0.7425037026405334, 0.7901209592819214, 0.8377382755279541, 0.885355532169342, 0.93297278881073, 0.9805901050567627, 1.0282073020935059, 1.0758246183395386, 1.1234419345855713, 1.1710591316223145, 1.2186764478683472, 1.2662937641143799, 1.313910961151123, 1.3615282773971558, 1.4091455936431885, 1.4567627906799316]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 8.0, 5.0, 17.0, 14.0, 15.0, 28.0, 37.0, 62.0, 92.0, 130.0, 205.0, 268.0, 437.0, 631.0, 938.0, 1582.0, 2432.0, 3991.0, 6822.0, 11689.0, 20536.0, 38006.0, 78665.0, 199680.0, 360356.0, 171976.0, 69749.0, 34400.0, 18721.0, 10568.0, 6100.0, 3733.0, 2313.0, 1444.0, 959.0, 668.0, 423.0, 261.0, 190.0, 130.0, 84.0, 54.0, 37.0, 32.0, 19.0, 13.0, 11.0, 8.0, 5.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.1771240234375, -0.171661376953125, -0.16619873046875, -0.160736083984375, -0.1552734375, -0.149810791015625, -0.14434814453125, -0.138885498046875, -0.1334228515625, -0.127960205078125, -0.12249755859375, -0.117034912109375, -0.111572265625, -0.106109619140625, -0.10064697265625, -0.095184326171875, -0.0897216796875, -0.084259033203125, -0.07879638671875, -0.073333740234375, -0.06787109375, -0.062408447265625, -0.05694580078125, -0.051483154296875, -0.0460205078125, -0.040557861328125, -0.03509521484375, -0.029632568359375, -0.024169921875, -0.018707275390625, -0.01324462890625, -0.007781982421875, -0.0023193359375, 0.003143310546875, 0.00860595703125, 0.014068603515625, 0.01953125, 0.024993896484375, 0.03045654296875, 0.035919189453125, 0.0413818359375, 0.046844482421875, 0.05230712890625, 0.057769775390625, 0.063232421875, 0.068695068359375, 0.07415771484375, 0.079620361328125, 0.0850830078125, 0.090545654296875, 0.09600830078125, 0.101470947265625, 0.10693359375, 0.112396240234375, 0.11785888671875, 0.123321533203125, 0.1287841796875, 0.134246826171875, 0.13970947265625, 0.145172119140625, 0.150634765625, 0.156097412109375, 0.16156005859375, 0.167022705078125, 0.1724853515625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 9.0, 5.0, 8.0, 7.0, 17.0, 14.0, 7.0, 22.0, 22.0, 25.0, 20.0, 27.0, 34.0, 38.0, 48.0, 43.0, 38.0, 27.0, 64.0, 49.0, 46.0, 43.0, 37.0, 38.0, 40.0, 34.0, 25.0, 27.0, 22.0, 27.0, 23.0, 14.0, 13.0, 8.0, 14.0, 8.0, 6.0, 13.0, 12.0, 10.0, 2.0, 6.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0919189453125, -0.08893299102783203, -0.08594703674316406, -0.0829610824584961, -0.07997512817382812, -0.07698917388916016, -0.07400321960449219, -0.07101726531982422, -0.06803131103515625, -0.06504535675048828, -0.06205940246582031, -0.059073448181152344, -0.056087493896484375, -0.053101539611816406, -0.05011558532714844, -0.04712963104248047, -0.0441436767578125, -0.04115772247314453, -0.03817176818847656, -0.035185813903808594, -0.032199859619140625, -0.029213905334472656, -0.026227951049804688, -0.02324199676513672, -0.02025604248046875, -0.01727008819580078, -0.014284133911132812, -0.011298179626464844, -0.008312225341796875, -0.005326271057128906, -0.0023403167724609375, 0.0006456375122070312, 0.003631591796875, 0.006617546081542969, 0.009603500366210938, 0.012589454650878906, 0.015575408935546875, 0.018561363220214844, 0.021547317504882812, 0.02453327178955078, 0.02751922607421875, 0.03050518035888672, 0.03349113464355469, 0.036477088928222656, 0.039463043212890625, 0.042448997497558594, 0.04543495178222656, 0.04842090606689453, 0.0514068603515625, 0.05439281463623047, 0.05737876892089844, 0.060364723205566406, 0.06335067749023438, 0.06633663177490234, 0.06932258605957031, 0.07230854034423828, 0.07529449462890625, 0.07828044891357422, 0.08126640319824219, 0.08425235748291016, 0.08723831176757812, 0.0902242660522461, 0.09321022033691406, 0.09619617462158203, 0.09918212890625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 3.0, 6.0, 8.0, 13.0, 19.0, 25.0, 28.0, 37.0, 67.0, 78.0, 134.0, 226.0, 352.0, 599.0, 1198.0, 2632.0, 8148.0, 43927.0, 704815.0, 253012.0, 23533.0, 5306.0, 1967.0, 999.0, 498.0, 294.0, 201.0, 128.0, 77.0, 69.0, 36.0, 27.0, 34.0, 14.0, 9.0, 12.0, 3.0, 3.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.50537109375, -0.488983154296875, -0.47259521484375, -0.456207275390625, -0.4398193359375, -0.423431396484375, -0.40704345703125, -0.390655517578125, -0.374267578125, -0.357879638671875, -0.34149169921875, -0.325103759765625, -0.3087158203125, -0.292327880859375, -0.27593994140625, -0.259552001953125, -0.2431640625, -0.226776123046875, -0.21038818359375, -0.194000244140625, -0.1776123046875, -0.161224365234375, -0.14483642578125, -0.128448486328125, -0.112060546875, -0.095672607421875, -0.07928466796875, -0.062896728515625, -0.0465087890625, -0.030120849609375, -0.01373291015625, 0.002655029296875, 0.01904296875, 0.035430908203125, 0.05181884765625, 0.068206787109375, 0.0845947265625, 0.100982666015625, 0.11737060546875, 0.133758544921875, 0.150146484375, 0.166534423828125, 0.18292236328125, 0.199310302734375, 0.2156982421875, 0.232086181640625, 0.24847412109375, 0.264862060546875, 0.28125, 0.297637939453125, 0.31402587890625, 0.330413818359375, 0.3468017578125, 0.363189697265625, 0.37957763671875, 0.395965576171875, 0.412353515625, 0.428741455078125, 0.44512939453125, 0.461517333984375, 0.4779052734375, 0.494293212890625, 0.51068115234375, 0.527069091796875, 0.54345703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 2.0, 6.0, 10.0, 7.0, 5.0, 6.0, 13.0, 20.0, 19.0, 28.0, 26.0, 33.0, 29.0, 42.0, 41.0, 32.0, 37.0, 41.0, 42.0, 39.0, 48.0, 42.0, 51.0, 44.0, 33.0, 30.0, 21.0, 30.0, 44.0, 29.0, 19.0, 21.0, 17.0, 17.0, 13.0, 12.0, 6.0, 8.0, 8.0, 6.0, 10.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.50146484375, -0.487396240234375, -0.47332763671875, -0.459259033203125, -0.4451904296875, -0.431121826171875, -0.41705322265625, -0.402984619140625, -0.388916015625, -0.374847412109375, -0.36077880859375, -0.346710205078125, -0.3326416015625, -0.318572998046875, -0.30450439453125, -0.290435791015625, -0.2763671875, -0.262298583984375, -0.24822998046875, -0.234161376953125, -0.2200927734375, -0.206024169921875, -0.19195556640625, -0.177886962890625, -0.163818359375, -0.149749755859375, -0.13568115234375, -0.121612548828125, -0.1075439453125, -0.093475341796875, -0.07940673828125, -0.065338134765625, -0.05126953125, -0.037200927734375, -0.02313232421875, -0.009063720703125, 0.0050048828125, 0.019073486328125, 0.03314208984375, 0.047210693359375, 0.061279296875, 0.075347900390625, 0.08941650390625, 0.103485107421875, 0.1175537109375, 0.131622314453125, 0.14569091796875, 0.159759521484375, 0.173828125, 0.187896728515625, 0.20196533203125, 0.216033935546875, 0.2301025390625, 0.244171142578125, 0.25823974609375, 0.272308349609375, 0.286376953125, 0.300445556640625, 0.31451416015625, 0.328582763671875, 0.3426513671875, 0.356719970703125, 0.37078857421875, 0.384857177734375, 0.39892578125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 9.0, 16.0, 9.0, 27.0, 30.0, 39.0, 75.0, 94.0, 184.0, 273.0, 473.0, 941.0, 1818.0, 4130.0, 10735.0, 32882.0, 168411.0, 691524.0, 98437.0, 23762.0, 8054.0, 3215.0, 1476.0, 861.0, 385.0, 236.0, 147.0, 95.0, 63.0, 42.0, 31.0, 25.0, 9.0, 8.0, 14.0, 8.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.14697265625, -0.1419677734375, -0.136962890625, -0.1319580078125, -0.126953125, -0.1219482421875, -0.116943359375, -0.1119384765625, -0.10693359375, -0.1019287109375, -0.096923828125, -0.0919189453125, -0.0869140625, -0.0819091796875, -0.076904296875, -0.0718994140625, -0.06689453125, -0.0618896484375, -0.056884765625, -0.0518798828125, -0.046875, -0.0418701171875, -0.036865234375, -0.0318603515625, -0.02685546875, -0.0218505859375, -0.016845703125, -0.0118408203125, -0.0068359375, -0.0018310546875, 0.003173828125, 0.0081787109375, 0.01318359375, 0.0181884765625, 0.023193359375, 0.0281982421875, 0.033203125, 0.0382080078125, 0.043212890625, 0.0482177734375, 0.05322265625, 0.0582275390625, 0.063232421875, 0.0682373046875, 0.0732421875, 0.0782470703125, 0.083251953125, 0.0882568359375, 0.09326171875, 0.0982666015625, 0.103271484375, 0.1082763671875, 0.11328125, 0.1182861328125, 0.123291015625, 0.1282958984375, 0.13330078125, 0.1383056640625, 0.143310546875, 0.1483154296875, 0.1533203125, 0.1583251953125, 0.163330078125, 0.1683349609375, 0.17333984375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 3.0, 3.0, 8.0, 1.0, 4.0, 3.0, 2.0, 3.0, 4.0, 5.0, 10.0, 7.0, 10.0, 14.0, 20.0, 20.0, 34.0, 41.0, 42.0, 54.0, 59.0, 70.0, 83.0, 90.0, 73.0, 62.0, 49.0, 27.0, 32.0, 26.0, 16.0, 19.0, 13.0, 13.0, 9.0, 8.0, 10.0, 6.0, 5.0, 12.0, 6.0, 3.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0], "bins": [-4.595518112182617e-05, -4.450324922800064e-05, -4.305131733417511e-05, -4.159938544034958e-05, -4.014745354652405e-05, -3.869552165269852e-05, -3.7243589758872986e-05, -3.5791657865047455e-05, -3.4339725971221924e-05, -3.288779407739639e-05, -3.143586218357086e-05, -2.998393028974533e-05, -2.85319983959198e-05, -2.708006650209427e-05, -2.5628134608268738e-05, -2.4176202714443207e-05, -2.2724270820617676e-05, -2.1272338926792145e-05, -1.9820407032966614e-05, -1.8368475139141083e-05, -1.6916543245315552e-05, -1.546461135149002e-05, -1.401267945766449e-05, -1.2560747563838959e-05, -1.1108815670013428e-05, -9.656883776187897e-06, -8.204951882362366e-06, -6.753019988536835e-06, -5.301088094711304e-06, -3.849156200885773e-06, -2.3972243070602417e-06, -9.452924132347107e-07, 5.066394805908203e-07, 1.9585713744163513e-06, 3.4105032682418823e-06, 4.862435162067413e-06, 6.314367055892944e-06, 7.766298949718475e-06, 9.218230843544006e-06, 1.0670162737369537e-05, 1.2122094631195068e-05, 1.35740265250206e-05, 1.502595841884613e-05, 1.647789031267166e-05, 1.7929822206497192e-05, 1.9381754100322723e-05, 2.0833685994148254e-05, 2.2285617887973785e-05, 2.3737549781799316e-05, 2.5189481675624847e-05, 2.664141356945038e-05, 2.809334546327591e-05, 2.954527735710144e-05, 3.099720925092697e-05, 3.24491411447525e-05, 3.3901073038578033e-05, 3.5353004932403564e-05, 3.6804936826229095e-05, 3.8256868720054626e-05, 3.970880061388016e-05, 4.116073250770569e-05, 4.261266440153122e-05, 4.406459629535675e-05, 4.551652818918228e-05, 4.696846008300781e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 8.0, 5.0, 18.0, 12.0, 22.0, 25.0, 40.0, 55.0, 88.0, 132.0, 186.0, 346.0, 616.0, 1138.0, 2497.0, 6173.0, 21691.0, 137523.0, 739509.0, 109359.0, 18741.0, 5507.0, 2242.0, 1076.0, 584.0, 331.0, 203.0, 114.0, 79.0, 55.0, 44.0, 21.0, 24.0, 19.0, 17.0, 9.0, 7.0, 12.0, 5.0, 2.0, 0.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.1705322265625, -0.16510963439941406, -0.15968704223632812, -0.1542644500732422, -0.14884185791015625, -0.1434192657470703, -0.13799667358398438, -0.13257408142089844, -0.1271514892578125, -0.12172889709472656, -0.11630630493164062, -0.11088371276855469, -0.10546112060546875, -0.10003852844238281, -0.09461593627929688, -0.08919334411621094, -0.083770751953125, -0.07834815979003906, -0.07292556762695312, -0.06750297546386719, -0.06208038330078125, -0.05665779113769531, -0.051235198974609375, -0.04581260681152344, -0.0403900146484375, -0.03496742248535156, -0.029544830322265625, -0.024122238159179688, -0.01869964599609375, -0.013277053833007812, -0.007854461669921875, -0.0024318695068359375, 0.00299072265625, 0.008413314819335938, 0.013835906982421875, 0.019258499145507812, 0.02468109130859375, 0.030103683471679688, 0.035526275634765625, 0.04094886779785156, 0.0463714599609375, 0.05179405212402344, 0.057216644287109375, 0.06263923645019531, 0.06806182861328125, 0.07348442077636719, 0.07890701293945312, 0.08432960510253906, 0.089752197265625, 0.09517478942871094, 0.10059738159179688, 0.10601997375488281, 0.11144256591796875, 0.11686515808105469, 0.12228775024414062, 0.12771034240722656, 0.1331329345703125, 0.13855552673339844, 0.14397811889648438, 0.1494007110595703, 0.15482330322265625, 0.1602458953857422, 0.16566848754882812, 0.17109107971191406, 0.176513671875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 3.0, 2.0, 8.0, 11.0, 19.0, 10.0, 23.0, 22.0, 16.0, 33.0, 54.0, 47.0, 60.0, 69.0, 74.0, 83.0, 74.0, 67.0, 59.0, 65.0, 31.0, 33.0, 30.0, 22.0, 15.0, 19.0, 6.0, 9.0, 7.0, 7.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1131591796875, -0.10870552062988281, -0.10425186157226562, -0.09979820251464844, -0.09534454345703125, -0.09089088439941406, -0.08643722534179688, -0.08198356628417969, -0.0775299072265625, -0.07307624816894531, -0.06862258911132812, -0.06416893005371094, -0.05971527099609375, -0.05526161193847656, -0.050807952880859375, -0.04635429382324219, -0.041900634765625, -0.03744697570800781, -0.032993316650390625, -0.028539657592773438, -0.02408599853515625, -0.019632339477539062, -0.015178680419921875, -0.010725021362304688, -0.0062713623046875, -0.0018177032470703125, 0.002635955810546875, 0.0070896148681640625, 0.01154327392578125, 0.015996932983398438, 0.020450592041015625, 0.024904251098632812, 0.02935791015625, 0.03381156921386719, 0.038265228271484375, 0.04271888732910156, 0.04717254638671875, 0.05162620544433594, 0.056079864501953125, 0.06053352355957031, 0.0649871826171875, 0.06944084167480469, 0.07389450073242188, 0.07834815979003906, 0.08280181884765625, 0.08725547790527344, 0.09170913696289062, 0.09616279602050781, 0.100616455078125, 0.10507011413574219, 0.10952377319335938, 0.11397743225097656, 0.11843109130859375, 0.12288475036621094, 0.12733840942382812, 0.1317920684814453, 0.1362457275390625, 0.1406993865966797, 0.14515304565429688, 0.14960670471191406, 0.15406036376953125, 0.15851402282714844, 0.16296768188476562, 0.1674213409423828, 0.171875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 2.0, 6.0, 5.0, 10.0, 11.0, 43.0, 63.0, 99.0, 149.0, 212.0, 165.0, 109.0, 53.0, 35.0, 10.0, 12.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.661623001098633, -2.5535011291503906, -2.4453794956207275, -2.3372576236724854, -2.2291359901428223, -2.12101411819458, -2.012892246246338, -1.9047706127166748, -1.7966487407684326, -1.68852698802948, -1.5804052352905273, -1.4722833633422852, -1.3641616106033325, -1.2560398578643799, -1.1479181051254272, -1.0397963523864746, -0.931674599647522, -0.8235528469085693, -0.7154310345649719, -0.6073092818260193, -0.49918749928474426, -0.39106571674346924, -0.2829439640045166, -0.1748221516609192, -0.06670039892196655, 0.041421376168727875, 0.1495431512594223, 0.25766491889953613, 0.36578670144081116, 0.4739084839820862, 0.5820302367210388, 0.6901520490646362, 0.7982738018035889, 0.9063955545425415, 1.0145173072814941, 1.1226391792297363, 1.230760931968689, 1.3388826847076416, 1.4470044374465942, 1.5551261901855469, 1.663248062133789, 1.7713698148727417, 1.8794915676116943, 1.9876134395599365, 2.0957350730895996, 2.203856945037842, 2.311978816986084, 2.420100450515747, 2.52822208404541, 2.6363439559936523, 2.7444655895233154, 2.8525874614715576, 2.9607090950012207, 3.068830966949463, 3.176952838897705, 3.285074472427368, 3.3931963443756104, 3.5013182163238525, 3.6094398498535156, 3.717561721801758, 3.825683355331421, 3.933805227279663, 4.041926860809326, 4.150048732757568, 4.2581706047058105]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 6.0, 9.0, 3.0, 7.0, 4.0, 7.0, 14.0, 15.0, 14.0, 12.0, 17.0, 16.0, 32.0, 21.0, 25.0, 38.0, 44.0, 38.0, 36.0, 62.0, 56.0, 48.0, 45.0, 45.0, 49.0, 46.0, 30.0, 32.0, 35.0, 22.0, 35.0, 27.0, 23.0, 11.0, 13.0, 17.0, 6.0, 8.0, 7.0, 7.0, 1.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.1636312007904053, -2.1042208671569824, -2.0448105335235596, -1.9854000806808472, -1.9259897470474243, -1.8665794134140015, -1.8071690797805786, -1.7477586269378662, -1.6883482933044434, -1.6289379596710205, -1.5695276260375977, -1.5101171731948853, -1.4507068395614624, -1.3912965059280396, -1.3318861722946167, -1.2724757194519043, -1.2130653858184814, -1.1536550521850586, -1.0942447185516357, -1.0348342657089233, -0.9754239320755005, -0.9160135984420776, -0.8566032648086548, -0.7971928715705872, -0.7377825975418091, -0.6783722639083862, -0.6189618706703186, -0.5595515370368958, -0.5001411437988281, -0.4407308101654053, -0.38132044672966003, -0.3219100832939148, -0.26249969005584717, -0.20308932662010193, -0.1436789631843567, -0.08426861464977264, -0.024858251214027405, 0.03455209732055664, 0.09396246075630188, 0.15337282419204712, 0.21278318762779236, 0.2721935510635376, 0.33160391449928284, 0.3910142779350281, 0.4504246115684509, 0.5098350048065186, 0.5692453384399414, 0.6286556720733643, 0.6880660653114319, 0.7474763989448547, 0.8068867921829224, 0.8662971258163452, 0.9257075190544128, 0.9851178526878357, 1.0445282459259033, 1.1039385795593262, 1.163348913192749, 1.2227592468261719, 1.2821695804595947, 1.3415800333023071, 1.40099036693573, 1.4604007005691528, 1.5198110342025757, 1.579221487045288, 1.638631820678711]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 7.0, 8.0, 4.0, 11.0, 14.0, 21.0, 24.0, 45.0, 54.0, 89.0, 172.0, 320.0, 728.0, 1696.0, 4621.0, 14819.0, 75555.0, 1213364.0, 2719962.0, 131114.0, 21756.0, 5965.0, 2074.0, 858.0, 419.0, 224.0, 98.0, 84.0, 43.0, 29.0, 28.0, 16.0, 13.0, 6.0, 7.0, 8.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27099609375, -0.2625617980957031, -0.25412750244140625, -0.24569320678710938, -0.2372589111328125, -0.22882461547851562, -0.22039031982421875, -0.21195602416992188, -0.203521728515625, -0.19508743286132812, -0.18665313720703125, -0.17821884155273438, -0.1697845458984375, -0.16135025024414062, -0.15291595458984375, -0.14448165893554688, -0.13604736328125, -0.12761306762695312, -0.11917877197265625, -0.11074447631835938, -0.1023101806640625, -0.09387588500976562, -0.08544158935546875, -0.07700729370117188, -0.068572998046875, -0.060138702392578125, -0.05170440673828125, -0.043270111083984375, -0.0348358154296875, -0.026401519775390625, -0.01796722412109375, -0.009532928466796875, -0.0010986328125, 0.007335662841796875, 0.01576995849609375, 0.024204254150390625, 0.0326385498046875, 0.041072845458984375, 0.04950714111328125, 0.057941436767578125, 0.066375732421875, 0.07481002807617188, 0.08324432373046875, 0.09167861938476562, 0.1001129150390625, 0.10854721069335938, 0.11698150634765625, 0.12541580200195312, 0.13385009765625, 0.14228439331054688, 0.15071868896484375, 0.15915298461914062, 0.1675872802734375, 0.17602157592773438, 0.18445587158203125, 0.19289016723632812, 0.201324462890625, 0.20975875854492188, 0.21819305419921875, 0.22662734985351562, 0.2350616455078125, 0.24349594116210938, 0.25193023681640625, 0.2603645324707031, 0.268798828125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 7.0, 9.0, 12.0, 18.0, 17.0, 29.0, 33.0, 46.0, 57.0, 43.0, 58.0, 80.0, 55.0, 68.0, 76.0, 73.0, 60.0, 52.0, 41.0, 38.0, 39.0, 16.0, 16.0, 14.0, 12.0, 6.0, 11.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.148193359375, -0.14346694946289062, -0.13874053955078125, -0.13401412963867188, -0.1292877197265625, -0.12456130981445312, -0.11983489990234375, -0.11510848999023438, -0.110382080078125, -0.10565567016601562, -0.10092926025390625, -0.09620285034179688, -0.0914764404296875, -0.08675003051757812, -0.08202362060546875, -0.07729721069335938, -0.07257080078125, -0.06784439086914062, -0.06311798095703125, -0.058391571044921875, -0.0536651611328125, -0.048938751220703125, -0.04421234130859375, -0.039485931396484375, -0.034759521484375, -0.030033111572265625, -0.02530670166015625, -0.020580291748046875, -0.0158538818359375, -0.011127471923828125, -0.00640106201171875, -0.001674652099609375, 0.0030517578125, 0.007778167724609375, 0.01250457763671875, 0.017230987548828125, 0.0219573974609375, 0.026683807373046875, 0.03141021728515625, 0.036136627197265625, 0.040863037109375, 0.045589447021484375, 0.05031585693359375, 0.055042266845703125, 0.0597686767578125, 0.06449508666992188, 0.06922149658203125, 0.07394790649414062, 0.07867431640625, 0.08340072631835938, 0.08812713623046875, 0.09285354614257812, 0.0975799560546875, 0.10230636596679688, 0.10703277587890625, 0.11175918579101562, 0.116485595703125, 0.12121200561523438, 0.12593841552734375, 0.13066482543945312, 0.1353912353515625, 0.14011764526367188, 0.14484405517578125, 0.14957046508789062, 0.154296875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 5.0, 8.0, 18.0, 18.0, 34.0, 50.0, 99.0, 167.0, 250.0, 457.0, 796.0, 1556.0, 3315.0, 6806.0, 16530.0, 46498.0, 183244.0, 1551741.0, 2075879.0, 222980.0, 51840.0, 17943.0, 7180.0, 3278.0, 1552.0, 886.0, 421.0, 274.0, 180.0, 109.0, 57.0, 36.0, 28.0, 13.0, 12.0, 11.0, 5.0, 4.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.24755859375, -0.2406940460205078, -0.23382949829101562, -0.22696495056152344, -0.22010040283203125, -0.21323585510253906, -0.20637130737304688, -0.1995067596435547, -0.1926422119140625, -0.1857776641845703, -0.17891311645507812, -0.17204856872558594, -0.16518402099609375, -0.15831947326660156, -0.15145492553710938, -0.1445903778076172, -0.137725830078125, -0.1308612823486328, -0.12399673461914062, -0.11713218688964844, -0.11026763916015625, -0.10340309143066406, -0.09653854370117188, -0.08967399597167969, -0.0828094482421875, -0.07594490051269531, -0.06908035278320312, -0.06221580505371094, -0.05535125732421875, -0.04848670959472656, -0.041622161865234375, -0.03475761413574219, -0.02789306640625, -0.021028518676757812, -0.014163970947265625, -0.0072994232177734375, -0.00043487548828125, 0.0064296722412109375, 0.013294219970703125, 0.020158767700195312, 0.0270233154296875, 0.03388786315917969, 0.040752410888671875, 0.04761695861816406, 0.05448150634765625, 0.06134605407714844, 0.06821060180664062, 0.07507514953613281, 0.081939697265625, 0.08880424499511719, 0.09566879272460938, 0.10253334045410156, 0.10939788818359375, 0.11626243591308594, 0.12312698364257812, 0.1299915313720703, 0.1368560791015625, 0.1437206268310547, 0.15058517456054688, 0.15744972229003906, 0.16431427001953125, 0.17117881774902344, 0.17804336547851562, 0.1849079132080078, 0.1917724609375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 2.0, 6.0, 5.0, 6.0, 11.0, 17.0, 12.0, 16.0, 21.0, 25.0, 36.0, 69.0, 91.0, 112.0, 174.0, 278.0, 435.0, 702.0, 728.0, 464.0, 331.0, 170.0, 101.0, 60.0, 48.0, 37.0, 28.0, 20.0, 12.0, 14.0, 11.0, 9.0, 6.0, 4.0, 2.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.284423828125, -0.2760581970214844, -0.26769256591796875, -0.2593269348144531, -0.2509613037109375, -0.24259567260742188, -0.23423004150390625, -0.22586441040039062, -0.217498779296875, -0.20913314819335938, -0.20076751708984375, -0.19240188598632812, -0.1840362548828125, -0.17567062377929688, -0.16730499267578125, -0.15893936157226562, -0.15057373046875, -0.14220809936523438, -0.13384246826171875, -0.12547683715820312, -0.1171112060546875, -0.10874557495117188, -0.10037994384765625, -0.09201431274414062, -0.083648681640625, -0.07528305053710938, -0.06691741943359375, -0.058551788330078125, -0.0501861572265625, -0.041820526123046875, -0.03345489501953125, -0.025089263916015625, -0.0167236328125, -0.008358001708984375, 7.62939453125e-06, 0.008373260498046875, 0.0167388916015625, 0.025104522705078125, 0.03347015380859375, 0.041835784912109375, 0.050201416015625, 0.058567047119140625, 0.06693267822265625, 0.07529830932617188, 0.0836639404296875, 0.09202957153320312, 0.10039520263671875, 0.10876083374023438, 0.11712646484375, 0.12549209594726562, 0.13385772705078125, 0.14222335815429688, 0.1505889892578125, 0.15895462036132812, 0.16732025146484375, 0.17568588256835938, 0.184051513671875, 0.19241714477539062, 0.20078277587890625, 0.20914840698242188, 0.2175140380859375, 0.22587966918945312, 0.23424530029296875, 0.24261093139648438, 0.2509765625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 10.0, 6.0, 15.0, 17.0, 65.0, 119.0, 242.0, 246.0, 165.0, 66.0, 26.0, 10.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.50014591217041, -5.373208999633789, -5.24627161026001, -5.1193342208862305, -4.992397308349609, -4.865460395812988, -4.738523006439209, -4.61158561706543, -4.484648704528809, -4.3577117919921875, -4.230774402618408, -4.103837013244629, -3.976900100708008, -3.8499629497528076, -3.7230257987976074, -3.5960886478424072, -3.469151496887207, -3.342214345932007, -3.2152771949768066, -3.0883400440216064, -2.9614028930664062, -2.834465742111206, -2.707528591156006, -2.5805914402008057, -2.4536542892456055, -2.3267171382904053, -2.199779987335205, -2.072842836380005, -1.9459056854248047, -1.8189685344696045, -1.6920313835144043, -1.565094232559204, -1.438157081604004, -1.3112199306488037, -1.1842827796936035, -1.0573456287384033, -0.9304084777832031, -0.8034713268280029, -0.6765341758728027, -0.5495970249176025, -0.42265987396240234, -0.29572272300720215, -0.16878557205200195, -0.04184842109680176, 0.08508872985839844, 0.21202588081359863, 0.33896303176879883, 0.465900182723999, 0.5928373336791992, 0.7197744846343994, 0.8467116355895996, 0.9736487865447998, 1.1005859375, 1.2275230884552002, 1.3544602394104004, 1.4813973903656006, 1.6083345413208008, 1.735271692276001, 1.8622088432312012, 1.9891459941864014, 2.1160831451416016, 2.2430202960968018, 2.369957447052002, 2.496894598007202, 2.6238317489624023]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 2.0, 4.0, 4.0, 7.0, 10.0, 6.0, 14.0, 14.0, 25.0, 27.0, 22.0, 37.0, 42.0, 36.0, 46.0, 40.0, 52.0, 48.0, 62.0, 65.0, 57.0, 51.0, 55.0, 39.0, 38.0, 34.0, 29.0, 27.0, 23.0, 19.0, 15.0, 9.0, 12.0, 10.0, 4.0, 4.0, 5.0, 2.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5750240087509155, -1.5291730165481567, -1.4833221435546875, -1.4374711513519287, -1.39162015914917, -1.3457691669464111, -1.299918293952942, -1.254067301750183, -1.2082164287567139, -1.162365436553955, -1.1165145635604858, -1.070663571357727, -1.0248125791549683, -0.9789616465568542, -0.9331107139587402, -0.8872597217559814, -0.8414087295532227, -0.7955577969551086, -0.7497068047523499, -0.7038558721542358, -0.658004879951477, -0.612153947353363, -0.566303014755249, -0.5204520225524902, -0.4746010899543762, -0.4287501275539398, -0.3828991651535034, -0.3370482325553894, -0.291197270154953, -0.2453463077545166, -0.1994953751564026, -0.1536444127559662, -0.10779345035552979, -0.06194249540567398, -0.016091540455818176, 0.02975940704345703, 0.07561036944389343, 0.12146133184432983, 0.16731226444244385, 0.21316322684288025, 0.25901418924331665, 0.30486515164375305, 0.35071611404418945, 0.39656704664230347, 0.44241800904273987, 0.48826897144317627, 0.5341199040412903, 0.5799708366394043, 0.6258218288421631, 0.6716727614402771, 0.7175237536430359, 0.7633746862411499, 0.8092256784439087, 0.8550766110420227, 0.9009275436401367, 0.9467785358428955, 0.9926294684410095, 1.0384804010391235, 1.0843313932418823, 1.1301822662353516, 1.1760332584381104, 1.2218842506408691, 1.267735242843628, 1.3135861158370972, 1.359437108039856]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 6.0, 5.0, 12.0, 15.0, 17.0, 27.0, 41.0, 61.0, 99.0, 136.0, 198.0, 386.0, 574.0, 856.0, 1383.0, 2257.0, 3690.0, 6558.0, 12295.0, 22965.0, 49836.0, 131136.0, 349574.0, 284315.0, 98631.0, 39669.0, 19256.0, 10178.0, 5664.0, 3282.0, 2040.0, 1219.0, 732.0, 500.0, 336.0, 202.0, 134.0, 93.0, 62.0, 49.0, 24.0, 13.0, 7.0, 9.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0], "bins": [-0.1807861328125, -0.17528533935546875, -0.1697845458984375, -0.16428375244140625, -0.158782958984375, -0.15328216552734375, -0.1477813720703125, -0.14228057861328125, -0.13677978515625, -0.13127899169921875, -0.1257781982421875, -0.12027740478515625, -0.114776611328125, -0.10927581787109375, -0.1037750244140625, -0.09827423095703125, -0.0927734375, -0.08727264404296875, -0.0817718505859375, -0.07627105712890625, -0.070770263671875, -0.06526947021484375, -0.0597686767578125, -0.05426788330078125, -0.04876708984375, -0.04326629638671875, -0.0377655029296875, -0.03226470947265625, -0.026763916015625, -0.02126312255859375, -0.0157623291015625, -0.01026153564453125, -0.0047607421875, 0.00074005126953125, 0.0062408447265625, 0.01174163818359375, 0.017242431640625, 0.02274322509765625, 0.0282440185546875, 0.03374481201171875, 0.03924560546875, 0.04474639892578125, 0.0502471923828125, 0.05574798583984375, 0.061248779296875, 0.06674957275390625, 0.0722503662109375, 0.07775115966796875, 0.083251953125, 0.08875274658203125, 0.0942535400390625, 0.09975433349609375, 0.105255126953125, 0.11075592041015625, 0.1162567138671875, 0.12175750732421875, 0.12725830078125, 0.13275909423828125, 0.1382598876953125, 0.14376068115234375, 0.149261474609375, 0.15476226806640625, 0.1602630615234375, 0.16576385498046875, 0.1712646484375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 0.0, 3.0, 4.0, 6.0, 9.0, 5.0, 11.0, 12.0, 19.0, 15.0, 26.0, 29.0, 22.0, 35.0, 28.0, 36.0, 45.0, 40.0, 50.0, 38.0, 38.0, 53.0, 49.0, 43.0, 40.0, 35.0, 35.0, 32.0, 39.0, 34.0, 23.0, 22.0, 24.0, 25.0, 11.0, 14.0, 12.0, 6.0, 5.0, 8.0, 6.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.10479736328125, -0.10155773162841797, -0.09831809997558594, -0.0950784683227539, -0.09183883666992188, -0.08859920501708984, -0.08535957336425781, -0.08211994171142578, -0.07888031005859375, -0.07564067840576172, -0.07240104675292969, -0.06916141510009766, -0.06592178344726562, -0.0626821517944336, -0.05944252014160156, -0.05620288848876953, -0.0529632568359375, -0.04972362518310547, -0.04648399353027344, -0.043244361877441406, -0.040004730224609375, -0.036765098571777344, -0.03352546691894531, -0.03028583526611328, -0.02704620361328125, -0.02380657196044922, -0.020566940307617188, -0.017327308654785156, -0.014087677001953125, -0.010848045349121094, -0.0076084136962890625, -0.004368782043457031, -0.001129150390625, 0.0021104812622070312, 0.0053501129150390625, 0.008589744567871094, 0.011829376220703125, 0.015069007873535156, 0.018308639526367188, 0.02154827117919922, 0.02478790283203125, 0.02802753448486328, 0.03126716613769531, 0.034506797790527344, 0.037746429443359375, 0.040986061096191406, 0.04422569274902344, 0.04746532440185547, 0.0507049560546875, 0.05394458770751953, 0.05718421936035156, 0.060423851013183594, 0.06366348266601562, 0.06690311431884766, 0.07014274597167969, 0.07338237762451172, 0.07662200927734375, 0.07986164093017578, 0.08310127258300781, 0.08634090423583984, 0.08958053588867188, 0.0928201675415039, 0.09605979919433594, 0.09929943084716797, 0.1025390625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 10.0, 11.0, 9.0, 25.0, 28.0, 31.0, 40.0, 64.0, 123.0, 158.0, 331.0, 613.0, 1243.0, 2882.0, 9557.0, 48180.0, 694315.0, 254192.0, 26207.0, 6330.0, 2100.0, 890.0, 502.0, 258.0, 160.0, 96.0, 69.0, 35.0, 25.0, 19.0, 17.0, 16.0, 8.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.438720703125, -0.4240150451660156, -0.40930938720703125, -0.3946037292480469, -0.3798980712890625, -0.3651924133300781, -0.35048675537109375, -0.3357810974121094, -0.321075439453125, -0.3063697814941406, -0.29166412353515625, -0.2769584655761719, -0.2622528076171875, -0.24754714965820312, -0.23284149169921875, -0.21813583374023438, -0.20343017578125, -0.18872451782226562, -0.17401885986328125, -0.15931320190429688, -0.1446075439453125, -0.12990188598632812, -0.11519622802734375, -0.10049057006835938, -0.085784912109375, -0.07107925415039062, -0.05637359619140625, -0.041667938232421875, -0.0269622802734375, -0.012256622314453125, 0.00244903564453125, 0.017154693603515625, 0.0318603515625, 0.046566009521484375, 0.06127166748046875, 0.07597732543945312, 0.0906829833984375, 0.10538864135742188, 0.12009429931640625, 0.13479995727539062, 0.149505615234375, 0.16421127319335938, 0.17891693115234375, 0.19362258911132812, 0.2083282470703125, 0.22303390502929688, 0.23773956298828125, 0.2524452209472656, 0.26715087890625, 0.2818565368652344, 0.29656219482421875, 0.3112678527832031, 0.3259735107421875, 0.3406791687011719, 0.35538482666015625, 0.3700904846191406, 0.384796142578125, 0.3995018005371094, 0.41420745849609375, 0.4289131164550781, 0.4436187744140625, 0.4583244323730469, 0.47303009033203125, 0.4877357482910156, 0.50244140625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 9.0, 3.0, 6.0, 4.0, 12.0, 16.0, 23.0, 21.0, 28.0, 38.0, 31.0, 44.0, 47.0, 53.0, 58.0, 54.0, 66.0, 59.0, 58.0, 44.0, 50.0, 48.0, 41.0, 30.0, 39.0, 21.0, 30.0, 17.0, 10.0, 8.0, 7.0, 8.0, 7.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.57568359375, -0.5591812133789062, -0.5426788330078125, -0.5261764526367188, -0.509674072265625, -0.49317169189453125, -0.4766693115234375, -0.46016693115234375, -0.44366455078125, -0.42716217041015625, -0.4106597900390625, -0.39415740966796875, -0.377655029296875, -0.36115264892578125, -0.3446502685546875, -0.32814788818359375, -0.3116455078125, -0.29514312744140625, -0.2786407470703125, -0.26213836669921875, -0.245635986328125, -0.22913360595703125, -0.2126312255859375, -0.19612884521484375, -0.17962646484375, -0.16312408447265625, -0.1466217041015625, -0.13011932373046875, -0.113616943359375, -0.09711456298828125, -0.0806121826171875, -0.06410980224609375, -0.047607421875, -0.03110504150390625, -0.0146026611328125, 0.00189971923828125, 0.018402099609375, 0.03490447998046875, 0.0514068603515625, 0.06790924072265625, 0.08441162109375, 0.10091400146484375, 0.1174163818359375, 0.13391876220703125, 0.150421142578125, 0.16692352294921875, 0.1834259033203125, 0.19992828369140625, 0.2164306640625, 0.23293304443359375, 0.2494354248046875, 0.26593780517578125, 0.282440185546875, 0.29894256591796875, 0.3154449462890625, 0.33194732666015625, 0.34844970703125, 0.36495208740234375, 0.3814544677734375, 0.39795684814453125, 0.414459228515625, 0.43096160888671875, 0.4474639892578125, 0.46396636962890625, 0.48046875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 6.0, 4.0, 8.0, 3.0, 5.0, 11.0, 14.0, 27.0, 38.0, 65.0, 91.0, 125.0, 194.0, 451.0, 921.0, 2129.0, 6293.0, 23568.0, 159366.0, 729027.0, 100394.0, 17379.0, 4995.0, 1760.0, 716.0, 411.0, 185.0, 119.0, 73.0, 70.0, 26.0, 27.0, 18.0, 12.0, 6.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1754150390625, -0.16901206970214844, -0.16260910034179688, -0.1562061309814453, -0.14980316162109375, -0.1434001922607422, -0.13699722290039062, -0.13059425354003906, -0.1241912841796875, -0.11778831481933594, -0.11138534545898438, -0.10498237609863281, -0.09857940673828125, -0.09217643737792969, -0.08577346801757812, -0.07937049865722656, -0.072967529296875, -0.06656455993652344, -0.060161590576171875, -0.05375862121582031, -0.04735565185546875, -0.04095268249511719, -0.034549713134765625, -0.028146743774414062, -0.0217437744140625, -0.015340805053710938, -0.008937835693359375, -0.0025348663330078125, 0.00386810302734375, 0.010271072387695312, 0.016674041748046875, 0.023077011108398438, 0.02947998046875, 0.03588294982910156, 0.042285919189453125, 0.04868888854980469, 0.05509185791015625, 0.06149482727050781, 0.06789779663085938, 0.07430076599121094, 0.0807037353515625, 0.08710670471191406, 0.09350967407226562, 0.09991264343261719, 0.10631561279296875, 0.11271858215332031, 0.11912155151367188, 0.12552452087402344, 0.131927490234375, 0.13833045959472656, 0.14473342895507812, 0.1511363983154297, 0.15753936767578125, 0.1639423370361328, 0.17034530639648438, 0.17674827575683594, 0.1831512451171875, 0.18955421447753906, 0.19595718383789062, 0.2023601531982422, 0.20876312255859375, 0.2151660919189453, 0.22156906127929688, 0.22797203063964844, 0.234375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 4.0, 5.0, 4.0, 6.0, 7.0, 11.0, 15.0, 11.0, 17.0, 17.0, 25.0, 26.0, 42.0, 51.0, 61.0, 70.0, 87.0, 112.0, 79.0, 72.0, 63.0, 58.0, 41.0, 26.0, 14.0, 10.0, 18.0, 10.0, 5.0, 5.0, 6.0, 6.0, 1.0, 5.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.513429641723633e-05, -5.342625081539154e-05, -5.171820521354675e-05, -5.0010159611701965e-05, -4.830211400985718e-05, -4.659406840801239e-05, -4.48860228061676e-05, -4.3177977204322815e-05, -4.146993160247803e-05, -3.976188600063324e-05, -3.805384039878845e-05, -3.6345794796943665e-05, -3.463774919509888e-05, -3.292970359325409e-05, -3.12216579914093e-05, -2.9513612389564514e-05, -2.7805566787719727e-05, -2.609752118587494e-05, -2.438947558403015e-05, -2.2681429982185364e-05, -2.0973384380340576e-05, -1.926533877849579e-05, -1.7557293176651e-05, -1.5849247574806213e-05, -1.4141201972961426e-05, -1.2433156371116638e-05, -1.072511076927185e-05, -9.017065167427063e-06, -7.309019565582275e-06, -5.600973963737488e-06, -3.8929283618927e-06, -2.1848827600479126e-06, -4.76837158203125e-07, 1.2312084436416626e-06, 2.93925404548645e-06, 4.647299647331238e-06, 6.355345249176025e-06, 8.063390851020813e-06, 9.7714364528656e-06, 1.1479482054710388e-05, 1.3187527656555176e-05, 1.4895573258399963e-05, 1.660361886024475e-05, 1.831166446208954e-05, 2.0019710063934326e-05, 2.1727755665779114e-05, 2.34358012676239e-05, 2.514384686946869e-05, 2.6851892471313477e-05, 2.8559938073158264e-05, 3.0267983675003052e-05, 3.197602927684784e-05, 3.368407487869263e-05, 3.5392120480537415e-05, 3.71001660823822e-05, 3.880821168422699e-05, 4.051625728607178e-05, 4.2224302887916565e-05, 4.393234848976135e-05, 4.564039409160614e-05, 4.734843969345093e-05, 4.9056485295295715e-05, 5.07645308971405e-05, 5.247257649898529e-05, 5.418062210083008e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 7.0, 8.0, 9.0, 18.0, 21.0, 33.0, 58.0, 97.0, 178.0, 363.0, 764.0, 2064.0, 7410.0, 47481.0, 722429.0, 240396.0, 20374.0, 4337.0, 1391.0, 579.0, 238.0, 117.0, 79.0, 43.0, 27.0, 13.0, 10.0, 8.0, 3.0, 4.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2454833984375, -0.23751258850097656, -0.22954177856445312, -0.2215709686279297, -0.21360015869140625, -0.2056293487548828, -0.19765853881835938, -0.18968772888183594, -0.1817169189453125, -0.17374610900878906, -0.16577529907226562, -0.1578044891357422, -0.14983367919921875, -0.1418628692626953, -0.13389205932617188, -0.12592124938964844, -0.117950439453125, -0.10997962951660156, -0.10200881958007812, -0.09403800964355469, -0.08606719970703125, -0.07809638977050781, -0.07012557983398438, -0.06215476989746094, -0.0541839599609375, -0.04621315002441406, -0.038242340087890625, -0.030271530151367188, -0.02230072021484375, -0.014329910278320312, -0.006359100341796875, 0.0016117095947265625, 0.00958251953125, 0.017553329467773438, 0.025524139404296875, 0.03349494934082031, 0.04146575927734375, 0.04943656921386719, 0.057407379150390625, 0.06537818908691406, 0.0733489990234375, 0.08131980895996094, 0.08929061889648438, 0.09726142883300781, 0.10523223876953125, 0.11320304870605469, 0.12117385864257812, 0.12914466857910156, 0.137115478515625, 0.14508628845214844, 0.15305709838867188, 0.1610279083251953, 0.16899871826171875, 0.1769695281982422, 0.18494033813476562, 0.19291114807128906, 0.2008819580078125, 0.20885276794433594, 0.21682357788085938, 0.2247943878173828, 0.23276519775390625, 0.2407360076904297, 0.24870681762695312, 0.25667762756347656, 0.2646484375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 9.0, 14.0, 9.0, 13.0, 19.0, 22.0, 27.0, 46.0, 71.0, 75.0, 103.0, 118.0, 109.0, 84.0, 71.0, 58.0, 40.0, 26.0, 23.0, 17.0, 19.0, 8.0, 7.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2354736328125, -0.2294139862060547, -0.22335433959960938, -0.21729469299316406, -0.21123504638671875, -0.20517539978027344, -0.19911575317382812, -0.1930561065673828, -0.1869964599609375, -0.1809368133544922, -0.17487716674804688, -0.16881752014160156, -0.16275787353515625, -0.15669822692871094, -0.15063858032226562, -0.1445789337158203, -0.138519287109375, -0.1324596405029297, -0.12639999389648438, -0.12034034729003906, -0.11428070068359375, -0.10822105407714844, -0.10216140747070312, -0.09610176086425781, -0.0900421142578125, -0.08398246765136719, -0.07792282104492188, -0.07186317443847656, -0.06580352783203125, -0.05974388122558594, -0.053684234619140625, -0.04762458801269531, -0.04156494140625, -0.03550529479980469, -0.029445648193359375, -0.023386001586914062, -0.01732635498046875, -0.011266708374023438, -0.005207061767578125, 0.0008525848388671875, 0.0069122314453125, 0.012971878051757812, 0.019031524658203125, 0.025091171264648438, 0.03115081787109375, 0.03721046447753906, 0.043270111083984375, 0.04932975769042969, 0.055389404296875, 0.06144905090332031, 0.06750869750976562, 0.07356834411621094, 0.07962799072265625, 0.08568763732910156, 0.09174728393554688, 0.09780693054199219, 0.1038665771484375, 0.10992622375488281, 0.11598587036132812, 0.12204551696777344, 0.12810516357421875, 0.13416481018066406, 0.14022445678710938, 0.1462841033935547, 0.15234375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 1.0, 6.0, 15.0, 25.0, 61.0, 145.0, 250.0, 267.0, 131.0, 56.0, 25.0, 6.0, 4.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.136523723602295, -3.000941276550293, -2.865358829498291, -2.72977614402771, -2.594193696975708, -2.458611249923706, -2.323028564453125, -2.187446117401123, -2.051863670349121, -1.9162812232971191, -1.7806986570358276, -1.6451160907745361, -1.5095336437225342, -1.3739511966705322, -1.2383686304092407, -1.1027860641479492, -0.9672036170959473, -0.8316211104393005, -0.6960386037826538, -0.5604560971260071, -0.42487359046936035, -0.2892910838127136, -0.1537085771560669, -0.018126070499420166, 0.11745643615722656, 0.2530389428138733, 0.38862144947052, 0.5242039561271667, 0.6597864627838135, 0.7953689694404602, 0.9309514760971069, 1.0665340423583984, 1.2021164894104004, 1.3376989364624023, 1.4732815027236938, 1.6088640689849854, 1.7444465160369873, 1.8800289630889893, 2.0156116485595703, 2.1511940956115723, 2.286776542663574, 2.422358989715576, 2.557941436767578, 2.693524122238159, 2.829106569290161, 2.964689016342163, 3.100271701812744, 3.235854148864746, 3.371436595916748, 3.50701904296875, 3.642601490020752, 3.778184175491333, 3.913766622543335, 4.049349308013916, 4.184931755065918, 4.32051420211792, 4.456096649169922, 4.591679096221924, 4.727261543273926, 4.862843990325928, 4.99842643737793, 5.13400936126709, 5.269591808319092, 5.405174255371094, 5.540756702423096]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 4.0, 12.0, 13.0, 20.0, 17.0, 13.0, 25.0, 29.0, 22.0, 38.0, 30.0, 33.0, 45.0, 49.0, 51.0, 50.0, 48.0, 61.0, 61.0, 54.0, 49.0, 41.0, 31.0, 35.0, 26.0, 22.0, 24.0, 20.0, 17.0, 8.0, 11.0, 4.0, 7.0, 6.0, 8.0, 4.0, 4.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5769604444503784, -1.5185120105743408, -1.4600635766983032, -1.4016151428222656, -1.343166708946228, -1.2847182750701904, -1.2262698411941528, -1.1678214073181152, -1.1093729734420776, -1.05092453956604, -0.9924761056900024, -0.9340276718139648, -0.8755792379379272, -0.8171308040618896, -0.758682370185852, -0.7002339363098145, -0.6417855024337769, -0.5833370685577393, -0.5248886346817017, -0.46644020080566406, -0.40799176692962646, -0.34954333305358887, -0.29109489917755127, -0.23264646530151367, -0.17419803142547607, -0.11574959754943848, -0.05730116367340088, 0.0011472702026367188, 0.059595704078674316, 0.11804413795471191, 0.1764925718307495, 0.2349410057067871, 0.29338955879211426, 0.35183799266815186, 0.41028642654418945, 0.46873486042022705, 0.5271832942962646, 0.5856317281723022, 0.6440801620483398, 0.7025285959243774, 0.760977029800415, 0.8194254636764526, 0.8778738975524902, 0.9363223314285278, 0.9947707653045654, 1.053219199180603, 1.1116676330566406, 1.1701160669326782, 1.2285645008087158, 1.2870129346847534, 1.345461368560791, 1.4039098024368286, 1.4623582363128662, 1.5208066701889038, 1.5792551040649414, 1.637703537940979, 1.6961519718170166, 1.7546004056930542, 1.8130488395690918, 1.8714972734451294, 1.929945707321167, 1.9883941411972046, 2.046842575073242, 2.1052908897399902, 2.1637394428253174]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 1.0, 8.0, 5.0, 2.0, 7.0, 11.0, 5.0, 15.0, 24.0, 23.0, 39.0, 52.0, 68.0, 104.0, 146.0, 253.0, 365.0, 625.0, 935.0, 1710.0, 3165.0, 5882.0, 11843.0, 25741.0, 62853.0, 182617.0, 659197.0, 1785870.0, 1024822.0, 273529.0, 87398.0, 34447.0, 15435.0, 7676.0, 3869.0, 2192.0, 1252.0, 801.0, 443.0, 281.0, 186.0, 136.0, 76.0, 60.0, 33.0, 21.0, 31.0, 12.0, 11.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.1337890625, -0.13003826141357422, -0.12628746032714844, -0.12253665924072266, -0.11878585815429688, -0.1150350570678711, -0.11128425598144531, -0.10753345489501953, -0.10378265380859375, -0.10003185272216797, -0.09628105163574219, -0.0925302505493164, -0.08877944946289062, -0.08502864837646484, -0.08127784729003906, -0.07752704620361328, -0.0737762451171875, -0.07002544403076172, -0.06627464294433594, -0.06252384185791016, -0.058773040771484375, -0.055022239685058594, -0.05127143859863281, -0.04752063751220703, -0.04376983642578125, -0.04001903533935547, -0.03626823425292969, -0.032517433166503906, -0.028766632080078125, -0.025015830993652344, -0.021265029907226562, -0.01751422882080078, -0.013763427734375, -0.010012626647949219, -0.0062618255615234375, -0.0025110244750976562, 0.001239776611328125, 0.004990577697753906, 0.008741378784179688, 0.012492179870605469, 0.01624298095703125, 0.01999378204345703, 0.023744583129882812, 0.027495384216308594, 0.031246185302734375, 0.034996986389160156, 0.03874778747558594, 0.04249858856201172, 0.0462493896484375, 0.05000019073486328, 0.05375099182128906, 0.057501792907714844, 0.061252593994140625, 0.0650033950805664, 0.06875419616699219, 0.07250499725341797, 0.07625579833984375, 0.08000659942626953, 0.08375740051269531, 0.0875082015991211, 0.09125900268554688, 0.09500980377197266, 0.09876060485839844, 0.10251140594482422, 0.10626220703125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 11.0, 17.0, 17.0, 28.0, 36.0, 39.0, 42.0, 54.0, 62.0, 68.0, 57.0, 70.0, 68.0, 55.0, 70.0, 52.0, 50.0, 44.0, 40.0, 29.0, 17.0, 25.0, 17.0, 12.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1878662109375, -0.18338871002197266, -0.1789112091064453, -0.17443370819091797, -0.16995620727539062, -0.16547870635986328, -0.16100120544433594, -0.1565237045288086, -0.15204620361328125, -0.1475687026977539, -0.14309120178222656, -0.13861370086669922, -0.13413619995117188, -0.12965869903564453, -0.1251811981201172, -0.12070369720458984, -0.1162261962890625, -0.11174869537353516, -0.10727119445800781, -0.10279369354248047, -0.09831619262695312, -0.09383869171142578, -0.08936119079589844, -0.0848836898803711, -0.08040618896484375, -0.0759286880493164, -0.07145118713378906, -0.06697368621826172, -0.062496185302734375, -0.05801868438720703, -0.05354118347167969, -0.049063682556152344, -0.044586181640625, -0.040108680725097656, -0.03563117980957031, -0.03115367889404297, -0.026676177978515625, -0.02219867706298828, -0.017721176147460938, -0.013243675231933594, -0.00876617431640625, -0.004288673400878906, 0.0001888275146484375, 0.004666328430175781, 0.009143829345703125, 0.013621330261230469, 0.018098831176757812, 0.022576332092285156, 0.0270538330078125, 0.031531333923339844, 0.03600883483886719, 0.04048633575439453, 0.044963836669921875, 0.04944133758544922, 0.05391883850097656, 0.058396339416503906, 0.06287384033203125, 0.0673513412475586, 0.07182884216308594, 0.07630634307861328, 0.08078384399414062, 0.08526134490966797, 0.08973884582519531, 0.09421634674072266, 0.09869384765625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 23.0, 34.0, 55.0, 93.0, 192.0, 376.0, 796.0, 2085.0, 5852.0, 21323.0, 105633.0, 1117408.0, 2663998.0, 222047.0, 38343.0, 9975.0, 3284.0, 1401.0, 643.0, 317.0, 157.0, 103.0, 54.0, 23.0, 21.0, 15.0, 9.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3173828125, -0.3075218200683594, -0.29766082763671875, -0.2877998352050781, -0.2779388427734375, -0.2680778503417969, -0.25821685791015625, -0.24835586547851562, -0.238494873046875, -0.22863388061523438, -0.21877288818359375, -0.20891189575195312, -0.1990509033203125, -0.18918991088867188, -0.17932891845703125, -0.16946792602539062, -0.15960693359375, -0.14974594116210938, -0.13988494873046875, -0.13002395629882812, -0.1201629638671875, -0.11030197143554688, -0.10044097900390625, -0.09057998657226562, -0.080718994140625, -0.07085800170898438, -0.06099700927734375, -0.051136016845703125, -0.0412750244140625, -0.031414031982421875, -0.02155303955078125, -0.011692047119140625, -0.0018310546875, 0.008029937744140625, 0.01789093017578125, 0.027751922607421875, 0.0376129150390625, 0.047473907470703125, 0.05733489990234375, 0.06719589233398438, 0.077056884765625, 0.08691787719726562, 0.09677886962890625, 0.10663986206054688, 0.1165008544921875, 0.12636184692382812, 0.13622283935546875, 0.14608383178710938, 0.15594482421875, 0.16580581665039062, 0.17566680908203125, 0.18552780151367188, 0.1953887939453125, 0.20524978637695312, 0.21511077880859375, 0.22497177124023438, 0.234832763671875, 0.24469375610351562, 0.25455474853515625, 0.2644157409667969, 0.2742767333984375, 0.2841377258300781, 0.29399871826171875, 0.3038597106933594, 0.313720703125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 2.0, 1.0, 2.0, 4.0, 11.0, 6.0, 14.0, 16.0, 20.0, 20.0, 35.0, 41.0, 55.0, 71.0, 91.0, 138.0, 185.0, 266.0, 331.0, 438.0, 491.0, 478.0, 356.0, 254.0, 154.0, 146.0, 100.0, 72.0, 56.0, 44.0, 36.0, 21.0, 21.0, 18.0, 14.0, 10.0, 9.0, 18.0, 3.0, 14.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.231201171875, -0.22312545776367188, -0.21504974365234375, -0.20697402954101562, -0.1988983154296875, -0.19082260131835938, -0.18274688720703125, -0.17467117309570312, -0.166595458984375, -0.15851974487304688, -0.15044403076171875, -0.14236831665039062, -0.1342926025390625, -0.12621688842773438, -0.11814117431640625, -0.11006546020507812, -0.10198974609375, -0.09391403198242188, -0.08583831787109375, -0.07776260375976562, -0.0696868896484375, -0.061611175537109375, -0.05353546142578125, -0.045459747314453125, -0.037384033203125, -0.029308319091796875, -0.02123260498046875, -0.013156890869140625, -0.0050811767578125, 0.002994537353515625, 0.01107025146484375, 0.019145965576171875, 0.0272216796875, 0.035297393798828125, 0.04337310791015625, 0.051448822021484375, 0.0595245361328125, 0.06760025024414062, 0.07567596435546875, 0.08375167846679688, 0.091827392578125, 0.09990310668945312, 0.10797882080078125, 0.11605453491210938, 0.1241302490234375, 0.13220596313476562, 0.14028167724609375, 0.14835739135742188, 0.15643310546875, 0.16450881958007812, 0.17258453369140625, 0.18066024780273438, 0.1887359619140625, 0.19681167602539062, 0.20488739013671875, 0.21296310424804688, 0.221038818359375, 0.22911453247070312, 0.23719024658203125, 0.24526596069335938, 0.2533416748046875, 0.2614173889160156, 0.26949310302734375, 0.2775688171386719, 0.28564453125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 13.0, 29.0, 100.0, 253.0, 358.0, 159.0, 48.0, 16.0, 10.0, 4.0, 2.0, 2.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.392030715942383, -8.187795639038086, -7.983559608459473, -7.779324054718018, -7.5750885009765625, -7.370852947235107, -7.166617393493652, -6.962381839752197, -6.758146286010742, -6.553910732269287, -6.349675178527832, -6.145439624786377, -5.941204071044922, -5.736968517303467, -5.532732963562012, -5.328497409820557, -5.124261856079102, -4.9200263023376465, -4.715790748596191, -4.511555194854736, -4.307319641113281, -4.103084087371826, -3.898848533630371, -3.694612979888916, -3.490377426147461, -3.286141872406006, -3.081906318664551, -2.8776707649230957, -2.6734352111816406, -2.4691996574401855, -2.2649641036987305, -2.0607285499572754, -1.8564934730529785, -1.6522579193115234, -1.4480223655700684, -1.2437868118286133, -1.0395512580871582, -0.8353157043457031, -0.631080150604248, -0.42684459686279297, -0.2226090431213379, -0.018373489379882812, 0.18586206436157227, 0.39009761810302734, 0.5943331718444824, 0.7985687255859375, 1.0028042793273926, 1.2070398330688477, 1.4112753868103027, 1.6155109405517578, 1.819746494293213, 2.023982048034668, 2.228217601776123, 2.432453155517578, 2.636688709259033, 2.8409242630004883, 3.0451598167419434, 3.2493953704833984, 3.4536309242248535, 3.6578664779663086, 3.8621020317077637, 4.066337585449219, 4.270573139190674, 4.474808692932129, 4.679044246673584]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 0.0, 4.0, 1.0, 6.0, 1.0, 6.0, 9.0, 8.0, 14.0, 15.0, 10.0, 18.0, 20.0, 22.0, 27.0, 38.0, 35.0, 40.0, 43.0, 36.0, 43.0, 50.0, 40.0, 42.0, 44.0, 37.0, 47.0, 31.0, 37.0, 38.0, 30.0, 31.0, 32.0, 22.0, 20.0, 18.0, 20.0, 12.0, 16.0, 10.0, 3.0, 9.0, 9.0, 3.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1628868579864502, -1.1204020977020264, -1.077917456626892, -1.0354326963424683, -0.9929479956626892, -0.9504632949829102, -0.9079785346984863, -0.8654938340187073, -0.8230091333389282, -0.7805244326591492, -0.7380396723747253, -0.6955549716949463, -0.6530702710151672, -0.6105855703353882, -0.5681008100509644, -0.5256161093711853, -0.4831313490867615, -0.44064661860466003, -0.398161917924881, -0.35567718744277954, -0.3131924867630005, -0.27070775628089905, -0.2282230257987976, -0.18573832511901855, -0.14325359463691711, -0.10076887905597687, -0.058284156024456024, -0.01579943299293518, 0.026685282588005066, 0.06916999816894531, 0.11165472865104675, 0.1541394293308258, 0.19662415981292725, 0.2391088753938675, 0.28159359097480774, 0.3240783214569092, 0.36656302213668823, 0.4090477526187897, 0.4515324831008911, 0.49401718378067017, 0.5365018844604492, 0.5789865851402283, 0.6214713454246521, 0.6639560461044312, 0.7064407467842102, 0.7489254474639893, 0.7914102077484131, 0.8338949084281921, 0.876379668712616, 0.918864369392395, 0.9613491296768188, 1.0038337707519531, 1.046318531036377, 1.0888032913208008, 1.1312880516052246, 1.1737726926803589, 1.2162574529647827, 1.2587422132492065, 1.3012268543243408, 1.3437116146087646, 1.3861963748931885, 1.4286810159683228, 1.4711657762527466, 1.5136504173278809, 1.5561351776123047]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 6.0, 11.0, 9.0, 18.0, 20.0, 35.0, 58.0, 86.0, 102.0, 162.0, 294.0, 447.0, 795.0, 1255.0, 2303.0, 4278.0, 7832.0, 15813.0, 32746.0, 69091.0, 162592.0, 346912.0, 226870.0, 92236.0, 41725.0, 20201.0, 10382.0, 5301.0, 2839.0, 1696.0, 970.0, 541.0, 343.0, 234.0, 109.0, 71.0, 62.0, 47.0, 22.0, 13.0, 10.0, 6.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.2041015625, -0.19765853881835938, -0.19121551513671875, -0.18477249145507812, -0.1783294677734375, -0.17188644409179688, -0.16544342041015625, -0.15900039672851562, -0.152557373046875, -0.14611434936523438, -0.13967132568359375, -0.13322830200195312, -0.1267852783203125, -0.12034225463867188, -0.11389923095703125, -0.10745620727539062, -0.10101318359375, -0.09457015991210938, -0.08812713623046875, -0.08168411254882812, -0.0752410888671875, -0.06879806518554688, -0.06235504150390625, -0.055912017822265625, -0.049468994140625, -0.043025970458984375, -0.03658294677734375, -0.030139923095703125, -0.0236968994140625, -0.017253875732421875, -0.01081085205078125, -0.004367828369140625, 0.0020751953125, 0.008518218994140625, 0.01496124267578125, 0.021404266357421875, 0.0278472900390625, 0.034290313720703125, 0.04073333740234375, 0.047176361083984375, 0.053619384765625, 0.060062408447265625, 0.06650543212890625, 0.07294845581054688, 0.0793914794921875, 0.08583450317382812, 0.09227752685546875, 0.09872055053710938, 0.10516357421875, 0.11160659790039062, 0.11804962158203125, 0.12449264526367188, 0.1309356689453125, 0.13737869262695312, 0.14382171630859375, 0.15026473999023438, 0.156707763671875, 0.16315078735351562, 0.16959381103515625, 0.17603683471679688, 0.1824798583984375, 0.18892288208007812, 0.19536590576171875, 0.20180892944335938, 0.208251953125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 8.0, 9.0, 12.0, 14.0, 16.0, 17.0, 21.0, 17.0, 22.0, 28.0, 32.0, 31.0, 33.0, 45.0, 40.0, 55.0, 40.0, 52.0, 40.0, 39.0, 35.0, 38.0, 41.0, 40.0, 48.0, 28.0, 30.0, 39.0, 17.0, 23.0, 19.0, 8.0, 12.0, 14.0, 9.0, 6.0, 6.0, 6.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10955810546875, -0.10635948181152344, -0.10316085815429688, -0.09996223449707031, -0.09676361083984375, -0.09356498718261719, -0.09036636352539062, -0.08716773986816406, -0.0839691162109375, -0.08077049255371094, -0.07757186889648438, -0.07437324523925781, -0.07117462158203125, -0.06797599792480469, -0.06477737426757812, -0.06157875061035156, -0.058380126953125, -0.05518150329589844, -0.051982879638671875, -0.04878425598144531, -0.04558563232421875, -0.04238700866699219, -0.039188385009765625, -0.03598976135253906, -0.0327911376953125, -0.029592514038085938, -0.026393890380859375, -0.023195266723632812, -0.01999664306640625, -0.016798019409179688, -0.013599395751953125, -0.010400772094726562, -0.0072021484375, -0.0040035247802734375, -0.000804901123046875, 0.0023937225341796875, 0.00559234619140625, 0.008790969848632812, 0.011989593505859375, 0.015188217163085938, 0.0183868408203125, 0.021585464477539062, 0.024784088134765625, 0.027982711791992188, 0.03118133544921875, 0.03437995910644531, 0.037578582763671875, 0.04077720642089844, 0.043975830078125, 0.04717445373535156, 0.050373077392578125, 0.05357170104980469, 0.05677032470703125, 0.05996894836425781, 0.06316757202148438, 0.06636619567871094, 0.0695648193359375, 0.07276344299316406, 0.07596206665039062, 0.07916069030761719, 0.08235931396484375, 0.08555793762207031, 0.08875656127929688, 0.09195518493652344, 0.09515380859375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 7.0, 4.0, 11.0, 13.0, 15.0, 26.0, 37.0, 51.0, 87.0, 130.0, 201.0, 266.0, 408.0, 728.0, 1212.0, 2478.0, 6136.0, 24253.0, 201141.0, 736550.0, 56349.0, 10658.0, 3672.0, 1686.0, 950.0, 522.0, 311.0, 218.0, 150.0, 86.0, 53.0, 50.0, 29.0, 17.0, 17.0, 10.0, 8.0, 7.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6083984375, -0.590087890625, -0.57177734375, -0.553466796875, -0.53515625, -0.516845703125, -0.49853515625, -0.480224609375, -0.4619140625, -0.443603515625, -0.42529296875, -0.406982421875, -0.388671875, -0.370361328125, -0.35205078125, -0.333740234375, -0.3154296875, -0.297119140625, -0.27880859375, -0.260498046875, -0.2421875, -0.223876953125, -0.20556640625, -0.187255859375, -0.1689453125, -0.150634765625, -0.13232421875, -0.114013671875, -0.095703125, -0.077392578125, -0.05908203125, -0.040771484375, -0.0224609375, -0.004150390625, 0.01416015625, 0.032470703125, 0.05078125, 0.069091796875, 0.08740234375, 0.105712890625, 0.1240234375, 0.142333984375, 0.16064453125, 0.178955078125, 0.197265625, 0.215576171875, 0.23388671875, 0.252197265625, 0.2705078125, 0.288818359375, 0.30712890625, 0.325439453125, 0.34375, 0.362060546875, 0.38037109375, 0.398681640625, 0.4169921875, 0.435302734375, 0.45361328125, 0.471923828125, 0.490234375, 0.508544921875, 0.52685546875, 0.545166015625, 0.5634765625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 7.0, 6.0, 5.0, 10.0, 18.0, 16.0, 19.0, 18.0, 29.0, 28.0, 37.0, 42.0, 42.0, 60.0, 50.0, 48.0, 47.0, 53.0, 43.0, 67.0, 58.0, 56.0, 38.0, 29.0, 34.0, 31.0, 20.0, 17.0, 12.0, 14.0, 9.0, 6.0, 6.0, 4.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54052734375, -0.5222854614257812, -0.5040435791015625, -0.48580169677734375, -0.467559814453125, -0.44931793212890625, -0.4310760498046875, -0.41283416748046875, -0.39459228515625, -0.37635040283203125, -0.3581085205078125, -0.33986663818359375, -0.321624755859375, -0.30338287353515625, -0.2851409912109375, -0.26689910888671875, -0.2486572265625, -0.23041534423828125, -0.2121734619140625, -0.19393157958984375, -0.175689697265625, -0.15744781494140625, -0.1392059326171875, -0.12096405029296875, -0.10272216796875, -0.08448028564453125, -0.0662384033203125, -0.04799652099609375, -0.029754638671875, -0.01151275634765625, 0.0067291259765625, 0.02497100830078125, 0.043212890625, 0.06145477294921875, 0.0796966552734375, 0.09793853759765625, 0.116180419921875, 0.13442230224609375, 0.1526641845703125, 0.17090606689453125, 0.18914794921875, 0.20738983154296875, 0.2256317138671875, 0.24387359619140625, 0.262115478515625, 0.28035736083984375, 0.2985992431640625, 0.31684112548828125, 0.3350830078125, 0.35332489013671875, 0.3715667724609375, 0.38980865478515625, 0.408050537109375, 0.42629241943359375, 0.4445343017578125, 0.46277618408203125, 0.48101806640625, 0.49925994873046875, 0.5175018310546875, 0.5357437133789062, 0.553985595703125, 0.5722274780273438, 0.5904693603515625, 0.6087112426757812, 0.626953125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 7.0, 4.0, 6.0, 9.0, 19.0, 20.0, 30.0, 50.0, 92.0, 104.0, 235.0, 312.0, 596.0, 1101.0, 2209.0, 5225.0, 14661.0, 48318.0, 196828.0, 600233.0, 126519.0, 33682.0, 10377.0, 3972.0, 1713.0, 908.0, 466.0, 291.0, 188.0, 109.0, 69.0, 58.0, 47.0, 28.0, 28.0, 10.0, 8.0, 6.0, 9.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1326904296875, -0.12845802307128906, -0.12422561645507812, -0.11999320983886719, -0.11576080322265625, -0.11152839660644531, -0.10729598999023438, -0.10306358337402344, -0.0988311767578125, -0.09459877014160156, -0.09036636352539062, -0.08613395690917969, -0.08190155029296875, -0.07766914367675781, -0.07343673706054688, -0.06920433044433594, -0.064971923828125, -0.06073951721191406, -0.056507110595703125, -0.05227470397949219, -0.04804229736328125, -0.04380989074707031, -0.039577484130859375, -0.03534507751464844, -0.0311126708984375, -0.026880264282226562, -0.022647857666015625, -0.018415451049804688, -0.01418304443359375, -0.009950637817382812, -0.005718231201171875, -0.0014858245849609375, 0.00274658203125, 0.0069789886474609375, 0.011211395263671875, 0.015443801879882812, 0.01967620849609375, 0.023908615112304688, 0.028141021728515625, 0.03237342834472656, 0.0366058349609375, 0.04083824157714844, 0.045070648193359375, 0.04930305480957031, 0.05353546142578125, 0.05776786804199219, 0.062000274658203125, 0.06623268127441406, 0.070465087890625, 0.07469749450683594, 0.07892990112304688, 0.08316230773925781, 0.08739471435546875, 0.09162712097167969, 0.09585952758789062, 0.10009193420410156, 0.1043243408203125, 0.10855674743652344, 0.11278915405273438, 0.11702156066894531, 0.12125396728515625, 0.1254863739013672, 0.12971878051757812, 0.13395118713378906, 0.13818359375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 5.0, 8.0, 11.0, 9.0, 5.0, 14.0, 15.0, 22.0, 20.0, 27.0, 29.0, 44.0, 53.0, 60.0, 71.0, 65.0, 73.0, 63.0, 65.0, 51.0, 42.0, 41.0, 33.0, 27.0, 24.0, 15.0, 17.0, 17.0, 14.0, 11.0, 6.0, 5.0, 8.0, 4.0, 9.0, 2.0, 1.0, 3.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.155801773071289e-05, -4.990771412849426e-05, -4.8257410526275635e-05, -4.660710692405701e-05, -4.495680332183838e-05, -4.330649971961975e-05, -4.165619611740112e-05, -4.0005892515182495e-05, -3.835558891296387e-05, -3.670528531074524e-05, -3.505498170852661e-05, -3.3404678106307983e-05, -3.1754374504089355e-05, -3.0104070901870728e-05, -2.84537672996521e-05, -2.680346369743347e-05, -2.5153160095214844e-05, -2.3502856492996216e-05, -2.1852552890777588e-05, -2.020224928855896e-05, -1.8551945686340332e-05, -1.6901642084121704e-05, -1.5251338481903076e-05, -1.3601034879684448e-05, -1.195073127746582e-05, -1.0300427675247192e-05, -8.650124073028564e-06, -6.9998204708099365e-06, -5.349516868591309e-06, -3.6992132663726807e-06, -2.0489096641540527e-06, -3.986060619354248e-07, 1.2516975402832031e-06, 2.902001142501831e-06, 4.552304744720459e-06, 6.202608346939087e-06, 7.852911949157715e-06, 9.503215551376343e-06, 1.115351915359497e-05, 1.2803822755813599e-05, 1.4454126358032227e-05, 1.6104429960250854e-05, 1.7754733562469482e-05, 1.940503716468811e-05, 2.1055340766906738e-05, 2.2705644369125366e-05, 2.4355947971343994e-05, 2.6006251573562622e-05, 2.765655517578125e-05, 2.9306858777999878e-05, 3.0957162380218506e-05, 3.2607465982437134e-05, 3.425776958465576e-05, 3.590807318687439e-05, 3.755837678909302e-05, 3.9208680391311646e-05, 4.0858983993530273e-05, 4.25092875957489e-05, 4.415959119796753e-05, 4.580989480018616e-05, 4.7460198402404785e-05, 4.911050200462341e-05, 5.076080560684204e-05, 5.241110920906067e-05, 5.40614128112793e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 9.0, 13.0, 20.0, 35.0, 54.0, 74.0, 125.0, 225.0, 337.0, 621.0, 1177.0, 2425.0, 5690.0, 19470.0, 119657.0, 716388.0, 147900.0, 22736.0, 6194.0, 2570.0, 1200.0, 645.0, 367.0, 195.0, 150.0, 96.0, 41.0, 39.0, 27.0, 15.0, 15.0, 7.0, 7.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.175048828125, -0.16950035095214844, -0.16395187377929688, -0.1584033966064453, -0.15285491943359375, -0.1473064422607422, -0.14175796508789062, -0.13620948791503906, -0.1306610107421875, -0.12511253356933594, -0.11956405639648438, -0.11401557922363281, -0.10846710205078125, -0.10291862487792969, -0.09737014770507812, -0.09182167053222656, -0.086273193359375, -0.08072471618652344, -0.07517623901367188, -0.06962776184082031, -0.06407928466796875, -0.05853080749511719, -0.052982330322265625, -0.04743385314941406, -0.0418853759765625, -0.03633689880371094, -0.030788421630859375, -0.025239944458007812, -0.01969146728515625, -0.014142990112304688, -0.008594512939453125, -0.0030460357666015625, 0.00250244140625, 0.008050918579101562, 0.013599395751953125, 0.019147872924804688, 0.02469635009765625, 0.030244827270507812, 0.035793304443359375, 0.04134178161621094, 0.0468902587890625, 0.05243873596191406, 0.057987213134765625, 0.06353569030761719, 0.06908416748046875, 0.07463264465332031, 0.08018112182617188, 0.08572959899902344, 0.091278076171875, 0.09682655334472656, 0.10237503051757812, 0.10792350769042969, 0.11347198486328125, 0.11902046203613281, 0.12456893920898438, 0.13011741638183594, 0.1356658935546875, 0.14121437072753906, 0.14676284790039062, 0.1523113250732422, 0.15785980224609375, 0.1634082794189453, 0.16895675659179688, 0.17450523376464844, 0.1800537109375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 6.0, 2.0, 1.0, 3.0, 3.0, 5.0, 11.0, 14.0, 13.0, 20.0, 20.0, 37.0, 41.0, 37.0, 37.0, 41.0, 66.0, 58.0, 64.0, 48.0, 56.0, 58.0, 73.0, 41.0, 42.0, 37.0, 26.0, 23.0, 26.0, 14.0, 19.0, 9.0, 8.0, 13.0, 10.0, 7.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10552978515625, -0.1015329360961914, -0.09753608703613281, -0.09353923797607422, -0.08954238891601562, -0.08554553985595703, -0.08154869079589844, -0.07755184173583984, -0.07355499267578125, -0.06955814361572266, -0.06556129455566406, -0.06156444549560547, -0.057567596435546875, -0.05357074737548828, -0.04957389831542969, -0.045577049255371094, -0.0415802001953125, -0.037583351135253906, -0.03358650207519531, -0.02958965301513672, -0.025592803955078125, -0.02159595489501953, -0.017599105834960938, -0.013602256774902344, -0.00960540771484375, -0.005608558654785156, -0.0016117095947265625, 0.0023851394653320312, 0.006381988525390625, 0.010378837585449219, 0.014375686645507812, 0.018372535705566406, 0.022369384765625, 0.026366233825683594, 0.030363082885742188, 0.03435993194580078, 0.038356781005859375, 0.04235363006591797, 0.04635047912597656, 0.050347328186035156, 0.05434417724609375, 0.058341026306152344, 0.06233787536621094, 0.06633472442626953, 0.07033157348632812, 0.07432842254638672, 0.07832527160644531, 0.0823221206665039, 0.0863189697265625, 0.0903158187866211, 0.09431266784667969, 0.09830951690673828, 0.10230636596679688, 0.10630321502685547, 0.11030006408691406, 0.11429691314697266, 0.11829376220703125, 0.12229061126708984, 0.12628746032714844, 0.13028430938720703, 0.13428115844726562, 0.13827800750732422, 0.1422748565673828, 0.1462717056274414, 0.1502685546875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 14.0, 35.0, 129.0, 331.0, 286.0, 131.0, 45.0, 14.0, 5.0, 5.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.505383491516113, -8.30266284942627, -8.099943161010742, -7.897222995758057, -7.694502830505371, -7.4917826652526855, -7.2890625, -7.086341857910156, -6.883622169494629, -6.680902004241943, -6.478181838989258, -6.275461673736572, -6.072741508483887, -5.870021343231201, -5.667301177978516, -5.464580535888672, -5.261860370635986, -5.059140205383301, -4.856420040130615, -4.65369987487793, -4.450979709625244, -4.248259544372559, -4.045538902282715, -3.8428189754486084, -3.640098810195923, -3.4373786449432373, -3.2346584796905518, -3.031938076019287, -2.8292179107666016, -2.626497745513916, -2.4237775802612305, -2.221057415008545, -2.0183377265930176, -1.815617561340332, -1.6128973960876465, -1.4101771116256714, -1.2074569463729858, -1.0047367811203003, -0.8020164966583252, -0.5992963314056396, -0.3965761661529541, -0.19385597109794617, 0.008864223957061768, 0.2115844488143921, 0.41430461406707764, 0.6170247793197632, 0.8197450637817383, 1.0224652290344238, 1.2251853942871094, 1.427905559539795, 1.6306257247924805, 1.8333460092544556, 2.0360660552978516, 2.238786220550537, 2.4415066242218018, 2.6442267894744873, 2.846946954727173, 3.0496671199798584, 3.252387285232544, 3.4551076889038086, 3.657827854156494, 3.8605480194091797, 4.063268184661865, 4.265988349914551, 4.468708515167236]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 5.0, 5.0, 11.0, 11.0, 14.0, 15.0, 13.0, 21.0, 15.0, 22.0, 25.0, 26.0, 38.0, 46.0, 41.0, 45.0, 54.0, 61.0, 83.0, 76.0, 52.0, 40.0, 46.0, 33.0, 41.0, 31.0, 29.0, 20.0, 18.0, 17.0, 8.0, 15.0, 9.0, 8.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.3481132984161377, -2.279743194580078, -2.2113728523254395, -2.143002510070801, -2.074632406234741, -2.0062623023986816, -1.937891960144043, -1.8695217370986938, -1.8011515140533447, -1.7327812910079956, -1.6644110679626465, -1.5960408449172974, -1.5276706218719482, -1.4593003988265991, -1.39093017578125, -1.3225599527359009, -1.2541897296905518, -1.1858195066452026, -1.1174492835998535, -1.0490790605545044, -0.9807088375091553, -0.9123386144638062, -0.843968391418457, -0.7755981683731079, -0.7072279453277588, -0.6388577222824097, -0.5704874992370605, -0.5021172761917114, -0.4337470531463623, -0.3653768301010132, -0.29700660705566406, -0.22863638401031494, -0.16026592254638672, -0.0918956995010376, -0.023525476455688477, 0.044844746589660645, 0.11321496963500977, 0.1815851926803589, 0.249955415725708, 0.31832563877105713, 0.38669586181640625, 0.45506608486175537, 0.5234363079071045, 0.5918065309524536, 0.6601767539978027, 0.7285469770431519, 0.796917200088501, 0.8652874231338501, 0.9336576461791992, 1.0020278692245483, 1.0703980922698975, 1.1387683153152466, 1.2071385383605957, 1.2755087614059448, 1.343878984451294, 1.412249207496643, 1.4806194305419922, 1.5489896535873413, 1.6173598766326904, 1.6857300996780396, 1.7541003227233887, 1.8224705457687378, 1.890840768814087, 1.959210991859436, 2.027581214904785]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 9.0, 10.0, 20.0, 27.0, 37.0, 71.0, 98.0, 181.0, 306.0, 622.0, 1258.0, 2763.0, 6842.0, 19419.0, 68575.0, 361072.0, 2166388.0, 1313465.0, 187781.0, 42647.0, 13385.0, 4985.0, 2133.0, 993.0, 500.0, 277.0, 172.0, 82.0, 56.0, 32.0, 24.0, 16.0, 12.0, 10.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1849365234375, -0.17930221557617188, -0.17366790771484375, -0.16803359985351562, -0.1623992919921875, -0.15676498413085938, -0.15113067626953125, -0.14549636840820312, -0.139862060546875, -0.13422775268554688, -0.12859344482421875, -0.12295913696289062, -0.1173248291015625, -0.11169052124023438, -0.10605621337890625, -0.10042190551757812, -0.09478759765625, -0.08915328979492188, -0.08351898193359375, -0.07788467407226562, -0.0722503662109375, -0.06661605834960938, -0.06098175048828125, -0.055347442626953125, -0.049713134765625, -0.044078826904296875, -0.03844451904296875, -0.032810211181640625, -0.0271759033203125, -0.021541595458984375, -0.01590728759765625, -0.010272979736328125, -0.004638671875, 0.000995635986328125, 0.00662994384765625, 0.012264251708984375, 0.0178985595703125, 0.023532867431640625, 0.02916717529296875, 0.034801483154296875, 0.040435791015625, 0.046070098876953125, 0.05170440673828125, 0.057338714599609375, 0.0629730224609375, 0.06860733032226562, 0.07424163818359375, 0.07987594604492188, 0.08551025390625, 0.09114456176757812, 0.09677886962890625, 0.10241317749023438, 0.1080474853515625, 0.11368179321289062, 0.11931610107421875, 0.12495040893554688, 0.130584716796875, 0.13621902465820312, 0.14185333251953125, 0.14748764038085938, 0.1531219482421875, 0.15875625610351562, 0.16439056396484375, 0.17002487182617188, 0.1756591796875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 11.0, 4.0, 8.0, 12.0, 11.0, 15.0, 23.0, 27.0, 24.0, 41.0, 38.0, 34.0, 43.0, 48.0, 50.0, 51.0, 54.0, 44.0, 55.0, 57.0, 68.0, 38.0, 52.0, 34.0, 27.0, 36.0, 25.0, 9.0, 17.0, 14.0, 9.0, 9.0, 7.0, 8.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1497802734375, -0.14585590362548828, -0.14193153381347656, -0.13800716400146484, -0.13408279418945312, -0.1301584243774414, -0.1262340545654297, -0.12230968475341797, -0.11838531494140625, -0.11446094512939453, -0.11053657531738281, -0.1066122055053711, -0.10268783569335938, -0.09876346588134766, -0.09483909606933594, -0.09091472625732422, -0.0869903564453125, -0.08306598663330078, -0.07914161682128906, -0.07521724700927734, -0.07129287719726562, -0.0673685073852539, -0.06344413757324219, -0.05951976776123047, -0.05559539794921875, -0.05167102813720703, -0.04774665832519531, -0.043822288513183594, -0.039897918701171875, -0.035973548889160156, -0.03204917907714844, -0.02812480926513672, -0.024200439453125, -0.02027606964111328, -0.016351699829101562, -0.012427330017089844, -0.008502960205078125, -0.004578590393066406, -0.0006542205810546875, 0.0032701492309570312, 0.00719451904296875, 0.011118888854980469, 0.015043258666992188, 0.018967628479003906, 0.022891998291015625, 0.026816368103027344, 0.030740737915039062, 0.03466510772705078, 0.0385894775390625, 0.04251384735107422, 0.04643821716308594, 0.050362586975097656, 0.054286956787109375, 0.058211326599121094, 0.06213569641113281, 0.06606006622314453, 0.06998443603515625, 0.07390880584716797, 0.07783317565917969, 0.0817575454711914, 0.08568191528320312, 0.08960628509521484, 0.09353065490722656, 0.09745502471923828, 0.10137939453125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 6.0, 15.0, 11.0, 17.0, 26.0, 25.0, 53.0, 77.0, 116.0, 148.0, 264.0, 429.0, 716.0, 1432.0, 3168.0, 7208.0, 19921.0, 67401.0, 344770.0, 2585449.0, 976330.0, 133291.0, 33479.0, 11266.0, 4320.0, 1914.0, 1029.0, 488.0, 342.0, 191.0, 115.0, 67.0, 40.0, 49.0, 21.0, 29.0, 7.0, 16.0, 7.0, 6.0, 4.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2403564453125, -0.2322711944580078, -0.22418594360351562, -0.21610069274902344, -0.20801544189453125, -0.19993019104003906, -0.19184494018554688, -0.1837596893310547, -0.1756744384765625, -0.1675891876220703, -0.15950393676757812, -0.15141868591308594, -0.14333343505859375, -0.13524818420410156, -0.12716293334960938, -0.11907768249511719, -0.110992431640625, -0.10290718078613281, -0.09482192993164062, -0.08673667907714844, -0.07865142822265625, -0.07056617736816406, -0.062480926513671875, -0.05439567565917969, -0.0463104248046875, -0.03822517395019531, -0.030139923095703125, -0.022054672241210938, -0.01396942138671875, -0.0058841705322265625, 0.002201080322265625, 0.010286331176757812, 0.01837158203125, 0.026456832885742188, 0.034542083740234375, 0.04262733459472656, 0.05071258544921875, 0.05879783630371094, 0.06688308715820312, 0.07496833801269531, 0.0830535888671875, 0.09113883972167969, 0.09922409057617188, 0.10730934143066406, 0.11539459228515625, 0.12347984313964844, 0.13156509399414062, 0.1396503448486328, 0.147735595703125, 0.1558208465576172, 0.16390609741210938, 0.17199134826660156, 0.18007659912109375, 0.18816184997558594, 0.19624710083007812, 0.2043323516845703, 0.2124176025390625, 0.2205028533935547, 0.22858810424804688, 0.23667335510253906, 0.24475860595703125, 0.25284385681152344, 0.2609291076660156, 0.2690143585205078, 0.277099609375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 5.0, 3.0, 7.0, 5.0, 9.0, 3.0, 15.0, 20.0, 19.0, 31.0, 43.0, 58.0, 73.0, 116.0, 166.0, 250.0, 340.0, 517.0, 584.0, 549.0, 382.0, 273.0, 177.0, 119.0, 84.0, 50.0, 50.0, 29.0, 24.0, 23.0, 10.0, 10.0, 7.0, 3.0, 5.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36279296875, -0.3525733947753906, -0.34235382080078125, -0.3321342468261719, -0.3219146728515625, -0.3116950988769531, -0.30147552490234375, -0.2912559509277344, -0.281036376953125, -0.2708168029785156, -0.26059722900390625, -0.2503776550292969, -0.2401580810546875, -0.22993850708007812, -0.21971893310546875, -0.20949935913085938, -0.19927978515625, -0.18906021118164062, -0.17884063720703125, -0.16862106323242188, -0.1584014892578125, -0.14818191528320312, -0.13796234130859375, -0.12774276733398438, -0.117523193359375, -0.10730361938476562, -0.09708404541015625, -0.08686447143554688, -0.0766448974609375, -0.06642532348632812, -0.05620574951171875, -0.045986175537109375, -0.0357666015625, -0.025547027587890625, -0.01532745361328125, -0.005107879638671875, 0.0051116943359375, 0.015331268310546875, 0.02555084228515625, 0.035770416259765625, 0.045989990234375, 0.056209564208984375, 0.06642913818359375, 0.07664871215820312, 0.0868682861328125, 0.09708786010742188, 0.10730743408203125, 0.11752700805664062, 0.12774658203125, 0.13796615600585938, 0.14818572998046875, 0.15840530395507812, 0.1686248779296875, 0.17884445190429688, 0.18906402587890625, 0.19928359985351562, 0.209503173828125, 0.21972274780273438, 0.22994232177734375, 0.24016189575195312, 0.2503814697265625, 0.2606010437011719, 0.27082061767578125, 0.2810401916503906, 0.291259765625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 13.0, 20.0, 86.0, 276.0, 320.0, 188.0, 57.0, 13.0, 8.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.473925590515137, -9.255084037780762, -9.036242485046387, -8.817400932312012, -8.598559379577637, -8.379717826843262, -8.16087532043457, -7.9420342445373535, -7.7231926918029785, -7.5043511390686035, -7.2855095863342285, -7.066667556762695, -6.84782600402832, -6.628984451293945, -6.41014289855957, -6.191301345825195, -5.97245979309082, -5.753618240356445, -5.53477668762207, -5.315935134887695, -5.097093105316162, -4.878251552581787, -4.659409999847412, -4.440568447113037, -4.221726417541504, -4.002884864807129, -3.784043073654175, -3.5652015209198, -3.346359968185425, -3.1275181770324707, -2.9086766242980957, -2.6898350715637207, -2.4709935188293457, -2.2521519660949707, -2.0333101749420166, -1.8144686222076416, -1.5956270694732666, -1.376785397529602, -1.1579437255859375, -0.9391021728515625, -0.720260500907898, -0.5014188885688782, -0.282577246427536, -0.06373560428619385, 0.15510600805282593, 0.3739476203918457, 0.5927892923355103, 0.8116308450698853, 1.0304725170135498, 1.2493141889572144, 1.4681557416915894, 1.686997413635254, 1.905838966369629, 2.124680519104004, 2.343522310256958, 2.562363862991333, 2.781205654144287, 3.000047206878662, 3.218888998031616, 3.437730550765991, 3.656572103500366, 3.8754138946533203, 4.094255447387695, 4.31309700012207, 4.531938552856445]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 7.0, 9.0, 2.0, 11.0, 8.0, 19.0, 18.0, 23.0, 25.0, 28.0, 25.0, 40.0, 43.0, 38.0, 45.0, 39.0, 40.0, 43.0, 54.0, 54.0, 49.0, 51.0, 41.0, 44.0, 33.0, 33.0, 30.0, 23.0, 30.0, 21.0, 16.0, 11.0, 15.0, 7.0, 9.0, 7.0, 3.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.7584247589111328, -1.7045485973358154, -1.6506723165512085, -1.5967961549758911, -1.5429198741912842, -1.4890437126159668, -1.4351675510406494, -1.3812912702560425, -1.3274149894714355, -1.2735388278961182, -1.2196625471115112, -1.1657863855361938, -1.111910104751587, -1.0580339431762695, -1.0041577816009521, -0.9502815008163452, -0.8964053392410278, -0.8425291180610657, -0.7886528968811035, -0.7347767353057861, -0.6809004545211792, -0.6270242929458618, -0.5731480717658997, -0.5192718505859375, -0.46539562940597534, -0.4115194082260132, -0.357643187046051, -0.30376699566841125, -0.2498907744884491, -0.19601455330848694, -0.14213836193084717, -0.08826214075088501, -0.03438591957092285, 0.01949029415845871, 0.07336650788784027, 0.12724271416664124, 0.1811189353466034, 0.23499515652656555, 0.2888713479042053, 0.3427475690841675, 0.39662379026412964, 0.4505000114440918, 0.504376232624054, 0.5582524538040161, 0.6121286153793335, 0.6660048961639404, 0.7198810577392578, 0.77375727891922, 0.8276335000991821, 0.8815097212791443, 0.9353859424591064, 0.9892621040344238, 1.0431383848190308, 1.0970145463943481, 1.150890827178955, 1.2047669887542725, 1.2586431503295898, 1.3125193119049072, 1.3663955926895142, 1.4202717542648315, 1.4741480350494385, 1.5280241966247559, 1.5819003582000732, 1.6357766389846802, 1.689652919769287]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 9.0, 13.0, 16.0, 17.0, 25.0, 52.0, 70.0, 98.0, 178.0, 278.0, 446.0, 714.0, 1167.0, 2028.0, 3697.0, 6842.0, 13964.0, 31560.0, 87727.0, 328798.0, 392624.0, 108090.0, 36748.0, 15802.0, 7745.0, 4171.0, 2322.0, 1267.0, 773.0, 496.0, 308.0, 180.0, 136.0, 72.0, 46.0, 32.0, 13.0, 16.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.2666015625, -0.259002685546875, -0.25140380859375, -0.243804931640625, -0.2362060546875, -0.228607177734375, -0.22100830078125, -0.213409423828125, -0.205810546875, -0.198211669921875, -0.19061279296875, -0.183013916015625, -0.1754150390625, -0.167816162109375, -0.16021728515625, -0.152618408203125, -0.14501953125, -0.137420654296875, -0.12982177734375, -0.122222900390625, -0.1146240234375, -0.107025146484375, -0.09942626953125, -0.091827392578125, -0.084228515625, -0.076629638671875, -0.06903076171875, -0.061431884765625, -0.0538330078125, -0.046234130859375, -0.03863525390625, -0.031036376953125, -0.0234375, -0.015838623046875, -0.00823974609375, -0.000640869140625, 0.0069580078125, 0.014556884765625, 0.02215576171875, 0.029754638671875, 0.037353515625, 0.044952392578125, 0.05255126953125, 0.060150146484375, 0.0677490234375, 0.075347900390625, 0.08294677734375, 0.090545654296875, 0.09814453125, 0.105743408203125, 0.11334228515625, 0.120941162109375, 0.1285400390625, 0.136138916015625, 0.14373779296875, 0.151336669921875, 0.158935546875, 0.166534423828125, 0.17413330078125, 0.181732177734375, 0.1893310546875, 0.196929931640625, 0.20452880859375, 0.212127685546875, 0.2197265625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 13.0, 12.0, 7.0, 12.0, 13.0, 18.0, 18.0, 20.0, 36.0, 31.0, 37.0, 28.0, 36.0, 52.0, 54.0, 46.0, 46.0, 41.0, 41.0, 47.0, 45.0, 44.0, 36.0, 30.0, 40.0, 30.0, 31.0, 30.0, 24.0, 20.0, 15.0, 6.0, 9.0, 8.0, 7.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.131591796875, -0.12789249420166016, -0.12419319152832031, -0.12049388885498047, -0.11679458618164062, -0.11309528350830078, -0.10939598083496094, -0.1056966781616211, -0.10199737548828125, -0.0982980728149414, -0.09459877014160156, -0.09089946746826172, -0.08720016479492188, -0.08350086212158203, -0.07980155944824219, -0.07610225677490234, -0.0724029541015625, -0.06870365142822266, -0.06500434875488281, -0.06130504608154297, -0.057605743408203125, -0.05390644073486328, -0.05020713806152344, -0.046507835388183594, -0.04280853271484375, -0.039109230041503906, -0.03540992736816406, -0.03171062469482422, -0.028011322021484375, -0.02431201934814453, -0.020612716674804688, -0.016913414001464844, -0.013214111328125, -0.009514808654785156, -0.0058155059814453125, -0.0021162033081054688, 0.001583099365234375, 0.005282402038574219, 0.008981704711914062, 0.012681007385253906, 0.01638031005859375, 0.020079612731933594, 0.023778915405273438, 0.02747821807861328, 0.031177520751953125, 0.03487682342529297, 0.03857612609863281, 0.042275428771972656, 0.0459747314453125, 0.049674034118652344, 0.05337333679199219, 0.05707263946533203, 0.060771942138671875, 0.06447124481201172, 0.06817054748535156, 0.0718698501586914, 0.07556915283203125, 0.0792684555053711, 0.08296775817871094, 0.08666706085205078, 0.09036636352539062, 0.09406566619873047, 0.09776496887207031, 0.10146427154541016, 0.10516357421875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 5.0, 4.0, 10.0, 9.0, 14.0, 25.0, 36.0, 48.0, 63.0, 87.0, 112.0, 172.0, 308.0, 535.0, 853.0, 1669.0, 4409.0, 14917.0, 88223.0, 808526.0, 103413.0, 16345.0, 4643.0, 1767.0, 860.0, 509.0, 307.0, 221.0, 143.0, 85.0, 64.0, 44.0, 36.0, 37.0, 22.0, 12.0, 5.0, 7.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.55517578125, -0.5386199951171875, -0.522064208984375, -0.5055084228515625, -0.48895263671875, -0.4723968505859375, -0.455841064453125, -0.4392852783203125, -0.4227294921875, -0.4061737060546875, -0.389617919921875, -0.3730621337890625, -0.35650634765625, -0.3399505615234375, -0.323394775390625, -0.3068389892578125, -0.290283203125, -0.2737274169921875, -0.257171630859375, -0.2406158447265625, -0.22406005859375, -0.2075042724609375, -0.190948486328125, -0.1743927001953125, -0.1578369140625, -0.1412811279296875, -0.124725341796875, -0.1081695556640625, -0.09161376953125, -0.0750579833984375, -0.058502197265625, -0.0419464111328125, -0.025390625, -0.0088348388671875, 0.007720947265625, 0.0242767333984375, 0.04083251953125, 0.0573883056640625, 0.073944091796875, 0.0904998779296875, 0.1070556640625, 0.1236114501953125, 0.140167236328125, 0.1567230224609375, 0.17327880859375, 0.1898345947265625, 0.206390380859375, 0.2229461669921875, 0.239501953125, 0.2560577392578125, 0.272613525390625, 0.2891693115234375, 0.30572509765625, 0.3222808837890625, 0.338836669921875, 0.3553924560546875, 0.3719482421875, 0.3885040283203125, 0.405059814453125, 0.4216156005859375, 0.43817138671875, 0.4547271728515625, 0.471282958984375, 0.4878387451171875, 0.50439453125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 7.0, 6.0, 7.0, 7.0, 11.0, 7.0, 14.0, 14.0, 16.0, 15.0, 26.0, 22.0, 26.0, 38.0, 38.0, 42.0, 42.0, 45.0, 55.0, 42.0, 45.0, 49.0, 43.0, 38.0, 49.0, 44.0, 34.0, 29.0, 25.0, 29.0, 24.0, 23.0, 18.0, 7.0, 15.0, 3.0, 12.0, 7.0, 4.0, 5.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.50537109375, -0.4907646179199219, -0.47615814208984375, -0.4615516662597656, -0.4469451904296875, -0.4323387145996094, -0.41773223876953125, -0.4031257629394531, -0.388519287109375, -0.3739128112792969, -0.35930633544921875, -0.3446998596191406, -0.3300933837890625, -0.3154869079589844, -0.30088043212890625, -0.2862739562988281, -0.27166748046875, -0.2570610046386719, -0.24245452880859375, -0.22784805297851562, -0.2132415771484375, -0.19863510131835938, -0.18402862548828125, -0.16942214965820312, -0.154815673828125, -0.14020919799804688, -0.12560272216796875, -0.11099624633789062, -0.0963897705078125, -0.08178329467773438, -0.06717681884765625, -0.052570343017578125, -0.0379638671875, -0.023357391357421875, -0.00875091552734375, 0.005855560302734375, 0.0204620361328125, 0.035068511962890625, 0.04967498779296875, 0.06428146362304688, 0.078887939453125, 0.09349441528320312, 0.10810089111328125, 0.12270736694335938, 0.1373138427734375, 0.15192031860351562, 0.16652679443359375, 0.18113327026367188, 0.19573974609375, 0.21034622192382812, 0.22495269775390625, 0.23955917358398438, 0.2541656494140625, 0.2687721252441406, 0.28337860107421875, 0.2979850769042969, 0.312591552734375, 0.3271980285644531, 0.34180450439453125, 0.3564109802246094, 0.3710174560546875, 0.3856239318847656, 0.40023040771484375, 0.4148368835449219, 0.429443359375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 7.0, 2.0, 3.0, 2.0, 10.0, 7.0, 6.0, 17.0, 22.0, 34.0, 62.0, 87.0, 138.0, 248.0, 391.0, 680.0, 1188.0, 2440.0, 5728.0, 15442.0, 56370.0, 288585.0, 562250.0, 80696.0, 20724.0, 7268.0, 2925.0, 1356.0, 750.0, 409.0, 239.0, 161.0, 104.0, 46.0, 31.0, 33.0, 31.0, 16.0, 15.0, 5.0, 6.0, 10.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.1475830078125, -0.1429882049560547, -0.13839340209960938, -0.13379859924316406, -0.12920379638671875, -0.12460899353027344, -0.12001419067382812, -0.11541938781738281, -0.1108245849609375, -0.10622978210449219, -0.10163497924804688, -0.09704017639160156, -0.09244537353515625, -0.08785057067871094, -0.08325576782226562, -0.07866096496582031, -0.074066162109375, -0.06947135925292969, -0.06487655639648438, -0.06028175354003906, -0.05568695068359375, -0.05109214782714844, -0.046497344970703125, -0.04190254211425781, -0.0373077392578125, -0.03271293640136719, -0.028118133544921875, -0.023523330688476562, -0.01892852783203125, -0.014333724975585938, -0.009738922119140625, -0.0051441192626953125, -0.00054931640625, 0.0040454864501953125, 0.008640289306640625, 0.013235092163085938, 0.01782989501953125, 0.022424697875976562, 0.027019500732421875, 0.03161430358886719, 0.0362091064453125, 0.04080390930175781, 0.045398712158203125, 0.04999351501464844, 0.05458831787109375, 0.05918312072753906, 0.06377792358398438, 0.06837272644042969, 0.072967529296875, 0.07756233215332031, 0.08215713500976562, 0.08675193786621094, 0.09134674072265625, 0.09594154357910156, 0.10053634643554688, 0.10513114929199219, 0.1097259521484375, 0.11432075500488281, 0.11891555786132812, 0.12351036071777344, 0.12810516357421875, 0.13269996643066406, 0.13729476928710938, 0.1418895721435547, 0.146484375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 5.0, 3.0, 9.0, 6.0, 12.0, 11.0, 16.0, 26.0, 26.0, 26.0, 34.0, 32.0, 64.0, 57.0, 105.0, 84.0, 90.0, 76.0, 72.0, 52.0, 34.0, 38.0, 25.0, 23.0, 15.0, 16.0, 13.0, 7.0, 6.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.358457565307617e-05, -5.1723793148994446e-05, -4.986301064491272e-05, -4.8002228140830994e-05, -4.614144563674927e-05, -4.428066313266754e-05, -4.2419880628585815e-05, -4.055909812450409e-05, -3.869831562042236e-05, -3.683753311634064e-05, -3.497675061225891e-05, -3.3115968108177185e-05, -3.125518560409546e-05, -2.9394403100013733e-05, -2.7533620595932007e-05, -2.567283809185028e-05, -2.3812055587768555e-05, -2.195127308368683e-05, -2.0090490579605103e-05, -1.8229708075523376e-05, -1.636892557144165e-05, -1.4508143067359924e-05, -1.2647360563278198e-05, -1.0786578059196472e-05, -8.925795555114746e-06, -7.06501305103302e-06, -5.204230546951294e-06, -3.343448042869568e-06, -1.4826655387878418e-06, 3.781169652938843e-07, 2.2388994693756104e-06, 4.0996819734573364e-06, 5.9604644775390625e-06, 7.821246981620789e-06, 9.682029485702515e-06, 1.154281198978424e-05, 1.3403594493865967e-05, 1.5264376997947693e-05, 1.712515950202942e-05, 1.8985942006111145e-05, 2.084672451019287e-05, 2.2707507014274597e-05, 2.4568289518356323e-05, 2.642907202243805e-05, 2.8289854526519775e-05, 3.01506370306015e-05, 3.201141953468323e-05, 3.3872202038764954e-05, 3.573298454284668e-05, 3.7593767046928406e-05, 3.945454955101013e-05, 4.131533205509186e-05, 4.3176114559173584e-05, 4.503689706325531e-05, 4.6897679567337036e-05, 4.875846207141876e-05, 5.061924457550049e-05, 5.2480027079582214e-05, 5.434080958366394e-05, 5.6201592087745667e-05, 5.806237459182739e-05, 5.992315709590912e-05, 6.178393959999084e-05, 6.364472210407257e-05, 6.55055046081543e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 12.0, 16.0, 17.0, 22.0, 42.0, 41.0, 61.0, 60.0, 84.0, 133.0, 187.0, 313.0, 467.0, 786.0, 1330.0, 2435.0, 5431.0, 14079.0, 48888.0, 226883.0, 598864.0, 105635.0, 25937.0, 8553.0, 3586.0, 1808.0, 1012.0, 608.0, 375.0, 269.0, 168.0, 111.0, 87.0, 73.0, 43.0, 35.0, 20.0, 15.0, 14.0, 9.0, 13.0, 4.0, 5.0, 3.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1280517578125, -0.12408256530761719, -0.12011337280273438, -0.11614418029785156, -0.11217498779296875, -0.10820579528808594, -0.10423660278320312, -0.10026741027832031, -0.0962982177734375, -0.09232902526855469, -0.08835983276367188, -0.08439064025878906, -0.08042144775390625, -0.07645225524902344, -0.07248306274414062, -0.06851387023925781, -0.064544677734375, -0.06057548522949219, -0.056606292724609375, -0.05263710021972656, -0.04866790771484375, -0.04469871520996094, -0.040729522705078125, -0.03676033020019531, -0.0327911376953125, -0.028821945190429688, -0.024852752685546875, -0.020883560180664062, -0.01691436767578125, -0.012945175170898438, -0.008975982666015625, -0.0050067901611328125, -0.00103759765625, 0.0029315948486328125, 0.006900787353515625, 0.010869979858398438, 0.01483917236328125, 0.018808364868164062, 0.022777557373046875, 0.026746749877929688, 0.0307159423828125, 0.03468513488769531, 0.038654327392578125, 0.04262351989746094, 0.04659271240234375, 0.05056190490722656, 0.054531097412109375, 0.05850028991699219, 0.062469482421875, 0.06643867492675781, 0.07040786743164062, 0.07437705993652344, 0.07834625244140625, 0.08231544494628906, 0.08628463745117188, 0.09025382995605469, 0.0942230224609375, 0.09819221496582031, 0.10216140747070312, 0.10613059997558594, 0.11009979248046875, 0.11406898498535156, 0.11803817749023438, 0.12200736999511719, 0.1259765625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 6.0, 5.0, 8.0, 4.0, 9.0, 6.0, 13.0, 22.0, 25.0, 15.0, 31.0, 45.0, 59.0, 46.0, 62.0, 69.0, 67.0, 71.0, 72.0, 65.0, 51.0, 47.0, 47.0, 30.0, 25.0, 28.0, 20.0, 11.0, 7.0, 7.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.12371826171875, -0.1200723648071289, -0.11642646789550781, -0.11278057098388672, -0.10913467407226562, -0.10548877716064453, -0.10184288024902344, -0.09819698333740234, -0.09455108642578125, -0.09090518951416016, -0.08725929260253906, -0.08361339569091797, -0.07996749877929688, -0.07632160186767578, -0.07267570495605469, -0.0690298080444336, -0.0653839111328125, -0.061738014221191406, -0.05809211730957031, -0.05444622039794922, -0.050800323486328125, -0.04715442657470703, -0.04350852966308594, -0.039862632751464844, -0.03621673583984375, -0.032570838928222656, -0.028924942016601562, -0.02527904510498047, -0.021633148193359375, -0.01798725128173828, -0.014341354370117188, -0.010695457458496094, -0.007049560546875, -0.0034036636352539062, 0.0002422332763671875, 0.0038881301879882812, 0.007534027099609375, 0.011179924011230469, 0.014825820922851562, 0.018471717834472656, 0.02211761474609375, 0.025763511657714844, 0.029409408569335938, 0.03305530548095703, 0.036701202392578125, 0.04034709930419922, 0.04399299621582031, 0.047638893127441406, 0.0512847900390625, 0.054930686950683594, 0.05857658386230469, 0.06222248077392578, 0.06586837768554688, 0.06951427459716797, 0.07316017150878906, 0.07680606842041016, 0.08045196533203125, 0.08409786224365234, 0.08774375915527344, 0.09138965606689453, 0.09503555297851562, 0.09868144989013672, 0.10232734680175781, 0.1059732437133789, 0.109619140625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 3.0, 8.0, 18.0, 41.0, 104.0, 269.0, 332.0, 134.0, 42.0, 20.0, 9.0, 4.0, 7.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.369033813476562, -8.191421508789062, -8.013809204101562, -7.836196422576904, -7.658584117889404, -7.480971813201904, -7.303359031677246, -7.125746726989746, -6.948134422302246, -6.770522117614746, -6.592909812927246, -6.415297031402588, -6.237684726715088, -6.060072422027588, -5.88245964050293, -5.70484733581543, -5.52723503112793, -5.34962272644043, -5.17201042175293, -4.9943976402282715, -4.8167853355407715, -4.6391730308532715, -4.461560249328613, -4.283947944641113, -4.106335639953613, -3.9287233352661133, -3.751110792160034, -3.573498249053955, -3.395885944366455, -3.218273639678955, -3.040661096572876, -2.863048553466797, -2.685436725616455, -2.507824420928955, -2.330211877822876, -2.152599334716797, -1.9749870300292969, -1.7973746061325073, -1.6197621822357178, -1.4421497583389282, -1.2645373344421387, -1.0869249105453491, -0.9093124866485596, -0.73170006275177, -0.5540876388549805, -0.3764752149581909, -0.19886279106140137, -0.021250367164611816, 0.15636205673217773, 0.3339744806289673, 0.5115869045257568, 0.6891993284225464, 0.8668117523193359, 1.0444241762161255, 1.222036600112915, 1.3996490240097046, 1.5772614479064941, 1.7548738718032837, 1.9324862957000732, 2.1100988388061523, 2.2877111434936523, 2.4653234481811523, 2.6429359912872314, 2.8205485343933105, 2.9981608390808105]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 9.0, 14.0, 15.0, 17.0, 18.0, 27.0, 30.0, 33.0, 33.0, 35.0, 43.0, 68.0, 84.0, 78.0, 82.0, 70.0, 52.0, 48.0, 33.0, 50.0, 30.0, 14.0, 21.0, 24.0, 21.0, 14.0, 7.0, 10.0, 7.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4731509685516357, -2.3982748985290527, -2.3233985900878906, -2.2485225200653076, -2.1736464500427246, -2.0987701416015625, -2.0238940715789795, -1.9490180015563965, -1.874141812324524, -1.7992656230926514, -1.7243895530700684, -1.6495133638381958, -1.5746371746063232, -1.4997611045837402, -1.4248849153518677, -1.3500087261199951, -1.275132656097412, -1.2002564668655396, -1.1253803968429565, -1.050504207611084, -0.9756280779838562, -0.9007519483566284, -0.8258757591247559, -0.7509996294975281, -0.6761234998703003, -0.6012473702430725, -0.5263712406158447, -0.45149505138397217, -0.3766189217567444, -0.3017427921295166, -0.22686663269996643, -0.15199047327041626, -0.07711410522460938, -0.002237960696220398, 0.07263818383216858, 0.14751432836055756, 0.22239047288894653, 0.2972666025161743, 0.3721427619457245, 0.44701892137527466, 0.5218950510025024, 0.5967711806297302, 0.671647310256958, 0.7465234994888306, 0.8213996291160583, 0.8962757587432861, 0.9711519479751587, 1.0460281372070312, 1.1209042072296143, 1.1957803964614868, 1.2706564664840698, 1.3455326557159424, 1.4204087257385254, 1.495284914970398, 1.5701611042022705, 1.6450371742248535, 1.719913363456726, 1.7947895526885986, 1.8696656227111816, 1.9445418119430542, 2.0194180011749268, 2.0942940711975098, 2.1691701412200928, 2.244046449661255, 2.318922519683838]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 8.0, 6.0, 10.0, 33.0, 31.0, 49.0, 77.0, 109.0, 191.0, 281.0, 573.0, 1061.0, 2460.0, 5292.0, 13562.0, 40813.0, 179739.0, 1252908.0, 2221355.0, 373127.0, 68679.0, 19827.0, 7492.0, 3203.0, 1526.0, 773.0, 440.0, 237.0, 137.0, 77.0, 52.0, 33.0, 28.0, 20.0, 19.0, 10.0, 8.0, 8.0, 9.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1661376953125, -0.1609783172607422, -0.15581893920898438, -0.15065956115722656, -0.14550018310546875, -0.14034080505371094, -0.13518142700195312, -0.1300220489501953, -0.1248626708984375, -0.11970329284667969, -0.11454391479492188, -0.10938453674316406, -0.10422515869140625, -0.09906578063964844, -0.09390640258789062, -0.08874702453613281, -0.083587646484375, -0.07842826843261719, -0.07326889038085938, -0.06810951232910156, -0.06295013427734375, -0.05779075622558594, -0.052631378173828125, -0.04747200012207031, -0.0423126220703125, -0.03715324401855469, -0.031993865966796875, -0.026834487915039062, -0.02167510986328125, -0.016515731811523438, -0.011356353759765625, -0.0061969757080078125, -0.00103759765625, 0.0041217803955078125, 0.009281158447265625, 0.014440536499023438, 0.01959991455078125, 0.024759292602539062, 0.029918670654296875, 0.03507804870605469, 0.0402374267578125, 0.04539680480957031, 0.050556182861328125, 0.05571556091308594, 0.06087493896484375, 0.06603431701660156, 0.07119369506835938, 0.07635307312011719, 0.081512451171875, 0.08667182922363281, 0.09183120727539062, 0.09699058532714844, 0.10214996337890625, 0.10730934143066406, 0.11246871948242188, 0.11762809753417969, 0.1227874755859375, 0.1279468536376953, 0.13310623168945312, 0.13826560974121094, 0.14342498779296875, 0.14858436584472656, 0.15374374389648438, 0.1589031219482422, 0.1640625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 5.0, 10.0, 14.0, 10.0, 10.0, 16.0, 12.0, 20.0, 18.0, 23.0, 27.0, 25.0, 31.0, 34.0, 34.0, 49.0, 47.0, 43.0, 41.0, 25.0, 45.0, 43.0, 35.0, 47.0, 32.0, 34.0, 43.0, 35.0, 34.0, 23.0, 27.0, 24.0, 12.0, 8.0, 8.0, 11.0, 9.0, 8.0, 7.0, 5.0, 6.0, 7.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.091064453125, -0.0878896713256836, -0.08471488952636719, -0.08154010772705078, -0.07836532592773438, -0.07519054412841797, -0.07201576232910156, -0.06884098052978516, -0.06566619873046875, -0.062491416931152344, -0.05931663513183594, -0.05614185333251953, -0.052967071533203125, -0.04979228973388672, -0.04661750793457031, -0.043442726135253906, -0.0402679443359375, -0.037093162536621094, -0.03391838073730469, -0.03074359893798828, -0.027568817138671875, -0.02439403533935547, -0.021219253540039062, -0.018044471740722656, -0.01486968994140625, -0.011694908142089844, -0.008520126342773438, -0.005345344543457031, -0.002170562744140625, 0.0010042190551757812, 0.0041790008544921875, 0.007353782653808594, 0.010528564453125, 0.013703346252441406, 0.016878128051757812, 0.02005290985107422, 0.023227691650390625, 0.02640247344970703, 0.029577255249023438, 0.032752037048339844, 0.03592681884765625, 0.039101600646972656, 0.04227638244628906, 0.04545116424560547, 0.048625946044921875, 0.05180072784423828, 0.05497550964355469, 0.058150291442871094, 0.0613250732421875, 0.0644998550415039, 0.06767463684082031, 0.07084941864013672, 0.07402420043945312, 0.07719898223876953, 0.08037376403808594, 0.08354854583740234, 0.08672332763671875, 0.08989810943603516, 0.09307289123535156, 0.09624767303466797, 0.09942245483398438, 0.10259723663330078, 0.10577201843261719, 0.1089468002319336, 0.11212158203125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 3.0, 7.0, 15.0, 19.0, 28.0, 59.0, 151.0, 384.0, 1319.0, 6478.0, 59933.0, 3209393.0, 882666.0, 28467.0, 3847.0, 934.0, 305.0, 130.0, 61.0, 27.0, 23.0, 14.0, 5.0, 5.0, 4.0, 8.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.71484375, -0.6977615356445312, -0.6806793212890625, -0.6635971069335938, -0.646514892578125, -0.6294326782226562, -0.6123504638671875, -0.5952682495117188, -0.57818603515625, -0.5611038208007812, -0.5440216064453125, -0.5269393920898438, -0.509857177734375, -0.49277496337890625, -0.4756927490234375, -0.45861053466796875, -0.4415283203125, -0.42444610595703125, -0.4073638916015625, -0.39028167724609375, -0.373199462890625, -0.35611724853515625, -0.3390350341796875, -0.32195281982421875, -0.30487060546875, -0.28778839111328125, -0.2707061767578125, -0.25362396240234375, -0.236541748046875, -0.21945953369140625, -0.2023773193359375, -0.18529510498046875, -0.168212890625, -0.15113067626953125, -0.1340484619140625, -0.11696624755859375, -0.099884033203125, -0.08280181884765625, -0.0657196044921875, -0.04863739013671875, -0.03155517578125, -0.01447296142578125, 0.0026092529296875, 0.01969146728515625, 0.036773681640625, 0.05385589599609375, 0.0709381103515625, 0.08802032470703125, 0.1051025390625, 0.12218475341796875, 0.1392669677734375, 0.15634918212890625, 0.173431396484375, 0.19051361083984375, 0.2075958251953125, 0.22467803955078125, 0.24176025390625, 0.25884246826171875, 0.2759246826171875, 0.29300689697265625, 0.310089111328125, 0.32717132568359375, 0.3442535400390625, 0.36133575439453125, 0.37841796875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 5.0, 10.0, 15.0, 17.0, 30.0, 41.0, 95.0, 116.0, 244.0, 472.0, 851.0, 900.0, 566.0, 288.0, 163.0, 94.0, 52.0, 40.0, 19.0, 16.0, 18.0, 8.0, 5.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.376953125, -0.36353302001953125, -0.3501129150390625, -0.33669281005859375, -0.323272705078125, -0.30985260009765625, -0.2964324951171875, -0.28301239013671875, -0.26959228515625, -0.25617218017578125, -0.2427520751953125, -0.22933197021484375, -0.215911865234375, -0.20249176025390625, -0.1890716552734375, -0.17565155029296875, -0.1622314453125, -0.14881134033203125, -0.1353912353515625, -0.12197113037109375, -0.108551025390625, -0.09513092041015625, -0.0817108154296875, -0.06829071044921875, -0.05487060546875, -0.04145050048828125, -0.0280303955078125, -0.01461029052734375, -0.001190185546875, 0.01222991943359375, 0.0256500244140625, 0.03907012939453125, 0.052490234375, 0.06591033935546875, 0.0793304443359375, 0.09275054931640625, 0.106170654296875, 0.11959075927734375, 0.1330108642578125, 0.14643096923828125, 0.15985107421875, 0.17327117919921875, 0.1866912841796875, 0.20011138916015625, 0.213531494140625, 0.22695159912109375, 0.2403717041015625, 0.25379180908203125, 0.2672119140625, 0.28063201904296875, 0.2940521240234375, 0.30747222900390625, 0.320892333984375, 0.33431243896484375, 0.3477325439453125, 0.36115264892578125, 0.37457275390625, 0.38799285888671875, 0.4014129638671875, 0.41483306884765625, 0.428253173828125, 0.44167327880859375, 0.4550933837890625, 0.46851348876953125, 0.48193359375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 9.0, 4.0, 11.0, 42.0, 88.0, 240.0, 266.0, 184.0, 81.0, 36.0, 15.0, 6.0, 6.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.497735977172852, -5.35775089263916, -5.217765808105469, -5.0777812004089355, -4.937796115875244, -4.797811031341553, -4.657825946807861, -4.51784086227417, -4.377856254577637, -4.237871170043945, -4.097886085510254, -3.9579012393951416, -3.8179163932800293, -3.677931308746338, -3.5379462242126465, -3.397961139678955, -3.2579760551452637, -3.1179909706115723, -2.97800612449646, -2.8380210399627686, -2.6980361938476562, -2.558051109313965, -2.4180660247802734, -2.278080940246582, -2.1380960941314697, -1.9981111288070679, -1.858126163482666, -1.7181410789489746, -1.5781561136245728, -1.438171148300171, -1.2981860637664795, -1.1582010984420776, -1.0182161331176758, -0.8782311677932739, -0.7382461428642273, -0.5982611179351807, -0.4582761526107788, -0.31829118728637695, -0.17830616235733032, -0.03832113742828369, 0.10166382789611816, 0.2416488230228424, 0.38163381814956665, 0.5216188430786133, 0.6616038084030151, 0.801588773727417, 0.9415737986564636, 1.0815588235855103, 1.221543788909912, 1.361528754234314, 1.5015137195587158, 1.6414988040924072, 1.781483769416809, 1.921468734741211, 2.0614538192749023, 2.2014389038085938, 2.341423749923706, 2.4814088344573975, 2.6213936805725098, 2.761378765106201, 2.9013638496398926, 3.041348695755005, 3.1813337802886963, 3.3213186264038086, 3.4613037109375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 17.0, 14.0, 23.0, 27.0, 36.0, 36.0, 41.0, 49.0, 45.0, 68.0, 62.0, 72.0, 72.0, 58.0, 50.0, 60.0, 52.0, 35.0, 38.0, 30.0, 25.0, 18.0, 13.0, 13.0, 8.0, 8.0, 5.0, 7.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.732755184173584, -1.6779906749725342, -1.6232261657714844, -1.5684616565704346, -1.5136971473693848, -1.458932638168335, -1.4041681289672852, -1.349403738975525, -1.294639229774475, -1.2398747205734253, -1.1851102113723755, -1.1303457021713257, -1.0755811929702759, -1.0208168029785156, -0.966052234172821, -0.911287784576416, -0.8565232157707214, -0.8017587065696716, -0.7469941973686218, -0.6922297477722168, -0.637465238571167, -0.5827007293701172, -0.5279362201690674, -0.47317174077033997, -0.41840723156929016, -0.36364272236824036, -0.30887824296951294, -0.25411373376846313, -0.19934923946857452, -0.1445847451686859, -0.08982023596763611, -0.03505575656890869, 0.019708752632141113, 0.07447324693202972, 0.12923774123191833, 0.18400225043296814, 0.23876674473285675, 0.29353123903274536, 0.34829574823379517, 0.4030602276325226, 0.4578247368335724, 0.5125892162322998, 0.5673537254333496, 0.6221182346343994, 0.6768827438354492, 0.731647253036499, 0.7864117622375488, 0.8411762118339539, 0.8959407210350037, 0.9507052302360535, 1.0054696798324585, 1.0602341890335083, 1.114998698234558, 1.169763207435608, 1.2245277166366577, 1.2792922258377075, 1.3340567350387573, 1.3888212442398071, 1.443585753440857, 1.4983502626419067, 1.5531147718429565, 1.6078791618347168, 1.6626436710357666, 1.7174081802368164, 1.7721726894378662]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 7.0, 5.0, 12.0, 18.0, 16.0, 27.0, 26.0, 46.0, 72.0, 87.0, 112.0, 154.0, 271.0, 404.0, 555.0, 913.0, 1471.0, 2527.0, 4439.0, 8414.0, 18729.0, 49721.0, 158918.0, 377455.0, 275115.0, 91186.0, 30715.0, 12538.0, 6007.0, 3307.0, 1863.0, 1179.0, 749.0, 494.0, 307.0, 209.0, 142.0, 99.0, 62.0, 57.0, 41.0, 31.0, 18.0, 12.0, 7.0, 7.0, 4.0, 4.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.165283203125, -0.16023826599121094, -0.15519332885742188, -0.1501483917236328, -0.14510345458984375, -0.1400585174560547, -0.13501358032226562, -0.12996864318847656, -0.1249237060546875, -0.11987876892089844, -0.11483383178710938, -0.10978889465332031, -0.10474395751953125, -0.09969902038574219, -0.09465408325195312, -0.08960914611816406, -0.084564208984375, -0.07951927185058594, -0.07447433471679688, -0.06942939758300781, -0.06438446044921875, -0.05933952331542969, -0.054294586181640625, -0.04924964904785156, -0.0442047119140625, -0.03915977478027344, -0.034114837646484375, -0.029069900512695312, -0.02402496337890625, -0.018980026245117188, -0.013935089111328125, -0.008890151977539062, -0.00384521484375, 0.0011997222900390625, 0.006244659423828125, 0.011289596557617188, 0.01633453369140625, 0.021379470825195312, 0.026424407958984375, 0.03146934509277344, 0.0365142822265625, 0.04155921936035156, 0.046604156494140625, 0.05164909362792969, 0.05669403076171875, 0.06173896789550781, 0.06678390502929688, 0.07182884216308594, 0.076873779296875, 0.08191871643066406, 0.08696365356445312, 0.09200859069824219, 0.09705352783203125, 0.10209846496582031, 0.10714340209960938, 0.11218833923339844, 0.1172332763671875, 0.12227821350097656, 0.12732315063476562, 0.1323680877685547, 0.13741302490234375, 0.1424579620361328, 0.14750289916992188, 0.15254783630371094, 0.1575927734375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 5.0, 11.0, 8.0, 12.0, 18.0, 7.0, 20.0, 23.0, 25.0, 16.0, 23.0, 31.0, 39.0, 35.0, 38.0, 37.0, 45.0, 47.0, 37.0, 42.0, 44.0, 39.0, 51.0, 39.0, 42.0, 38.0, 35.0, 27.0, 25.0, 22.0, 22.0, 16.0, 14.0, 9.0, 12.0, 11.0, 9.0, 3.0, 7.0, 9.0, 2.0, 1.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.11248779296875, -0.10889911651611328, -0.10531044006347656, -0.10172176361083984, -0.09813308715820312, -0.0945444107055664, -0.09095573425292969, -0.08736705780029297, -0.08377838134765625, -0.08018970489501953, -0.07660102844238281, -0.0730123519897461, -0.06942367553710938, -0.06583499908447266, -0.06224632263183594, -0.05865764617919922, -0.0550689697265625, -0.05148029327392578, -0.04789161682128906, -0.044302940368652344, -0.040714263916015625, -0.037125587463378906, -0.03353691101074219, -0.02994823455810547, -0.02635955810546875, -0.02277088165283203, -0.019182205200195312, -0.015593528747558594, -0.012004852294921875, -0.008416175842285156, -0.0048274993896484375, -0.0012388229370117188, 0.002349853515625, 0.005938529968261719, 0.009527206420898438, 0.013115882873535156, 0.016704559326171875, 0.020293235778808594, 0.023881912231445312, 0.02747058868408203, 0.03105926513671875, 0.03464794158935547, 0.03823661804199219, 0.041825294494628906, 0.045413970947265625, 0.049002647399902344, 0.05259132385253906, 0.05618000030517578, 0.0597686767578125, 0.06335735321044922, 0.06694602966308594, 0.07053470611572266, 0.07412338256835938, 0.0777120590209961, 0.08130073547363281, 0.08488941192626953, 0.08847808837890625, 0.09206676483154297, 0.09565544128417969, 0.0992441177368164, 0.10283279418945312, 0.10642147064208984, 0.11001014709472656, 0.11359882354736328, 0.1171875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 8.0, 14.0, 23.0, 35.0, 40.0, 54.0, 106.0, 153.0, 305.0, 749.0, 1972.0, 6954.0, 46463.0, 780002.0, 190601.0, 15388.0, 3467.0, 1159.0, 476.0, 217.0, 127.0, 69.0, 54.0, 28.0, 25.0, 10.0, 10.0, 8.0, 7.0, 6.0, 2.0, 5.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.402587890625, -0.3890533447265625, -0.375518798828125, -0.3619842529296875, -0.34844970703125, -0.3349151611328125, -0.321380615234375, -0.3078460693359375, -0.2943115234375, -0.2807769775390625, -0.267242431640625, -0.2537078857421875, -0.24017333984375, -0.2266387939453125, -0.213104248046875, -0.1995697021484375, -0.18603515625, -0.1725006103515625, -0.158966064453125, -0.1454315185546875, -0.13189697265625, -0.1183624267578125, -0.104827880859375, -0.0912933349609375, -0.0777587890625, -0.0642242431640625, -0.050689697265625, -0.0371551513671875, -0.02362060546875, -0.0100860595703125, 0.003448486328125, 0.0169830322265625, 0.030517578125, 0.0440521240234375, 0.057586669921875, 0.0711212158203125, 0.08465576171875, 0.0981903076171875, 0.111724853515625, 0.1252593994140625, 0.1387939453125, 0.1523284912109375, 0.165863037109375, 0.1793975830078125, 0.19293212890625, 0.2064666748046875, 0.220001220703125, 0.2335357666015625, 0.2470703125, 0.2606048583984375, 0.274139404296875, 0.2876739501953125, 0.30120849609375, 0.3147430419921875, 0.328277587890625, 0.3418121337890625, 0.3553466796875, 0.3688812255859375, 0.382415771484375, 0.3959503173828125, 0.40948486328125, 0.4230194091796875, 0.436553955078125, 0.4500885009765625, 0.463623046875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 8.0, 2.0, 2.0, 10.0, 10.0, 10.0, 25.0, 16.0, 27.0, 23.0, 44.0, 31.0, 49.0, 65.0, 67.0, 64.0, 63.0, 84.0, 78.0, 57.0, 46.0, 60.0, 35.0, 24.0, 28.0, 20.0, 15.0, 14.0, 7.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5419921875, -0.5228958129882812, -0.5037994384765625, -0.48470306396484375, -0.465606689453125, -0.44651031494140625, -0.4274139404296875, -0.40831756591796875, -0.38922119140625, -0.37012481689453125, -0.3510284423828125, -0.33193206787109375, -0.312835693359375, -0.29373931884765625, -0.2746429443359375, -0.25554656982421875, -0.2364501953125, -0.21735382080078125, -0.1982574462890625, -0.17916107177734375, -0.160064697265625, -0.14096832275390625, -0.1218719482421875, -0.10277557373046875, -0.08367919921875, -0.06458282470703125, -0.0454864501953125, -0.02639007568359375, -0.007293701171875, 0.01180267333984375, 0.0308990478515625, 0.04999542236328125, 0.069091796875, 0.08818817138671875, 0.1072845458984375, 0.12638092041015625, 0.145477294921875, 0.16457366943359375, 0.1836700439453125, 0.20276641845703125, 0.22186279296875, 0.24095916748046875, 0.2600555419921875, 0.27915191650390625, 0.298248291015625, 0.31734466552734375, 0.3364410400390625, 0.35553741455078125, 0.3746337890625, 0.39373016357421875, 0.4128265380859375, 0.43192291259765625, 0.451019287109375, 0.47011566162109375, 0.4892120361328125, 0.5083084106445312, 0.52740478515625, 0.5465011596679688, 0.5655975341796875, 0.5846939086914062, 0.603790283203125, 0.6228866577148438, 0.6419830322265625, 0.6610794067382812, 0.68017578125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 2.0, 3.0, 3.0, 4.0, 9.0, 14.0, 20.0, 35.0, 42.0, 91.0, 171.0, 379.0, 755.0, 1933.0, 5547.0, 19890.0, 104822.0, 698566.0, 174689.0, 29481.0, 7749.0, 2449.0, 941.0, 443.0, 204.0, 123.0, 71.0, 40.0, 31.0, 11.0, 9.0, 7.0, 5.0, 7.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1837158203125, -0.17908000946044922, -0.17444419860839844, -0.16980838775634766, -0.16517257690429688, -0.1605367660522461, -0.1559009552001953, -0.15126514434814453, -0.14662933349609375, -0.14199352264404297, -0.1373577117919922, -0.1327219009399414, -0.12808609008789062, -0.12345027923583984, -0.11881446838378906, -0.11417865753173828, -0.1095428466796875, -0.10490703582763672, -0.10027122497558594, -0.09563541412353516, -0.09099960327148438, -0.0863637924194336, -0.08172798156738281, -0.07709217071533203, -0.07245635986328125, -0.06782054901123047, -0.06318473815917969, -0.058548927307128906, -0.053913116455078125, -0.049277305603027344, -0.04464149475097656, -0.04000568389892578, -0.035369873046875, -0.03073406219482422, -0.026098251342773438, -0.021462440490722656, -0.016826629638671875, -0.012190818786621094, -0.0075550079345703125, -0.0029191970825195312, 0.00171661376953125, 0.006352424621582031, 0.010988235473632812, 0.015624046325683594, 0.020259857177734375, 0.024895668029785156, 0.029531478881835938, 0.03416728973388672, 0.0388031005859375, 0.04343891143798828, 0.04807472229003906, 0.052710533142089844, 0.057346343994140625, 0.061982154846191406, 0.06661796569824219, 0.07125377655029297, 0.07588958740234375, 0.08052539825439453, 0.08516120910644531, 0.0897970199584961, 0.09443283081054688, 0.09906864166259766, 0.10370445251464844, 0.10834026336669922, 0.11297607421875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 7.0, 7.0, 5.0, 7.0, 9.0, 10.0, 15.0, 16.0, 25.0, 32.0, 43.0, 45.0, 56.0, 62.0, 70.0, 83.0, 66.0, 69.0, 68.0, 68.0, 56.0, 35.0, 27.0, 23.0, 25.0, 14.0, 8.0, 6.0, 6.0, 7.0, 2.0, 2.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.4868717193603516e-05, -3.3629126846790314e-05, -3.238953649997711e-05, -3.114994615316391e-05, -2.9910355806350708e-05, -2.8670765459537506e-05, -2.7431175112724304e-05, -2.6191584765911102e-05, -2.49519944190979e-05, -2.37124040722847e-05, -2.2472813725471497e-05, -2.1233223378658295e-05, -1.9993633031845093e-05, -1.875404268503189e-05, -1.751445233821869e-05, -1.6274861991405487e-05, -1.5035271644592285e-05, -1.3795681297779083e-05, -1.2556090950965881e-05, -1.131650060415268e-05, -1.0076910257339478e-05, -8.837319910526276e-06, -7.597729563713074e-06, -6.358139216899872e-06, -5.11854887008667e-06, -3.878958523273468e-06, -2.639368176460266e-06, -1.3997778296470642e-06, -1.601874828338623e-07, 1.0794028639793396e-06, 2.3189932107925415e-06, 3.5585835576057434e-06, 4.798173904418945e-06, 6.037764251232147e-06, 7.277354598045349e-06, 8.516944944858551e-06, 9.756535291671753e-06, 1.0996125638484955e-05, 1.2235715985298157e-05, 1.3475306332111359e-05, 1.471489667892456e-05, 1.5954487025737762e-05, 1.7194077372550964e-05, 1.8433667719364166e-05, 1.9673258066177368e-05, 2.091284841299057e-05, 2.2152438759803772e-05, 2.3392029106616974e-05, 2.4631619453430176e-05, 2.5871209800243378e-05, 2.711080014705658e-05, 2.835039049386978e-05, 2.9589980840682983e-05, 3.0829571187496185e-05, 3.206916153430939e-05, 3.330875188112259e-05, 3.454834222793579e-05, 3.578793257474899e-05, 3.7027522921562195e-05, 3.82671132683754e-05, 3.95067036151886e-05, 4.07462939620018e-05, 4.1985884308815e-05, 4.3225474655628204e-05, 4.4465065002441406e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 6.0, 4.0, 16.0, 16.0, 15.0, 33.0, 51.0, 62.0, 153.0, 274.0, 585.0, 1293.0, 3791.0, 14833.0, 92487.0, 725559.0, 176661.0, 24051.0, 5397.0, 1751.0, 744.0, 315.0, 183.0, 102.0, 64.0, 36.0, 27.0, 14.0, 13.0, 7.0, 4.0, 7.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13134765625, -0.12601852416992188, -0.12068939208984375, -0.11536026000976562, -0.1100311279296875, -0.10470199584960938, -0.09937286376953125, -0.09404373168945312, -0.088714599609375, -0.08338546752929688, -0.07805633544921875, -0.07272720336914062, -0.0673980712890625, -0.062068939208984375, -0.05673980712890625, -0.051410675048828125, -0.04608154296875, -0.040752410888671875, -0.03542327880859375, -0.030094146728515625, -0.0247650146484375, -0.019435882568359375, -0.01410675048828125, -0.008777618408203125, -0.003448486328125, 0.001880645751953125, 0.00720977783203125, 0.012538909912109375, 0.0178680419921875, 0.023197174072265625, 0.02852630615234375, 0.033855438232421875, 0.0391845703125, 0.044513702392578125, 0.04984283447265625, 0.055171966552734375, 0.0605010986328125, 0.06583023071289062, 0.07115936279296875, 0.07648849487304688, 0.081817626953125, 0.08714675903320312, 0.09247589111328125, 0.09780502319335938, 0.1031341552734375, 0.10846328735351562, 0.11379241943359375, 0.11912155151367188, 0.12445068359375, 0.12977981567382812, 0.13510894775390625, 0.14043807983398438, 0.1457672119140625, 0.15109634399414062, 0.15642547607421875, 0.16175460815429688, 0.167083740234375, 0.17241287231445312, 0.17774200439453125, 0.18307113647460938, 0.1884002685546875, 0.19372940063476562, 0.19905853271484375, 0.20438766479492188, 0.209716796875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 4.0, 9.0, 3.0, 19.0, 13.0, 13.0, 35.0, 46.0, 48.0, 71.0, 81.0, 88.0, 95.0, 91.0, 112.0, 70.0, 48.0, 39.0, 34.0, 21.0, 24.0, 10.0, 6.0, 4.0, 5.0, 2.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.123291015625, -0.11867713928222656, -0.11406326293945312, -0.10944938659667969, -0.10483551025390625, -0.10022163391113281, -0.09560775756835938, -0.09099388122558594, -0.0863800048828125, -0.08176612854003906, -0.07715225219726562, -0.07253837585449219, -0.06792449951171875, -0.06331062316894531, -0.058696746826171875, -0.05408287048339844, -0.049468994140625, -0.04485511779785156, -0.040241241455078125, -0.03562736511230469, -0.03101348876953125, -0.026399612426757812, -0.021785736083984375, -0.017171859741210938, -0.0125579833984375, -0.007944107055664062, -0.003330230712890625, 0.0012836456298828125, 0.00589752197265625, 0.010511398315429688, 0.015125274658203125, 0.019739151000976562, 0.02435302734375, 0.028966903686523438, 0.033580780029296875, 0.03819465637207031, 0.04280853271484375, 0.04742240905761719, 0.052036285400390625, 0.05665016174316406, 0.0612640380859375, 0.06587791442871094, 0.07049179077148438, 0.07510566711425781, 0.07971954345703125, 0.08433341979980469, 0.08894729614257812, 0.09356117248535156, 0.098175048828125, 0.10278892517089844, 0.10740280151367188, 0.11201667785644531, 0.11663055419921875, 0.12124443054199219, 0.12585830688476562, 0.13047218322753906, 0.1350860595703125, 0.13969993591308594, 0.14431381225585938, 0.1489276885986328, 0.15354156494140625, 0.1581554412841797, 0.16276931762695312, 0.16738319396972656, 0.1719970703125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 3.0, 8.0, 24.0, 55.0, 93.0, 169.0, 288.0, 137.0, 90.0, 50.0, 26.0, 16.0, 7.0, 12.0, 5.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.021078586578369, -1.9377696514129639, -1.8544608354568481, -1.7711519002914429, -1.6878430843353271, -1.6045341491699219, -1.5212252140045166, -1.4379163980484009, -1.3546075820922852, -1.2712986469268799, -1.1879898309707642, -1.1046808958053589, -1.0213720798492432, -0.9380631446838379, -0.8547542691230774, -0.7714453935623169, -0.6881364583969116, -0.6048275828361511, -0.5215187072753906, -0.43820980191230774, -0.35490092635154724, -0.27159205079078674, -0.18828314542770386, -0.10497426986694336, -0.02166539430618286, 0.061643488705158234, 0.14495237171649933, 0.22826126217842102, 0.3115701377391815, 0.394879013299942, 0.4781879186630249, 0.5614967942237854, 0.6448056697845459, 0.7281145453453064, 0.8114234209060669, 0.8947323560714722, 0.9780411720275879, 1.0613501071929932, 1.1446590423583984, 1.2279678583145142, 1.3112766742706299, 1.3945856094360352, 1.4778944253921509, 1.5612033605575562, 1.6445121765136719, 1.7278211116790771, 1.8111300468444824, 1.8944388628005981, 1.9777477979660034, 2.061056613922119, 2.1443655490875244, 2.2276744842529297, 2.310983419418335, 2.394292116165161, 2.4776010513305664, 2.5609099864959717, 2.644218921661377, 2.7275278568267822, 2.8108367919921875, 2.8941454887390137, 2.977454423904419, 3.060763359069824, 3.1440722942352295, 3.2273812294006348, 3.310689926147461]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 6.0, 5.0, 4.0, 6.0, 10.0, 8.0, 9.0, 18.0, 25.0, 21.0, 20.0, 30.0, 34.0, 34.0, 55.0, 44.0, 79.0, 84.0, 100.0, 71.0, 64.0, 30.0, 42.0, 40.0, 28.0, 22.0, 28.0, 21.0, 12.0, 12.0, 10.0, 9.0, 6.0, 5.0, 7.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.5481157302856445, -2.479661226272583, -2.4112067222595215, -2.34275221824646, -2.2742977142333984, -2.205843448638916, -2.1373889446258545, -2.068934440612793, -2.0004799365997314, -1.93202543258667, -1.8635709285736084, -1.7951165437698364, -1.726662039756775, -1.6582075357437134, -1.5897531509399414, -1.5212986469268799, -1.4528441429138184, -1.3843896389007568, -1.3159351348876953, -1.2474807500839233, -1.1790262460708618, -1.1105717420578003, -1.0421173572540283, -0.9736628532409668, -0.9052083492279053, -0.8367538452148438, -0.768299400806427, -0.6998449563980103, -0.6313904523849487, -0.5629359483718872, -0.49448150396347046, -0.4260270297527313, -0.3575727939605713, -0.28911831974983215, -0.22066384553909302, -0.15220937132835388, -0.08375489711761475, -0.01530042290687561, 0.053154051303863525, 0.12160852551460266, 0.1900629997253418, 0.25851747393608093, 0.32697194814682007, 0.3954264223575592, 0.46388089656829834, 0.5323354005813599, 0.6007898449897766, 0.6692442893981934, 0.7376987934112549, 0.8061532974243164, 0.8746077418327332, 0.9430621862411499, 1.0115166902542114, 1.079971194267273, 1.148425579071045, 1.2168800830841064, 1.285334587097168, 1.3537890911102295, 1.422243595123291, 1.490697979927063, 1.5591524839401245, 1.627606987953186, 1.696061372756958, 1.7645158767700195, 1.832970380783081]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 2.0, 13.0, 8.0, 13.0, 21.0, 18.0, 34.0, 47.0, 73.0, 93.0, 138.0, 304.0, 478.0, 825.0, 1603.0, 3170.0, 7134.0, 19490.0, 73770.0, 418065.0, 2278868.0, 1160617.0, 172508.0, 35938.0, 11567.0, 4588.0, 2200.0, 1112.0, 585.0, 345.0, 229.0, 124.0, 86.0, 50.0, 51.0, 34.0, 21.0, 23.0, 13.0, 6.0, 3.0, 2.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1309814453125, -0.12608718872070312, -0.12119293212890625, -0.11629867553710938, -0.1114044189453125, -0.10651016235351562, -0.10161590576171875, -0.09672164916992188, -0.091827392578125, -0.08693313598632812, -0.08203887939453125, -0.07714462280273438, -0.0722503662109375, -0.06735610961914062, -0.06246185302734375, -0.057567596435546875, -0.05267333984375, -0.047779083251953125, -0.04288482666015625, -0.037990570068359375, -0.0330963134765625, -0.028202056884765625, -0.02330780029296875, -0.018413543701171875, -0.013519287109375, -0.008625030517578125, -0.00373077392578125, 0.001163482666015625, 0.0060577392578125, 0.010951995849609375, 0.01584625244140625, 0.020740509033203125, 0.025634765625, 0.030529022216796875, 0.03542327880859375, 0.040317535400390625, 0.0452117919921875, 0.050106048583984375, 0.05500030517578125, 0.059894561767578125, 0.064788818359375, 0.06968307495117188, 0.07457733154296875, 0.07947158813476562, 0.0843658447265625, 0.08926010131835938, 0.09415435791015625, 0.09904861450195312, 0.10394287109375, 0.10883712768554688, 0.11373138427734375, 0.11862564086914062, 0.1235198974609375, 0.12841415405273438, 0.13330841064453125, 0.13820266723632812, 0.143096923828125, 0.14799118041992188, 0.15288543701171875, 0.15777969360351562, 0.1626739501953125, 0.16756820678710938, 0.17246246337890625, 0.17735671997070312, 0.1822509765625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 8.0, 10.0, 7.0, 7.0, 11.0, 13.0, 20.0, 13.0, 23.0, 25.0, 18.0, 19.0, 28.0, 34.0, 30.0, 38.0, 41.0, 37.0, 52.0, 45.0, 36.0, 32.0, 38.0, 41.0, 50.0, 42.0, 31.0, 30.0, 23.0, 20.0, 26.0, 16.0, 33.0, 16.0, 15.0, 9.0, 6.0, 9.0, 12.0, 9.0, 4.0, 1.0, 4.0, 5.0, 7.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.1064453125, -0.10318946838378906, -0.09993362426757812, -0.09667778015136719, -0.09342193603515625, -0.09016609191894531, -0.08691024780273438, -0.08365440368652344, -0.0803985595703125, -0.07714271545410156, -0.07388687133789062, -0.07063102722167969, -0.06737518310546875, -0.06411933898925781, -0.060863494873046875, -0.05760765075683594, -0.054351806640625, -0.05109596252441406, -0.047840118408203125, -0.04458427429199219, -0.04132843017578125, -0.03807258605957031, -0.034816741943359375, -0.03156089782714844, -0.0283050537109375, -0.025049209594726562, -0.021793365478515625, -0.018537521362304688, -0.01528167724609375, -0.012025833129882812, -0.008769989013671875, -0.0055141448974609375, -0.00225830078125, 0.0009975433349609375, 0.004253387451171875, 0.0075092315673828125, 0.01076507568359375, 0.014020919799804688, 0.017276763916015625, 0.020532608032226562, 0.0237884521484375, 0.027044296264648438, 0.030300140380859375, 0.03355598449707031, 0.03681182861328125, 0.04006767272949219, 0.043323516845703125, 0.04657936096191406, 0.049835205078125, 0.05309104919433594, 0.056346893310546875, 0.05960273742675781, 0.06285858154296875, 0.06611442565917969, 0.06937026977539062, 0.07262611389160156, 0.0758819580078125, 0.07913780212402344, 0.08239364624023438, 0.08564949035644531, 0.08890533447265625, 0.09216117858886719, 0.09541702270507812, 0.09867286682128906, 0.1019287109375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 9.0, 7.0, 12.0, 13.0, 42.0, 48.0, 71.0, 121.0, 257.0, 590.0, 1647.0, 5637.0, 29773.0, 356561.0, 3566164.0, 204520.0, 21795.0, 4554.0, 1376.0, 507.0, 221.0, 119.0, 76.0, 44.0, 33.0, 21.0, 21.0, 4.0, 12.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40869140625, -0.3968162536621094, -0.38494110107421875, -0.3730659484863281, -0.3611907958984375, -0.3493156433105469, -0.33744049072265625, -0.3255653381347656, -0.313690185546875, -0.3018150329589844, -0.28993988037109375, -0.2780647277832031, -0.2661895751953125, -0.2543144226074219, -0.24243927001953125, -0.23056411743164062, -0.21868896484375, -0.20681381225585938, -0.19493865966796875, -0.18306350708007812, -0.1711883544921875, -0.15931320190429688, -0.14743804931640625, -0.13556289672851562, -0.123687744140625, -0.11181259155273438, -0.09993743896484375, -0.08806228637695312, -0.0761871337890625, -0.06431198120117188, -0.05243682861328125, -0.040561676025390625, -0.0286865234375, -0.016811370849609375, -0.00493621826171875, 0.006938934326171875, 0.0188140869140625, 0.030689239501953125, 0.04256439208984375, 0.054439544677734375, 0.066314697265625, 0.07818984985351562, 0.09006500244140625, 0.10194015502929688, 0.1138153076171875, 0.12569046020507812, 0.13756561279296875, 0.14944076538085938, 0.16131591796875, 0.17319107055664062, 0.18506622314453125, 0.19694137573242188, 0.2088165283203125, 0.22069168090820312, 0.23256683349609375, 0.24444198608398438, 0.256317138671875, 0.2681922912597656, 0.28006744384765625, 0.2919425964355469, 0.3038177490234375, 0.3156929016113281, 0.32756805419921875, 0.3394432067871094, 0.351318359375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 5.0, 9.0, 11.0, 16.0, 21.0, 26.0, 33.0, 53.0, 67.0, 139.0, 196.0, 340.0, 554.0, 789.0, 684.0, 401.0, 264.0, 159.0, 88.0, 62.0, 34.0, 33.0, 24.0, 21.0, 18.0, 8.0, 3.0, 2.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30810546875, -0.29840087890625, -0.2886962890625, -0.27899169921875, -0.269287109375, -0.25958251953125, -0.2498779296875, -0.24017333984375, -0.23046875, -0.22076416015625, -0.2110595703125, -0.20135498046875, -0.191650390625, -0.18194580078125, -0.1722412109375, -0.16253662109375, -0.15283203125, -0.14312744140625, -0.1334228515625, -0.12371826171875, -0.114013671875, -0.10430908203125, -0.0946044921875, -0.08489990234375, -0.0751953125, -0.06549072265625, -0.0557861328125, -0.04608154296875, -0.036376953125, -0.02667236328125, -0.0169677734375, -0.00726318359375, 0.00244140625, 0.01214599609375, 0.0218505859375, 0.03155517578125, 0.041259765625, 0.05096435546875, 0.0606689453125, 0.07037353515625, 0.080078125, 0.08978271484375, 0.0994873046875, 0.10919189453125, 0.118896484375, 0.12860107421875, 0.1383056640625, 0.14801025390625, 0.15771484375, 0.16741943359375, 0.1771240234375, 0.18682861328125, 0.196533203125, 0.20623779296875, 0.2159423828125, 0.22564697265625, 0.2353515625, 0.24505615234375, 0.2547607421875, 0.26446533203125, 0.274169921875, 0.28387451171875, 0.2935791015625, 0.30328369140625, 0.31298828125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 6.0, 9.0, 10.0, 18.0, 34.0, 107.0, 206.0, 225.0, 197.0, 118.0, 44.0, 15.0, 6.0, 8.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9273905754089355, -3.8071742057800293, -3.686957597732544, -3.5667412281036377, -3.4465246200561523, -3.326308250427246, -3.2060916423797607, -3.0858752727508545, -2.965658664703369, -2.845442295074463, -2.7252256870269775, -2.6050093173980713, -2.484792709350586, -2.3645763397216797, -2.2443597316741943, -2.124143362045288, -2.0039267539978027, -1.883710265159607, -1.7634937763214111, -1.6432772874832153, -1.5230607986450195, -1.4028444290161133, -1.282627820968628, -1.1624114513397217, -1.0421950817108154, -0.9219785928726196, -0.8017621040344238, -0.681545615196228, -0.5613291263580322, -0.4411126971244812, -0.3208962082862854, -0.2006797194480896, -0.08046317100524902, 0.03975331038236618, 0.15996979176998138, 0.280186265707016, 0.4004027545452118, 0.5206192135810852, 0.640835702419281, 0.7610521912574768, 0.8812686800956726, 1.0014851093292236, 1.1217015981674194, 1.2419180870056152, 1.362134575843811, 1.4823510646820068, 1.6025675535202026, 1.7227840423583984, 1.8430005311965942, 1.96321702003479, 2.0834333896636963, 2.2036499977111816, 2.323866367340088, 2.4440829753875732, 2.5642993450164795, 2.684515953063965, 2.804732322692871, 2.9249486923217773, 3.0451653003692627, 3.165381669998169, 3.2855982780456543, 3.4058146476745605, 3.526031255722046, 3.646247625350952, 3.7664642333984375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 5.0, 5.0, 12.0, 10.0, 9.0, 15.0, 11.0, 16.0, 23.0, 29.0, 21.0, 24.0, 29.0, 42.0, 38.0, 48.0, 35.0, 54.0, 41.0, 47.0, 40.0, 33.0, 39.0, 43.0, 44.0, 48.0, 31.0, 37.0, 25.0, 24.0, 21.0, 19.0, 14.0, 16.0, 7.0, 12.0, 11.0, 11.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.117948293685913, -1.0799614191055298, -1.0419745445251465, -1.0039876699447632, -0.9660007953643799, -0.9280139207839966, -0.8900269865989685, -0.8520401120185852, -0.8140532374382019, -0.7760663628578186, -0.7380794882774353, -0.700092613697052, -0.6621056795120239, -0.6241188049316406, -0.5861319303512573, -0.548145055770874, -0.5101581811904907, -0.4721713066101074, -0.4341844320297241, -0.39619752764701843, -0.35821065306663513, -0.32022377848625183, -0.28223687410354614, -0.24424999952316284, -0.20626312494277954, -0.16827625036239624, -0.13028936088085175, -0.09230247884988785, -0.05431559681892395, -0.01632872223854065, 0.021658167243003845, 0.05964505672454834, 0.09763193130493164, 0.13561880588531494, 0.17360569536685944, 0.21159258484840393, 0.24957945942878723, 0.28756633400917053, 0.3255532383918762, 0.3635401129722595, 0.4015269875526428, 0.4395138621330261, 0.4775007367134094, 0.5154876112937927, 0.5534745454788208, 0.5914614200592041, 0.6294482946395874, 0.6674351692199707, 0.705422043800354, 0.7434089183807373, 0.7813957929611206, 0.8193826675415039, 0.8573695421218872, 0.8953564167022705, 0.9333433508872986, 0.9713302254676819, 1.00931715965271, 1.0473040342330933, 1.0852909088134766, 1.1232777833938599, 1.1612646579742432, 1.1992515325546265, 1.2372384071350098, 1.2752254009246826, 1.3132121562957764]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 4.0, 6.0, 6.0, 17.0, 14.0, 21.0, 34.0, 61.0, 64.0, 103.0, 161.0, 226.0, 369.0, 600.0, 1063.0, 2035.0, 4293.0, 10553.0, 32026.0, 134745.0, 494091.0, 278270.0, 59961.0, 17188.0, 6313.0, 2830.0, 1417.0, 751.0, 464.0, 267.0, 195.0, 140.0, 71.0, 61.0, 39.0, 32.0, 20.0, 14.0, 11.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2095947265625, -0.2029895782470703, -0.19638442993164062, -0.18977928161621094, -0.18317413330078125, -0.17656898498535156, -0.16996383666992188, -0.1633586883544922, -0.1567535400390625, -0.1501483917236328, -0.14354324340820312, -0.13693809509277344, -0.13033294677734375, -0.12372779846191406, -0.11712265014648438, -0.11051750183105469, -0.103912353515625, -0.09730720520019531, -0.09070205688476562, -0.08409690856933594, -0.07749176025390625, -0.07088661193847656, -0.06428146362304688, -0.05767631530761719, -0.0510711669921875, -0.04446601867675781, -0.037860870361328125, -0.03125572204589844, -0.02465057373046875, -0.018045425415039062, -0.011440277099609375, -0.0048351287841796875, 0.00177001953125, 0.008375167846679688, 0.014980316162109375, 0.021585464477539062, 0.02819061279296875, 0.03479576110839844, 0.041400909423828125, 0.04800605773925781, 0.0546112060546875, 0.06121635437011719, 0.06782150268554688, 0.07442665100097656, 0.08103179931640625, 0.08763694763183594, 0.09424209594726562, 0.10084724426269531, 0.107452392578125, 0.11405754089355469, 0.12066268920898438, 0.12726783752441406, 0.13387298583984375, 0.14047813415527344, 0.14708328247070312, 0.1536884307861328, 0.1602935791015625, 0.1668987274169922, 0.17350387573242188, 0.18010902404785156, 0.18671417236328125, 0.19331932067871094, 0.19992446899414062, 0.2065296173095703, 0.213134765625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 7.0, 5.0, 4.0, 5.0, 8.0, 11.0, 12.0, 18.0, 16.0, 25.0, 20.0, 24.0, 30.0, 34.0, 36.0, 39.0, 28.0, 40.0, 43.0, 59.0, 36.0, 55.0, 49.0, 40.0, 37.0, 52.0, 40.0, 30.0, 27.0, 17.0, 27.0, 20.0, 17.0, 12.0, 15.0, 18.0, 11.0, 12.0, 5.0, 4.0, 6.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11529541015625, -0.11155891418457031, -0.10782241821289062, -0.10408592224121094, -0.10034942626953125, -0.09661293029785156, -0.09287643432617188, -0.08913993835449219, -0.0854034423828125, -0.08166694641113281, -0.07793045043945312, -0.07419395446777344, -0.07045745849609375, -0.06672096252441406, -0.06298446655273438, -0.05924797058105469, -0.055511474609375, -0.05177497863769531, -0.048038482666015625, -0.04430198669433594, -0.04056549072265625, -0.03682899475097656, -0.033092498779296875, -0.029356002807617188, -0.0256195068359375, -0.021883010864257812, -0.018146514892578125, -0.014410018920898438, -0.01067352294921875, -0.0069370269775390625, -0.003200531005859375, 0.0005359649658203125, 0.0042724609375, 0.008008956909179688, 0.011745452880859375, 0.015481948852539062, 0.01921844482421875, 0.022954940795898438, 0.026691436767578125, 0.030427932739257812, 0.0341644287109375, 0.03790092468261719, 0.041637420654296875, 0.04537391662597656, 0.04911041259765625, 0.05284690856933594, 0.056583404541015625, 0.06031990051269531, 0.064056396484375, 0.06779289245605469, 0.07152938842773438, 0.07526588439941406, 0.07900238037109375, 0.08273887634277344, 0.08647537231445312, 0.09021186828613281, 0.0939483642578125, 0.09768486022949219, 0.10142135620117188, 0.10515785217285156, 0.10889434814453125, 0.11263084411621094, 0.11636734008789062, 0.12010383605957031, 0.12384033203125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 9.0, 2.0, 6.0, 6.0, 10.0, 7.0, 11.0, 17.0, 26.0, 34.0, 43.0, 50.0, 64.0, 99.0, 123.0, 190.0, 279.0, 493.0, 940.0, 1938.0, 4956.0, 18751.0, 133671.0, 762224.0, 100904.0, 15310.0, 4301.0, 1734.0, 858.0, 473.0, 299.0, 216.0, 127.0, 94.0, 57.0, 55.0, 56.0, 35.0, 21.0, 16.0, 16.0, 11.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.334716796875, -0.3252716064453125, -0.315826416015625, -0.3063812255859375, -0.29693603515625, -0.2874908447265625, -0.278045654296875, -0.2686004638671875, -0.2591552734375, -0.2497100830078125, -0.240264892578125, -0.2308197021484375, -0.22137451171875, -0.2119293212890625, -0.202484130859375, -0.1930389404296875, -0.18359375, -0.1741485595703125, -0.164703369140625, -0.1552581787109375, -0.14581298828125, -0.1363677978515625, -0.126922607421875, -0.1174774169921875, -0.1080322265625, -0.0985870361328125, -0.089141845703125, -0.0796966552734375, -0.07025146484375, -0.0608062744140625, -0.051361083984375, -0.0419158935546875, -0.032470703125, -0.0230255126953125, -0.013580322265625, -0.0041351318359375, 0.00531005859375, 0.0147552490234375, 0.024200439453125, 0.0336456298828125, 0.0430908203125, 0.0525360107421875, 0.061981201171875, 0.0714263916015625, 0.08087158203125, 0.0903167724609375, 0.099761962890625, 0.1092071533203125, 0.11865234375, 0.1280975341796875, 0.137542724609375, 0.1469879150390625, 0.15643310546875, 0.1658782958984375, 0.175323486328125, 0.1847686767578125, 0.1942138671875, 0.2036590576171875, 0.213104248046875, 0.2225494384765625, 0.23199462890625, 0.2414398193359375, 0.250885009765625, 0.2603302001953125, 0.269775390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 5.0, 3.0, 8.0, 11.0, 12.0, 8.0, 17.0, 24.0, 35.0, 32.0, 63.0, 55.0, 66.0, 65.0, 59.0, 71.0, 61.0, 68.0, 62.0, 59.0, 42.0, 30.0, 26.0, 26.0, 20.0, 11.0, 14.0, 19.0, 8.0, 9.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59765625, -0.5797653198242188, -0.5618743896484375, -0.5439834594726562, -0.526092529296875, -0.5082015991210938, -0.4903106689453125, -0.47241973876953125, -0.45452880859375, -0.43663787841796875, -0.4187469482421875, -0.40085601806640625, -0.382965087890625, -0.36507415771484375, -0.3471832275390625, -0.32929229736328125, -0.3114013671875, -0.29351043701171875, -0.2756195068359375, -0.25772857666015625, -0.239837646484375, -0.22194671630859375, -0.2040557861328125, -0.18616485595703125, -0.16827392578125, -0.15038299560546875, -0.1324920654296875, -0.11460113525390625, -0.096710205078125, -0.07881927490234375, -0.0609283447265625, -0.04303741455078125, -0.025146484375, -0.00725555419921875, 0.0106353759765625, 0.02852630615234375, 0.046417236328125, 0.06430816650390625, 0.0821990966796875, 0.10009002685546875, 0.11798095703125, 0.13587188720703125, 0.1537628173828125, 0.17165374755859375, 0.189544677734375, 0.20743560791015625, 0.2253265380859375, 0.24321746826171875, 0.2611083984375, 0.27899932861328125, 0.2968902587890625, 0.31478118896484375, 0.332672119140625, 0.35056304931640625, 0.3684539794921875, 0.38634490966796875, 0.40423583984375, 0.42212677001953125, 0.4400177001953125, 0.45790863037109375, 0.475799560546875, 0.49369049072265625, 0.5115814208984375, 0.5294723510742188, 0.54736328125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 7.0, 12.0, 16.0, 16.0, 11.0, 18.0, 27.0, 28.0, 45.0, 50.0, 113.0, 121.0, 197.0, 280.0, 485.0, 777.0, 1349.0, 2467.0, 4758.0, 9456.0, 21701.0, 57711.0, 201066.0, 573704.0, 108826.0, 35663.0, 14656.0, 6955.0, 3481.0, 1766.0, 1023.0, 618.0, 385.0, 247.0, 153.0, 104.0, 77.0, 47.0, 41.0, 26.0, 18.0, 21.0, 13.0, 5.0, 7.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.0733642578125, -0.0710906982421875, -0.068817138671875, -0.0665435791015625, -0.06427001953125, -0.0619964599609375, -0.059722900390625, -0.0574493408203125, -0.05517578125, -0.0529022216796875, -0.050628662109375, -0.0483551025390625, -0.04608154296875, -0.0438079833984375, -0.041534423828125, -0.0392608642578125, -0.0369873046875, -0.0347137451171875, -0.032440185546875, -0.0301666259765625, -0.02789306640625, -0.0256195068359375, -0.023345947265625, -0.0210723876953125, -0.018798828125, -0.0165252685546875, -0.014251708984375, -0.0119781494140625, -0.00970458984375, -0.0074310302734375, -0.005157470703125, -0.0028839111328125, -0.0006103515625, 0.0016632080078125, 0.003936767578125, 0.0062103271484375, 0.00848388671875, 0.0107574462890625, 0.013031005859375, 0.0153045654296875, 0.017578125, 0.0198516845703125, 0.022125244140625, 0.0243988037109375, 0.02667236328125, 0.0289459228515625, 0.031219482421875, 0.0334930419921875, 0.0357666015625, 0.0380401611328125, 0.040313720703125, 0.0425872802734375, 0.04486083984375, 0.0471343994140625, 0.049407958984375, 0.0516815185546875, 0.053955078125, 0.0562286376953125, 0.058502197265625, 0.0607757568359375, 0.06304931640625, 0.0653228759765625, 0.067596435546875, 0.0698699951171875, 0.0721435546875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 2.0, 6.0, 9.0, 3.0, 7.0, 10.0, 14.0, 12.0, 23.0, 21.0, 29.0, 44.0, 55.0, 45.0, 70.0, 72.0, 77.0, 72.0, 70.0, 68.0, 54.0, 41.0, 46.0, 26.0, 17.0, 21.0, 12.0, 8.0, 9.0, 7.0, 7.0, 7.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 4.0], "bins": [-3.7550926208496094e-05, -3.6495737731456757e-05, -3.544054925441742e-05, -3.438536077737808e-05, -3.3330172300338745e-05, -3.227498382329941e-05, -3.121979534626007e-05, -3.0164606869220734e-05, -2.9109418392181396e-05, -2.805422991514206e-05, -2.6999041438102722e-05, -2.5943852961063385e-05, -2.4888664484024048e-05, -2.383347600698471e-05, -2.2778287529945374e-05, -2.1723099052906036e-05, -2.06679105758667e-05, -1.9612722098827362e-05, -1.8557533621788025e-05, -1.7502345144748688e-05, -1.644715666770935e-05, -1.5391968190670013e-05, -1.4336779713630676e-05, -1.3281591236591339e-05, -1.2226402759552002e-05, -1.1171214282512665e-05, -1.0116025805473328e-05, -9.06083732843399e-06, -8.005648851394653e-06, -6.950460374355316e-06, -5.895271897315979e-06, -4.840083420276642e-06, -3.7848949432373047e-06, -2.7297064661979675e-06, -1.6745179891586304e-06, -6.193295121192932e-07, 4.3585896492004395e-07, 1.491047441959381e-06, 2.5462359189987183e-06, 3.6014243960380554e-06, 4.656612873077393e-06, 5.71180135011673e-06, 6.766989827156067e-06, 7.822178304195404e-06, 8.877366781234741e-06, 9.932555258274078e-06, 1.0987743735313416e-05, 1.2042932212352753e-05, 1.309812068939209e-05, 1.4153309166431427e-05, 1.5208497643470764e-05, 1.62636861205101e-05, 1.731887459754944e-05, 1.8374063074588776e-05, 1.9429251551628113e-05, 2.048444002866745e-05, 2.1539628505706787e-05, 2.2594816982746124e-05, 2.365000545978546e-05, 2.47051939368248e-05, 2.5760382413864136e-05, 2.6815570890903473e-05, 2.787075936794281e-05, 2.8925947844982147e-05, 2.9981136322021484e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 10.0, 9.0, 7.0, 11.0, 30.0, 23.0, 41.0, 63.0, 119.0, 187.0, 313.0, 594.0, 1202.0, 2590.0, 7228.0, 23952.0, 123938.0, 734041.0, 118745.0, 23332.0, 7019.0, 2600.0, 1122.0, 556.0, 300.0, 174.0, 116.0, 78.0, 59.0, 29.0, 22.0, 13.0, 10.0, 8.0, 7.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12335205078125, -0.11955547332763672, -0.11575889587402344, -0.11196231842041016, -0.10816574096679688, -0.1043691635131836, -0.10057258605957031, -0.09677600860595703, -0.09297943115234375, -0.08918285369873047, -0.08538627624511719, -0.0815896987915039, -0.07779312133789062, -0.07399654388427734, -0.07019996643066406, -0.06640338897705078, -0.0626068115234375, -0.05881023406982422, -0.05501365661621094, -0.051217079162597656, -0.047420501708984375, -0.043623924255371094, -0.03982734680175781, -0.03603076934814453, -0.03223419189453125, -0.02843761444091797, -0.024641036987304688, -0.020844459533691406, -0.017047882080078125, -0.013251304626464844, -0.009454727172851562, -0.005658149719238281, -0.001861572265625, 0.0019350051879882812, 0.0057315826416015625, 0.009528160095214844, 0.013324737548828125, 0.017121315002441406, 0.020917892456054688, 0.02471446990966797, 0.02851104736328125, 0.03230762481689453, 0.03610420227050781, 0.039900779724121094, 0.043697357177734375, 0.047493934631347656, 0.05129051208496094, 0.05508708953857422, 0.0588836669921875, 0.06268024444580078, 0.06647682189941406, 0.07027339935302734, 0.07406997680664062, 0.0778665542602539, 0.08166313171386719, 0.08545970916748047, 0.08925628662109375, 0.09305286407470703, 0.09684944152832031, 0.1006460189819336, 0.10444259643554688, 0.10823917388916016, 0.11203575134277344, 0.11583232879638672, 0.11962890625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 10.0, 4.0, 8.0, 8.0, 14.0, 29.0, 42.0, 39.0, 80.0, 110.0, 106.0, 109.0, 112.0, 84.0, 63.0, 53.0, 38.0, 29.0, 13.0, 23.0, 14.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.17626953125, -0.1721038818359375, -0.167938232421875, -0.1637725830078125, -0.15960693359375, -0.1554412841796875, -0.151275634765625, -0.1471099853515625, -0.1429443359375, -0.1387786865234375, -0.134613037109375, -0.1304473876953125, -0.12628173828125, -0.1221160888671875, -0.117950439453125, -0.1137847900390625, -0.109619140625, -0.1054534912109375, -0.101287841796875, -0.0971221923828125, -0.09295654296875, -0.0887908935546875, -0.084625244140625, -0.0804595947265625, -0.0762939453125, -0.0721282958984375, -0.067962646484375, -0.0637969970703125, -0.05963134765625, -0.0554656982421875, -0.051300048828125, -0.0471343994140625, -0.04296875, -0.0388031005859375, -0.034637451171875, -0.0304718017578125, -0.02630615234375, -0.0221405029296875, -0.017974853515625, -0.0138092041015625, -0.0096435546875, -0.0054779052734375, -0.001312255859375, 0.0028533935546875, 0.00701904296875, 0.0111846923828125, 0.015350341796875, 0.0195159912109375, 0.023681640625, 0.0278472900390625, 0.032012939453125, 0.0361785888671875, 0.04034423828125, 0.0445098876953125, 0.048675537109375, 0.0528411865234375, 0.0570068359375, 0.0611724853515625, 0.065338134765625, 0.0695037841796875, 0.07366943359375, 0.0778350830078125, 0.082000732421875, 0.0861663818359375, 0.09033203125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 15.0, 4.0, 18.0, 31.0, 77.0, 107.0, 232.0, 246.0, 106.0, 58.0, 34.0, 16.0, 16.0, 9.0, 5.0, 7.0, 1.0, 1.0, 5.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.111006021499634, -3.0370190143585205, -2.963031768798828, -2.889044761657715, -2.8150575160980225, -2.741070508956909, -2.667083263397217, -2.5930962562561035, -2.519109010696411, -2.445122003555298, -2.3711347579956055, -2.297147750854492, -2.2231605052948, -2.1491734981536865, -2.075186252593994, -2.001199245452881, -1.927212119102478, -1.8532249927520752, -1.7792378664016724, -1.7052507400512695, -1.6312636137008667, -1.5572764873504639, -1.4832894802093506, -1.4093022346496582, -1.335315227508545, -1.261328101158142, -1.1873409748077393, -1.1133538484573364, -1.0393667221069336, -0.9653795957565308, -0.8913925290107727, -0.8174054026603699, -0.7434182167053223, -0.6694310903549194, -0.5954439640045166, -0.5214568376541138, -0.4474697411060333, -0.3734826147556305, -0.29949551820755005, -0.22550839185714722, -0.15152126550674438, -0.07753414660692215, -0.0035470277070999146, 0.07044008374214172, 0.14442721009254456, 0.2184143364429474, 0.29240143299102783, 0.36638855934143066, 0.4403756856918335, 0.5143628120422363, 0.5883499383926392, 0.662337064743042, 0.7363241910934448, 0.8103113174438477, 0.8842983841896057, 0.9582855105400085, 1.0322725772857666, 1.1062597036361694, 1.1802468299865723, 1.254233956336975, 1.328221082687378, 1.4022082090377808, 1.4761953353881836, 1.5501823425292969, 1.6241695880889893]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 6.0, 11.0, 15.0, 10.0, 8.0, 13.0, 6.0, 16.0, 24.0, 30.0, 29.0, 23.0, 29.0, 20.0, 42.0, 41.0, 54.0, 75.0, 70.0, 81.0, 57.0, 41.0, 37.0, 26.0, 28.0, 23.0, 32.0, 19.0, 11.0, 14.0, 21.0, 10.0, 6.0, 9.0, 12.0, 7.0, 7.0, 5.0, 2.0, 4.0, 3.0, 0.0, 3.0, 3.0, 2.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.3790278434753418, -1.3324027061462402, -1.2857776880264282, -1.2391525506973267, -1.192527413368225, -1.1459022760391235, -1.0992772579193115, -1.05265212059021, -1.0060269832611084, -0.9594019055366516, -0.91277676820755, -0.8661516904830933, -0.8195265531539917, -0.7729014754295349, -0.7262763977050781, -0.6796512603759766, -0.6330261826515198, -0.586401104927063, -0.5397759675979614, -0.49315088987350464, -0.4465257525444031, -0.3999006748199463, -0.3532755672931671, -0.30665045976638794, -0.26002535223960876, -0.2134002447128296, -0.16677513718605042, -0.12015004456043243, -0.07352493703365326, -0.026899829506874084, 0.019725263118743896, 0.06635037064552307, 0.11297547817230225, 0.15960058569908142, 0.2062256932258606, 0.2528507709503174, 0.29947590827941895, 0.34610098600387573, 0.3927260935306549, 0.4393512010574341, 0.48597630858421326, 0.5326014161109924, 0.5792264938354492, 0.6258516311645508, 0.6724767088890076, 0.7191018462181091, 0.7657269239425659, 0.8123520612716675, 0.8589771389961243, 0.905602216720581, 0.9522273540496826, 0.9988524317741394, 1.0454775094985962, 1.0921026468276978, 1.1387277841567993, 1.1853528022766113, 1.231977939605713, 1.2786030769348145, 1.3252280950546265, 1.371853232383728, 1.4184783697128296, 1.4651035070419312, 1.5117285251617432, 1.5583536624908447, 1.6049787998199463]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 9.0, 8.0, 10.0, 11.0, 17.0, 18.0, 36.0, 63.0, 99.0, 123.0, 266.0, 499.0, 865.0, 1824.0, 3897.0, 10196.0, 33266.0, 153906.0, 981703.0, 2357448.0, 527707.0, 87842.0, 21315.0, 7126.0, 3006.0, 1304.0, 700.0, 379.0, 235.0, 143.0, 80.0, 62.0, 30.0, 34.0, 15.0, 8.0, 6.0, 8.0, 10.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1868896484375, -0.18160057067871094, -0.17631149291992188, -0.1710224151611328, -0.16573333740234375, -0.1604442596435547, -0.15515518188476562, -0.14986610412597656, -0.1445770263671875, -0.13928794860839844, -0.13399887084960938, -0.1287097930908203, -0.12342071533203125, -0.11813163757324219, -0.11284255981445312, -0.10755348205566406, -0.102264404296875, -0.09697532653808594, -0.09168624877929688, -0.08639717102050781, -0.08110809326171875, -0.07581901550292969, -0.07052993774414062, -0.06524085998535156, -0.0599517822265625, -0.05466270446777344, -0.049373626708984375, -0.04408454895019531, -0.03879547119140625, -0.03350639343261719, -0.028217315673828125, -0.022928237915039062, -0.01763916015625, -0.012350082397460938, -0.007061004638671875, -0.0017719268798828125, 0.00351715087890625, 0.008806228637695312, 0.014095306396484375, 0.019384384155273438, 0.0246734619140625, 0.029962539672851562, 0.035251617431640625, 0.04054069519042969, 0.04582977294921875, 0.05111885070800781, 0.056407928466796875, 0.06169700622558594, 0.066986083984375, 0.07227516174316406, 0.07756423950195312, 0.08285331726074219, 0.08814239501953125, 0.09343147277832031, 0.09872055053710938, 0.10400962829589844, 0.1092987060546875, 0.11458778381347656, 0.11987686157226562, 0.1251659393310547, 0.13045501708984375, 0.1357440948486328, 0.14103317260742188, 0.14632225036621094, 0.151611328125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 4.0, 6.0, 9.0, 9.0, 14.0, 7.0, 14.0, 15.0, 23.0, 19.0, 22.0, 32.0, 28.0, 35.0, 30.0, 28.0, 33.0, 32.0, 33.0, 38.0, 33.0, 47.0, 39.0, 30.0, 39.0, 42.0, 33.0, 36.0, 30.0, 29.0, 28.0, 20.0, 20.0, 21.0, 18.0, 11.0, 19.0, 10.0, 16.0, 6.0, 9.0, 7.0, 4.0, 7.0, 10.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09674072265625, -0.09358024597167969, -0.09041976928710938, -0.08725929260253906, -0.08409881591796875, -0.08093833923339844, -0.07777786254882812, -0.07461738586425781, -0.0714569091796875, -0.06829643249511719, -0.06513595581054688, -0.06197547912597656, -0.05881500244140625, -0.05565452575683594, -0.052494049072265625, -0.04933357238769531, -0.046173095703125, -0.04301261901855469, -0.039852142333984375, -0.03669166564941406, -0.03353118896484375, -0.030370712280273438, -0.027210235595703125, -0.024049758911132812, -0.0208892822265625, -0.017728805541992188, -0.014568328857421875, -0.011407852172851562, -0.00824737548828125, -0.0050868988037109375, -0.001926422119140625, 0.0012340545654296875, 0.00439453125, 0.0075550079345703125, 0.010715484619140625, 0.013875961303710938, 0.01703643798828125, 0.020196914672851562, 0.023357391357421875, 0.026517868041992188, 0.0296783447265625, 0.03283882141113281, 0.035999298095703125, 0.03915977478027344, 0.04232025146484375, 0.04548072814941406, 0.048641204833984375, 0.05180168151855469, 0.054962158203125, 0.05812263488769531, 0.061283111572265625, 0.06444358825683594, 0.06760406494140625, 0.07076454162597656, 0.07392501831054688, 0.07708549499511719, 0.0802459716796875, 0.08340644836425781, 0.08656692504882812, 0.08972740173339844, 0.09288787841796875, 0.09604835510253906, 0.09920883178710938, 0.10236930847167969, 0.10552978515625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 8.0, 2.0, 11.0, 14.0, 16.0, 22.0, 46.0, 57.0, 80.0, 164.0, 290.0, 722.0, 2207.0, 9794.0, 76444.0, 2255857.0, 1771199.0, 64800.0, 8844.0, 2189.0, 758.0, 331.0, 161.0, 83.0, 51.0, 37.0, 31.0, 13.0, 9.0, 13.0, 5.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.363037109375, -0.3516807556152344, -0.34032440185546875, -0.3289680480957031, -0.3176116943359375, -0.3062553405761719, -0.29489898681640625, -0.2835426330566406, -0.272186279296875, -0.2608299255371094, -0.24947357177734375, -0.23811721801757812, -0.2267608642578125, -0.21540451049804688, -0.20404815673828125, -0.19269180297851562, -0.18133544921875, -0.16997909545898438, -0.15862274169921875, -0.14726638793945312, -0.1359100341796875, -0.12455368041992188, -0.11319732666015625, -0.10184097290039062, -0.090484619140625, -0.07912826538085938, -0.06777191162109375, -0.056415557861328125, -0.0450592041015625, -0.033702850341796875, -0.02234649658203125, -0.010990142822265625, 0.0003662109375, 0.011722564697265625, 0.02307891845703125, 0.034435272216796875, 0.0457916259765625, 0.057147979736328125, 0.06850433349609375, 0.07986068725585938, 0.091217041015625, 0.10257339477539062, 0.11392974853515625, 0.12528610229492188, 0.1366424560546875, 0.14799880981445312, 0.15935516357421875, 0.17071151733398438, 0.18206787109375, 0.19342422485351562, 0.20478057861328125, 0.21613693237304688, 0.2274932861328125, 0.23884963989257812, 0.25020599365234375, 0.2615623474121094, 0.272918701171875, 0.2842750549316406, 0.29563140869140625, 0.3069877624511719, 0.3183441162109375, 0.3297004699707031, 0.34105682373046875, 0.3524131774902344, 0.36376953125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 14.0, 17.0, 33.0, 33.0, 41.0, 60.0, 74.0, 121.0, 155.0, 250.0, 398.0, 580.0, 630.0, 552.0, 353.0, 239.0, 148.0, 99.0, 77.0, 56.0, 42.0, 23.0, 11.0, 13.0, 12.0, 8.0, 9.0, 2.0, 6.0, 0.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2025146484375, -0.1938915252685547, -0.18526840209960938, -0.17664527893066406, -0.16802215576171875, -0.15939903259277344, -0.15077590942382812, -0.1421527862548828, -0.1335296630859375, -0.12490653991699219, -0.11628341674804688, -0.10766029357910156, -0.09903717041015625, -0.09041404724121094, -0.08179092407226562, -0.07316780090332031, -0.064544677734375, -0.05592155456542969, -0.047298431396484375, -0.03867530822753906, -0.03005218505859375, -0.021429061889648438, -0.012805938720703125, -0.0041828155517578125, 0.0044403076171875, 0.013063430786132812, 0.021686553955078125, 0.030309677124023438, 0.03893280029296875, 0.04755592346191406, 0.056179046630859375, 0.06480216979980469, 0.07342529296875, 0.08204841613769531, 0.09067153930664062, 0.09929466247558594, 0.10791778564453125, 0.11654090881347656, 0.12516403198242188, 0.1337871551513672, 0.1424102783203125, 0.1510334014892578, 0.15965652465820312, 0.16827964782714844, 0.17690277099609375, 0.18552589416503906, 0.19414901733398438, 0.2027721405029297, 0.211395263671875, 0.2200183868408203, 0.22864151000976562, 0.23726463317871094, 0.24588775634765625, 0.25451087951660156, 0.2631340026855469, 0.2717571258544922, 0.2803802490234375, 0.2890033721923828, 0.2976264953613281, 0.30624961853027344, 0.31487274169921875, 0.32349586486816406, 0.3321189880371094, 0.3407421112060547, 0.349365234375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 4.0, 5.0, 6.0, 8.0, 28.0, 38.0, 58.0, 88.0, 105.0, 154.0, 123.0, 127.0, 90.0, 59.0, 35.0, 25.0, 12.0, 7.0, 3.0, 4.0, 10.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.2555696964263916, -2.1898317337036133, -2.124093532562256, -2.0583555698394775, -1.9926173686981201, -1.9268792867660522, -1.8611412048339844, -1.795403242111206, -1.7296650409698486, -1.6639269590377808, -1.598188877105713, -1.532450795173645, -1.4667127132415771, -1.4009746313095093, -1.3352365493774414, -1.269498586654663, -1.2037605047225952, -1.1380224227905273, -1.0722843408584595, -1.0065462589263916, -0.9408081769943237, -0.8750700950622559, -0.8093320727348328, -0.7435939908027649, -0.677855908870697, -0.6121178269386292, -0.5463797450065613, -0.4806416928768158, -0.4149036109447479, -0.34916552901268005, -0.28342747688293457, -0.2176893949508667, -0.15195119380950928, -0.086213119328022, -0.02047504484653473, 0.04526302218437195, 0.11100110411643982, 0.1767391860485077, 0.24247723817825317, 0.30821532011032104, 0.3739534020423889, 0.4396914839744568, 0.5054295659065247, 0.5711675882339478, 0.6369056701660156, 0.7026437520980835, 0.7683818340301514, 0.8341199159622192, 0.8998579978942871, 0.965596079826355, 1.0313341617584229, 1.0970722436904907, 1.1628103256225586, 1.2285484075546265, 1.2942864894866943, 1.3600244522094727, 1.42576265335083, 1.491500735282898, 1.5572388172149658, 1.6229768991470337, 1.6887149810791016, 1.7544530630111694, 1.8201911449432373, 1.8859291076660156, 1.9516671895980835]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 9.0, 8.0, 8.0, 20.0, 13.0, 37.0, 26.0, 37.0, 43.0, 55.0, 63.0, 57.0, 67.0, 58.0, 87.0, 65.0, 52.0, 56.0, 43.0, 49.0, 38.0, 27.0, 23.0, 16.0, 16.0, 12.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3563575744628906, -1.3047322034835815, -1.253106713294983, -1.2014813423156738, -1.1498559713363647, -1.0982306003570557, -1.046605110168457, -0.994979739189148, -0.9433543086051941, -0.8917288780212402, -0.8401035070419312, -0.7884780764579773, -0.7368526458740234, -0.6852272748947144, -0.6336018443107605, -0.5819764137268066, -0.5303510427474976, -0.4787256419658661, -0.4271002411842346, -0.37547481060028076, -0.3238494098186493, -0.2722240090370178, -0.22059857845306396, -0.1689731776714325, -0.11734777688980103, -0.06572236865758896, -0.014096960425376892, 0.03752845525741577, 0.08915385603904724, 0.1407792568206787, 0.19240468740463257, 0.24403008818626404, 0.2956554889678955, 0.347280889749527, 0.39890629053115845, 0.4505317211151123, 0.5021570920944214, 0.5537825226783752, 0.6054079532623291, 0.6570333242416382, 0.708658754825592, 0.7602841854095459, 0.811909556388855, 0.8635349869728088, 0.9151604175567627, 0.9667857885360718, 1.0184111595153809, 1.0700366497039795, 1.1216620206832886, 1.1732873916625977, 1.2249128818511963, 1.2765382528305054, 1.3281636238098145, 1.379789113998413, 1.4314144849777222, 1.4830398559570312, 1.5346653461456299, 1.586290717124939, 1.6379162073135376, 1.6895415782928467, 1.7411669492721558, 1.7927923202514648, 1.8444178104400635, 1.8960431814193726, 1.9476685523986816]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 2.0, 5.0, 7.0, 6.0, 14.0, 14.0, 26.0, 32.0, 50.0, 55.0, 100.0, 121.0, 159.0, 295.0, 510.0, 714.0, 1224.0, 2232.0, 4188.0, 8322.0, 18460.0, 44435.0, 132203.0, 398092.0, 289317.0, 87478.0, 32535.0, 13706.0, 6495.0, 3249.0, 1676.0, 1019.0, 609.0, 389.0, 267.0, 173.0, 119.0, 75.0, 62.0, 38.0, 35.0, 18.0, 9.0, 7.0, 4.0, 4.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.152099609375, -0.14699935913085938, -0.14189910888671875, -0.13679885864257812, -0.1316986083984375, -0.12659835815429688, -0.12149810791015625, -0.11639785766601562, -0.111297607421875, -0.10619735717773438, -0.10109710693359375, -0.09599685668945312, -0.0908966064453125, -0.08579635620117188, -0.08069610595703125, -0.07559585571289062, -0.07049560546875, -0.06539535522460938, -0.06029510498046875, -0.055194854736328125, -0.0500946044921875, -0.044994354248046875, -0.03989410400390625, -0.034793853759765625, -0.029693603515625, -0.024593353271484375, -0.01949310302734375, -0.014392852783203125, -0.0092926025390625, -0.004192352294921875, 0.00090789794921875, 0.006008148193359375, 0.0111083984375, 0.016208648681640625, 0.02130889892578125, 0.026409149169921875, 0.0315093994140625, 0.036609649658203125, 0.04170989990234375, 0.046810150146484375, 0.051910400390625, 0.057010650634765625, 0.06211090087890625, 0.06721115112304688, 0.0723114013671875, 0.07741165161132812, 0.08251190185546875, 0.08761215209960938, 0.09271240234375, 0.09781265258789062, 0.10291290283203125, 0.10801315307617188, 0.1131134033203125, 0.11821365356445312, 0.12331390380859375, 0.12841415405273438, 0.133514404296875, 0.13861465454101562, 0.14371490478515625, 0.14881515502929688, 0.1539154052734375, 0.15901565551757812, 0.16411590576171875, 0.16921615600585938, 0.17431640625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 6.0, 5.0, 7.0, 7.0, 7.0, 10.0, 20.0, 9.0, 15.0, 21.0, 22.0, 21.0, 25.0, 41.0, 41.0, 45.0, 37.0, 39.0, 45.0, 54.0, 47.0, 47.0, 53.0, 47.0, 34.0, 36.0, 32.0, 26.0, 32.0, 21.0, 26.0, 25.0, 15.0, 16.0, 15.0, 14.0, 11.0, 11.0, 5.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.12103271484375, -0.1172018051147461, -0.11337089538574219, -0.10953998565673828, -0.10570907592773438, -0.10187816619873047, -0.09804725646972656, -0.09421634674072266, -0.09038543701171875, -0.08655452728271484, -0.08272361755371094, -0.07889270782470703, -0.07506179809570312, -0.07123088836669922, -0.06739997863769531, -0.0635690689086914, -0.0597381591796875, -0.055907249450683594, -0.05207633972167969, -0.04824542999267578, -0.044414520263671875, -0.04058361053466797, -0.03675270080566406, -0.032921791076660156, -0.02909088134765625, -0.025259971618652344, -0.021429061889648438, -0.01759815216064453, -0.013767242431640625, -0.009936332702636719, -0.0061054229736328125, -0.0022745132446289062, 0.001556396484375, 0.005387306213378906, 0.009218215942382812, 0.013049125671386719, 0.016880035400390625, 0.02071094512939453, 0.024541854858398438, 0.028372764587402344, 0.03220367431640625, 0.036034584045410156, 0.03986549377441406, 0.04369640350341797, 0.047527313232421875, 0.05135822296142578, 0.05518913269042969, 0.059020042419433594, 0.0628509521484375, 0.0666818618774414, 0.07051277160644531, 0.07434368133544922, 0.07817459106445312, 0.08200550079345703, 0.08583641052246094, 0.08966732025146484, 0.09349822998046875, 0.09732913970947266, 0.10116004943847656, 0.10499095916748047, 0.10882186889648438, 0.11265277862548828, 0.11648368835449219, 0.1203145980834961, 0.1241455078125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 8.0, 4.0, 4.0, 7.0, 17.0, 23.0, 45.0, 51.0, 83.0, 180.0, 290.0, 514.0, 1239.0, 3912.0, 23690.0, 757520.0, 241553.0, 14411.0, 2958.0, 959.0, 455.0, 237.0, 135.0, 89.0, 51.0, 44.0, 26.0, 17.0, 8.0, 11.0, 5.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.366943359375, -0.3515815734863281, -0.33621978759765625, -0.3208580017089844, -0.3054962158203125, -0.2901344299316406, -0.27477264404296875, -0.2594108581542969, -0.244049072265625, -0.22868728637695312, -0.21332550048828125, -0.19796371459960938, -0.1826019287109375, -0.16724014282226562, -0.15187835693359375, -0.13651657104492188, -0.12115478515625, -0.10579299926757812, -0.09043121337890625, -0.07506942749023438, -0.0597076416015625, -0.044345855712890625, -0.02898406982421875, -0.013622283935546875, 0.001739501953125, 0.017101287841796875, 0.03246307373046875, 0.047824859619140625, 0.0631866455078125, 0.07854843139648438, 0.09391021728515625, 0.10927200317382812, 0.1246337890625, 0.13999557495117188, 0.15535736083984375, 0.17071914672851562, 0.1860809326171875, 0.20144271850585938, 0.21680450439453125, 0.23216629028320312, 0.247528076171875, 0.2628898620605469, 0.27825164794921875, 0.2936134338378906, 0.3089752197265625, 0.3243370056152344, 0.33969879150390625, 0.3550605773925781, 0.37042236328125, 0.3857841491699219, 0.40114593505859375, 0.4165077209472656, 0.4318695068359375, 0.4472312927246094, 0.46259307861328125, 0.4779548645019531, 0.493316650390625, 0.5086784362792969, 0.5240402221679688, 0.5394020080566406, 0.5547637939453125, 0.5701255798339844, 0.5854873657226562, 0.6008491516113281, 0.6162109375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 1.0, 3.0, 4.0, 3.0, 7.0, 7.0, 15.0, 17.0, 27.0, 28.0, 22.0, 47.0, 45.0, 52.0, 50.0, 57.0, 79.0, 64.0, 68.0, 67.0, 65.0, 63.0, 42.0, 37.0, 24.0, 22.0, 19.0, 17.0, 7.0, 10.0, 6.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.488525390625, -0.4692726135253906, -0.45001983642578125, -0.4307670593261719, -0.4115142822265625, -0.3922615051269531, -0.37300872802734375, -0.3537559509277344, -0.334503173828125, -0.3152503967285156, -0.29599761962890625, -0.2767448425292969, -0.2574920654296875, -0.23823928833007812, -0.21898651123046875, -0.19973373413085938, -0.18048095703125, -0.16122817993164062, -0.14197540283203125, -0.12272262573242188, -0.1034698486328125, -0.08421707153320312, -0.06496429443359375, -0.045711517333984375, -0.026458740234375, -0.007205963134765625, 0.01204681396484375, 0.031299591064453125, 0.0505523681640625, 0.06980514526367188, 0.08905792236328125, 0.10831069946289062, 0.1275634765625, 0.14681625366210938, 0.16606903076171875, 0.18532180786132812, 0.2045745849609375, 0.22382736206054688, 0.24308013916015625, 0.2623329162597656, 0.281585693359375, 0.3008384704589844, 0.32009124755859375, 0.3393440246582031, 0.3585968017578125, 0.3778495788574219, 0.39710235595703125, 0.4163551330566406, 0.43560791015625, 0.4548606872558594, 0.47411346435546875, 0.4933662414550781, 0.5126190185546875, 0.5318717956542969, 0.5511245727539062, 0.5703773498535156, 0.589630126953125, 0.6088829040527344, 0.6281356811523438, 0.6473884582519531, 0.6666412353515625, 0.6858940124511719, 0.7051467895507812, 0.7243995666503906, 0.74365234375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 5.0, 3.0, 5.0, 15.0, 16.0, 22.0, 51.0, 69.0, 115.0, 147.0, 280.0, 534.0, 1097.0, 2373.0, 5997.0, 20126.0, 120246.0, 785243.0, 86480.0, 16494.0, 5191.0, 2049.0, 899.0, 467.0, 238.0, 140.0, 86.0, 67.0, 34.0, 23.0, 13.0, 9.0, 9.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1204833984375, -0.1172637939453125, -0.114044189453125, -0.1108245849609375, -0.10760498046875, -0.1043853759765625, -0.101165771484375, -0.0979461669921875, -0.0947265625, -0.0915069580078125, -0.088287353515625, -0.0850677490234375, -0.08184814453125, -0.0786285400390625, -0.075408935546875, -0.0721893310546875, -0.0689697265625, -0.0657501220703125, -0.062530517578125, -0.0593109130859375, -0.05609130859375, -0.0528717041015625, -0.049652099609375, -0.0464324951171875, -0.043212890625, -0.0399932861328125, -0.036773681640625, -0.0335540771484375, -0.03033447265625, -0.0271148681640625, -0.023895263671875, -0.0206756591796875, -0.0174560546875, -0.0142364501953125, -0.011016845703125, -0.0077972412109375, -0.00457763671875, -0.0013580322265625, 0.001861572265625, 0.0050811767578125, 0.00830078125, 0.0115203857421875, 0.014739990234375, 0.0179595947265625, 0.02117919921875, 0.0243988037109375, 0.027618408203125, 0.0308380126953125, 0.0340576171875, 0.0372772216796875, 0.040496826171875, 0.0437164306640625, 0.04693603515625, 0.0501556396484375, 0.053375244140625, 0.0565948486328125, 0.059814453125, 0.0630340576171875, 0.066253662109375, 0.0694732666015625, 0.07269287109375, 0.0759124755859375, 0.079132080078125, 0.0823516845703125, 0.0855712890625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 8.0, 4.0, 3.0, 3.0, 5.0, 11.0, 13.0, 14.0, 15.0, 24.0, 29.0, 59.0, 84.0, 95.0, 105.0, 97.0, 103.0, 84.0, 57.0, 41.0, 33.0, 27.0, 12.0, 17.0, 17.0, 8.0, 6.0, 11.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.225969314575195e-05, -4.0903687477111816e-05, -3.954768180847168e-05, -3.819167613983154e-05, -3.6835670471191406e-05, -3.547966480255127e-05, -3.412365913391113e-05, -3.2767653465270996e-05, -3.141164779663086e-05, -3.0055642127990723e-05, -2.8699636459350586e-05, -2.734363079071045e-05, -2.5987625122070312e-05, -2.4631619453430176e-05, -2.327561378479004e-05, -2.1919608116149902e-05, -2.0563602447509766e-05, -1.920759677886963e-05, -1.7851591110229492e-05, -1.6495585441589355e-05, -1.5139579772949219e-05, -1.3783574104309082e-05, -1.2427568435668945e-05, -1.1071562767028809e-05, -9.715557098388672e-06, -8.359551429748535e-06, -7.0035457611083984e-06, -5.647540092468262e-06, -4.291534423828125e-06, -2.9355287551879883e-06, -1.5795230865478516e-06, -2.2351741790771484e-07, 1.1324882507324219e-06, 2.4884939193725586e-06, 3.844499588012695e-06, 5.200505256652832e-06, 6.556510925292969e-06, 7.912516593933105e-06, 9.268522262573242e-06, 1.0624527931213379e-05, 1.1980533599853516e-05, 1.3336539268493652e-05, 1.4692544937133789e-05, 1.6048550605773926e-05, 1.7404556274414062e-05, 1.87605619430542e-05, 2.0116567611694336e-05, 2.1472573280334473e-05, 2.282857894897461e-05, 2.4184584617614746e-05, 2.5540590286254883e-05, 2.689659595489502e-05, 2.8252601623535156e-05, 2.9608607292175293e-05, 3.096461296081543e-05, 3.2320618629455566e-05, 3.36766242980957e-05, 3.503262996673584e-05, 3.6388635635375977e-05, 3.774464130401611e-05, 3.910064697265625e-05, 4.045665264129639e-05, 4.1812658309936523e-05, 4.316866397857666e-05, 4.45246696472168e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 6.0, 10.0, 8.0, 11.0, 22.0, 24.0, 28.0, 44.0, 72.0, 108.0, 195.0, 325.0, 579.0, 1134.0, 2444.0, 5874.0, 19289.0, 83723.0, 697055.0, 185256.0, 35777.0, 9812.0, 3488.0, 1494.0, 703.0, 374.0, 256.0, 150.0, 89.0, 54.0, 36.0, 34.0, 21.0, 15.0, 6.0, 17.0, 4.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0810546875, -0.0782327651977539, -0.07541084289550781, -0.07258892059326172, -0.06976699829101562, -0.06694507598876953, -0.06412315368652344, -0.061301231384277344, -0.05847930908203125, -0.055657386779785156, -0.05283546447753906, -0.05001354217529297, -0.047191619873046875, -0.04436969757080078, -0.04154777526855469, -0.038725852966308594, -0.0359039306640625, -0.033082008361816406, -0.030260086059570312, -0.02743816375732422, -0.024616241455078125, -0.02179431915283203, -0.018972396850585938, -0.016150474548339844, -0.01332855224609375, -0.010506629943847656, -0.0076847076416015625, -0.004862785339355469, -0.002040863037109375, 0.0007810592651367188, 0.0036029815673828125, 0.006424903869628906, 0.009246826171875, 0.012068748474121094, 0.014890670776367188, 0.01771259307861328, 0.020534515380859375, 0.02335643768310547, 0.026178359985351562, 0.029000282287597656, 0.03182220458984375, 0.034644126892089844, 0.03746604919433594, 0.04028797149658203, 0.043109893798828125, 0.04593181610107422, 0.04875373840332031, 0.051575660705566406, 0.0543975830078125, 0.057219505310058594, 0.06004142761230469, 0.06286334991455078, 0.06568527221679688, 0.06850719451904297, 0.07132911682128906, 0.07415103912353516, 0.07697296142578125, 0.07979488372802734, 0.08261680603027344, 0.08543872833251953, 0.08826065063476562, 0.09108257293701172, 0.09390449523925781, 0.0967264175415039, 0.09954833984375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 0.0, 7.0, 5.0, 5.0, 7.0, 11.0, 14.0, 11.0, 15.0, 17.0, 29.0, 22.0, 36.0, 51.0, 55.0, 65.0, 99.0, 92.0, 94.0, 73.0, 57.0, 51.0, 38.0, 20.0, 29.0, 13.0, 16.0, 15.0, 14.0, 10.0, 8.0, 5.0, 1.0, 1.0, 3.0, 1.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0838623046875, -0.0811929702758789, -0.07852363586425781, -0.07585430145263672, -0.07318496704101562, -0.07051563262939453, -0.06784629821777344, -0.06517696380615234, -0.06250762939453125, -0.059838294982910156, -0.05716896057128906, -0.05449962615966797, -0.051830291748046875, -0.04916095733642578, -0.04649162292480469, -0.043822288513183594, -0.0411529541015625, -0.038483619689941406, -0.03581428527832031, -0.03314495086669922, -0.030475616455078125, -0.02780628204345703, -0.025136947631835938, -0.022467613220214844, -0.01979827880859375, -0.017128944396972656, -0.014459609985351562, -0.011790275573730469, -0.009120941162109375, -0.006451606750488281, -0.0037822723388671875, -0.0011129379272460938, 0.001556396484375, 0.004225730895996094, 0.0068950653076171875, 0.009564399719238281, 0.012233734130859375, 0.014903068542480469, 0.017572402954101562, 0.020241737365722656, 0.02291107177734375, 0.025580406188964844, 0.028249740600585938, 0.03091907501220703, 0.033588409423828125, 0.03625774383544922, 0.03892707824707031, 0.041596412658691406, 0.0442657470703125, 0.046935081481933594, 0.04960441589355469, 0.05227375030517578, 0.054943084716796875, 0.05761241912841797, 0.06028175354003906, 0.06295108795166016, 0.06562042236328125, 0.06828975677490234, 0.07095909118652344, 0.07362842559814453, 0.07629776000976562, 0.07896709442138672, 0.08163642883300781, 0.0843057632446289, 0.08697509765625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 4.0, 2.0, 4.0, 5.0, 5.0, 22.0, 29.0, 119.0, 339.0, 325.0, 94.0, 31.0, 16.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.468199729919434, -4.3328423500061035, -4.197485446929932, -4.062128067016602, -3.9267709255218506, -3.7914137840270996, -3.6560564041137695, -3.5206992626190186, -3.3853421211242676, -3.2499849796295166, -3.1146275997161865, -2.9792704582214355, -2.8439133167266846, -2.7085561752319336, -2.5731987953186035, -2.4378416538238525, -2.3024842739105225, -2.1671271324157715, -2.0317697525024414, -1.8964126110076904, -1.7610554695129395, -1.625698208808899, -1.4903409481048584, -1.3549838066101074, -1.219626545906067, -1.0842692852020264, -0.9489121437072754, -0.8135548830032349, -0.6781976819038391, -0.5428404808044434, -0.40748322010040283, -0.2721260190010071, -0.13676881790161133, -0.0014116019010543823, 0.13394561409950256, 0.2693028450012207, 0.40466004610061646, 0.5400172472000122, 0.6753745079040527, 0.8107317090034485, 0.9460889101028442, 1.0814461708068848, 1.2168033123016357, 1.3521605730056763, 1.4875178337097168, 1.6228749752044678, 1.7582322359085083, 1.8935894966125488, 2.0289466381073, 2.164303779602051, 2.299661159515381, 2.435018301010132, 2.570375442504883, 2.705732822418213, 2.841089963912964, 2.976447105407715, 3.111804485321045, 3.247161626815796, 3.382519006729126, 3.517876148223877, 3.653233289718628, 3.788590431213379, 3.923947811126709, 4.059305191040039, 4.194662094116211]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 0.0, 2.0, 4.0, 1.0, 5.0, 4.0, 6.0, 7.0, 9.0, 11.0, 9.0, 15.0, 16.0, 15.0, 10.0, 13.0, 23.0, 13.0, 40.0, 32.0, 26.0, 46.0, 48.0, 77.0, 98.0, 91.0, 78.0, 48.0, 19.0, 32.0, 23.0, 27.0, 27.0, 24.0, 13.0, 16.0, 9.0, 16.0, 13.0, 8.0, 5.0, 7.0, 8.0, 2.0, 7.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5876935720443726, -1.5325590372085571, -1.4774245023727417, -1.4222898483276367, -1.3671553134918213, -1.3120207786560059, -1.2568862438201904, -1.201751708984375, -1.1466171741485596, -1.0914826393127441, -1.0363481044769287, -0.9812135100364685, -0.9260789752006531, -0.8709443807601929, -0.8158098459243774, -0.760675311088562, -0.7055407166481018, -0.6504061818122864, -0.5952715873718262, -0.5401370525360107, -0.4850025177001953, -0.4298679530620575, -0.3747333884239197, -0.31959885358810425, -0.26446428894996643, -0.2093297392129898, -0.15419518947601318, -0.09906062483787537, -0.04392607510089874, 0.01120847463607788, 0.0663430392742157, 0.12147757411003113, 0.17661213874816895, 0.23174668848514557, 0.2868812382221222, 0.34201580286026, 0.39715033769607544, 0.45228490233421326, 0.5074194669723511, 0.5625540018081665, 0.6176885366439819, 0.6728230714797974, 0.7279576659202576, 0.783092200756073, 0.8382267355918884, 0.8933613300323486, 0.9484958648681641, 1.0036303997039795, 1.058764934539795, 1.1138994693756104, 1.1690340042114258, 1.2241685390472412, 1.2793031930923462, 1.3344377279281616, 1.389572262763977, 1.4447067975997925, 1.4998414516448975, 1.554975986480713, 1.6101105213165283, 1.6652450561523438, 1.7203797101974487, 1.7755142450332642, 1.8306487798690796, 1.885783314704895, 1.9409178495407104]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 4.0, 4.0, 12.0, 9.0, 22.0, 28.0, 38.0, 49.0, 111.0, 135.0, 228.0, 337.0, 578.0, 922.0, 1526.0, 2530.0, 4625.0, 8723.0, 17166.0, 38454.0, 95556.0, 267121.0, 755823.0, 1514931.0, 945798.0, 335102.0, 115847.0, 45779.0, 20246.0, 9859.0, 5173.0, 2876.0, 1678.0, 1076.0, 685.0, 427.0, 283.0, 163.0, 101.0, 77.0, 54.0, 42.0, 31.0, 20.0, 3.0, 6.0, 14.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.1583251953125, -0.15346908569335938, -0.14861297607421875, -0.14375686645507812, -0.1389007568359375, -0.13404464721679688, -0.12918853759765625, -0.12433242797851562, -0.119476318359375, -0.11462020874023438, -0.10976409912109375, -0.10490798950195312, -0.1000518798828125, -0.09519577026367188, -0.09033966064453125, -0.08548355102539062, -0.08062744140625, -0.07577133178710938, -0.07091522216796875, -0.06605911254882812, -0.0612030029296875, -0.056346893310546875, -0.05149078369140625, -0.046634674072265625, -0.041778564453125, -0.036922454833984375, -0.03206634521484375, -0.027210235595703125, -0.0223541259765625, -0.017498016357421875, -0.01264190673828125, -0.007785797119140625, -0.0029296875, 0.001926422119140625, 0.00678253173828125, 0.011638641357421875, 0.0164947509765625, 0.021350860595703125, 0.02620697021484375, 0.031063079833984375, 0.035919189453125, 0.040775299072265625, 0.04563140869140625, 0.050487518310546875, 0.0553436279296875, 0.060199737548828125, 0.06505584716796875, 0.06991195678710938, 0.07476806640625, 0.07962417602539062, 0.08448028564453125, 0.08933639526367188, 0.0941925048828125, 0.09904861450195312, 0.10390472412109375, 0.10876083374023438, 0.113616943359375, 0.11847305297851562, 0.12332916259765625, 0.12818527221679688, 0.1330413818359375, 0.13789749145507812, 0.14275360107421875, 0.14760971069335938, 0.1524658203125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 7.0, 3.0, 4.0, 13.0, 11.0, 17.0, 16.0, 19.0, 17.0, 34.0, 21.0, 31.0, 33.0, 28.0, 32.0, 42.0, 44.0, 52.0, 49.0, 41.0, 46.0, 58.0, 41.0, 34.0, 32.0, 40.0, 30.0, 28.0, 31.0, 28.0, 14.0, 18.0, 19.0, 9.0, 11.0, 13.0, 8.0, 11.0, 7.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11981201171875, -0.11605548858642578, -0.11229896545410156, -0.10854244232177734, -0.10478591918945312, -0.1010293960571289, -0.09727287292480469, -0.09351634979248047, -0.08975982666015625, -0.08600330352783203, -0.08224678039550781, -0.0784902572631836, -0.07473373413085938, -0.07097721099853516, -0.06722068786621094, -0.06346416473388672, -0.0597076416015625, -0.05595111846923828, -0.05219459533691406, -0.048438072204589844, -0.044681549072265625, -0.040925025939941406, -0.03716850280761719, -0.03341197967529297, -0.02965545654296875, -0.02589893341064453, -0.022142410278320312, -0.018385887145996094, -0.014629364013671875, -0.010872840881347656, -0.0071163177490234375, -0.0033597946166992188, 0.000396728515625, 0.004153251647949219, 0.007909774780273438, 0.011666297912597656, 0.015422821044921875, 0.019179344177246094, 0.022935867309570312, 0.02669239044189453, 0.03044891357421875, 0.03420543670654297, 0.03796195983886719, 0.041718482971191406, 0.045475006103515625, 0.049231529235839844, 0.05298805236816406, 0.05674457550048828, 0.0605010986328125, 0.06425762176513672, 0.06801414489746094, 0.07177066802978516, 0.07552719116210938, 0.0792837142944336, 0.08304023742675781, 0.08679676055908203, 0.09055328369140625, 0.09430980682373047, 0.09806632995605469, 0.1018228530883789, 0.10557937622070312, 0.10933589935302734, 0.11309242248535156, 0.11684894561767578, 0.12060546875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 3.0, 3.0, 9.0, 8.0, 4.0, 10.0, 14.0, 12.0, 19.0, 44.0, 57.0, 88.0, 116.0, 199.0, 353.0, 661.0, 1634.0, 6828.0, 106835.0, 3953655.0, 113626.0, 6763.0, 1736.0, 696.0, 365.0, 194.0, 124.0, 68.0, 55.0, 33.0, 24.0, 17.0, 9.0, 7.0, 10.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.892578125, -0.8642501831054688, -0.8359222412109375, -0.8075942993164062, -0.779266357421875, -0.7509384155273438, -0.7226104736328125, -0.6942825317382812, -0.66595458984375, -0.6376266479492188, -0.6092987060546875, -0.5809707641601562, -0.552642822265625, -0.5243148803710938, -0.4959869384765625, -0.46765899658203125, -0.4393310546875, -0.41100311279296875, -0.3826751708984375, -0.35434722900390625, -0.326019287109375, -0.29769134521484375, -0.2693634033203125, -0.24103546142578125, -0.21270751953125, -0.18437957763671875, -0.1560516357421875, -0.12772369384765625, -0.099395751953125, -0.07106781005859375, -0.0427398681640625, -0.01441192626953125, 0.013916015625, 0.04224395751953125, 0.0705718994140625, 0.09889984130859375, 0.127227783203125, 0.15555572509765625, 0.1838836669921875, 0.21221160888671875, 0.24053955078125, 0.26886749267578125, 0.2971954345703125, 0.32552337646484375, 0.353851318359375, 0.38217926025390625, 0.4105072021484375, 0.43883514404296875, 0.4671630859375, 0.49549102783203125, 0.5238189697265625, 0.5521469116210938, 0.580474853515625, 0.6088027954101562, 0.6371307373046875, 0.6654586791992188, 0.69378662109375, 0.7221145629882812, 0.7504425048828125, 0.7787704467773438, 0.807098388671875, 0.8354263305664062, 0.8637542724609375, 0.8920822143554688, 0.92041015625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 3.0, 7.0, 11.0, 13.0, 16.0, 16.0, 33.0, 46.0, 62.0, 85.0, 110.0, 152.0, 230.0, 317.0, 441.0, 575.0, 588.0, 383.0, 289.0, 196.0, 152.0, 96.0, 77.0, 51.0, 25.0, 23.0, 20.0, 9.0, 11.0, 12.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40869140625, -0.3945655822753906, -0.38043975830078125, -0.3663139343261719, -0.3521881103515625, -0.3380622863769531, -0.32393646240234375, -0.3098106384277344, -0.295684814453125, -0.2815589904785156, -0.26743316650390625, -0.2533073425292969, -0.2391815185546875, -0.22505569458007812, -0.21092987060546875, -0.19680404663085938, -0.18267822265625, -0.16855239868164062, -0.15442657470703125, -0.14030075073242188, -0.1261749267578125, -0.11204910278320312, -0.09792327880859375, -0.08379745483398438, -0.069671630859375, -0.055545806884765625, -0.04141998291015625, -0.027294158935546875, -0.0131683349609375, 0.000957489013671875, 0.01508331298828125, 0.029209136962890625, 0.0433349609375, 0.057460784912109375, 0.07158660888671875, 0.08571243286132812, 0.0998382568359375, 0.11396408081054688, 0.12808990478515625, 0.14221572875976562, 0.156341552734375, 0.17046737670898438, 0.18459320068359375, 0.19871902465820312, 0.2128448486328125, 0.22697067260742188, 0.24109649658203125, 0.2552223205566406, 0.26934814453125, 0.2834739685058594, 0.29759979248046875, 0.3117256164550781, 0.3258514404296875, 0.3399772644042969, 0.35410308837890625, 0.3682289123535156, 0.382354736328125, 0.3964805603027344, 0.41060638427734375, 0.4247322082519531, 0.4388580322265625, 0.4529838562011719, 0.46710968017578125, 0.4812355041503906, 0.495361328125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 6.0, 9.0, 16.0, 26.0, 22.0, 52.0, 85.0, 139.0, 162.0, 157.0, 127.0, 85.0, 44.0, 27.0, 12.0, 4.0, 13.0, 5.0, 1.0, 1.0, 3.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.5635986328125, -6.395124912261963, -6.226650714874268, -6.0581769943237305, -5.889702796936035, -5.721229076385498, -5.552755355834961, -5.384281158447266, -5.2158074378967285, -5.047333717346191, -4.878859519958496, -4.710385799407959, -4.541912078857422, -4.373437881469727, -4.2049641609191895, -4.036490440368652, -3.868016242980957, -3.699542284011841, -3.5310683250427246, -3.3625946044921875, -3.1941206455230713, -3.025646686553955, -2.857172966003418, -2.6886990070343018, -2.5202250480651855, -2.3517510890960693, -2.183277130126953, -2.014803409576416, -1.8463294506072998, -1.6778554916381836, -1.509381651878357, -1.3409078121185303, -1.172433853149414, -1.0039598941802979, -0.8354860544204712, -0.6670121550559998, -0.4985382556915283, -0.3300643563270569, -0.16159045696258545, 0.006883382797241211, 0.17535734176635742, 0.34383124113082886, 0.5123051404953003, 0.6807790398597717, 0.8492529392242432, 1.0177268981933594, 1.186200737953186, 1.3546745777130127, 1.523148536682129, 1.6916224956512451, 1.8600963354110718, 2.0285701751708984, 2.1970441341400146, 2.365518093109131, 2.533991813659668, 2.702465772628784, 2.8709397315979004, 3.0394136905670166, 3.207887649536133, 3.37636137008667, 3.544835329055786, 3.7133092880249023, 3.8817830085754395, 4.050256729125977, 4.218730926513672]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 2.0, 5.0, 5.0, 8.0, 5.0, 9.0, 15.0, 14.0, 10.0, 21.0, 23.0, 15.0, 27.0, 26.0, 29.0, 33.0, 36.0, 35.0, 23.0, 31.0, 54.0, 42.0, 40.0, 48.0, 45.0, 36.0, 33.0, 36.0, 27.0, 26.0, 23.0, 23.0, 23.0, 25.0, 14.0, 24.0, 15.0, 13.0, 16.0, 7.0, 10.0, 12.0, 9.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.9179359674453735, -1.856309413909912, -1.7946829795837402, -1.7330564260482788, -1.6714298725128174, -1.6098034381866455, -1.548176884651184, -1.4865503311157227, -1.4249238967895508, -1.3632973432540894, -1.3016709089279175, -1.240044355392456, -1.1784179210662842, -1.1167913675308228, -1.0551648139953613, -0.9935383200645447, -0.931911826133728, -0.8702853322029114, -0.8086588382720947, -0.7470322847366333, -0.6854057908058167, -0.623779296875, -0.5621527433395386, -0.5005262494087219, -0.4388997554779053, -0.3772732615470886, -0.3156467378139496, -0.25402021408081055, -0.1923937201499939, -0.13076722621917725, -0.06914070248603821, -0.00751417875289917, 0.05411243438720703, 0.11573894321918488, 0.17736545205116272, 0.23899196088314056, 0.3006184697151184, 0.36224496364593506, 0.4238714873790741, 0.48549801111221313, 0.5471245050430298, 0.6087509989738464, 0.6703774929046631, 0.7320040464401245, 0.7936305403709412, 0.8552570343017578, 0.9168835878372192, 0.9785100817680359, 1.0401365756988525, 1.101763129234314, 1.1633895635604858, 1.2250161170959473, 1.2866425514221191, 1.3482691049575806, 1.409895658493042, 1.4715220928192139, 1.5331486463546753, 1.5947751998901367, 1.6564016342163086, 1.71802818775177, 1.7796547412872314, 1.8412811756134033, 1.9029077291488647, 1.9645342826843262, 2.026160717010498]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 11.0, 12.0, 9.0, 18.0, 27.0, 53.0, 77.0, 136.0, 232.0, 433.0, 716.0, 1474.0, 2799.0, 6116.0, 15735.0, 49248.0, 223800.0, 588728.0, 110668.0, 28949.0, 10368.0, 4352.0, 2042.0, 1126.0, 568.0, 329.0, 189.0, 112.0, 85.0, 49.0, 31.0, 15.0, 8.0, 13.0, 4.0, 7.0, 4.0, 1.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1837158203125, -0.1764507293701172, -0.16918563842773438, -0.16192054748535156, -0.15465545654296875, -0.14739036560058594, -0.14012527465820312, -0.1328601837158203, -0.1255950927734375, -0.11833000183105469, -0.11106491088867188, -0.10379981994628906, -0.09653472900390625, -0.08926963806152344, -0.08200454711914062, -0.07473945617675781, -0.067474365234375, -0.06020927429199219, -0.052944183349609375, -0.04567909240722656, -0.03841400146484375, -0.031148910522460938, -0.023883819580078125, -0.016618728637695312, -0.0093536376953125, -0.0020885467529296875, 0.005176544189453125, 0.012441635131835938, 0.01970672607421875, 0.026971817016601562, 0.034236907958984375, 0.04150199890136719, 0.04876708984375, 0.05603218078613281, 0.06329727172851562, 0.07056236267089844, 0.07782745361328125, 0.08509254455566406, 0.09235763549804688, 0.09962272644042969, 0.1068878173828125, 0.11415290832519531, 0.12141799926757812, 0.12868309020996094, 0.13594818115234375, 0.14321327209472656, 0.15047836303710938, 0.1577434539794922, 0.165008544921875, 0.1722736358642578, 0.17953872680664062, 0.18680381774902344, 0.19406890869140625, 0.20133399963378906, 0.20859909057617188, 0.2158641815185547, 0.2231292724609375, 0.2303943634033203, 0.23765945434570312, 0.24492454528808594, 0.25218963623046875, 0.25945472717285156, 0.2667198181152344, 0.2739849090576172, 0.28125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 7.0, 4.0, 4.0, 6.0, 13.0, 13.0, 20.0, 20.0, 34.0, 38.0, 44.0, 61.0, 55.0, 61.0, 84.0, 71.0, 80.0, 57.0, 54.0, 57.0, 45.0, 49.0, 31.0, 27.0, 20.0, 16.0, 7.0, 15.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1650390625, -0.15665817260742188, -0.14827728271484375, -0.13989639282226562, -0.1315155029296875, -0.12313461303710938, -0.11475372314453125, -0.10637283325195312, -0.097991943359375, -0.08961105346679688, -0.08123016357421875, -0.07284927368164062, -0.0644683837890625, -0.056087493896484375, -0.04770660400390625, -0.039325714111328125, -0.03094482421875, -0.022563934326171875, -0.01418304443359375, -0.005802154541015625, 0.0025787353515625, 0.010959625244140625, 0.01934051513671875, 0.027721405029296875, 0.036102294921875, 0.044483184814453125, 0.05286407470703125, 0.061244964599609375, 0.0696258544921875, 0.07800674438476562, 0.08638763427734375, 0.09476852416992188, 0.1031494140625, 0.11153030395507812, 0.11991119384765625, 0.12829208374023438, 0.1366729736328125, 0.14505386352539062, 0.15343475341796875, 0.16181564331054688, 0.170196533203125, 0.17857742309570312, 0.18695831298828125, 0.19533920288085938, 0.2037200927734375, 0.21210098266601562, 0.22048187255859375, 0.22886276245117188, 0.23724365234375, 0.24562454223632812, 0.25400543212890625, 0.2623863220214844, 0.2707672119140625, 0.2791481018066406, 0.28752899169921875, 0.2959098815917969, 0.304290771484375, 0.3126716613769531, 0.32105255126953125, 0.3294334411621094, 0.3378143310546875, 0.3461952209472656, 0.35457611083984375, 0.3629570007324219, 0.371337890625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 4.0, 6.0, 2.0, 14.0, 12.0, 42.0, 54.0, 75.0, 111.0, 235.0, 641.0, 2246.0, 14532.0, 804249.0, 212356.0, 10811.0, 1878.0, 678.0, 275.0, 134.0, 74.0, 38.0, 19.0, 23.0, 14.0, 9.0, 6.0, 7.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47802734375, -0.4615020751953125, -0.444976806640625, -0.4284515380859375, -0.41192626953125, -0.3954010009765625, -0.378875732421875, -0.3623504638671875, -0.3458251953125, -0.3292999267578125, -0.312774658203125, -0.2962493896484375, -0.27972412109375, -0.2631988525390625, -0.246673583984375, -0.2301483154296875, -0.213623046875, -0.1970977783203125, -0.180572509765625, -0.1640472412109375, -0.14752197265625, -0.1309967041015625, -0.114471435546875, -0.0979461669921875, -0.0814208984375, -0.0648956298828125, -0.048370361328125, -0.0318450927734375, -0.01531982421875, 0.0012054443359375, 0.017730712890625, 0.0342559814453125, 0.05078125, 0.0673065185546875, 0.083831787109375, 0.1003570556640625, 0.11688232421875, 0.1334075927734375, 0.149932861328125, 0.1664581298828125, 0.1829833984375, 0.1995086669921875, 0.216033935546875, 0.2325592041015625, 0.24908447265625, 0.2656097412109375, 0.282135009765625, 0.2986602783203125, 0.315185546875, 0.3317108154296875, 0.348236083984375, 0.3647613525390625, 0.38128662109375, 0.3978118896484375, 0.414337158203125, 0.4308624267578125, 0.4473876953125, 0.4639129638671875, 0.480438232421875, 0.4969635009765625, 0.51348876953125, 0.5300140380859375, 0.546539306640625, 0.5630645751953125, 0.57958984375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 0.0, 9.0, 2.0, 3.0, 3.0, 7.0, 10.0, 10.0, 8.0, 23.0, 16.0, 19.0, 23.0, 26.0, 34.0, 28.0, 33.0, 66.0, 67.0, 68.0, 91.0, 75.0, 62.0, 56.0, 43.0, 30.0, 34.0, 28.0, 21.0, 17.0, 16.0, 11.0, 10.0, 10.0, 10.0, 13.0, 8.0, 8.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62744140625, -0.6016921997070312, -0.5759429931640625, -0.5501937866210938, -0.524444580078125, -0.49869537353515625, -0.4729461669921875, -0.44719696044921875, -0.42144775390625, -0.39569854736328125, -0.3699493408203125, -0.34420013427734375, -0.318450927734375, -0.29270172119140625, -0.2669525146484375, -0.24120330810546875, -0.2154541015625, -0.18970489501953125, -0.1639556884765625, -0.13820648193359375, -0.112457275390625, -0.08670806884765625, -0.0609588623046875, -0.03520965576171875, -0.00946044921875, 0.01628875732421875, 0.0420379638671875, 0.06778717041015625, 0.093536376953125, 0.11928558349609375, 0.1450347900390625, 0.17078399658203125, 0.196533203125, 0.22228240966796875, 0.2480316162109375, 0.27378082275390625, 0.299530029296875, 0.32527923583984375, 0.3510284423828125, 0.37677764892578125, 0.40252685546875, 0.42827606201171875, 0.4540252685546875, 0.47977447509765625, 0.505523681640625, 0.5312728881835938, 0.5570220947265625, 0.5827713012695312, 0.6085205078125, 0.6342697143554688, 0.6600189208984375, 0.6857681274414062, 0.711517333984375, 0.7372665405273438, 0.7630157470703125, 0.7887649536132812, 0.81451416015625, 0.8402633666992188, 0.8660125732421875, 0.8917617797851562, 0.917510986328125, 0.9432601928710938, 0.9690093994140625, 0.9947586059570312, 1.0205078125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 1.0, 3.0, 12.0, 16.0, 27.0, 37.0, 70.0, 138.0, 261.0, 570.0, 1468.0, 5054.0, 25902.0, 759245.0, 228451.0, 20632.0, 4283.0, 1327.0, 538.0, 250.0, 110.0, 53.0, 35.0, 22.0, 16.0, 17.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09747314453125, -0.09476089477539062, -0.09204864501953125, -0.08933639526367188, -0.0866241455078125, -0.08391189575195312, -0.08119964599609375, -0.07848739624023438, -0.075775146484375, -0.07306289672851562, -0.07035064697265625, -0.06763839721679688, -0.0649261474609375, -0.062213897705078125, -0.05950164794921875, -0.056789398193359375, -0.0540771484375, -0.051364898681640625, -0.04865264892578125, -0.045940399169921875, -0.0432281494140625, -0.040515899658203125, -0.03780364990234375, -0.035091400146484375, -0.032379150390625, -0.029666900634765625, -0.02695465087890625, -0.024242401123046875, -0.0215301513671875, -0.018817901611328125, -0.01610565185546875, -0.013393402099609375, -0.01068115234375, -0.007968902587890625, -0.00525665283203125, -0.002544403076171875, 0.0001678466796875, 0.002880096435546875, 0.00559234619140625, 0.008304595947265625, 0.011016845703125, 0.013729095458984375, 0.01644134521484375, 0.019153594970703125, 0.0218658447265625, 0.024578094482421875, 0.02729034423828125, 0.030002593994140625, 0.03271484375, 0.035427093505859375, 0.03813934326171875, 0.040851593017578125, 0.0435638427734375, 0.046276092529296875, 0.04898834228515625, 0.051700592041015625, 0.054412841796875, 0.057125091552734375, 0.05983734130859375, 0.06254959106445312, 0.0652618408203125, 0.06797409057617188, 0.07068634033203125, 0.07339859008789062, 0.07611083984375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 4.0, 3.0, 2.0, 2.0, 7.0, 3.0, 8.0, 7.0, 10.0, 15.0, 7.0, 16.0, 11.0, 20.0, 35.0, 20.0, 31.0, 41.0, 55.0, 72.0, 77.0, 69.0, 88.0, 80.0, 49.0, 52.0, 44.0, 27.0, 27.0, 22.0, 22.0, 11.0, 14.0, 8.0, 10.0, 5.0, 8.0, 12.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.5212764739990234e-05, -2.436712384223938e-05, -2.3521482944488525e-05, -2.267584204673767e-05, -2.1830201148986816e-05, -2.0984560251235962e-05, -2.0138919353485107e-05, -1.9293278455734253e-05, -1.84476375579834e-05, -1.7601996660232544e-05, -1.675635576248169e-05, -1.5910714864730835e-05, -1.506507396697998e-05, -1.4219433069229126e-05, -1.3373792171478271e-05, -1.2528151273727417e-05, -1.1682510375976562e-05, -1.0836869478225708e-05, -9.991228580474854e-06, -9.145587682723999e-06, -8.299946784973145e-06, -7.45430588722229e-06, -6.6086649894714355e-06, -5.763024091720581e-06, -4.9173831939697266e-06, -4.071742296218872e-06, -3.2261013984680176e-06, -2.380460500717163e-06, -1.5348196029663086e-06, -6.891787052154541e-07, 1.564621925354004e-07, 1.0021030902862549e-06, 1.8477439880371094e-06, 2.693384885787964e-06, 3.5390257835388184e-06, 4.384666681289673e-06, 5.230307579040527e-06, 6.075948476791382e-06, 6.921589374542236e-06, 7.76723027229309e-06, 8.612871170043945e-06, 9.4585120677948e-06, 1.0304152965545654e-05, 1.1149793863296509e-05, 1.1995434761047363e-05, 1.2841075658798218e-05, 1.3686716556549072e-05, 1.4532357454299927e-05, 1.537799835205078e-05, 1.6223639249801636e-05, 1.706928014755249e-05, 1.7914921045303345e-05, 1.87605619430542e-05, 1.9606202840805054e-05, 2.0451843738555908e-05, 2.1297484636306763e-05, 2.2143125534057617e-05, 2.298876643180847e-05, 2.3834407329559326e-05, 2.468004822731018e-05, 2.5525689125061035e-05, 2.637133002281189e-05, 2.7216970920562744e-05, 2.80626118183136e-05, 2.8908252716064453e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 5.0, 7.0, 5.0, 8.0, 13.0, 14.0, 23.0, 38.0, 42.0, 97.0, 127.0, 213.0, 458.0, 730.0, 1563.0, 3663.0, 8922.0, 25886.0, 113294.0, 791761.0, 69819.0, 19138.0, 6948.0, 2877.0, 1382.0, 691.0, 317.0, 196.0, 115.0, 68.0, 46.0, 28.0, 17.0, 13.0, 5.0, 9.0, 6.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05816650390625, -0.05618572235107422, -0.05420494079589844, -0.052224159240722656, -0.050243377685546875, -0.048262596130371094, -0.04628181457519531, -0.04430103302001953, -0.04232025146484375, -0.04033946990966797, -0.03835868835449219, -0.036377906799316406, -0.034397125244140625, -0.032416343688964844, -0.030435562133789062, -0.02845478057861328, -0.0264739990234375, -0.02449321746826172, -0.022512435913085938, -0.020531654357910156, -0.018550872802734375, -0.016570091247558594, -0.014589309692382812, -0.012608528137207031, -0.01062774658203125, -0.008646965026855469, -0.0066661834716796875, -0.004685401916503906, -0.002704620361328125, -0.0007238388061523438, 0.0012569427490234375, 0.0032377243041992188, 0.005218505859375, 0.007199287414550781, 0.009180068969726562, 0.011160850524902344, 0.013141632080078125, 0.015122413635253906, 0.017103195190429688, 0.01908397674560547, 0.02106475830078125, 0.02304553985595703, 0.025026321411132812, 0.027007102966308594, 0.028987884521484375, 0.030968666076660156, 0.03294944763183594, 0.03493022918701172, 0.0369110107421875, 0.03889179229736328, 0.04087257385253906, 0.042853355407714844, 0.044834136962890625, 0.046814918518066406, 0.04879570007324219, 0.05077648162841797, 0.05275726318359375, 0.05473804473876953, 0.05671882629394531, 0.058699607849121094, 0.060680389404296875, 0.06266117095947266, 0.06464195251464844, 0.06662273406982422, 0.068603515625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 2.0, 4.0, 4.0, 7.0, 15.0, 12.0, 14.0, 15.0, 18.0, 20.0, 26.0, 51.0, 59.0, 77.0, 92.0, 100.0, 85.0, 87.0, 77.0, 58.0, 35.0, 24.0, 25.0, 22.0, 13.0, 11.0, 7.0, 4.0, 8.0, 6.0, 3.0, 4.0, 6.0, 1.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.088134765625, -0.08552742004394531, -0.08292007446289062, -0.08031272888183594, -0.07770538330078125, -0.07509803771972656, -0.07249069213867188, -0.06988334655761719, -0.0672760009765625, -0.06466865539550781, -0.062061309814453125, -0.05945396423339844, -0.05684661865234375, -0.05423927307128906, -0.051631927490234375, -0.04902458190917969, -0.046417236328125, -0.04380989074707031, -0.041202545166015625, -0.03859519958496094, -0.03598785400390625, -0.03338050842285156, -0.030773162841796875, -0.028165817260742188, -0.0255584716796875, -0.022951126098632812, -0.020343780517578125, -0.017736434936523438, -0.01512908935546875, -0.012521743774414062, -0.009914398193359375, -0.0073070526123046875, -0.00469970703125, -0.0020923614501953125, 0.000514984130859375, 0.0031223297119140625, 0.00572967529296875, 0.008337020874023438, 0.010944366455078125, 0.013551712036132812, 0.0161590576171875, 0.018766403198242188, 0.021373748779296875, 0.023981094360351562, 0.02658843994140625, 0.029195785522460938, 0.031803131103515625, 0.03441047668457031, 0.037017822265625, 0.03962516784667969, 0.042232513427734375, 0.04483985900878906, 0.04744720458984375, 0.05005455017089844, 0.052661895751953125, 0.05526924133300781, 0.0578765869140625, 0.06048393249511719, 0.06309127807617188, 0.06569862365722656, 0.06830596923828125, 0.07091331481933594, 0.07352066040039062, 0.07612800598144531, 0.0787353515625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 6.0, 14.0, 27.0, 43.0, 78.0, 183.0, 356.0, 131.0, 69.0, 35.0, 17.0, 12.0, 12.0, 6.0, 5.0, 8.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9888582229614258, -0.8926008343696594, -0.7963434457778931, -0.7000859975814819, -0.6038286685943604, -0.5075712203979492, -0.41131383180618286, -0.3150564432144165, -0.21879905462265015, -0.12254165858030319, -0.026284262537956238, 0.06997314095497131, 0.16623052954673767, 0.26248791813850403, 0.3587453365325928, 0.45500272512435913, 0.5512601137161255, 0.6475175023078918, 0.7437748908996582, 0.8400323390960693, 0.9362896680831909, 1.032547116279602, 1.1288044452667236, 1.2250618934631348, 1.321319341659546, 1.417576789855957, 1.5138341188430786, 1.6100915670394897, 1.7063488960266113, 1.8026063442230225, 1.8988637924194336, 1.9951211214065552, 2.0913784503936768, 2.187635898590088, 2.283893346786499, 2.380150556564331, 2.476408004760742, 2.5726654529571533, 2.6689229011535645, 2.7651801109313965, 2.8614375591278076, 2.9576950073242188, 3.05395245552063, 3.150209665298462, 3.246467113494873, 3.342724561691284, 3.4389820098876953, 3.5352392196655273, 3.6314969062805176, 3.7277543544769287, 3.82401180267334, 3.920269012451172, 4.016526699066162, 4.112783908843994, 4.209041118621826, 4.305298805236816, 4.401556015014648, 4.4978132247924805, 4.594070911407471, 4.690328121185303, 4.786585807800293, 4.882843017578125, 4.979100227355957, 5.075357913970947, 5.171615123748779]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 9.0, 6.0, 6.0, 6.0, 6.0, 13.0, 5.0, 22.0, 15.0, 19.0, 23.0, 19.0, 33.0, 34.0, 57.0, 71.0, 123.0, 132.0, 108.0, 67.0, 38.0, 28.0, 25.0, 18.0, 24.0, 13.0, 12.0, 10.0, 11.0, 9.0, 12.0, 6.0, 8.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.556845188140869, -2.4864301681518555, -2.416015386581421, -2.3456003665924072, -2.2751855850219727, -2.204770565032959, -2.1343557834625244, -2.0639407634735107, -1.9935258626937866, -1.9231109619140625, -1.8526960611343384, -1.7822811603546143, -1.7118661403656006, -1.641451358795166, -1.5710363388061523, -1.5006214380264282, -1.430206537246704, -1.35979163646698, -1.2893767356872559, -1.2189618349075317, -1.1485469341278076, -1.078131914138794, -1.0077170133590698, -0.9373021125793457, -0.8668872117996216, -0.7964723110198975, -0.7260574102401733, -0.6556424498558044, -0.5852275490760803, -0.5148126482963562, -0.4443977177143097, -0.3739827871322632, -0.30356764793395996, -0.23315273225307465, -0.16273781657218933, -0.09232290089130402, -0.0219079852104187, 0.04850691556930542, 0.11892184615135193, 0.18933677673339844, 0.25975167751312256, 0.3301665782928467, 0.4005815088748932, 0.4709964394569397, 0.5414113402366638, 0.6118262410163879, 0.6822412014007568, 0.752656102180481, 0.8230710029602051, 0.8934859037399292, 0.9639008045196533, 1.0343157052993774, 1.1047306060791016, 1.1751456260681152, 1.2455605268478394, 1.3159754276275635, 1.3863903284072876, 1.4568052291870117, 1.5272201299667358, 1.59763503074646, 1.6680500507354736, 1.7384648323059082, 1.8088798522949219, 1.879294753074646, 1.9497096538543701]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 5.0, 2.0, 5.0, 11.0, 10.0, 11.0, 14.0, 14.0, 18.0, 24.0, 23.0, 35.0, 23.0, 22.0, 28.0, 48.0, 64.0, 170.0, 118.0, 59.0, 40.0, 31.0, 25.0, 26.0, 18.0, 21.0, 16.0, 24.0, 12.0, 11.0, 17.0, 10.0, 10.0, 7.0, 7.0, 2.0, 4.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.159423828125, -0.15387916564941406, -0.14833450317382812, -0.1427898406982422, -0.13724517822265625, -0.1317005157470703, -0.12615585327148438, -0.12061119079589844, -0.1150665283203125, -0.10952186584472656, -0.10397720336914062, -0.09843254089355469, -0.09288787841796875, -0.08734321594238281, -0.08179855346679688, -0.07625389099121094, -0.070709228515625, -0.06516456604003906, -0.059619903564453125, -0.05407524108886719, -0.04853057861328125, -0.04298591613769531, -0.037441253662109375, -0.03189659118652344, -0.0263519287109375, -0.020807266235351562, -0.015262603759765625, -0.009717941284179688, -0.00417327880859375, 0.0013713836669921875, 0.006916046142578125, 0.012460708618164062, 0.01800537109375, 0.023550033569335938, 0.029094696044921875, 0.03463935852050781, 0.04018402099609375, 0.04572868347167969, 0.051273345947265625, 0.05681800842285156, 0.0623626708984375, 0.06790733337402344, 0.07345199584960938, 0.07899665832519531, 0.08454132080078125, 0.09008598327636719, 0.09563064575195312, 0.10117530822753906, 0.106719970703125, 0.11226463317871094, 0.11780929565429688, 0.12335395812988281, 0.12889862060546875, 0.1344432830810547, 0.13998794555664062, 0.14553260803222656, 0.1510772705078125, 0.15662193298339844, 0.16216659545898438, 0.1677112579345703, 0.17325592041015625, 0.1788005828857422, 0.18434524536132812, 0.18988990783691406, 0.1954345703125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 4.0, 4.0, 2.0, 7.0, 9.0, 8.0, 14.0, 24.0, 32.0, 35.0, 42.0, 57.0, 99.0, 166.0, 370.0, 765.0, 2104.0, 6993.0, 63964.0, 8294026.0, 14207.0, 3358.0, 1198.0, 493.0, 231.0, 114.0, 57.0, 45.0, 39.0, 18.0, 9.0, 16.0, 19.0, 10.0, 7.0, 7.0, 7.0, 4.0, 4.0, 2.0, 0.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.2476420402526855, -1.2122299671173096, -1.1768180131912231, -1.1414059400558472, -1.1059939861297607, -1.0705819129943848, -1.0351698398590088, -0.9997578263282776, -0.9643458127975464, -0.9289337992668152, -0.893521785736084, -0.858109712600708, -0.8226976990699768, -0.7872856855392456, -0.7518736124038696, -0.7164615988731384, -0.6810495853424072, -0.645637571811676, -0.6102255582809448, -0.5748134851455688, -0.5394014716148376, -0.5039894580841064, -0.46857741475105286, -0.43316537141799927, -0.39775335788726807, -0.36234134435653687, -0.3269293010234833, -0.2915172576904297, -0.2561052441596985, -0.2206932157278061, -0.1852811872959137, -0.1498691588640213, -0.1144571304321289, -0.07904510200023651, -0.043633073568344116, -0.008221045136451721, 0.027190983295440674, 0.06260301172733307, 0.09801504015922546, 0.13342706859111786, 0.16883909702301025, 0.20425112545490265, 0.23966315388679504, 0.27507519721984863, 0.31048721075057983, 0.34589922428131104, 0.3813112676143646, 0.4167233109474182, 0.4521353244781494, 0.4875473380088806, 0.5229593515396118, 0.5583714246749878, 0.593783438205719, 0.6291954517364502, 0.6646075248718262, 0.7000195384025574, 0.7354315519332886, 0.7708435654640198, 0.806255578994751, 0.841667652130127, 0.8770796656608582, 0.9124916791915894, 0.9479037523269653, 0.9833157658576965, 1.0187277793884277]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 6.0, 4.0, 7.0, 2.0, 7.0, 9.0, 3.0, 1.0, 3.0, 5.0, 3.0, 4.0, 1.0, 5.0, 2.0, 2.0, 7.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.232407569885254, -1.183804988861084, -1.135202407836914, -1.0865998268127441, -1.0379972457885742, -0.9893946647644043, -0.9407920241355896, -0.8921894431114197, -0.8435868620872498, -0.7949842810630798, -0.7463817000389099, -0.6977790594100952, -0.6491764783859253, -0.6005738973617554, -0.5519713163375854, -0.5033687353134155, -0.4547661542892456, -0.4061635732650757, -0.35756099224090576, -0.30895838141441345, -0.26035580039024353, -0.2117532193660736, -0.1631506085395813, -0.11454802751541138, -0.06594544649124146, -0.017342858016490936, 0.03125973045825958, 0.0798623263835907, 0.12846490740776062, 0.17706748843193054, 0.22567009925842285, 0.2742726802825928, 0.32287514209747314, 0.37147772312164307, 0.420080304145813, 0.4686829149723053, 0.5172854661941528, 0.5658880472183228, 0.6144906878471375, 0.6630932688713074, 0.7116958498954773, 0.7602984309196472, 0.8089010119438171, 0.8575036525726318, 0.9061062335968018, 0.9547088146209717, 1.0033113956451416, 1.0519139766693115, 1.1005165576934814, 1.1491191387176514, 1.1977217197418213, 1.2463243007659912, 1.2949268817901611, 1.343529462814331, 1.392132043838501, 1.440734624862671, 1.4893372058868408, 1.5379397869110107, 1.5865423679351807, 1.6351449489593506, 1.6837475299835205, 1.7323501110076904, 1.7809526920318604, 1.8295552730560303, 1.8781579732894897]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 0.0, 5.0, 5.0, 8.0, 6.0, 12.0, 10.0, 12.0, 13.0, 27.0, 16.0, 21.0, 31.0, 28.0, 48.0, 63.0, 59.0, 57.0, 66.0, 70.0, 52.0, 63.0, 41.0, 40.0, 41.0, 42.0, 29.0, 25.0, 25.0, 18.0, 17.0, 11.0, 8.0, 11.0, 5.0, 8.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1424560546875, -0.13739967346191406, -0.13234329223632812, -0.1272869110107422, -0.12223052978515625, -0.11717414855957031, -0.11211776733398438, -0.10706138610839844, -0.1020050048828125, -0.09694862365722656, -0.09189224243164062, -0.08683586120605469, -0.08177947998046875, -0.07672309875488281, -0.07166671752929688, -0.06661033630371094, -0.061553955078125, -0.05649757385253906, -0.051441192626953125, -0.04638481140136719, -0.04132843017578125, -0.03627204895019531, -0.031215667724609375, -0.026159286499023438, -0.0211029052734375, -0.016046524047851562, -0.010990142822265625, -0.0059337615966796875, -0.00087738037109375, 0.0041790008544921875, 0.009235382080078125, 0.014291763305664062, 0.01934814453125, 0.024404525756835938, 0.029460906982421875, 0.03451728820800781, 0.03957366943359375, 0.04463005065917969, 0.049686431884765625, 0.05474281311035156, 0.0597991943359375, 0.06485557556152344, 0.06991195678710938, 0.07496833801269531, 0.08002471923828125, 0.08508110046386719, 0.09013748168945312, 0.09519386291503906, 0.100250244140625, 0.10530662536621094, 0.11036300659179688, 0.11541938781738281, 0.12047576904296875, 0.1255321502685547, 0.13058853149414062, 0.13564491271972656, 0.1407012939453125, 0.14575767517089844, 0.15081405639648438, 0.1558704376220703, 0.16092681884765625, 0.1659832000732422, 0.17103958129882812, 0.17609596252441406, 0.18115234375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 5.0, 8.0, 13.0, 21.0, 25.0, 33.0, 73.0, 107.0, 195.0, 296.0, 611.0, 1350.0, 2774.0, 6783.0, 16844.0, 45559.0, 116810.0, 178288.0, 93744.0, 36044.0, 13952.0, 5693.0, 2527.0, 1155.0, 581.0, 322.0, 182.0, 109.0, 60.0, 38.0, 28.0, 11.0, 6.0, 7.0, 1.0, 5.0, 3.0, 0.0, 1.0], "bins": [-1.365234375, -1.3330230712890625, -1.300811767578125, -1.2686004638671875, -1.23638916015625, -1.2041778564453125, -1.171966552734375, -1.1397552490234375, -1.1075439453125, -1.0753326416015625, -1.043121337890625, -1.0109100341796875, -0.97869873046875, -0.9464874267578125, -0.914276123046875, -0.8820648193359375, -0.849853515625, -0.8176422119140625, -0.785430908203125, -0.7532196044921875, -0.72100830078125, -0.6887969970703125, -0.656585693359375, -0.6243743896484375, -0.5921630859375, -0.5599517822265625, -0.527740478515625, -0.4955291748046875, -0.46331787109375, -0.4311065673828125, -0.398895263671875, -0.3666839599609375, -0.33447265625, -0.3022613525390625, -0.270050048828125, -0.2378387451171875, -0.20562744140625, -0.1734161376953125, -0.141204833984375, -0.1089935302734375, -0.0767822265625, -0.0445709228515625, -0.012359619140625, 0.0198516845703125, 0.05206298828125, 0.0842742919921875, 0.116485595703125, 0.1486968994140625, 0.180908203125, 0.2131195068359375, 0.245330810546875, 0.2775421142578125, 0.30975341796875, 0.3419647216796875, 0.374176025390625, 0.4063873291015625, 0.4385986328125, 0.4708099365234375, 0.503021240234375, 0.5352325439453125, 0.56744384765625, 0.5996551513671875, 0.631866455078125, 0.6640777587890625, 0.6962890625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 4.0, 5.0, 7.0, 8.0, 8.0, 7.0, 16.0, 17.0, 16.0, 20.0, 16.0, 30.0, 39.0, 41.0, 31.0, 58.0, 65.0, 50.0, 60.0, 56.0, 50.0, 54.0, 45.0, 40.0, 38.0, 39.0, 26.0, 24.0, 25.0, 21.0, 11.0, 12.0, 14.0, 8.0, 5.0, 8.0, 4.0, 4.0, 5.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.178466796875, -0.17332077026367188, -0.16817474365234375, -0.16302871704101562, -0.1578826904296875, -0.15273666381835938, -0.14759063720703125, -0.14244461059570312, -0.137298583984375, -0.13215255737304688, -0.12700653076171875, -0.12186050415039062, -0.1167144775390625, -0.11156845092773438, -0.10642242431640625, -0.10127639770507812, -0.09613037109375, -0.09098434448242188, -0.08583831787109375, -0.08069229125976562, -0.0755462646484375, -0.07040023803710938, -0.06525421142578125, -0.060108184814453125, -0.054962158203125, -0.049816131591796875, -0.04467010498046875, -0.039524078369140625, -0.0343780517578125, -0.029232025146484375, -0.02408599853515625, -0.018939971923828125, -0.0137939453125, -0.008647918701171875, -0.00350189208984375, 0.001644134521484375, 0.0067901611328125, 0.011936187744140625, 0.01708221435546875, 0.022228240966796875, 0.027374267578125, 0.032520294189453125, 0.03766632080078125, 0.042812347412109375, 0.0479583740234375, 0.053104400634765625, 0.05825042724609375, 0.06339645385742188, 0.06854248046875, 0.07368850708007812, 0.07883453369140625, 0.08398056030273438, 0.0891265869140625, 0.09427261352539062, 0.09941864013671875, 0.10456466674804688, 0.109710693359375, 0.11485671997070312, 0.12000274658203125, 0.12514877319335938, 0.1302947998046875, 0.13544082641601562, 0.14058685302734375, 0.14573287963867188, 0.15087890625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 3.0, 6.0, 3.0, 5.0, 7.0, 7.0, 28.0, 54.0, 124.0, 119.0, 66.0, 26.0, 10.0, 9.0, 2.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3505499362945557, -2.2932605743408203, -2.235971212387085, -2.1786818504333496, -2.1213927268981934, -2.064103364944458, -2.0068140029907227, -1.9495246410369873, -1.892235279083252, -1.8349459171295166, -1.7776566743850708, -1.7203673124313354, -1.6630779504776, -1.6057887077331543, -1.548499345779419, -1.4912099838256836, -1.4339206218719482, -1.376631259918213, -1.319342017173767, -1.2620526552200317, -1.2047632932662964, -1.1474740505218506, -1.0901846885681152, -1.0328953266143799, -0.9756060838699341, -0.9183167815208435, -0.8610274195671082, -0.8037381172180176, -0.7464487552642822, -0.6891594529151917, -0.6318701505661011, -0.5745807886123657, -0.5172914266586304, -0.4600020945072174, -0.40271276235580444, -0.34542346000671387, -0.2881340980529785, -0.23084479570388794, -0.17355546355247498, -0.11626613140106201, -0.05897679924964905, -0.0016874708235263824, 0.05560185760259628, 0.11289118230342865, 0.1701805144548416, 0.22746983170509338, 0.28475916385650635, 0.3420484960079193, 0.3993378281593323, 0.45662716031074524, 0.5139164924621582, 0.5712057948112488, 0.6284951567649841, 0.6857844591140747, 0.7430738210678101, 0.8003631234169006, 0.8576524257659912, 0.9149417281150818, 0.9722310900688171, 1.0295203924179077, 1.086809754371643, 1.1440989971160889, 1.2013883590698242, 1.2586777210235596, 1.315967082977295]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 4.0, 5.0, 3.0, 4.0, 9.0, 13.0, 23.0, 49.0, 54.0, 78.0, 82.0, 49.0, 33.0, 12.0, 7.0, 7.0, 4.0, 8.0, 1.0, 5.0, 6.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9270635843276978, -0.8975524306297302, -0.8680412173271179, -0.8385300636291504, -0.8090188503265381, -0.7795076966285706, -0.749996542930603, -0.7204853296279907, -0.6909741759300232, -0.6614630222320557, -0.6319518089294434, -0.6024406552314758, -0.5729295015335083, -0.543418288230896, -0.5139071345329285, -0.48439595103263855, -0.45488476753234863, -0.4253735840320587, -0.3958624005317688, -0.36635124683380127, -0.33684006333351135, -0.30732887983322144, -0.2778177261352539, -0.248306542634964, -0.21879535913467407, -0.18928417563438416, -0.15977300703525543, -0.1302618384361267, -0.10075065493583679, -0.07123947143554688, -0.04172830283641815, -0.012217134237289429, 0.017294108867645264, 0.046805284917354584, 0.0763164609670639, 0.10582763701677322, 0.13533881306648254, 0.16484999656677246, 0.19436116516590118, 0.2238723337650299, 0.2533835172653198, 0.28289470076560974, 0.31240588426589966, 0.3419170379638672, 0.3714282214641571, 0.400939404964447, 0.43045055866241455, 0.45996174216270447, 0.4894729256629944, 0.5189840793609619, 0.5484952926635742, 0.5780064463615417, 0.6075176000595093, 0.6370288133621216, 0.6665399670600891, 0.6960511207580566, 0.725562334060669, 0.7550734877586365, 0.7845847010612488, 0.8140958547592163, 0.8436070680618286, 0.8731182217597961, 0.9026293754577637, 0.932140588760376, 0.9616517424583435]}, "eval/loss": 0.35239124298095703, "eval/wer": 0.10420468068226894, "eval/runtime": 326.5742, "eval/samples_per_second": 8.09, "eval/steps_per_second": 0.508} \ No newline at end of file +{"train/loss": 0.0308, "train/learning_rate": 1.4754098360655737e-06, "train/epoch": 10.0, "train/global_step": 1110, "_runtime": 25890, "_timestamp": 1648512792, "_step": 1112, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 7.0, 34.0, 74.0, 168.0, 333.0, 235.0, 100.0, 43.0, 9.0, 5.0, 2.0, 0.0, 2.0], "bins": [-4.376101493835449, -4.297544956207275, -4.21898889541626, -4.140432357788086, -4.06187629699707, -3.9833199977874756, -3.904763698577881, -3.826207399368286, -3.7476511001586914, -3.6690948009490967, -3.590538501739502, -3.5119822025299072, -3.4334259033203125, -3.3548696041107178, -3.276313304901123, -3.1977570056915283, -3.1192007064819336, -3.040644407272339, -2.962088108062744, -2.8835318088531494, -2.8049755096435547, -2.72641921043396, -2.6478629112243652, -2.5693066120147705, -2.4907500743865967, -2.412193775177002, -2.3336374759674072, -2.2550811767578125, -2.1765248775482178, -2.097968578338623, -2.0194122791290283, -1.9408559799194336, -1.8622997999191284, -1.7837435007095337, -1.705187201499939, -1.6266309022903442, -1.5480746030807495, -1.4695183038711548, -1.3909618854522705, -1.3124055862426758, -1.233849287033081, -1.1552929878234863, -1.0767366886138916, -0.9981803894042969, -0.9196240901947021, -0.8410677909851074, -0.7625114321708679, -0.6839551329612732, -0.6053988933563232, -0.5268425941467285, -0.4482862949371338, -0.3697299659252167, -0.29117366671562195, -0.21261736750602722, -0.1340610384941101, -0.05550473928451538, 0.023051559925079346, 0.10160786658525467, 0.18016417324543, 0.2587204873561859, 0.33727678656578064, 0.41583308577537537, 0.4943894147872925, 0.5729457139968872, 0.6515020132064819]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 6.0, 4.0, 8.0, 10.0, 7.0, 14.0, 13.0, 15.0, 14.0, 25.0, 35.0, 27.0, 29.0, 39.0, 34.0, 39.0, 40.0, 42.0, 46.0, 33.0, 54.0, 46.0, 39.0, 44.0, 57.0, 32.0, 45.0, 33.0, 27.0, 25.0, 27.0, 18.0, 16.0, 19.0, 14.0, 8.0, 12.0, 1.0, 8.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5758266448974609, -0.5571876764297485, -0.5385486483573914, -0.519909679889679, -0.5012706518173218, -0.4826316833496094, -0.4639926850795746, -0.4453536868095398, -0.426714688539505, -0.4080756902694702, -0.3894366919994354, -0.37079769372940063, -0.35215872526168823, -0.33351969718933105, -0.31488072872161865, -0.29624173045158386, -0.2776027321815491, -0.2589637339115143, -0.2403247356414795, -0.2216857522726059, -0.2030467540025711, -0.18440775573253632, -0.16576877236366272, -0.14712977409362793, -0.12849077582359314, -0.10985177755355835, -0.09121278673410416, -0.07257379591464996, -0.05393479764461517, -0.03529579937458038, -0.01665680855512619, 0.001982182264328003, 0.020621120929718018, 0.03926011547446251, 0.057899110019207, 0.0765381008386612, 0.09517709910869598, 0.11381609737873077, 0.13245508074760437, 0.15109407901763916, 0.16973307728767395, 0.18837207555770874, 0.20701107382774353, 0.22565005719661713, 0.24428905546665192, 0.2629280686378479, 0.2815670371055603, 0.3002060353755951, 0.3188450336456299, 0.3374840319156647, 0.35612303018569946, 0.37476202845573425, 0.39340102672576904, 0.41203999519348145, 0.43067899346351624, 0.449317991733551, 0.4679569900035858, 0.4865959882736206, 0.505234956741333, 0.5238739848136902, 0.5425129532814026, 0.5611519813537598, 0.5797909498214722, 0.5984299182891846, 0.6170689463615417]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 7.0, 14.0, 13.0, 25.0, 37.0, 70.0, 78.0, 92.0, 158.0, 186.0, 328.0, 447.0, 763.0, 1228.0, 2196.0, 3983.0, 7429.0, 16140.0, 60534.0, 567329.0, 2653480.0, 762211.0, 79108.0, 18380.0, 8465.0, 4572.0, 2706.0, 1542.0, 919.0, 600.0, 388.0, 236.0, 149.0, 126.0, 99.0, 69.0, 48.0, 33.0, 29.0, 9.0, 15.0, 12.0, 11.0, 4.0, 8.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7685546875, -1.7087554931640625, -1.648956298828125, -1.5891571044921875, -1.52935791015625, -1.4695587158203125, -1.409759521484375, -1.3499603271484375, -1.2901611328125, -1.2303619384765625, -1.170562744140625, -1.1107635498046875, -1.05096435546875, -0.9911651611328125, -0.931365966796875, -0.8715667724609375, -0.811767578125, -0.7519683837890625, -0.692169189453125, -0.6323699951171875, -0.57257080078125, -0.5127716064453125, -0.452972412109375, -0.3931732177734375, -0.3333740234375, -0.2735748291015625, -0.213775634765625, -0.1539764404296875, -0.09417724609375, -0.0343780517578125, 0.025421142578125, 0.0852203369140625, 0.14501953125, 0.2048187255859375, 0.264617919921875, 0.3244171142578125, 0.38421630859375, 0.4440155029296875, 0.503814697265625, 0.5636138916015625, 0.6234130859375, 0.6832122802734375, 0.743011474609375, 0.8028106689453125, 0.86260986328125, 0.9224090576171875, 0.982208251953125, 1.0420074462890625, 1.101806640625, 1.1616058349609375, 1.221405029296875, 1.2812042236328125, 1.34100341796875, 1.4008026123046875, 1.460601806640625, 1.5204010009765625, 1.5802001953125, 1.6399993896484375, 1.699798583984375, 1.7595977783203125, 1.81939697265625, 1.8791961669921875, 1.938995361328125, 1.9987945556640625, 2.05859375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 9.0, 6.0, 12.0, 6.0, 10.0, 8.0, 9.0, 13.0, 14.0, 23.0, 32.0, 29.0, 38.0, 38.0, 29.0, 32.0, 44.0, 41.0, 45.0, 45.0, 37.0, 38.0, 44.0, 36.0, 45.0, 49.0, 35.0, 33.0, 25.0, 29.0, 22.0, 23.0, 22.0, 11.0, 16.0, 16.0, 11.0, 2.0, 7.0, 4.0, 10.0, 1.0, 7.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.998046875, -0.966156005859375, -0.93426513671875, -0.902374267578125, -0.8704833984375, -0.838592529296875, -0.80670166015625, -0.774810791015625, -0.742919921875, -0.711029052734375, -0.67913818359375, -0.647247314453125, -0.6153564453125, -0.583465576171875, -0.55157470703125, -0.519683837890625, -0.48779296875, -0.455902099609375, -0.42401123046875, -0.392120361328125, -0.3602294921875, -0.328338623046875, -0.29644775390625, -0.264556884765625, -0.232666015625, -0.200775146484375, -0.16888427734375, -0.136993408203125, -0.1051025390625, -0.073211669921875, -0.04132080078125, -0.009429931640625, 0.0224609375, 0.054351806640625, 0.08624267578125, 0.118133544921875, 0.1500244140625, 0.181915283203125, 0.21380615234375, 0.245697021484375, 0.277587890625, 0.309478759765625, 0.34136962890625, 0.373260498046875, 0.4051513671875, 0.437042236328125, 0.46893310546875, 0.500823974609375, 0.53271484375, 0.564605712890625, 0.59649658203125, 0.628387451171875, 0.6602783203125, 0.692169189453125, 0.72406005859375, 0.755950927734375, 0.787841796875, 0.819732666015625, 0.85162353515625, 0.883514404296875, 0.9154052734375, 0.947296142578125, 0.97918701171875, 1.011077880859375, 1.04296875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 12.0, 8.0, 14.0, 29.0, 44.0, 69.0, 153.0, 684.0, 8936.0, 4174470.0, 8802.0, 687.0, 168.0, 77.0, 39.0, 30.0, 17.0, 9.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-16.609375, -16.1414794921875, -15.673583984375, -15.2056884765625, -14.73779296875, -14.2698974609375, -13.802001953125, -13.3341064453125, -12.8662109375, -12.3983154296875, -11.930419921875, -11.4625244140625, -10.99462890625, -10.5267333984375, -10.058837890625, -9.5909423828125, -9.123046875, -8.6551513671875, -8.187255859375, -7.7193603515625, -7.25146484375, -6.7835693359375, -6.315673828125, -5.8477783203125, -5.3798828125, -4.9119873046875, -4.444091796875, -3.9761962890625, -3.50830078125, -3.0404052734375, -2.572509765625, -2.1046142578125, -1.63671875, -1.1688232421875, -0.700927734375, -0.2330322265625, 0.23486328125, 0.7027587890625, 1.170654296875, 1.6385498046875, 2.1064453125, 2.5743408203125, 3.042236328125, 3.5101318359375, 3.97802734375, 4.4459228515625, 4.913818359375, 5.3817138671875, 5.849609375, 6.3175048828125, 6.785400390625, 7.2532958984375, 7.72119140625, 8.1890869140625, 8.656982421875, 9.1248779296875, 9.5927734375, 10.0606689453125, 10.528564453125, 10.9964599609375, 11.46435546875, 11.9322509765625, 12.400146484375, 12.8680419921875, 13.3359375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 8.0, 11.0, 17.0, 18.0, 35.0, 59.0, 105.0, 199.0, 638.0, 1652.0, 804.0, 228.0, 111.0, 63.0, 37.0, 23.0, 20.0, 13.0, 11.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74560546875, -0.7175369262695312, -0.6894683837890625, -0.6613998413085938, -0.633331298828125, -0.6052627563476562, -0.5771942138671875, -0.5491256713867188, -0.52105712890625, -0.49298858642578125, -0.4649200439453125, -0.43685150146484375, -0.408782958984375, -0.38071441650390625, -0.3526458740234375, -0.32457733154296875, -0.2965087890625, -0.26844024658203125, -0.2403717041015625, -0.21230316162109375, -0.184234619140625, -0.15616607666015625, -0.1280975341796875, -0.10002899169921875, -0.07196044921875, -0.04389190673828125, -0.0158233642578125, 0.01224517822265625, 0.040313720703125, 0.06838226318359375, 0.0964508056640625, 0.12451934814453125, 0.152587890625, 0.18065643310546875, 0.2087249755859375, 0.23679351806640625, 0.264862060546875, 0.29293060302734375, 0.3209991455078125, 0.34906768798828125, 0.37713623046875, 0.40520477294921875, 0.4332733154296875, 0.46134185791015625, 0.489410400390625, 0.5174789428710938, 0.5455474853515625, 0.5736160278320312, 0.6016845703125, 0.6297531127929688, 0.6578216552734375, 0.6858901977539062, 0.713958740234375, 0.7420272827148438, 0.7700958251953125, 0.7981643676757812, 0.82623291015625, 0.8543014526367188, 0.8823699951171875, 0.9104385375976562, 0.938507080078125, 0.9665756225585938, 0.9946441650390625, 1.0227127075195312, 1.05078125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0, 6.0, 7.0, 4.0, 7.0, 13.0, 15.0, 16.0, 27.0, 36.0, 37.0, 52.0, 50.0, 70.0, 82.0, 99.0, 87.0, 72.0, 74.0, 60.0, 43.0, 35.0, 26.0, 23.0, 11.0, 11.0, 6.0, 7.0, 6.0, 4.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5493606328964233, -1.5017366409301758, -1.4541127681732178, -1.4064887762069702, -1.3588649034500122, -1.3112409114837646, -1.2636170387268066, -1.215993046760559, -1.1683690547943115, -1.120745062828064, -1.073121190071106, -1.0254971981048584, -0.9778733253479004, -0.9302493333816528, -0.88262540102005, -0.8350014686584473, -0.7873775959014893, -0.7397536635398865, -0.6921297311782837, -0.6445057392120361, -0.5968818664550781, -0.5492578744888306, -0.5016339421272278, -0.454010009765625, -0.4063860774040222, -0.35876214504241943, -0.31113821268081665, -0.2635142505168915, -0.2158903181552887, -0.1682663857936859, -0.12064242362976074, -0.07301849126815796, -0.025394439697265625, 0.022229500114917755, 0.06985343992710114, 0.11747738718986511, 0.1651013195514679, 0.21272525191307068, 0.26034921407699585, 0.30797314643859863, 0.3555970788002014, 0.4032210111618042, 0.450844943523407, 0.49846890568733215, 0.5460928678512573, 0.5937167406082153, 0.6413407325744629, 0.6889646649360657, 0.7365885972976685, 0.7842125296592712, 0.831836462020874, 0.8794604539871216, 0.9270843267440796, 0.9747083187103271, 1.0223321914672852, 1.0699561834335327, 1.1175801753997803, 1.1652041673660278, 1.2128280401229858, 1.2604520320892334, 1.3080759048461914, 1.355699896812439, 1.4033238887786865, 1.4509477615356445, 1.4985716342926025]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 6.0, 4.0, 10.0, 2.0, 8.0, 12.0, 20.0, 10.0, 17.0, 18.0, 26.0, 25.0, 25.0, 28.0, 33.0, 41.0, 38.0, 39.0, 36.0, 41.0, 35.0, 39.0, 46.0, 43.0, 28.0, 46.0, 33.0, 40.0, 38.0, 30.0, 29.0, 17.0, 15.0, 25.0, 8.0, 22.0, 15.0, 15.0, 7.0, 6.0, 7.0, 4.0, 4.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9994038939476013, -0.9701382517814636, -0.9408726692199707, -0.911607027053833, -0.8823413848876953, -0.8530758023262024, -0.8238101601600647, -0.7945445775985718, -0.7652789354324341, -0.7360132932662964, -0.7067477107048035, -0.6774820685386658, -0.6482164263725281, -0.6189508438110352, -0.5896852016448975, -0.5604195594787598, -0.5311539173126221, -0.5018882751464844, -0.47262266278266907, -0.44335705041885376, -0.41409143805503845, -0.38482582569122314, -0.35556018352508545, -0.32629457116127014, -0.29702895879745483, -0.2677633464336395, -0.23849771916866302, -0.20923209190368652, -0.17996647953987122, -0.15070085227489471, -0.12143522500991821, -0.0921696126461029, -0.0629040002822876, -0.03363838046789169, -0.00437275692820549, 0.024892866611480713, 0.05415848642587662, 0.08342410624027252, 0.11268973350524902, 0.14195534586906433, 0.17122097313404083, 0.20048660039901733, 0.22975221276283264, 0.25901782512664795, 0.28828346729278564, 0.31754907965660095, 0.34681469202041626, 0.37608033418655396, 0.40534594655036926, 0.43461155891418457, 0.46387720108032227, 0.4931428134441376, 0.5224084258079529, 0.5516740679740906, 0.5809396505355835, 0.6102052927017212, 0.6394709348678589, 0.6687365770339966, 0.6980021595954895, 0.7272678017616272, 0.7565334439277649, 0.7857990264892578, 0.8150646686553955, 0.8443303108215332, 0.8735958933830261]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 6.0, 6.0, 9.0, 20.0, 28.0, 43.0, 69.0, 84.0, 124.0, 205.0, 310.0, 467.0, 788.0, 1255.0, 2086.0, 3416.0, 5622.0, 9460.0, 16580.0, 29324.0, 54762.0, 105941.0, 209747.0, 280857.0, 153086.0, 78141.0, 41614.0, 22626.0, 12912.0, 7396.0, 4483.0, 2701.0, 1649.0, 1037.0, 602.0, 406.0, 247.0, 127.0, 107.0, 67.0, 55.0, 33.0, 9.0, 20.0, 9.0, 8.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.4306640625, -0.4177207946777344, -0.40477752685546875, -0.3918342590332031, -0.3788909912109375, -0.3659477233886719, -0.35300445556640625, -0.3400611877441406, -0.327117919921875, -0.3141746520996094, -0.30123138427734375, -0.2882881164550781, -0.2753448486328125, -0.2624015808105469, -0.24945831298828125, -0.23651504516601562, -0.22357177734375, -0.21062850952148438, -0.19768524169921875, -0.18474197387695312, -0.1717987060546875, -0.15885543823242188, -0.14591217041015625, -0.13296890258789062, -0.120025634765625, -0.10708236694335938, -0.09413909912109375, -0.08119583129882812, -0.0682525634765625, -0.055309295654296875, -0.04236602783203125, -0.029422760009765625, -0.0164794921875, -0.003536224365234375, 0.00940704345703125, 0.022350311279296875, 0.0352935791015625, 0.048236846923828125, 0.06118011474609375, 0.07412338256835938, 0.087066650390625, 0.10000991821289062, 0.11295318603515625, 0.12589645385742188, 0.1388397216796875, 0.15178298950195312, 0.16472625732421875, 0.17766952514648438, 0.19061279296875, 0.20355606079101562, 0.21649932861328125, 0.22944259643554688, 0.2423858642578125, 0.2553291320800781, 0.26827239990234375, 0.2812156677246094, 0.294158935546875, 0.3071022033691406, 0.32004547119140625, 0.3329887390136719, 0.3459320068359375, 0.3588752746582031, 0.37181854248046875, 0.3847618103027344, 0.397705078125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 7.0, 5.0, 4.0, 3.0, 6.0, 13.0, 12.0, 16.0, 14.0, 24.0, 26.0, 17.0, 36.0, 33.0, 33.0, 44.0, 45.0, 35.0, 40.0, 41.0, 43.0, 43.0, 63.0, 39.0, 51.0, 40.0, 40.0, 31.0, 39.0, 25.0, 15.0, 13.0, 14.0, 13.0, 15.0, 16.0, 13.0, 8.0, 9.0, 3.0, 5.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.71728515625, -0.6948699951171875, -0.672454833984375, -0.6500396728515625, -0.62762451171875, -0.6052093505859375, -0.582794189453125, -0.5603790283203125, -0.5379638671875, -0.5155487060546875, -0.493133544921875, -0.4707183837890625, -0.44830322265625, -0.4258880615234375, -0.403472900390625, -0.3810577392578125, -0.358642578125, -0.3362274169921875, -0.313812255859375, -0.2913970947265625, -0.26898193359375, -0.2465667724609375, -0.224151611328125, -0.2017364501953125, -0.1793212890625, -0.1569061279296875, -0.134490966796875, -0.1120758056640625, -0.08966064453125, -0.0672454833984375, -0.044830322265625, -0.0224151611328125, 0.0, 0.0224151611328125, 0.044830322265625, 0.0672454833984375, 0.08966064453125, 0.1120758056640625, 0.134490966796875, 0.1569061279296875, 0.1793212890625, 0.2017364501953125, 0.224151611328125, 0.2465667724609375, 0.26898193359375, 0.2913970947265625, 0.313812255859375, 0.3362274169921875, 0.358642578125, 0.3810577392578125, 0.403472900390625, 0.4258880615234375, 0.44830322265625, 0.4707183837890625, 0.493133544921875, 0.5155487060546875, 0.5379638671875, 0.5603790283203125, 0.582794189453125, 0.6052093505859375, 0.62762451171875, 0.6500396728515625, 0.672454833984375, 0.6948699951171875, 0.71728515625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 9.0, 7.0, 21.0, 27.0, 34.0, 50.0, 82.0, 100.0, 156.0, 258.0, 403.0, 678.0, 1243.0, 2598.0, 5867.0, 15841.0, 48934.0, 169517.0, 475092.0, 229292.0, 64182.0, 20272.0, 7335.0, 3096.0, 1504.0, 765.0, 445.0, 246.0, 172.0, 95.0, 69.0, 52.0, 24.0, 24.0, 19.0, 16.0, 4.0, 10.0, 2.0, 5.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6103515625, -0.5904159545898438, -0.5704803466796875, -0.5505447387695312, -0.530609130859375, -0.5106735229492188, -0.4907379150390625, -0.47080230712890625, -0.45086669921875, -0.43093109130859375, -0.4109954833984375, -0.39105987548828125, -0.371124267578125, -0.35118865966796875, -0.3312530517578125, -0.31131744384765625, -0.2913818359375, -0.27144622802734375, -0.2515106201171875, -0.23157501220703125, -0.211639404296875, -0.19170379638671875, -0.1717681884765625, -0.15183258056640625, -0.13189697265625, -0.11196136474609375, -0.0920257568359375, -0.07209014892578125, -0.052154541015625, -0.03221893310546875, -0.0122833251953125, 0.00765228271484375, 0.027587890625, 0.04752349853515625, 0.0674591064453125, 0.08739471435546875, 0.107330322265625, 0.12726593017578125, 0.1472015380859375, 0.16713714599609375, 0.18707275390625, 0.20700836181640625, 0.2269439697265625, 0.24687957763671875, 0.266815185546875, 0.28675079345703125, 0.3066864013671875, 0.32662200927734375, 0.3465576171875, 0.36649322509765625, 0.3864288330078125, 0.40636444091796875, 0.426300048828125, 0.44623565673828125, 0.4661712646484375, 0.48610687255859375, 0.50604248046875, 0.5259780883789062, 0.5459136962890625, 0.5658493041992188, 0.585784912109375, 0.6057205200195312, 0.6256561279296875, 0.6455917358398438, 0.66552734375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 5.0, 5.0, 8.0, 14.0, 9.0, 12.0, 18.0, 18.0, 23.0, 31.0, 35.0, 32.0, 35.0, 42.0, 50.0, 51.0, 50.0, 55.0, 55.0, 44.0, 38.0, 42.0, 34.0, 34.0, 37.0, 39.0, 29.0, 25.0, 32.0, 20.0, 25.0, 14.0, 4.0, 7.0, 6.0, 5.0, 3.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.583984375, -1.5337371826171875, -1.483489990234375, -1.4332427978515625, -1.38299560546875, -1.3327484130859375, -1.282501220703125, -1.2322540283203125, -1.1820068359375, -1.1317596435546875, -1.081512451171875, -1.0312652587890625, -0.98101806640625, -0.9307708740234375, -0.880523681640625, -0.8302764892578125, -0.780029296875, -0.7297821044921875, -0.679534912109375, -0.6292877197265625, -0.57904052734375, -0.5287933349609375, -0.478546142578125, -0.4282989501953125, -0.3780517578125, -0.3278045654296875, -0.277557373046875, -0.2273101806640625, -0.17706298828125, -0.1268157958984375, -0.076568603515625, -0.0263214111328125, 0.02392578125, 0.0741729736328125, 0.124420166015625, 0.1746673583984375, 0.22491455078125, 0.2751617431640625, 0.325408935546875, 0.3756561279296875, 0.4259033203125, 0.4761505126953125, 0.526397705078125, 0.5766448974609375, 0.62689208984375, 0.6771392822265625, 0.727386474609375, 0.7776336669921875, 0.827880859375, 0.8781280517578125, 0.928375244140625, 0.9786224365234375, 1.02886962890625, 1.0791168212890625, 1.129364013671875, 1.1796112060546875, 1.2298583984375, 1.2801055908203125, 1.330352783203125, 1.3805999755859375, 1.43084716796875, 1.4810943603515625, 1.531341552734375, 1.5815887451171875, 1.6318359375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 10.0, 9.0, 11.0, 31.0, 31.0, 42.0, 73.0, 73.0, 121.0, 204.0, 271.0, 459.0, 747.0, 1351.0, 2339.0, 4663.0, 10122.0, 23346.0, 64980.0, 235714.0, 476161.0, 148383.0, 45838.0, 17196.0, 7663.0, 3814.0, 1962.0, 1129.0, 645.0, 395.0, 265.0, 170.0, 108.0, 61.0, 44.0, 38.0, 15.0, 23.0, 10.0, 12.0, 10.0, 9.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1422119140625, -0.13781356811523438, -0.13341522216796875, -0.12901687622070312, -0.1246185302734375, -0.12022018432617188, -0.11582183837890625, -0.11142349243164062, -0.107025146484375, -0.10262680053710938, -0.09822845458984375, -0.09383010864257812, -0.0894317626953125, -0.08503341674804688, -0.08063507080078125, -0.07623672485351562, -0.07183837890625, -0.06744003295898438, -0.06304168701171875, -0.058643341064453125, -0.0542449951171875, -0.049846649169921875, -0.04544830322265625, -0.041049957275390625, -0.036651611328125, -0.032253265380859375, -0.02785491943359375, -0.023456573486328125, -0.0190582275390625, -0.014659881591796875, -0.01026153564453125, -0.005863189697265625, -0.00146484375, 0.002933502197265625, 0.00733184814453125, 0.011730194091796875, 0.0161285400390625, 0.020526885986328125, 0.02492523193359375, 0.029323577880859375, 0.033721923828125, 0.038120269775390625, 0.04251861572265625, 0.046916961669921875, 0.0513153076171875, 0.055713653564453125, 0.06011199951171875, 0.06451034545898438, 0.06890869140625, 0.07330703735351562, 0.07770538330078125, 0.08210372924804688, 0.0865020751953125, 0.09090042114257812, 0.09529876708984375, 0.09969711303710938, 0.104095458984375, 0.10849380493164062, 0.11289215087890625, 0.11729049682617188, 0.1216888427734375, 0.12608718872070312, 0.13048553466796875, 0.13488388061523438, 0.1392822265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 6.0, 5.0, 5.0, 11.0, 10.0, 23.0, 17.0, 29.0, 32.0, 60.0, 94.0, 135.0, 181.0, 100.0, 73.0, 51.0, 39.0, 36.0, 17.0, 18.0, 14.0, 13.0, 6.0, 8.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013494491577148438, -0.00013016164302825928, -0.00012537837028503418, -0.00012059509754180908, -0.00011581182479858398, -0.00011102855205535889, -0.00010624527931213379, -0.00010146200656890869, -9.66787338256836e-05, -9.18954610824585e-05, -8.71121883392334e-05, -8.23289155960083e-05, -7.75456428527832e-05, -7.27623701095581e-05, -6.797909736633301e-05, -6.319582462310791e-05, -5.841255187988281e-05, -5.3629279136657715e-05, -4.884600639343262e-05, -4.406273365020752e-05, -3.927946090698242e-05, -3.4496188163757324e-05, -2.9712915420532227e-05, -2.492964267730713e-05, -2.014636993408203e-05, -1.5363097190856934e-05, -1.0579824447631836e-05, -5.796551704406738e-06, -1.0132789611816406e-06, 3.769993782043457e-06, 8.553266525268555e-06, 1.3336539268493652e-05, 1.811981201171875e-05, 2.2903084754943848e-05, 2.7686357498168945e-05, 3.246963024139404e-05, 3.725290298461914e-05, 4.203617572784424e-05, 4.6819448471069336e-05, 5.1602721214294434e-05, 5.638599395751953e-05, 6.116926670074463e-05, 6.595253944396973e-05, 7.073581218719482e-05, 7.551908493041992e-05, 8.030235767364502e-05, 8.508563041687012e-05, 8.986890316009521e-05, 9.465217590332031e-05, 9.943544864654541e-05, 0.00010421872138977051, 0.0001090019941329956, 0.0001137852668762207, 0.0001185685396194458, 0.0001233518123626709, 0.000128135085105896, 0.0001329183578491211, 0.0001377016305923462, 0.0001424849033355713, 0.0001472681760787964, 0.00015205144882202148, 0.00015683472156524658, 0.00016161799430847168, 0.00016640126705169678, 0.00017118453979492188]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 2.0, 8.0, 13.0, 8.0, 6.0, 14.0, 17.0, 33.0, 62.0, 117.0, 186.0, 440.0, 1051.0, 3239.0, 13769.0, 103624.0, 760750.0, 141917.0, 17167.0, 3898.0, 1234.0, 485.0, 232.0, 101.0, 49.0, 40.0, 20.0, 12.0, 9.0, 11.0, 7.0, 6.0, 3.0, 7.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.386962890625, -0.3771820068359375, -0.367401123046875, -0.3576202392578125, -0.34783935546875, -0.3380584716796875, -0.328277587890625, -0.3184967041015625, -0.3087158203125, -0.2989349365234375, -0.289154052734375, -0.2793731689453125, -0.26959228515625, -0.2598114013671875, -0.250030517578125, -0.2402496337890625, -0.23046875, -0.2206878662109375, -0.210906982421875, -0.2011260986328125, -0.19134521484375, -0.1815643310546875, -0.171783447265625, -0.1620025634765625, -0.1522216796875, -0.1424407958984375, -0.132659912109375, -0.1228790283203125, -0.11309814453125, -0.1033172607421875, -0.093536376953125, -0.0837554931640625, -0.073974609375, -0.0641937255859375, -0.054412841796875, -0.0446319580078125, -0.03485107421875, -0.0250701904296875, -0.015289306640625, -0.0055084228515625, 0.0042724609375, 0.0140533447265625, 0.023834228515625, 0.0336151123046875, 0.04339599609375, 0.0531768798828125, 0.062957763671875, 0.0727386474609375, 0.08251953125, 0.0923004150390625, 0.102081298828125, 0.1118621826171875, 0.12164306640625, 0.1314239501953125, 0.141204833984375, 0.1509857177734375, 0.1607666015625, 0.1705474853515625, 0.180328369140625, 0.1901092529296875, 0.19989013671875, 0.2096710205078125, 0.219451904296875, 0.2292327880859375, 0.239013671875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 6.0, 6.0, 10.0, 5.0, 8.0, 6.0, 11.0, 13.0, 24.0, 20.0, 28.0, 41.0, 52.0, 55.0, 66.0, 72.0, 91.0, 77.0, 87.0, 57.0, 53.0, 41.0, 32.0, 28.0, 25.0, 13.0, 20.0, 12.0, 9.0, 7.0, 6.0, 5.0, 6.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.06622314453125, -0.06446170806884766, -0.06270027160644531, -0.06093883514404297, -0.059177398681640625, -0.05741596221923828, -0.05565452575683594, -0.053893089294433594, -0.05213165283203125, -0.050370216369628906, -0.04860877990722656, -0.04684734344482422, -0.045085906982421875, -0.04332447052001953, -0.04156303405761719, -0.039801597595214844, -0.0380401611328125, -0.036278724670410156, -0.03451728820800781, -0.03275585174560547, -0.030994415283203125, -0.02923297882080078, -0.027471542358398438, -0.025710105895996094, -0.02394866943359375, -0.022187232971191406, -0.020425796508789062, -0.01866436004638672, -0.016902923583984375, -0.015141487121582031, -0.013380050659179688, -0.011618614196777344, -0.009857177734375, -0.008095741271972656, -0.0063343048095703125, -0.004572868347167969, -0.002811431884765625, -0.0010499954223632812, 0.0007114410400390625, 0.0024728775024414062, 0.00423431396484375, 0.005995750427246094, 0.0077571868896484375, 0.009518623352050781, 0.011280059814453125, 0.013041496276855469, 0.014802932739257812, 0.016564369201660156, 0.0183258056640625, 0.020087242126464844, 0.021848678588867188, 0.02361011505126953, 0.025371551513671875, 0.02713298797607422, 0.028894424438476562, 0.030655860900878906, 0.03241729736328125, 0.034178733825683594, 0.03594017028808594, 0.03770160675048828, 0.039463043212890625, 0.04122447967529297, 0.04298591613769531, 0.044747352600097656, 0.0465087890625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 13.0, 29.0, 45.0, 108.0, 186.0, 268.0, 169.0, 99.0, 58.0, 19.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6685404777526855, -2.583641767501831, -2.4987430572509766, -2.413844108581543, -2.3289453983306885, -2.244046688079834, -2.1591479778289795, -2.074249267578125, -1.989350438117981, -1.9044517278671265, -1.8195528984069824, -1.734654188156128, -1.6497554779052734, -1.5648566484451294, -1.479957938194275, -1.3950591087341309, -1.3101603984832764, -1.2252616882324219, -1.1403628587722778, -1.0554641485214233, -0.9705653786659241, -0.8856666088104248, -0.8007678985595703, -0.715869128704071, -0.6309703588485718, -0.5460715889930725, -0.46117284893989563, -0.37627410888671875, -0.2913753390312195, -0.20647656917572021, -0.12157785892486572, -0.036679089069366455, 0.04821968078613281, 0.1331184357404709, 0.21801719069480896, 0.30291593074798584, 0.3878147006034851, 0.4727134704589844, 0.5576121807098389, 0.6425109505653381, 0.7274097204208374, 0.8123084902763367, 0.8972072601318359, 0.9821059703826904, 1.067004680633545, 1.151903510093689, 1.2368022203445435, 1.3217010498046875, 1.406599760055542, 1.4914984703063965, 1.5763972997665405, 1.661296010017395, 1.746194839477539, 1.8310935497283936, 1.915992259979248, 2.0008909702301025, 2.085789680480957, 2.1706883907318115, 2.255587100982666, 2.3404860496520996, 2.425384759902954, 2.5102834701538086, 2.595182180404663, 2.6800808906555176, 2.764979839324951]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 7.0, 1.0, 9.0, 8.0, 6.0, 9.0, 9.0, 22.0, 8.0, 16.0, 22.0, 15.0, 17.0, 28.0, 28.0, 36.0, 36.0, 36.0, 45.0, 23.0, 38.0, 33.0, 46.0, 38.0, 40.0, 42.0, 32.0, 33.0, 44.0, 26.0, 28.0, 27.0, 27.0, 25.0, 21.0, 20.0, 11.0, 17.0, 12.0, 10.0, 12.0, 8.0, 6.0, 5.0, 5.0, 9.0, 3.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5722605586051941, -0.5532446503639221, -0.5342288017272949, -0.515212893486023, -0.49619701504707336, -0.4771811366081238, -0.4581652283668518, -0.4391493499279022, -0.42013347148895264, -0.40111759305000305, -0.3821016848087311, -0.3630858063697815, -0.3440699279308319, -0.3250540494918823, -0.30603814125061035, -0.28702226281166077, -0.2680063545703888, -0.24899046123027802, -0.22997458279132843, -0.21095868945121765, -0.19194281101226807, -0.1729269176721573, -0.1539110243320465, -0.13489514589309692, -0.11587925255298615, -0.09686336666345596, -0.07784748077392578, -0.058831587433815, -0.03981570154428482, -0.02079981565475464, -0.0017839223146438599, 0.017231956124305725, 0.036247849464416504, 0.055263735353946686, 0.07427962124347687, 0.09329551458358765, 0.11231140047311783, 0.131327286362648, 0.1503431797027588, 0.16935905814170837, 0.18837495148181915, 0.20739084482192993, 0.22640672326087952, 0.2454226166009903, 0.2644385099411011, 0.28345438838005066, 0.30247026681900024, 0.3214861750602722, 0.3405020534992218, 0.3595179319381714, 0.37853384017944336, 0.39754971861839294, 0.41656559705734253, 0.4355815052986145, 0.4545973837375641, 0.47361326217651367, 0.49262917041778564, 0.5116450786590576, 0.5306609272956848, 0.5496768355369568, 0.5686927437782288, 0.587708592414856, 0.6067245006561279, 0.6257404088973999, 0.6447562575340271]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 5.0, 10.0, 11.0, 9.0, 35.0, 29.0, 50.0, 91.0, 133.0, 220.0, 285.0, 417.0, 678.0, 1131.0, 1914.0, 3648.0, 7258.0, 16128.0, 47153.0, 227644.0, 602791.0, 90321.0, 26761.0, 10152.0, 5090.0, 2687.0, 1441.0, 866.0, 559.0, 338.0, 212.0, 162.0, 117.0, 62.0, 51.0, 31.0, 17.0, 14.0, 11.0, 5.0, 7.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.935546875, -0.9065322875976562, -0.8775177001953125, -0.8485031127929688, -0.819488525390625, -0.7904739379882812, -0.7614593505859375, -0.7324447631835938, -0.70343017578125, -0.6744155883789062, -0.6454010009765625, -0.6163864135742188, -0.587371826171875, -0.5583572387695312, -0.5293426513671875, -0.5003280639648438, -0.4713134765625, -0.44229888916015625, -0.4132843017578125, -0.38426971435546875, -0.355255126953125, -0.32624053955078125, -0.2972259521484375, -0.26821136474609375, -0.23919677734375, -0.21018218994140625, -0.1811676025390625, -0.15215301513671875, -0.123138427734375, -0.09412384033203125, -0.0651092529296875, -0.03609466552734375, -0.007080078125, 0.02193450927734375, 0.0509490966796875, 0.07996368408203125, 0.108978271484375, 0.13799285888671875, 0.1670074462890625, 0.19602203369140625, 0.22503662109375, 0.25405120849609375, 0.2830657958984375, 0.31208038330078125, 0.341094970703125, 0.37010955810546875, 0.3991241455078125, 0.42813873291015625, 0.4571533203125, 0.48616790771484375, 0.5151824951171875, 0.5441970825195312, 0.573211669921875, 0.6022262573242188, 0.6312408447265625, 0.6602554321289062, 0.68927001953125, 0.7182846069335938, 0.7472991943359375, 0.7763137817382812, 0.805328369140625, 0.8343429565429688, 0.8633575439453125, 0.8923721313476562, 0.92138671875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 7.0, 11.0, 9.0, 7.0, 9.0, 12.0, 12.0, 21.0, 17.0, 12.0, 23.0, 32.0, 29.0, 31.0, 42.0, 41.0, 46.0, 47.0, 61.0, 62.0, 62.0, 49.0, 39.0, 46.0, 44.0, 25.0, 30.0, 24.0, 36.0, 13.0, 15.0, 15.0, 10.0, 11.0, 8.0, 6.0, 5.0, 9.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.36328125, -4.2236328125, -4.083984375, -3.9443359375, -3.8046875, -3.6650390625, -3.525390625, -3.3857421875, -3.24609375, -3.1064453125, -2.966796875, -2.8271484375, -2.6875, -2.5478515625, -2.408203125, -2.2685546875, -2.12890625, -1.9892578125, -1.849609375, -1.7099609375, -1.5703125, -1.4306640625, -1.291015625, -1.1513671875, -1.01171875, -0.8720703125, -0.732421875, -0.5927734375, -0.453125, -0.3134765625, -0.173828125, -0.0341796875, 0.10546875, 0.2451171875, 0.384765625, 0.5244140625, 0.6640625, 0.8037109375, 0.943359375, 1.0830078125, 1.22265625, 1.3623046875, 1.501953125, 1.6416015625, 1.78125, 1.9208984375, 2.060546875, 2.2001953125, 2.33984375, 2.4794921875, 2.619140625, 2.7587890625, 2.8984375, 3.0380859375, 3.177734375, 3.3173828125, 3.45703125, 3.5966796875, 3.736328125, 3.8759765625, 4.015625, 4.1552734375, 4.294921875, 4.4345703125, 4.57421875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 9.0, 8.0, 7.0, 7.0, 6.0, 16.0, 19.0, 19.0, 20.0, 22.0, 35.0, 38.0, 49.0, 66.0, 93.0, 109.0, 215.0, 468.0, 1372.0, 5561.0, 42980.0, 895651.0, 89831.0, 8674.0, 1753.0, 591.0, 263.0, 155.0, 103.0, 75.0, 64.0, 47.0, 43.0, 34.0, 25.0, 19.0, 18.0, 19.0, 12.0, 10.0, 8.0, 6.0, 4.0, 8.0, 6.0, 7.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2421875, -2.168975830078125, -2.09576416015625, -2.022552490234375, -1.9493408203125, -1.876129150390625, -1.80291748046875, -1.729705810546875, -1.656494140625, -1.583282470703125, -1.51007080078125, -1.436859130859375, -1.3636474609375, -1.290435791015625, -1.21722412109375, -1.144012451171875, -1.07080078125, -0.997589111328125, -0.92437744140625, -0.851165771484375, -0.7779541015625, -0.704742431640625, -0.63153076171875, -0.558319091796875, -0.485107421875, -0.411895751953125, -0.33868408203125, -0.265472412109375, -0.1922607421875, -0.119049072265625, -0.04583740234375, 0.027374267578125, 0.1005859375, 0.173797607421875, 0.24700927734375, 0.320220947265625, 0.3934326171875, 0.466644287109375, 0.53985595703125, 0.613067626953125, 0.686279296875, 0.759490966796875, 0.83270263671875, 0.905914306640625, 0.9791259765625, 1.052337646484375, 1.12554931640625, 1.198760986328125, 1.27197265625, 1.345184326171875, 1.41839599609375, 1.491607666015625, 1.5648193359375, 1.638031005859375, 1.71124267578125, 1.784454345703125, 1.857666015625, 1.930877685546875, 2.00408935546875, 2.077301025390625, 2.1505126953125, 2.223724365234375, 2.29693603515625, 2.370147705078125, 2.443359375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 9.0, 6.0, 6.0, 6.0, 5.0, 4.0, 13.0, 12.0, 14.0, 9.0, 13.0, 22.0, 19.0, 22.0, 26.0, 33.0, 33.0, 39.0, 40.0, 50.0, 47.0, 44.0, 50.0, 41.0, 41.0, 37.0, 40.0, 27.0, 35.0, 29.0, 25.0, 26.0, 24.0, 26.0, 22.0, 18.0, 14.0, 14.0, 10.0, 4.0, 9.0, 7.0, 7.0, 3.0, 5.0, 4.0, 7.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.59375, -3.476409912109375, -3.35906982421875, -3.241729736328125, -3.1243896484375, -3.007049560546875, -2.88970947265625, -2.772369384765625, -2.655029296875, -2.537689208984375, -2.42034912109375, -2.303009033203125, -2.1856689453125, -2.068328857421875, -1.95098876953125, -1.833648681640625, -1.71630859375, -1.598968505859375, -1.48162841796875, -1.364288330078125, -1.2469482421875, -1.129608154296875, -1.01226806640625, -0.894927978515625, -0.777587890625, -0.660247802734375, -0.54290771484375, -0.425567626953125, -0.3082275390625, -0.190887451171875, -0.07354736328125, 0.043792724609375, 0.1611328125, 0.278472900390625, 0.39581298828125, 0.513153076171875, 0.6304931640625, 0.747833251953125, 0.86517333984375, 0.982513427734375, 1.099853515625, 1.217193603515625, 1.33453369140625, 1.451873779296875, 1.5692138671875, 1.686553955078125, 1.80389404296875, 1.921234130859375, 2.03857421875, 2.155914306640625, 2.27325439453125, 2.390594482421875, 2.5079345703125, 2.625274658203125, 2.74261474609375, 2.859954833984375, 2.977294921875, 3.094635009765625, 3.21197509765625, 3.329315185546875, 3.4466552734375, 3.563995361328125, 3.68133544921875, 3.798675537109375, 3.916015625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 8.0, 7.0, 9.0, 16.0, 27.0, 43.0, 64.0, 85.0, 159.0, 257.0, 535.0, 1128.0, 2568.0, 7233.0, 57368.0, 944491.0, 25461.0, 5174.0, 1964.0, 877.0, 459.0, 223.0, 135.0, 97.0, 56.0, 32.0, 13.0, 14.0, 14.0, 10.0, 5.0, 3.0, 7.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54638671875, -0.5304832458496094, -0.5145797729492188, -0.4986763000488281, -0.4827728271484375, -0.4668693542480469, -0.45096588134765625, -0.4350624084472656, -0.419158935546875, -0.4032554626464844, -0.38735198974609375, -0.3714485168457031, -0.3555450439453125, -0.3396415710449219, -0.32373809814453125, -0.3078346252441406, -0.29193115234375, -0.2760276794433594, -0.26012420654296875, -0.24422073364257812, -0.2283172607421875, -0.21241378784179688, -0.19651031494140625, -0.18060684204101562, -0.164703369140625, -0.14879989624023438, -0.13289642333984375, -0.11699295043945312, -0.1010894775390625, -0.08518600463867188, -0.06928253173828125, -0.053379058837890625, -0.0374755859375, -0.021572113037109375, -0.00566864013671875, 0.010234832763671875, 0.0261383056640625, 0.042041778564453125, 0.05794525146484375, 0.07384872436523438, 0.089752197265625, 0.10565567016601562, 0.12155914306640625, 0.13746261596679688, 0.1533660888671875, 0.16926956176757812, 0.18517303466796875, 0.20107650756835938, 0.21697998046875, 0.23288345336914062, 0.24878692626953125, 0.2646903991699219, 0.2805938720703125, 0.2964973449707031, 0.31240081787109375, 0.3283042907714844, 0.344207763671875, 0.3601112365722656, 0.37601470947265625, 0.3919181823730469, 0.4078216552734375, 0.4237251281738281, 0.43962860107421875, 0.4555320739746094, 0.471435546875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 11.0, 12.0, 19.0, 58.0, 132.0, 567.0, 112.0, 34.0, 15.0, 13.0, 8.0, 4.0, 6.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.587671279907227e-05, -7.338542491197586e-05, -7.089413702487946e-05, -6.840284913778305e-05, -6.591156125068665e-05, -6.342027336359024e-05, -6.0928985476493835e-05, -5.843769758939743e-05, -5.5946409702301025e-05, -5.345512181520462e-05, -5.0963833928108215e-05, -4.847254604101181e-05, -4.5981258153915405e-05, -4.3489970266819e-05, -4.0998682379722595e-05, -3.850739449262619e-05, -3.6016106605529785e-05, -3.352481871843338e-05, -3.1033530831336975e-05, -2.854224294424057e-05, -2.6050955057144165e-05, -2.355966717004776e-05, -2.1068379282951355e-05, -1.857709139585495e-05, -1.6085803508758545e-05, -1.359451562166214e-05, -1.1103227734565735e-05, -8.61193984746933e-06, -6.120651960372925e-06, -3.6293640732765198e-06, -1.1380761861801147e-06, 1.3532117009162903e-06, 3.844499588012695e-06, 6.3357874751091e-06, 8.827075362205505e-06, 1.131836324930191e-05, 1.3809651136398315e-05, 1.630093902349472e-05, 1.8792226910591125e-05, 2.128351479768753e-05, 2.3774802684783936e-05, 2.626609057188034e-05, 2.8757378458976746e-05, 3.124866634607315e-05, 3.3739954233169556e-05, 3.623124212026596e-05, 3.8722530007362366e-05, 4.121381789445877e-05, 4.3705105781555176e-05, 4.619639366865158e-05, 4.8687681555747986e-05, 5.117896944284439e-05, 5.3670257329940796e-05, 5.61615452170372e-05, 5.8652833104133606e-05, 6.114412099123001e-05, 6.363540887832642e-05, 6.612669676542282e-05, 6.861798465251923e-05, 7.110927253961563e-05, 7.360056042671204e-05, 7.609184831380844e-05, 7.858313620090485e-05, 8.107442408800125e-05, 8.356571197509766e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 9.0, 17.0, 26.0, 40.0, 72.0, 105.0, 217.0, 374.0, 843.0, 2119.0, 7977.0, 410545.0, 614332.0, 8082.0, 2016.0, 806.0, 412.0, 214.0, 117.0, 87.0, 46.0, 27.0, 15.0, 18.0, 7.0, 5.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.685546875, -0.6653900146484375, -0.645233154296875, -0.6250762939453125, -0.60491943359375, -0.5847625732421875, -0.564605712890625, -0.5444488525390625, -0.5242919921875, -0.5041351318359375, -0.483978271484375, -0.4638214111328125, -0.44366455078125, -0.4235076904296875, -0.403350830078125, -0.3831939697265625, -0.363037109375, -0.3428802490234375, -0.322723388671875, -0.3025665283203125, -0.28240966796875, -0.2622528076171875, -0.242095947265625, -0.2219390869140625, -0.2017822265625, -0.1816253662109375, -0.161468505859375, -0.1413116455078125, -0.12115478515625, -0.1009979248046875, -0.080841064453125, -0.0606842041015625, -0.04052734375, -0.0203704833984375, -0.000213623046875, 0.0199432373046875, 0.04010009765625, 0.0602569580078125, 0.080413818359375, 0.1005706787109375, 0.1207275390625, 0.1408843994140625, 0.161041259765625, 0.1811981201171875, 0.20135498046875, 0.2215118408203125, 0.241668701171875, 0.2618255615234375, 0.281982421875, 0.3021392822265625, 0.322296142578125, 0.3424530029296875, 0.36260986328125, 0.3827667236328125, 0.402923583984375, 0.4230804443359375, 0.4432373046875, 0.4633941650390625, 0.483551025390625, 0.5037078857421875, 0.52386474609375, 0.5440216064453125, 0.564178466796875, 0.5843353271484375, 0.6044921875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 3.0, 11.0, 7.0, 21.0, 38.0, 69.0, 475.0, 247.0, 54.0, 39.0, 17.0, 7.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.232421875, -0.22464752197265625, -0.2168731689453125, -0.20909881591796875, -0.201324462890625, -0.19355010986328125, -0.1857757568359375, -0.17800140380859375, -0.17022705078125, -0.16245269775390625, -0.1546783447265625, -0.14690399169921875, -0.139129638671875, -0.13135528564453125, -0.1235809326171875, -0.11580657958984375, -0.1080322265625, -0.10025787353515625, -0.0924835205078125, -0.08470916748046875, -0.076934814453125, -0.06916046142578125, -0.0613861083984375, -0.05361175537109375, -0.04583740234375, -0.03806304931640625, -0.0302886962890625, -0.02251434326171875, -0.014739990234375, -0.00696563720703125, 0.0008087158203125, 0.00858306884765625, 0.016357421875, 0.02413177490234375, 0.0319061279296875, 0.03968048095703125, 0.047454833984375, 0.05522918701171875, 0.0630035400390625, 0.07077789306640625, 0.07855224609375, 0.08632659912109375, 0.0941009521484375, 0.10187530517578125, 0.109649658203125, 0.11742401123046875, 0.1251983642578125, 0.13297271728515625, 0.1407470703125, 0.14852142333984375, 0.1562957763671875, 0.16407012939453125, 0.171844482421875, 0.17961883544921875, 0.1873931884765625, 0.19516754150390625, 0.20294189453125, 0.21071624755859375, 0.2184906005859375, 0.22626495361328125, 0.234039306640625, 0.24181365966796875, 0.2495880126953125, 0.25736236572265625, 0.26513671875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 20.0, 95.0, 338.0, 409.0, 130.0, 20.0, 3.0, 2.0], "bins": [-17.6982421875, -17.39818572998047, -17.098129272460938, -16.79807472229004, -16.498018264770508, -16.197961807250977, -15.897905349731445, -15.59784984588623, -15.2977933883667, -14.997736930847168, -14.697681427001953, -14.397624969482422, -14.097569465637207, -13.797513008117676, -13.497457504272461, -13.19740104675293, -12.897344589233398, -12.597288131713867, -12.297232627868652, -11.997176170349121, -11.697120666503906, -11.397064208984375, -11.097007751464844, -10.796952247619629, -10.496896743774414, -10.196840286254883, -9.896784782409668, -9.596728324890137, -9.296672821044922, -8.99661636352539, -8.69655990600586, -8.396504402160645, -8.096447944641113, -7.79639196395874, -7.496335983276367, -7.196279525756836, -6.896223545074463, -6.59616756439209, -6.296111583709717, -5.996055603027344, -5.6959991455078125, -5.3959431648254395, -5.095887184143066, -4.795830726623535, -4.495774745941162, -4.195718765258789, -3.895662784576416, -3.595606565475464, -3.2955503463745117, -2.9954943656921387, -2.6954381465911865, -2.3953821659088135, -2.0953259468078613, -1.7952699661254883, -1.4952139854431152, -1.195157766342163, -0.8951019048690796, -0.595045804977417, -0.29498976469039917, 0.005066275596618652, 0.30512237548828125, 0.6051784753799438, 0.9052344560623169, 1.205290675163269, 1.505346655845642]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 3.0, 6.0, 8.0, 8.0, 11.0, 18.0, 11.0, 22.0, 21.0, 27.0, 24.0, 23.0, 29.0, 33.0, 44.0, 23.0, 40.0, 43.0, 38.0, 53.0, 53.0, 44.0, 41.0, 49.0, 41.0, 30.0, 39.0, 38.0, 25.0, 24.0, 21.0, 15.0, 14.0, 12.0, 11.0, 16.0, 9.0, 5.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.079907417297363, -6.875357151031494, -6.670806884765625, -6.466256141662598, -6.2617058753967285, -6.057155609130859, -5.85260534286499, -5.648055076599121, -5.443504333496094, -5.238954067230225, -5.0344038009643555, -4.829853057861328, -4.625302791595459, -4.42075252532959, -4.216202259063721, -4.011651992797852, -3.8071017265319824, -3.6025514602661133, -3.398000955581665, -3.193450689315796, -2.9889001846313477, -2.7843499183654785, -2.5797996520996094, -2.3752493858337402, -2.170698881149292, -1.9661484956741333, -1.7615981101989746, -1.5570478439331055, -1.3524974584579468, -1.147947072982788, -0.943396806716919, -0.7388464212417603, -0.5342965126037598, -0.32974615693092346, -0.12519580125808716, 0.07935452461242676, 0.28390491008758545, 0.48845529556274414, 0.6930055618286133, 0.897555947303772, 1.1021063327789307, 1.3066567182540894, 1.511207103729248, 1.7157573699951172, 1.9203077554702759, 2.1248581409454346, 2.3294084072113037, 2.533958911895752, 2.738509178161621, 2.9430594444274902, 3.1476099491119385, 3.3521602153778076, 3.556710720062256, 3.761260986328125, 3.965811252593994, 4.170361518859863, 4.374912261962891, 4.57946252822876, 4.784012794494629, 4.988563537597656, 5.193113803863525, 5.3976640701293945, 5.602214336395264, 5.806764602661133, 6.011314868927002]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 10.0, 4.0, 8.0, 13.0, 10.0, 25.0, 23.0, 33.0, 65.0, 83.0, 162.0, 310.0, 606.0, 1253.0, 2667.0, 5957.0, 17282.0, 134652.0, 2299903.0, 1626333.0, 79241.0, 14458.0, 5626.0, 2707.0, 1247.0, 697.0, 357.0, 191.0, 122.0, 91.0, 42.0, 23.0, 14.0, 12.0, 22.0, 8.0, 6.0, 5.0, 5.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.8447265625, -1.79034423828125, -1.7359619140625, -1.68157958984375, -1.627197265625, -1.57281494140625, -1.5184326171875, -1.46405029296875, -1.40966796875, -1.35528564453125, -1.3009033203125, -1.24652099609375, -1.192138671875, -1.13775634765625, -1.0833740234375, -1.02899169921875, -0.974609375, -0.92022705078125, -0.8658447265625, -0.81146240234375, -0.757080078125, -0.70269775390625, -0.6483154296875, -0.59393310546875, -0.53955078125, -0.48516845703125, -0.4307861328125, -0.37640380859375, -0.322021484375, -0.26763916015625, -0.2132568359375, -0.15887451171875, -0.1044921875, -0.05010986328125, 0.0042724609375, 0.05865478515625, 0.113037109375, 0.16741943359375, 0.2218017578125, 0.27618408203125, 0.33056640625, 0.38494873046875, 0.4393310546875, 0.49371337890625, 0.548095703125, 0.60247802734375, 0.6568603515625, 0.71124267578125, 0.765625, 0.82000732421875, 0.8743896484375, 0.92877197265625, 0.983154296875, 1.03753662109375, 1.0919189453125, 1.14630126953125, 1.20068359375, 1.25506591796875, 1.3094482421875, 1.36383056640625, 1.418212890625, 1.47259521484375, 1.5269775390625, 1.58135986328125, 1.6357421875]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 0.0, 4.0, 3.0, 3.0, 11.0, 8.0, 15.0, 15.0, 9.0, 24.0, 18.0, 24.0, 24.0, 39.0, 45.0, 35.0, 45.0, 48.0, 45.0, 38.0, 44.0, 60.0, 44.0, 56.0, 35.0, 37.0, 38.0, 27.0, 37.0, 27.0, 23.0, 16.0, 22.0, 23.0, 11.0, 9.0, 13.0, 3.0, 9.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7587890625, -0.7324447631835938, -0.7061004638671875, -0.6797561645507812, -0.653411865234375, -0.6270675659179688, -0.6007232666015625, -0.5743789672851562, -0.54803466796875, -0.5216903686523438, -0.4953460693359375, -0.46900177001953125, -0.442657470703125, -0.41631317138671875, -0.3899688720703125, -0.36362457275390625, -0.3372802734375, -0.31093597412109375, -0.2845916748046875, -0.25824737548828125, -0.231903076171875, -0.20555877685546875, -0.1792144775390625, -0.15287017822265625, -0.12652587890625, -0.10018157958984375, -0.0738372802734375, -0.04749298095703125, -0.021148681640625, 0.00519561767578125, 0.0315399169921875, 0.05788421630859375, 0.084228515625, 0.11057281494140625, 0.1369171142578125, 0.16326141357421875, 0.189605712890625, 0.21595001220703125, 0.2422943115234375, 0.26863861083984375, 0.29498291015625, 0.32132720947265625, 0.3476715087890625, 0.37401580810546875, 0.400360107421875, 0.42670440673828125, 0.4530487060546875, 0.47939300537109375, 0.5057373046875, 0.5320816040039062, 0.5584259033203125, 0.5847702026367188, 0.611114501953125, 0.6374588012695312, 0.6638031005859375, 0.6901473999023438, 0.71649169921875, 0.7428359985351562, 0.7691802978515625, 0.7955245971679688, 0.821868896484375, 0.8482131958007812, 0.8745574951171875, 0.9009017944335938, 0.92724609375]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 11.0, 6.0, 9.0, 14.0, 41.0, 112.0, 1255.0, 4192232.0, 422.0, 82.0, 32.0, 13.0, 12.0, 9.0, 6.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.578125, -17.783447265625, -16.98876953125, -16.194091796875, -15.3994140625, -14.604736328125, -13.81005859375, -13.015380859375, -12.220703125, -11.426025390625, -10.63134765625, -9.836669921875, -9.0419921875, -8.247314453125, -7.45263671875, -6.657958984375, -5.86328125, -5.068603515625, -4.27392578125, -3.479248046875, -2.6845703125, -1.889892578125, -1.09521484375, -0.300537109375, 0.494140625, 1.288818359375, 2.08349609375, 2.878173828125, 3.6728515625, 4.467529296875, 5.26220703125, 6.056884765625, 6.8515625, 7.646240234375, 8.44091796875, 9.235595703125, 10.0302734375, 10.824951171875, 11.61962890625, 12.414306640625, 13.208984375, 14.003662109375, 14.79833984375, 15.593017578125, 16.3876953125, 17.182373046875, 17.97705078125, 18.771728515625, 19.56640625, 20.361083984375, 21.15576171875, 21.950439453125, 22.7451171875, 23.539794921875, 24.33447265625, 25.129150390625, 25.923828125, 26.718505859375, 27.51318359375, 28.307861328125, 29.1025390625, 29.897216796875, 30.69189453125, 31.486572265625, 32.28125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 8.0, 7.0, 9.0, 7.0, 14.0, 17.0, 29.0, 31.0, 49.0, 79.0, 142.0, 304.0, 734.0, 1134.0, 736.0, 333.0, 148.0, 86.0, 65.0, 41.0, 24.0, 26.0, 10.0, 11.0, 4.0, 7.0, 5.0, 3.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.578125, -0.5627288818359375, -0.547332763671875, -0.5319366455078125, -0.51654052734375, -0.5011444091796875, -0.485748291015625, -0.4703521728515625, -0.4549560546875, -0.4395599365234375, -0.424163818359375, -0.4087677001953125, -0.39337158203125, -0.3779754638671875, -0.362579345703125, -0.3471832275390625, -0.331787109375, -0.3163909912109375, -0.300994873046875, -0.2855987548828125, -0.27020263671875, -0.2548065185546875, -0.239410400390625, -0.2240142822265625, -0.2086181640625, -0.1932220458984375, -0.177825927734375, -0.1624298095703125, -0.14703369140625, -0.1316375732421875, -0.116241455078125, -0.1008453369140625, -0.08544921875, -0.0700531005859375, -0.054656982421875, -0.0392608642578125, -0.02386474609375, -0.0084686279296875, 0.006927490234375, 0.0223236083984375, 0.0377197265625, 0.0531158447265625, 0.068511962890625, 0.0839080810546875, 0.09930419921875, 0.1147003173828125, 0.130096435546875, 0.1454925537109375, 0.160888671875, 0.1762847900390625, 0.191680908203125, 0.2070770263671875, 0.22247314453125, 0.2378692626953125, 0.253265380859375, 0.2686614990234375, 0.2840576171875, 0.2994537353515625, 0.314849853515625, 0.3302459716796875, 0.34564208984375, 0.3610382080078125, 0.376434326171875, 0.3918304443359375, 0.4072265625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 5.0, 5.0, 6.0, 11.0, 15.0, 12.0, 22.0, 23.0, 21.0, 39.0, 51.0, 64.0, 73.0, 83.0, 80.0, 105.0, 74.0, 64.0, 54.0, 37.0, 28.0, 25.0, 26.0, 19.0, 19.0, 9.0, 4.0, 6.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.18211829662323, -1.1478058099746704, -1.1134932041168213, -1.0791807174682617, -1.0448682308197021, -1.0105557441711426, -0.9762431979179382, -0.9419306516647339, -0.9076181650161743, -0.8733056783676147, -0.8389931321144104, -0.804680585861206, -0.7703680992126465, -0.7360556125640869, -0.7017430663108826, -0.6674305200576782, -0.6331180334091187, -0.5988055467605591, -0.5644930005073547, -0.5301804542541504, -0.4958679676055908, -0.46155545115470886, -0.4272429347038269, -0.39293041825294495, -0.358617901802063, -0.32430538535118103, -0.2899928689002991, -0.2556803524494171, -0.22136783599853516, -0.1870553195476532, -0.15274280309677124, -0.11843028664588928, -0.08411788940429688, -0.04980537295341492, -0.015492856502532959, 0.018819659948349, 0.05313217639923096, 0.08744469285011292, 0.12175720930099487, 0.15606972575187683, 0.1903822422027588, 0.22469475865364075, 0.2590072751045227, 0.29331979155540466, 0.3276323080062866, 0.3619448244571686, 0.39625734090805054, 0.4305698573589325, 0.46488237380981445, 0.4991948902606964, 0.5335074067115784, 0.5678199529647827, 0.6021324396133423, 0.6364449262619019, 0.6707574725151062, 0.7050700187683105, 0.7393825054168701, 0.7736949920654297, 0.808007538318634, 0.8423200845718384, 0.876632571220398, 0.9109450578689575, 0.9452576041221619, 0.9795701503753662, 1.0138826370239258]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 1.0, 6.0, 6.0, 7.0, 11.0, 19.0, 15.0, 18.0, 15.0, 17.0, 28.0, 29.0, 39.0, 40.0, 40.0, 34.0, 31.0, 42.0, 38.0, 56.0, 55.0, 52.0, 44.0, 46.0, 39.0, 31.0, 31.0, 34.0, 31.0, 27.0, 19.0, 16.0, 17.0, 15.0, 12.0, 10.0, 10.0, 4.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9027748107910156, -0.8754429221153259, -0.8481109738349915, -0.8207790851593018, -0.7934471964836121, -0.7661153078079224, -0.7387833595275879, -0.7114514708518982, -0.6841195821762085, -0.6567876935005188, -0.6294557452201843, -0.6021238565444946, -0.5747919678688049, -0.5474600791931152, -0.5201281309127808, -0.49279624223709106, -0.465464323759079, -0.4381324052810669, -0.4108005166053772, -0.3834685981273651, -0.3561367094516754, -0.32880479097366333, -0.30147290229797363, -0.27414098381996155, -0.24680908024311066, -0.21947717666625977, -0.19214527308940887, -0.16481336951255798, -0.1374814510345459, -0.11014954745769501, -0.08281764388084412, -0.055485740303993225, -0.028153836727142334, -0.0008219312876462936, 0.026509974151849747, 0.053841881453990936, 0.08117378503084183, 0.10850569605827332, 0.1358375996351242, 0.1631695032119751, 0.190501406788826, 0.21783331036567688, 0.24516521394252777, 0.27249711751937866, 0.29982903599739075, 0.32716095447540283, 0.35449284315109253, 0.3818247318267822, 0.4091566503047943, 0.4364885687828064, 0.4638204574584961, 0.4911523759365082, 0.5184842944145203, 0.54581618309021, 0.5731480717658997, 0.6004799604415894, 0.6278119087219238, 0.6551437973976135, 0.682475745677948, 0.7098076343536377, 0.7371395230293274, 0.7644714117050171, 0.7918033599853516, 0.8191352486610413, 0.846467137336731]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 20.0, 16.0, 26.0, 38.0, 62.0, 95.0, 142.0, 226.0, 423.0, 645.0, 995.0, 1615.0, 2716.0, 4771.0, 9139.0, 19271.0, 45571.0, 119927.0, 335140.0, 314787.0, 111633.0, 43090.0, 18149.0, 8658.0, 4555.0, 2687.0, 1615.0, 910.0, 597.0, 366.0, 239.0, 164.0, 87.0, 68.0, 44.0, 24.0, 15.0, 5.0, 7.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.38330078125, -0.3709220886230469, -0.35854339599609375, -0.3461647033691406, -0.3337860107421875, -0.3214073181152344, -0.30902862548828125, -0.2966499328613281, -0.284271240234375, -0.2718925476074219, -0.25951385498046875, -0.24713516235351562, -0.2347564697265625, -0.22237777709960938, -0.20999908447265625, -0.19762039184570312, -0.18524169921875, -0.17286300659179688, -0.16048431396484375, -0.14810562133789062, -0.1357269287109375, -0.12334823608398438, -0.11096954345703125, -0.09859085083007812, -0.086212158203125, -0.07383346557617188, -0.06145477294921875, -0.049076080322265625, -0.0366973876953125, -0.024318695068359375, -0.01194000244140625, 0.000438690185546875, 0.0128173828125, 0.025196075439453125, 0.03757476806640625, 0.049953460693359375, 0.0623321533203125, 0.07471084594726562, 0.08708953857421875, 0.09946823120117188, 0.111846923828125, 0.12422561645507812, 0.13660430908203125, 0.14898300170898438, 0.1613616943359375, 0.17374038696289062, 0.18611907958984375, 0.19849777221679688, 0.21087646484375, 0.22325515747070312, 0.23563385009765625, 0.24801254272460938, 0.2603912353515625, 0.2727699279785156, 0.28514862060546875, 0.2975273132324219, 0.309906005859375, 0.3222846984863281, 0.33466339111328125, 0.3470420837402344, 0.3594207763671875, 0.3717994689941406, 0.38417816162109375, 0.3965568542480469, 0.408935546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 1.0, 4.0, 3.0, 5.0, 7.0, 7.0, 16.0, 13.0, 18.0, 15.0, 23.0, 27.0, 38.0, 33.0, 43.0, 42.0, 41.0, 64.0, 41.0, 50.0, 77.0, 72.0, 38.0, 51.0, 31.0, 39.0, 41.0, 31.0, 25.0, 22.0, 21.0, 12.0, 17.0, 7.0, 13.0, 7.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59326171875, -0.572021484375, -0.55078125, -0.529541015625, -0.50830078125, -0.487060546875, -0.4658203125, -0.444580078125, -0.42333984375, -0.402099609375, -0.380859375, -0.359619140625, -0.33837890625, -0.317138671875, -0.2958984375, -0.274658203125, -0.25341796875, -0.232177734375, -0.2109375, -0.189697265625, -0.16845703125, -0.147216796875, -0.1259765625, -0.104736328125, -0.08349609375, -0.062255859375, -0.041015625, -0.019775390625, 0.00146484375, 0.022705078125, 0.0439453125, 0.065185546875, 0.08642578125, 0.107666015625, 0.12890625, 0.150146484375, 0.17138671875, 0.192626953125, 0.2138671875, 0.235107421875, 0.25634765625, 0.277587890625, 0.298828125, 0.320068359375, 0.34130859375, 0.362548828125, 0.3837890625, 0.405029296875, 0.42626953125, 0.447509765625, 0.46875, 0.489990234375, 0.51123046875, 0.532470703125, 0.5537109375, 0.574951171875, 0.59619140625, 0.617431640625, 0.638671875, 0.659912109375, 0.68115234375, 0.702392578125, 0.7236328125, 0.744873046875, 0.76611328125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 4.0, 7.0, 5.0, 4.0, 4.0, 14.0, 14.0, 17.0, 28.0, 43.0, 41.0, 69.0, 106.0, 198.0, 292.0, 513.0, 960.0, 1886.0, 4221.0, 10768.0, 31842.0, 112604.0, 415984.0, 339779.0, 87531.0, 25491.0, 8856.0, 3541.0, 1629.0, 840.0, 482.0, 264.0, 176.0, 103.0, 81.0, 58.0, 21.0, 21.0, 23.0, 9.0, 11.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.362548828125, -0.3485527038574219, -0.33455657958984375, -0.3205604553222656, -0.3065643310546875, -0.2925682067871094, -0.27857208251953125, -0.2645759582519531, -0.250579833984375, -0.23658370971679688, -0.22258758544921875, -0.20859146118164062, -0.1945953369140625, -0.18059921264648438, -0.16660308837890625, -0.15260696411132812, -0.13861083984375, -0.12461471557617188, -0.11061859130859375, -0.09662246704101562, -0.0826263427734375, -0.06863021850585938, -0.05463409423828125, -0.040637969970703125, -0.026641845703125, -0.012645721435546875, 0.00135040283203125, 0.015346527099609375, 0.0293426513671875, 0.043338775634765625, 0.05733489990234375, 0.07133102416992188, 0.0853271484375, 0.09932327270507812, 0.11331939697265625, 0.12731552124023438, 0.1413116455078125, 0.15530776977539062, 0.16930389404296875, 0.18330001831054688, 0.197296142578125, 0.21129226684570312, 0.22528839111328125, 0.23928451538085938, 0.2532806396484375, 0.2672767639160156, 0.28127288818359375, 0.2952690124511719, 0.30926513671875, 0.3232612609863281, 0.33725738525390625, 0.3512535095214844, 0.3652496337890625, 0.3792457580566406, 0.39324188232421875, 0.4072380065917969, 0.421234130859375, 0.4352302551269531, 0.44922637939453125, 0.4632225036621094, 0.4772186279296875, 0.4912147521972656, 0.5052108764648438, 0.5192070007324219, 0.533203125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 4.0, 9.0, 9.0, 11.0, 13.0, 17.0, 19.0, 22.0, 24.0, 34.0, 14.0, 38.0, 37.0, 44.0, 36.0, 39.0, 52.0, 43.0, 42.0, 54.0, 53.0, 51.0, 42.0, 42.0, 35.0, 31.0, 24.0, 27.0, 23.0, 16.0, 15.0, 17.0, 14.0, 12.0, 8.0, 4.0, 11.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.203125, -1.1669769287109375, -1.130828857421875, -1.0946807861328125, -1.05853271484375, -1.0223846435546875, -0.986236572265625, -0.9500885009765625, -0.9139404296875, -0.8777923583984375, -0.841644287109375, -0.8054962158203125, -0.76934814453125, -0.7332000732421875, -0.697052001953125, -0.6609039306640625, -0.624755859375, -0.5886077880859375, -0.552459716796875, -0.5163116455078125, -0.48016357421875, -0.4440155029296875, -0.407867431640625, -0.3717193603515625, -0.3355712890625, -0.2994232177734375, -0.263275146484375, -0.2271270751953125, -0.19097900390625, -0.1548309326171875, -0.118682861328125, -0.0825347900390625, -0.04638671875, -0.0102386474609375, 0.025909423828125, 0.0620574951171875, 0.09820556640625, 0.1343536376953125, 0.170501708984375, 0.2066497802734375, 0.2427978515625, 0.2789459228515625, 0.315093994140625, 0.3512420654296875, 0.38739013671875, 0.4235382080078125, 0.459686279296875, 0.4958343505859375, 0.531982421875, 0.5681304931640625, 0.604278564453125, 0.6404266357421875, 0.67657470703125, 0.7127227783203125, 0.748870849609375, 0.7850189208984375, 0.8211669921875, 0.8573150634765625, 0.893463134765625, 0.9296112060546875, 0.96575927734375, 1.0019073486328125, 1.038055419921875, 1.0742034912109375, 1.1103515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 6.0, 4.0, 9.0, 13.0, 15.0, 31.0, 42.0, 72.0, 99.0, 129.0, 240.0, 400.0, 580.0, 1064.0, 1947.0, 4093.0, 8964.0, 23950.0, 89336.0, 517381.0, 312763.0, 56466.0, 17051.0, 6676.0, 3186.0, 1697.0, 896.0, 531.0, 346.0, 165.0, 114.0, 98.0, 76.0, 25.0, 25.0, 18.0, 16.0, 11.0, 10.0, 7.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.136962890625, -0.13303184509277344, -0.12910079956054688, -0.1251697540283203, -0.12123870849609375, -0.11730766296386719, -0.11337661743164062, -0.10944557189941406, -0.1055145263671875, -0.10158348083496094, -0.09765243530273438, -0.09372138977050781, -0.08979034423828125, -0.08585929870605469, -0.08192825317382812, -0.07799720764160156, -0.074066162109375, -0.07013511657714844, -0.06620407104492188, -0.06227302551269531, -0.05834197998046875, -0.05441093444824219, -0.050479888916015625, -0.04654884338378906, -0.0426177978515625, -0.03868675231933594, -0.034755706787109375, -0.030824661254882812, -0.02689361572265625, -0.022962570190429688, -0.019031524658203125, -0.015100479125976562, -0.01116943359375, -0.0072383880615234375, -0.003307342529296875, 0.0006237030029296875, 0.00455474853515625, 0.008485794067382812, 0.012416839599609375, 0.016347885131835938, 0.0202789306640625, 0.024209976196289062, 0.028141021728515625, 0.03207206726074219, 0.03600311279296875, 0.03993415832519531, 0.043865203857421875, 0.04779624938964844, 0.051727294921875, 0.05565834045410156, 0.059589385986328125, 0.06352043151855469, 0.06745147705078125, 0.07138252258300781, 0.07531356811523438, 0.07924461364746094, 0.0831756591796875, 0.08710670471191406, 0.09103775024414062, 0.09496879577636719, 0.09889984130859375, 0.10283088684082031, 0.10676193237304688, 0.11069297790527344, 0.1146240234375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 5.0, 5.0, 10.0, 10.0, 19.0, 36.0, 57.0, 87.0, 206.0, 222.0, 139.0, 67.0, 44.0, 28.0, 22.0, 11.0, 8.0, 5.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014293193817138672, -0.00013820268213748932, -0.00013347342610359192, -0.00012874417006969452, -0.00012401491403579712, -0.00011928565800189972, -0.00011455640196800232, -0.00010982714593410492, -0.00010509788990020752, -0.00010036863386631012, -9.563937783241272e-05, -9.091012179851532e-05, -8.618086576461792e-05, -8.145160973072052e-05, -7.672235369682312e-05, -7.199309766292572e-05, -6.726384162902832e-05, -6.253458559513092e-05, -5.780532956123352e-05, -5.307607352733612e-05, -4.834681749343872e-05, -4.361756145954132e-05, -3.888830542564392e-05, -3.415904939174652e-05, -2.942979335784912e-05, -2.470053732395172e-05, -1.997128129005432e-05, -1.5242025256156921e-05, -1.0512769222259521e-05, -5.783513188362122e-06, -1.0542571544647217e-06, 3.6749988794326782e-06, 8.404254913330078e-06, 1.3133510947227478e-05, 1.7862766981124878e-05, 2.2592023015022278e-05, 2.7321279048919678e-05, 3.205053508281708e-05, 3.677979111671448e-05, 4.150904715061188e-05, 4.623830318450928e-05, 5.096755921840668e-05, 5.569681525230408e-05, 6.042607128620148e-05, 6.515532732009888e-05, 6.988458335399628e-05, 7.461383938789368e-05, 7.934309542179108e-05, 8.407235145568848e-05, 8.880160748958588e-05, 9.353086352348328e-05, 9.826011955738068e-05, 0.00010298937559127808, 0.00010771863162517548, 0.00011244788765907288, 0.00011717714369297028, 0.00012190639972686768, 0.00012663565576076508, 0.00013136491179466248, 0.00013609416782855988, 0.00014082342386245728, 0.00014555267989635468, 0.00015028193593025208, 0.00015501119196414948, 0.00015974044799804688]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 4.0, 0.0, 6.0, 4.0, 6.0, 11.0, 15.0, 25.0, 36.0, 95.0, 378.0, 3778.0, 362844.0, 675811.0, 4887.0, 457.0, 104.0, 41.0, 17.0, 10.0, 5.0, 5.0, 3.0, 7.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.57666015625, -0.5606613159179688, -0.5446624755859375, -0.5286636352539062, -0.512664794921875, -0.49666595458984375, -0.4806671142578125, -0.46466827392578125, -0.44866943359375, -0.43267059326171875, -0.4166717529296875, -0.40067291259765625, -0.384674072265625, -0.36867523193359375, -0.3526763916015625, -0.33667755126953125, -0.3206787109375, -0.30467987060546875, -0.2886810302734375, -0.27268218994140625, -0.256683349609375, -0.24068450927734375, -0.2246856689453125, -0.20868682861328125, -0.19268798828125, -0.17668914794921875, -0.1606903076171875, -0.14469146728515625, -0.128692626953125, -0.11269378662109375, -0.0966949462890625, -0.08069610595703125, -0.064697265625, -0.04869842529296875, -0.0326995849609375, -0.01670074462890625, -0.000701904296875, 0.01529693603515625, 0.0312957763671875, 0.04729461669921875, 0.06329345703125, 0.07929229736328125, 0.0952911376953125, 0.11128997802734375, 0.127288818359375, 0.14328765869140625, 0.1592864990234375, 0.17528533935546875, 0.1912841796875, 0.20728302001953125, 0.2232818603515625, 0.23928070068359375, 0.255279541015625, 0.27127838134765625, 0.2872772216796875, 0.30327606201171875, 0.31927490234375, 0.33527374267578125, 0.3512725830078125, 0.36727142333984375, 0.383270263671875, 0.39926910400390625, 0.4152679443359375, 0.43126678466796875, 0.447265625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 5.0, 3.0, 9.0, 11.0, 13.0, 11.0, 17.0, 26.0, 28.0, 31.0, 56.0, 57.0, 72.0, 95.0, 103.0, 101.0, 82.0, 68.0, 44.0, 39.0, 30.0, 29.0, 17.0, 12.0, 11.0, 8.0, 2.0, 2.0, 4.0, 2.0, 2.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.038238525390625, -0.03713035583496094, -0.036022186279296875, -0.03491401672363281, -0.03380584716796875, -0.03269767761230469, -0.031589508056640625, -0.030481338500976562, -0.0293731689453125, -0.028264999389648438, -0.027156829833984375, -0.026048660278320312, -0.02494049072265625, -0.023832321166992188, -0.022724151611328125, -0.021615982055664062, -0.0205078125, -0.019399642944335938, -0.018291473388671875, -0.017183303833007812, -0.01607513427734375, -0.014966964721679688, -0.013858795166015625, -0.012750625610351562, -0.0116424560546875, -0.010534286499023438, -0.009426116943359375, -0.008317947387695312, -0.00720977783203125, -0.0061016082763671875, -0.004993438720703125, -0.0038852691650390625, -0.002777099609375, -0.0016689300537109375, -0.000560760498046875, 0.0005474090576171875, 0.00165557861328125, 0.0027637481689453125, 0.003871917724609375, 0.0049800872802734375, 0.0060882568359375, 0.0071964263916015625, 0.008304595947265625, 0.009412765502929688, 0.01052093505859375, 0.011629104614257812, 0.012737274169921875, 0.013845443725585938, 0.01495361328125, 0.016061782836914062, 0.017169952392578125, 0.018278121948242188, 0.01938629150390625, 0.020494461059570312, 0.021602630615234375, 0.022710800170898438, 0.0238189697265625, 0.024927139282226562, 0.026035308837890625, 0.027143478393554688, 0.02825164794921875, 0.029359817504882812, 0.030467987060546875, 0.03157615661621094, 0.032684326171875]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 4.0, 2.0, 5.0, 4.0, 8.0, 12.0, 15.0, 28.0, 22.0, 49.0, 64.0, 110.0, 118.0, 134.0, 144.0, 104.0, 54.0, 34.0, 33.0, 14.0, 12.0, 9.0, 13.0, 9.0, 0.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.387607455253601, -1.3575772047042847, -1.3275469541549683, -1.2975167036056519, -1.2674864530563354, -1.2374560832977295, -1.207425832748413, -1.1773955821990967, -1.1473653316497803, -1.1173350811004639, -1.0873048305511475, -1.057274580001831, -1.0272443294525146, -0.9972140192985535, -0.9671837687492371, -0.9371535181999207, -0.9071232676506042, -0.8770930171012878, -0.8470627665519714, -0.8170324563980103, -0.7870022058486938, -0.7569719552993774, -0.726941704750061, -0.6969114542007446, -0.6668812036514282, -0.6368509531021118, -0.6068207025527954, -0.576790452003479, -0.5467601418495178, -0.5167298913002014, -0.486699640750885, -0.4566693902015686, -0.4266391396522522, -0.3966088891029358, -0.366578608751297, -0.3365483582019806, -0.3065180778503418, -0.2764878273010254, -0.24645757675170898, -0.21642731130123138, -0.18639704585075378, -0.15636678040027618, -0.12633651494979858, -0.09630626440048218, -0.06627599895000458, -0.03624573349952698, -0.006215482950210571, 0.02381478250026703, 0.05384504795074463, 0.08387531340122223, 0.11390557140111923, 0.14393582940101624, 0.17396609485149384, 0.20399636030197144, 0.23402661085128784, 0.26405686140060425, 0.29408714175224304, 0.32411739230155945, 0.35414767265319824, 0.38417792320251465, 0.41420817375183105, 0.44423845410346985, 0.47426870465278625, 0.504298985004425, 0.5343292355537415]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 3.0, 9.0, 8.0, 9.0, 12.0, 24.0, 22.0, 24.0, 44.0, 32.0, 61.0, 54.0, 54.0, 58.0, 67.0, 77.0, 62.0, 76.0, 48.0, 47.0, 41.0, 44.0, 32.0, 23.0, 24.0, 17.0, 14.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5779840350151062, -0.5522323846817017, -0.5264807343482971, -0.5007290840148926, -0.47497737407684326, -0.4492257237434387, -0.4234740734100342, -0.39772242307662964, -0.3719707429409027, -0.34621909260749817, -0.32046741247177124, -0.2947157621383667, -0.26896411180496216, -0.24321243166923523, -0.2174607813358307, -0.19170911610126495, -0.16595745086669922, -0.14020578563213348, -0.11445412784814835, -0.08870247006416321, -0.06295080482959747, -0.03719913959503174, -0.011447489261627197, 0.014304175972938538, 0.04005584120750427, 0.06580750644207001, 0.09155916422605515, 0.11731082201004028, 0.14306248724460602, 0.16881415247917175, 0.1945658028125763, 0.22031746804714203, 0.246069073677063, 0.27182072401046753, 0.29757240414619446, 0.323324054479599, 0.3490757346153259, 0.37482738494873047, 0.400579035282135, 0.42633068561553955, 0.4520823657512665, 0.477834016084671, 0.503585696220398, 0.5293373465538025, 0.555088996887207, 0.5808407068252563, 0.6065922975540161, 0.6323440074920654, 0.65809565782547, 0.6838473081588745, 0.709598958492279, 0.7353506088256836, 0.7611023187637329, 0.7868539690971375, 0.812605619430542, 0.8383572697639465, 0.8641089200973511, 0.8898605704307556, 0.9156122207641602, 0.9413639307022095, 0.967115581035614, 0.9928672313690186, 1.0186188220977783, 1.0443705320358276, 1.070122241973877]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 8.0, 6.0, 7.0, 17.0, 16.0, 19.0, 37.0, 32.0, 43.0, 90.0, 131.0, 242.0, 393.0, 714.0, 1396.0, 2914.0, 6897.0, 19594.0, 92511.0, 713508.0, 166407.0, 27210.0, 8936.0, 3634.0, 1701.0, 884.0, 466.0, 269.0, 145.0, 107.0, 68.0, 42.0, 32.0, 16.0, 16.0, 19.0, 8.0, 9.0, 1.0, 2.0, 5.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.630859375, -0.60882568359375, -0.5867919921875, -0.56475830078125, -0.542724609375, -0.52069091796875, -0.4986572265625, -0.47662353515625, -0.45458984375, -0.43255615234375, -0.4105224609375, -0.38848876953125, -0.366455078125, -0.34442138671875, -0.3223876953125, -0.30035400390625, -0.2783203125, -0.25628662109375, -0.2342529296875, -0.21221923828125, -0.190185546875, -0.16815185546875, -0.1461181640625, -0.12408447265625, -0.10205078125, -0.08001708984375, -0.0579833984375, -0.03594970703125, -0.013916015625, 0.00811767578125, 0.0301513671875, 0.05218505859375, 0.07421875, 0.09625244140625, 0.1182861328125, 0.14031982421875, 0.162353515625, 0.18438720703125, 0.2064208984375, 0.22845458984375, 0.25048828125, 0.27252197265625, 0.2945556640625, 0.31658935546875, 0.338623046875, 0.36065673828125, 0.3826904296875, 0.40472412109375, 0.4267578125, 0.44879150390625, 0.4708251953125, 0.49285888671875, 0.514892578125, 0.53692626953125, 0.5589599609375, 0.58099365234375, 0.60302734375, 0.62506103515625, 0.6470947265625, 0.66912841796875, 0.691162109375, 0.71319580078125, 0.7352294921875, 0.75726318359375, 0.779296875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 6.0, 6.0, 6.0, 10.0, 17.0, 17.0, 12.0, 21.0, 26.0, 23.0, 37.0, 41.0, 41.0, 45.0, 51.0, 57.0, 60.0, 62.0, 65.0, 59.0, 52.0, 55.0, 37.0, 34.0, 24.0, 31.0, 16.0, 22.0, 17.0, 15.0, 8.0, 6.0, 6.0, 7.0, 6.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7099609375, -1.6418609619140625, -1.573760986328125, -1.5056610107421875, -1.43756103515625, -1.3694610595703125, -1.301361083984375, -1.2332611083984375, -1.1651611328125, -1.0970611572265625, -1.028961181640625, -0.9608612060546875, -0.89276123046875, -0.8246612548828125, -0.756561279296875, -0.6884613037109375, -0.620361328125, -0.5522613525390625, -0.484161376953125, -0.4160614013671875, -0.34796142578125, -0.2798614501953125, -0.211761474609375, -0.1436614990234375, -0.0755615234375, -0.0074615478515625, 0.060638427734375, 0.1287384033203125, 0.19683837890625, 0.2649383544921875, 0.333038330078125, 0.4011383056640625, 0.46923828125, 0.5373382568359375, 0.605438232421875, 0.6735382080078125, 0.74163818359375, 0.8097381591796875, 0.877838134765625, 0.9459381103515625, 1.0140380859375, 1.0821380615234375, 1.150238037109375, 1.2183380126953125, 1.28643798828125, 1.3545379638671875, 1.422637939453125, 1.4907379150390625, 1.558837890625, 1.6269378662109375, 1.695037841796875, 1.7631378173828125, 1.83123779296875, 1.8993377685546875, 1.967437744140625, 2.0355377197265625, 2.1036376953125, 2.1717376708984375, 2.239837646484375, 2.3079376220703125, 2.37603759765625, 2.4441375732421875, 2.512237548828125, 2.5803375244140625, 2.6484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 1.0, 3.0, 8.0, 7.0, 7.0, 8.0, 10.0, 12.0, 19.0, 25.0, 33.0, 27.0, 47.0, 54.0, 60.0, 86.0, 153.0, 679.0, 1016858.0, 29690.0, 296.0, 114.0, 80.0, 62.0, 37.0, 41.0, 27.0, 22.0, 14.0, 21.0, 10.0, 11.0, 6.0, 12.0, 3.0, 1.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.7421875, -6.54290771484375, -6.3436279296875, -6.14434814453125, -5.945068359375, -5.74578857421875, -5.5465087890625, -5.34722900390625, -5.14794921875, -4.94866943359375, -4.7493896484375, -4.55010986328125, -4.350830078125, -4.15155029296875, -3.9522705078125, -3.75299072265625, -3.5537109375, -3.35443115234375, -3.1551513671875, -2.95587158203125, -2.756591796875, -2.55731201171875, -2.3580322265625, -2.15875244140625, -1.95947265625, -1.76019287109375, -1.5609130859375, -1.36163330078125, -1.162353515625, -0.96307373046875, -0.7637939453125, -0.56451416015625, -0.365234375, -0.16595458984375, 0.0333251953125, 0.23260498046875, 0.431884765625, 0.63116455078125, 0.8304443359375, 1.02972412109375, 1.22900390625, 1.42828369140625, 1.6275634765625, 1.82684326171875, 2.026123046875, 2.22540283203125, 2.4246826171875, 2.62396240234375, 2.8232421875, 3.02252197265625, 3.2218017578125, 3.42108154296875, 3.620361328125, 3.81964111328125, 4.0189208984375, 4.21820068359375, 4.41748046875, 4.61676025390625, 4.8160400390625, 5.01531982421875, 5.214599609375, 5.41387939453125, 5.6131591796875, 5.81243896484375, 6.01171875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 9.0, 5.0, 12.0, 12.0, 13.0, 18.0, 20.0, 31.0, 33.0, 40.0, 36.0, 47.0, 63.0, 44.0, 70.0, 70.0, 54.0, 58.0, 51.0, 55.0, 40.0, 34.0, 35.0, 25.0, 22.0, 17.0, 20.0, 14.0, 7.0, 11.0, 8.0, 4.0, 3.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.654296875, -2.5758056640625, -2.497314453125, -2.4188232421875, -2.34033203125, -2.2618408203125, -2.183349609375, -2.1048583984375, -2.0263671875, -1.9478759765625, -1.869384765625, -1.7908935546875, -1.71240234375, -1.6339111328125, -1.555419921875, -1.4769287109375, -1.3984375, -1.3199462890625, -1.241455078125, -1.1629638671875, -1.08447265625, -1.0059814453125, -0.927490234375, -0.8489990234375, -0.7705078125, -0.6920166015625, -0.613525390625, -0.5350341796875, -0.45654296875, -0.3780517578125, -0.299560546875, -0.2210693359375, -0.142578125, -0.0640869140625, 0.014404296875, 0.0928955078125, 0.17138671875, 0.2498779296875, 0.328369140625, 0.4068603515625, 0.4853515625, 0.5638427734375, 0.642333984375, 0.7208251953125, 0.79931640625, 0.8778076171875, 0.956298828125, 1.0347900390625, 1.11328125, 1.1917724609375, 1.270263671875, 1.3487548828125, 1.42724609375, 1.5057373046875, 1.584228515625, 1.6627197265625, 1.7412109375, 1.8197021484375, 1.898193359375, 1.9766845703125, 2.05517578125, 2.1336669921875, 2.212158203125, 2.2906494140625, 2.369140625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 2.0, 3.0, 12.0, 18.0, 24.0, 34.0, 75.0, 210.0, 510.0, 1650.0, 8389.0, 263164.0, 761856.0, 9779.0, 1839.0, 565.0, 218.0, 84.0, 35.0, 21.0, 9.0, 7.0, 8.0, 8.0, 3.0, 4.0, 3.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.4296875, -1.38641357421875, -1.3431396484375, -1.29986572265625, -1.256591796875, -1.21331787109375, -1.1700439453125, -1.12677001953125, -1.08349609375, -1.04022216796875, -0.9969482421875, -0.95367431640625, -0.910400390625, -0.86712646484375, -0.8238525390625, -0.78057861328125, -0.7373046875, -0.69403076171875, -0.6507568359375, -0.60748291015625, -0.564208984375, -0.52093505859375, -0.4776611328125, -0.43438720703125, -0.39111328125, -0.34783935546875, -0.3045654296875, -0.26129150390625, -0.218017578125, -0.17474365234375, -0.1314697265625, -0.08819580078125, -0.044921875, -0.00164794921875, 0.0416259765625, 0.08489990234375, 0.128173828125, 0.17144775390625, 0.2147216796875, 0.25799560546875, 0.30126953125, 0.34454345703125, 0.3878173828125, 0.43109130859375, 0.474365234375, 0.51763916015625, 0.5609130859375, 0.60418701171875, 0.6474609375, 0.69073486328125, 0.7340087890625, 0.77728271484375, 0.820556640625, 0.86383056640625, 0.9071044921875, 0.95037841796875, 0.99365234375, 1.03692626953125, 1.0802001953125, 1.12347412109375, 1.166748046875, 1.21002197265625, 1.2532958984375, 1.29656982421875, 1.33984375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 7.0, 10.0, 16.0, 20.0, 39.0, 76.0, 447.0, 251.0, 36.0, 35.0, 18.0, 16.0, 6.0, 5.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.572505950927734e-05, -9.153783321380615e-05, -8.735060691833496e-05, -8.316338062286377e-05, -7.897615432739258e-05, -7.478892803192139e-05, -7.06017017364502e-05, -6.6414475440979e-05, -6.222724914550781e-05, -5.804002285003662e-05, -5.385279655456543e-05, -4.966557025909424e-05, -4.547834396362305e-05, -4.1291117668151855e-05, -3.7103891372680664e-05, -3.291666507720947e-05, -2.872943878173828e-05, -2.454221248626709e-05, -2.03549861907959e-05, -1.6167759895324707e-05, -1.1980533599853516e-05, -7.793307304382324e-06, -3.606081008911133e-06, 5.811452865600586e-07, 4.76837158203125e-06, 8.955597877502441e-06, 1.3142824172973633e-05, 1.7330050468444824e-05, 2.1517276763916016e-05, 2.5704503059387207e-05, 2.98917293548584e-05, 3.407895565032959e-05, 3.826618194580078e-05, 4.245340824127197e-05, 4.6640634536743164e-05, 5.0827860832214355e-05, 5.501508712768555e-05, 5.920231342315674e-05, 6.338953971862793e-05, 6.757676601409912e-05, 7.176399230957031e-05, 7.59512186050415e-05, 8.01384449005127e-05, 8.432567119598389e-05, 8.851289749145508e-05, 9.270012378692627e-05, 9.688735008239746e-05, 0.00010107457637786865, 0.00010526180267333984, 0.00010944902896881104, 0.00011363625526428223, 0.00011782348155975342, 0.00012201070785522461, 0.0001261979341506958, 0.000130385160446167, 0.00013457238674163818, 0.00013875961303710938, 0.00014294683933258057, 0.00014713406562805176, 0.00015132129192352295, 0.00015550851821899414, 0.00015969574451446533, 0.00016388297080993652, 0.00016807019710540771, 0.0001722574234008789]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 2.0, 4.0, 6.0, 7.0, 12.0, 14.0, 12.0, 20.0, 34.0, 101.0, 511.0, 5873.0, 975877.0, 63523.0, 2058.0, 300.0, 77.0, 23.0, 15.0, 20.0, 10.0, 6.0, 6.0, 8.0, 6.0, 6.0, 6.0, 2.0, 8.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.287109375, -2.22662353515625, -2.1661376953125, -2.10565185546875, -2.045166015625, -1.98468017578125, -1.9241943359375, -1.86370849609375, -1.80322265625, -1.74273681640625, -1.6822509765625, -1.62176513671875, -1.561279296875, -1.50079345703125, -1.4403076171875, -1.37982177734375, -1.3193359375, -1.25885009765625, -1.1983642578125, -1.13787841796875, -1.077392578125, -1.01690673828125, -0.9564208984375, -0.89593505859375, -0.83544921875, -0.77496337890625, -0.7144775390625, -0.65399169921875, -0.593505859375, -0.53302001953125, -0.4725341796875, -0.41204833984375, -0.3515625, -0.29107666015625, -0.2305908203125, -0.17010498046875, -0.109619140625, -0.04913330078125, 0.0113525390625, 0.07183837890625, 0.13232421875, 0.19281005859375, 0.2532958984375, 0.31378173828125, 0.374267578125, 0.43475341796875, 0.4952392578125, 0.55572509765625, 0.6162109375, 0.67669677734375, 0.7371826171875, 0.79766845703125, 0.858154296875, 0.91864013671875, 0.9791259765625, 1.03961181640625, 1.10009765625, 1.16058349609375, 1.2210693359375, 1.28155517578125, 1.342041015625, 1.40252685546875, 1.4630126953125, 1.52349853515625, 1.583984375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 0.0, 8.0, 5.0, 6.0, 7.0, 4.0, 6.0, 11.0, 11.0, 15.0, 12.0, 12.0, 29.0, 57.0, 99.0, 264.0, 206.0, 96.0, 43.0, 19.0, 20.0, 14.0, 10.0, 8.0, 13.0, 7.0, 6.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1787109375, -0.17230224609375, -0.1658935546875, -0.15948486328125, -0.153076171875, -0.14666748046875, -0.1402587890625, -0.13385009765625, -0.12744140625, -0.12103271484375, -0.1146240234375, -0.10821533203125, -0.101806640625, -0.09539794921875, -0.0889892578125, -0.08258056640625, -0.076171875, -0.06976318359375, -0.0633544921875, -0.05694580078125, -0.050537109375, -0.04412841796875, -0.0377197265625, -0.03131103515625, -0.02490234375, -0.01849365234375, -0.0120849609375, -0.00567626953125, 0.000732421875, 0.00714111328125, 0.0135498046875, 0.01995849609375, 0.0263671875, 0.03277587890625, 0.0391845703125, 0.04559326171875, 0.052001953125, 0.05841064453125, 0.0648193359375, 0.07122802734375, 0.07763671875, 0.08404541015625, 0.0904541015625, 0.09686279296875, 0.103271484375, 0.10968017578125, 0.1160888671875, 0.12249755859375, 0.12890625, 0.13531494140625, 0.1417236328125, 0.14813232421875, 0.154541015625, 0.16094970703125, 0.1673583984375, 0.17376708984375, 0.18017578125, 0.18658447265625, 0.1929931640625, 0.19940185546875, 0.205810546875, 0.21221923828125, 0.2186279296875, 0.22503662109375, 0.2314453125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 10.0, 46.0, 122.0, 449.0, 287.0, 74.0, 20.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5340017080307007, -1.306362271308899, -1.0787227153778076, -0.8510832786560059, -0.6234438419342041, -0.39580440521240234, -0.16816484928131104, 0.05947458744049072, 0.2871140241622925, 0.5147534608840942, 0.7423929572105408, 0.9700324535369873, 1.197671890258789, 1.4253113269805908, 1.6529508829116821, 1.8805903196334839, 2.108229637145996, 2.335869073867798, 2.5635085105895996, 2.7911481857299805, 3.018787384033203, 3.246427059173584, 3.4740664958953857, 3.7017059326171875, 3.9293456077575684, 4.156985282897949, 4.384624481201172, 4.612264156341553, 4.839903354644775, 5.067543029785156, 5.295182228088379, 5.52282190322876, 5.750461578369141, 5.9781012535095215, 6.205740451812744, 6.433380126953125, 6.661019325256348, 6.8886590003967285, 7.116298675537109, 7.343937873840332, 7.571577072143555, 7.7992167472839355, 8.026856422424316, 8.254495620727539, 8.482134819030762, 8.709774017333984, 8.937414169311523, 9.165053367614746, 9.392692565917969, 9.620331764221191, 9.84797191619873, 10.075611114501953, 10.303250312805176, 10.530889511108398, 10.758529663085938, 10.98616886138916, 11.2138090133667, 11.441448211669922, 11.669088363647461, 11.896727561950684, 12.124366760253906, 12.352005958557129, 12.579646110534668, 12.80728530883789, 13.034924507141113]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 6.0, 7.0, 9.0, 15.0, 13.0, 17.0, 13.0, 16.0, 17.0, 18.0, 19.0, 25.0, 27.0, 26.0, 29.0, 30.0, 31.0, 41.0, 38.0, 44.0, 40.0, 36.0, 38.0, 37.0, 41.0, 45.0, 36.0, 37.0, 34.0, 28.0, 35.0, 21.0, 22.0, 13.0, 16.0, 17.0, 3.0, 12.0, 6.0, 10.0, 6.0, 7.0, 7.0, 3.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.6897172927856445, -2.6114749908447266, -2.5332324504852295, -2.4549901485443115, -2.3767476081848145, -2.2985053062438965, -2.2202630043029785, -2.1420204639434814, -2.0637781620025635, -1.985535740852356, -1.9072933197021484, -1.8290510177612305, -1.750808596611023, -1.6725661754608154, -1.594323754310608, -1.5160813331604004, -1.4378389120101929, -1.3595964908599854, -1.2813540697097778, -1.2031116485595703, -1.1248693466186523, -1.0466269254684448, -0.9683845043182373, -0.8901421427726746, -0.811899721622467, -0.7336573004722595, -0.6554149389266968, -0.5771725177764893, -0.4989301264286041, -0.420687735080719, -0.3424453139305115, -0.26420295238494873, -0.1859605312347412, -0.10771813243627548, -0.029475733637809753, 0.04876667261123657, 0.1270090639591217, 0.20525145530700684, 0.28349387645721436, 0.3617362380027771, 0.4399786591529846, 0.5182210803031921, 0.5964634418487549, 0.6747058629989624, 0.7529482841491699, 0.8311906456947327, 0.9094330668449402, 0.9876754283905029, 1.0659178495407104, 1.144160270690918, 1.2224026918411255, 1.300645112991333, 1.378887414932251, 1.4571298360824585, 1.535372257232666, 1.613614559173584, 1.691857099533081, 1.7700995206832886, 1.848341941833496, 1.926584243774414, 2.004826784133911, 2.083069086074829, 2.161311626434326, 2.239553928375244, 2.317796230316162]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 4.0, 6.0, 16.0, 26.0, 25.0, 35.0, 62.0, 145.0, 318.0, 1354.0, 10124.0, 1093963.0, 3069249.0, 16108.0, 2001.0, 428.0, 152.0, 87.0, 51.0, 33.0, 28.0, 20.0, 9.0, 15.0, 5.0, 3.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.66796875, -4.53863525390625, -4.4093017578125, -4.27996826171875, -4.150634765625, -4.02130126953125, -3.8919677734375, -3.76263427734375, -3.63330078125, -3.50396728515625, -3.3746337890625, -3.24530029296875, -3.115966796875, -2.98663330078125, -2.8572998046875, -2.72796630859375, -2.5986328125, -2.46929931640625, -2.3399658203125, -2.21063232421875, -2.081298828125, -1.95196533203125, -1.8226318359375, -1.69329833984375, -1.56396484375, -1.43463134765625, -1.3052978515625, -1.17596435546875, -1.046630859375, -0.91729736328125, -0.7879638671875, -0.65863037109375, -0.529296875, -0.39996337890625, -0.2706298828125, -0.14129638671875, -0.011962890625, 0.11737060546875, 0.2467041015625, 0.37603759765625, 0.50537109375, 0.63470458984375, 0.7640380859375, 0.89337158203125, 1.022705078125, 1.15203857421875, 1.2813720703125, 1.41070556640625, 1.5400390625, 1.66937255859375, 1.7987060546875, 1.92803955078125, 2.057373046875, 2.18670654296875, 2.3160400390625, 2.44537353515625, 2.57470703125, 2.70404052734375, 2.8333740234375, 2.96270751953125, 3.092041015625, 3.22137451171875, 3.3507080078125, 3.48004150390625, 3.609375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 6.0, 4.0, 8.0, 7.0, 7.0, 17.0, 14.0, 25.0, 17.0, 21.0, 32.0, 30.0, 33.0, 40.0, 42.0, 42.0, 32.0, 50.0, 48.0, 46.0, 50.0, 44.0, 38.0, 33.0, 35.0, 34.0, 27.0, 44.0, 31.0, 28.0, 20.0, 13.0, 16.0, 19.0, 12.0, 11.0, 5.0, 7.0, 3.0, 5.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6240234375, -0.6037979125976562, -0.5835723876953125, -0.5633468627929688, -0.543121337890625, -0.5228958129882812, -0.5026702880859375, -0.48244476318359375, -0.46221923828125, -0.44199371337890625, -0.4217681884765625, -0.40154266357421875, -0.381317138671875, -0.36109161376953125, -0.3408660888671875, -0.32064056396484375, -0.3004150390625, -0.28018951416015625, -0.2599639892578125, -0.23973846435546875, -0.219512939453125, -0.19928741455078125, -0.1790618896484375, -0.15883636474609375, -0.13861083984375, -0.11838531494140625, -0.0981597900390625, -0.07793426513671875, -0.057708740234375, -0.03748321533203125, -0.0172576904296875, 0.00296783447265625, 0.023193359375, 0.04341888427734375, 0.0636444091796875, 0.08386993408203125, 0.104095458984375, 0.12432098388671875, 0.1445465087890625, 0.16477203369140625, 0.18499755859375, 0.20522308349609375, 0.2254486083984375, 0.24567413330078125, 0.265899658203125, 0.28612518310546875, 0.3063507080078125, 0.32657623291015625, 0.3468017578125, 0.36702728271484375, 0.3872528076171875, 0.40747833251953125, 0.427703857421875, 0.44792938232421875, 0.4681549072265625, 0.48838043212890625, 0.50860595703125, 0.5288314819335938, 0.5490570068359375, 0.5692825317382812, 0.589508056640625, 0.6097335815429688, 0.6299591064453125, 0.6501846313476562, 0.67041015625]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 7.0, 8.0, 19.0, 29.0, 101.0, 307.0, 3158.0, 4175546.0, 14403.0, 502.0, 123.0, 48.0, 21.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.0234375, -14.69427490234375, -14.3651123046875, -14.03594970703125, -13.706787109375, -13.37762451171875, -13.0484619140625, -12.71929931640625, -12.39013671875, -12.06097412109375, -11.7318115234375, -11.40264892578125, -11.073486328125, -10.74432373046875, -10.4151611328125, -10.08599853515625, -9.7568359375, -9.42767333984375, -9.0985107421875, -8.76934814453125, -8.440185546875, -8.11102294921875, -7.7818603515625, -7.45269775390625, -7.12353515625, -6.79437255859375, -6.4652099609375, -6.13604736328125, -5.806884765625, -5.47772216796875, -5.1485595703125, -4.81939697265625, -4.490234375, -4.16107177734375, -3.8319091796875, -3.50274658203125, -3.173583984375, -2.84442138671875, -2.5152587890625, -2.18609619140625, -1.85693359375, -1.52777099609375, -1.1986083984375, -0.86944580078125, -0.540283203125, -0.21112060546875, 0.1180419921875, 0.44720458984375, 0.7763671875, 1.10552978515625, 1.4346923828125, 1.76385498046875, 2.093017578125, 2.42218017578125, 2.7513427734375, 3.08050537109375, 3.40966796875, 3.73883056640625, 4.0679931640625, 4.39715576171875, 4.726318359375, 5.05548095703125, 5.3846435546875, 5.71380615234375, 6.04296875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 5.0, 1.0, 4.0, 3.0, 7.0, 5.0, 9.0, 12.0, 9.0, 15.0, 13.0, 27.0, 32.0, 24.0, 54.0, 75.0, 84.0, 146.0, 240.0, 334.0, 514.0, 670.0, 554.0, 435.0, 249.0, 144.0, 85.0, 69.0, 50.0, 44.0, 26.0, 19.0, 17.0, 15.0, 15.0, 13.0, 10.0, 5.0, 6.0, 7.0, 4.0, 5.0, 2.0, 3.0, 6.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27783203125, -0.2681465148925781, -0.25846099853515625, -0.24877548217773438, -0.2390899658203125, -0.22940444946289062, -0.21971893310546875, -0.21003341674804688, -0.200347900390625, -0.19066238403320312, -0.18097686767578125, -0.17129135131835938, -0.1616058349609375, -0.15192031860351562, -0.14223480224609375, -0.13254928588867188, -0.12286376953125, -0.11317825317382812, -0.10349273681640625, -0.09380722045898438, -0.0841217041015625, -0.07443618774414062, -0.06475067138671875, -0.055065155029296875, -0.045379638671875, -0.035694122314453125, -0.02600860595703125, -0.016323089599609375, -0.0066375732421875, 0.003047943115234375, 0.01273345947265625, 0.022418975830078125, 0.0321044921875, 0.041790008544921875, 0.05147552490234375, 0.061161041259765625, 0.0708465576171875, 0.08053207397460938, 0.09021759033203125, 0.09990310668945312, 0.109588623046875, 0.11927413940429688, 0.12895965576171875, 0.13864517211914062, 0.1483306884765625, 0.15801620483398438, 0.16770172119140625, 0.17738723754882812, 0.18707275390625, 0.19675827026367188, 0.20644378662109375, 0.21612930297851562, 0.2258148193359375, 0.23550033569335938, 0.24518585205078125, 0.2548713684082031, 0.264556884765625, 0.2742424011230469, 0.28392791748046875, 0.2936134338378906, 0.3032989501953125, 0.3129844665527344, 0.32266998291015625, 0.3323554992675781, 0.342041015625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 6.0, 7.0, 3.0, 4.0, 5.0, 19.0, 18.0, 32.0, 23.0, 35.0, 41.0, 65.0, 76.0, 92.0, 116.0, 115.0, 81.0, 60.0, 44.0, 34.0, 36.0, 15.0, 16.0, 14.0, 10.0, 10.0, 5.0, 4.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8767918348312378, -0.8426021933555603, -0.8084125518798828, -0.7742229104042053, -0.7400332689285278, -0.7058435678482056, -0.6716539263725281, -0.6374642848968506, -0.6032746434211731, -0.5690850019454956, -0.5348953604698181, -0.5007057189941406, -0.46651604771614075, -0.43232640624046326, -0.3981367349624634, -0.3639470934867859, -0.3297574520111084, -0.2955678105354309, -0.2613781690597534, -0.22718849778175354, -0.19299885630607605, -0.15880921483039856, -0.12461955845355988, -0.09042990207672119, -0.0562402606010437, -0.022050611674785614, 0.012139037251472473, 0.04632868617773056, 0.08051833510398865, 0.11470797657966614, 0.14889763295650482, 0.1830872893333435, 0.21727705001831055, 0.25146669149398804, 0.2856563329696655, 0.3198460042476654, 0.3540356457233429, 0.3882252871990204, 0.42241495847702026, 0.45660459995269775, 0.49079424142837524, 0.5249838829040527, 0.5591735243797302, 0.5933631658554077, 0.62755286693573, 0.6617424488067627, 0.695932149887085, 0.7301217913627625, 0.7643114328384399, 0.7985010743141174, 0.8326907157897949, 0.8668803572654724, 0.9010699987411499, 0.9352596998214722, 0.9694493412971497, 1.0036389827728271, 1.0378286838531494, 1.0720183849334717, 1.1062079668045044, 1.1403976678848267, 1.1745872497558594, 1.2087769508361816, 1.2429665327072144, 1.2771562337875366, 1.3113458156585693]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 6.0, 2.0, 9.0, 8.0, 7.0, 8.0, 9.0, 11.0, 15.0, 15.0, 20.0, 23.0, 28.0, 40.0, 25.0, 31.0, 31.0, 34.0, 42.0, 37.0, 33.0, 37.0, 39.0, 35.0, 45.0, 42.0, 36.0, 46.0, 39.0, 32.0, 23.0, 25.0, 27.0, 16.0, 16.0, 17.0, 22.0, 17.0, 6.0, 13.0, 11.0, 8.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6731864213943481, -0.6533223390579224, -0.6334582567214966, -0.6135942339897156, -0.5937301516532898, -0.573866069316864, -0.5540019869804382, -0.5341379046440125, -0.5142738819122314, -0.49440979957580566, -0.47454574704170227, -0.4546816647052765, -0.4348176121711731, -0.4149535298347473, -0.39508944749832153, -0.37522536516189575, -0.35536128282546997, -0.3354972004890442, -0.3156331479549408, -0.295769065618515, -0.2759050130844116, -0.25604093074798584, -0.23617684841156006, -0.21631278097629547, -0.19644871354103088, -0.1765846461057663, -0.1567205786705017, -0.13685649633407593, -0.11699242889881134, -0.09712836146354675, -0.07726428657770157, -0.057400211691856384, -0.03753608465194702, -0.017672013491392136, 0.0021920576691627502, 0.022056128829717636, 0.04192019999027252, 0.06178426742553711, 0.0816483423113823, 0.10151241719722748, 0.12137648463249207, 0.14124055206775665, 0.16110461950302124, 0.18096870183944702, 0.2008327692747116, 0.2206968367099762, 0.24056091904640198, 0.26042497158050537, 0.28028905391693115, 0.30015313625335693, 0.3200171887874603, 0.3398812711238861, 0.3597453236579895, 0.3796094059944153, 0.39947348833084106, 0.41933757066726685, 0.43920162320137024, 0.459065705537796, 0.4789297580718994, 0.4987938404083252, 0.518657922744751, 0.5385220050811768, 0.5583860278129578, 0.5782501101493835, 0.5981141924858093]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 4.0, 7.0, 5.0, 2.0, 3.0, 8.0, 9.0, 5.0, 6.0, 19.0, 25.0, 38.0, 72.0, 185.0, 793.0, 4707.0, 42615.0, 815226.0, 170453.0, 12007.0, 1755.0, 333.0, 96.0, 41.0, 15.0, 22.0, 18.0, 15.0, 10.0, 11.0, 7.0, 10.0, 6.0, 5.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95068359375, -0.9175949096679688, -0.8845062255859375, -0.8514175415039062, -0.818328857421875, -0.7852401733398438, -0.7521514892578125, -0.7190628051757812, -0.68597412109375, -0.6528854370117188, -0.6197967529296875, -0.5867080688476562, -0.553619384765625, -0.5205307006835938, -0.4874420166015625, -0.45435333251953125, -0.4212646484375, -0.38817596435546875, -0.3550872802734375, -0.32199859619140625, -0.288909912109375, -0.25582122802734375, -0.2227325439453125, -0.18964385986328125, -0.15655517578125, -0.12346649169921875, -0.0903778076171875, -0.05728912353515625, -0.024200439453125, 0.00888824462890625, 0.0419769287109375, 0.07506561279296875, 0.108154296875, 0.14124298095703125, 0.1743316650390625, 0.20742034912109375, 0.240509033203125, 0.27359771728515625, 0.3066864013671875, 0.33977508544921875, 0.37286376953125, 0.40595245361328125, 0.4390411376953125, 0.47212982177734375, 0.505218505859375, 0.5383071899414062, 0.5713958740234375, 0.6044845581054688, 0.6375732421875, 0.6706619262695312, 0.7037506103515625, 0.7368392944335938, 0.769927978515625, 0.8030166625976562, 0.8361053466796875, 0.8691940307617188, 0.90228271484375, 0.9353713989257812, 0.9684600830078125, 1.0015487670898438, 1.034637451171875, 1.0677261352539062, 1.1008148193359375, 1.1339035034179688, 1.1669921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 8.0, 11.0, 15.0, 27.0, 43.0, 57.0, 72.0, 75.0, 77.0, 86.0, 94.0, 90.0, 81.0, 72.0, 52.0, 35.0, 40.0, 23.0, 18.0, 12.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.22265625, -1.1961479187011719, -1.1696395874023438, -1.1431312561035156, -1.1166229248046875, -1.0901145935058594, -1.0636062622070312, -1.0370979309082031, -1.010589599609375, -0.9840812683105469, -0.9575729370117188, -0.9310646057128906, -0.9045562744140625, -0.8780479431152344, -0.8515396118164062, -0.8250312805175781, -0.79852294921875, -0.7720146179199219, -0.7455062866210938, -0.7189979553222656, -0.6924896240234375, -0.6659812927246094, -0.6394729614257812, -0.6129646301269531, -0.586456298828125, -0.5599479675292969, -0.5334396362304688, -0.5069313049316406, -0.4804229736328125, -0.4539146423339844, -0.42740631103515625, -0.4008979797363281, -0.3743896484375, -0.3478813171386719, -0.32137298583984375, -0.2948646545410156, -0.2683563232421875, -0.24184799194335938, -0.21533966064453125, -0.18883132934570312, -0.162322998046875, -0.13581466674804688, -0.10930633544921875, -0.08279800415039062, -0.0562896728515625, -0.029781341552734375, -0.00327301025390625, 0.023235321044921875, 0.04974365234375, 0.07625198364257812, 0.10276031494140625, 0.12926864624023438, 0.1557769775390625, 0.18228530883789062, 0.20879364013671875, 0.23530197143554688, 0.261810302734375, 0.2883186340332031, 0.31482696533203125, 0.3413352966308594, 0.3678436279296875, 0.3943519592285156, 0.42086029052734375, 0.4473686218261719, 0.473876953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 3.0, 12.0, 7.0, 8.0, 23.0, 27.0, 51.0, 103.0, 202.0, 368.0, 770.0, 1645.0, 3771.0, 10655.0, 36825.0, 196679.0, 633079.0, 123721.0, 26790.0, 8177.0, 3015.0, 1307.0, 651.0, 285.0, 146.0, 83.0, 50.0, 25.0, 20.0, 14.0, 13.0, 11.0, 5.0, 6.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.466552734375, -0.45372772216796875, -0.4409027099609375, -0.42807769775390625, -0.415252685546875, -0.40242767333984375, -0.3896026611328125, -0.37677764892578125, -0.36395263671875, -0.35112762451171875, -0.3383026123046875, -0.32547760009765625, -0.312652587890625, -0.29982757568359375, -0.2870025634765625, -0.27417755126953125, -0.2613525390625, -0.24852752685546875, -0.2357025146484375, -0.22287750244140625, -0.210052490234375, -0.19722747802734375, -0.1844024658203125, -0.17157745361328125, -0.15875244140625, -0.14592742919921875, -0.1331024169921875, -0.12027740478515625, -0.107452392578125, -0.09462738037109375, -0.0818023681640625, -0.06897735595703125, -0.05615234375, -0.04332733154296875, -0.0305023193359375, -0.01767730712890625, -0.004852294921875, 0.00797271728515625, 0.0207977294921875, 0.03362274169921875, 0.04644775390625, 0.05927276611328125, 0.0720977783203125, 0.08492279052734375, 0.097747802734375, 0.11057281494140625, 0.1233978271484375, 0.13622283935546875, 0.1490478515625, 0.16187286376953125, 0.1746978759765625, 0.18752288818359375, 0.200347900390625, 0.21317291259765625, 0.2259979248046875, 0.23882293701171875, 0.25164794921875, 0.26447296142578125, 0.2772979736328125, 0.29012298583984375, 0.302947998046875, 0.31577301025390625, 0.3285980224609375, 0.34142303466796875, 0.354248046875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 6.0, 7.0, 9.0, 10.0, 16.0, 12.0, 15.0, 23.0, 23.0, 33.0, 35.0, 24.0, 34.0, 63.0, 47.0, 42.0, 33.0, 37.0, 36.0, 47.0, 42.0, 47.0, 47.0, 38.0, 30.0, 32.0, 37.0, 28.0, 26.0, 20.0, 12.0, 21.0, 7.0, 12.0, 6.0, 8.0, 4.0, 6.0, 3.0, 1.0, 3.0, 4.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.80419921875, -0.7798538208007812, -0.7555084228515625, -0.7311630249023438, -0.706817626953125, -0.6824722290039062, -0.6581268310546875, -0.6337814331054688, -0.60943603515625, -0.5850906372070312, -0.5607452392578125, -0.5363998413085938, -0.512054443359375, -0.48770904541015625, -0.4633636474609375, -0.43901824951171875, -0.4146728515625, -0.39032745361328125, -0.3659820556640625, -0.34163665771484375, -0.317291259765625, -0.29294586181640625, -0.2686004638671875, -0.24425506591796875, -0.21990966796875, -0.19556427001953125, -0.1712188720703125, -0.14687347412109375, -0.122528076171875, -0.09818267822265625, -0.0738372802734375, -0.04949188232421875, -0.025146484375, -0.00080108642578125, 0.0235443115234375, 0.04788970947265625, 0.072235107421875, 0.09658050537109375, 0.1209259033203125, 0.14527130126953125, 0.16961669921875, 0.19396209716796875, 0.2183074951171875, 0.24265289306640625, 0.266998291015625, 0.29134368896484375, 0.3156890869140625, 0.34003448486328125, 0.3643798828125, 0.38872528076171875, 0.4130706787109375, 0.43741607666015625, 0.461761474609375, 0.48610687255859375, 0.5104522705078125, 0.5347976684570312, 0.55914306640625, 0.5834884643554688, 0.6078338623046875, 0.6321792602539062, 0.656524658203125, 0.6808700561523438, 0.7052154541015625, 0.7295608520507812, 0.75390625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 8.0, 5.0, 10.0, 13.0, 13.0, 19.0, 43.0, 44.0, 102.0, 114.0, 171.0, 288.0, 460.0, 752.0, 1283.0, 2358.0, 4549.0, 11017.0, 42233.0, 569126.0, 363882.0, 33031.0, 9685.0, 4048.0, 2143.0, 1226.0, 699.0, 423.0, 257.0, 170.0, 131.0, 75.0, 55.0, 40.0, 15.0, 17.0, 14.0, 5.0, 9.0, 10.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.186279296875, -0.1807880401611328, -0.17529678344726562, -0.16980552673339844, -0.16431427001953125, -0.15882301330566406, -0.15333175659179688, -0.1478404998779297, -0.1423492431640625, -0.1368579864501953, -0.13136672973632812, -0.12587547302246094, -0.12038421630859375, -0.11489295959472656, -0.10940170288085938, -0.10391044616699219, -0.098419189453125, -0.09292793273925781, -0.08743667602539062, -0.08194541931152344, -0.07645416259765625, -0.07096290588378906, -0.06547164916992188, -0.05998039245605469, -0.0544891357421875, -0.04899787902832031, -0.043506622314453125, -0.03801536560058594, -0.03252410888671875, -0.027032852172851562, -0.021541595458984375, -0.016050338745117188, -0.01055908203125, -0.0050678253173828125, 0.000423431396484375, 0.0059146881103515625, 0.01140594482421875, 0.016897201538085938, 0.022388458251953125, 0.027879714965820312, 0.0333709716796875, 0.03886222839355469, 0.044353485107421875, 0.04984474182128906, 0.05533599853515625, 0.06082725524902344, 0.06631851196289062, 0.07180976867675781, 0.077301025390625, 0.08279228210449219, 0.08828353881835938, 0.09377479553222656, 0.09926605224609375, 0.10475730895996094, 0.11024856567382812, 0.11573982238769531, 0.1212310791015625, 0.1267223358154297, 0.13221359252929688, 0.13770484924316406, 0.14319610595703125, 0.14868736267089844, 0.15417861938476562, 0.1596698760986328, 0.1651611328125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 13.0, 7.0, 14.0, 21.0, 43.0, 75.0, 155.0, 287.0, 180.0, 71.0, 54.0, 23.0, 15.0, 11.0, 11.0, 3.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.551908493041992e-05, -7.122848182916641e-05, -6.69378787279129e-05, -6.26472756266594e-05, -5.8356672525405884e-05, -5.4066069424152374e-05, -4.9775466322898865e-05, -4.5484863221645355e-05, -4.1194260120391846e-05, -3.6903657019138336e-05, -3.261305391788483e-05, -2.8322450816631317e-05, -2.4031847715377808e-05, -1.9741244614124298e-05, -1.545064151287079e-05, -1.1160038411617279e-05, -6.8694353103637695e-06, -2.57883220911026e-06, 1.7117708921432495e-06, 6.002373993396759e-06, 1.0292977094650269e-05, 1.4583580195903778e-05, 1.8874183297157288e-05, 2.3164786398410797e-05, 2.7455389499664307e-05, 3.1745992600917816e-05, 3.6036595702171326e-05, 4.0327198803424835e-05, 4.4617801904678345e-05, 4.8908405005931854e-05, 5.3199008107185364e-05, 5.748961120843887e-05, 6.178021430969238e-05, 6.607081741094589e-05, 7.03614205121994e-05, 7.465202361345291e-05, 7.894262671470642e-05, 8.323322981595993e-05, 8.752383291721344e-05, 9.181443601846695e-05, 9.610503911972046e-05, 0.00010039564222097397, 0.00010468624532222748, 0.00010897684842348099, 0.0001132674515247345, 0.000117558054625988, 0.00012184865772724152, 0.00012613926082849503, 0.00013042986392974854, 0.00013472046703100204, 0.00013901107013225555, 0.00014330167323350906, 0.00014759227633476257, 0.00015188287943601608, 0.0001561734825372696, 0.0001604640856385231, 0.0001647546887397766, 0.00016904529184103012, 0.00017333589494228363, 0.00017762649804353714, 0.00018191710114479065, 0.00018620770424604416, 0.00019049830734729767, 0.00019478891044855118, 0.0001990795135498047]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 11.0, 6.0, 5.0, 23.0, 25.0, 42.0, 80.0, 117.0, 218.0, 362.0, 639.0, 1124.0, 2592.0, 7609.0, 56994.0, 910768.0, 55468.0, 7314.0, 2463.0, 1149.0, 643.0, 337.0, 212.0, 118.0, 82.0, 62.0, 29.0, 19.0, 7.0, 8.0, 5.0, 4.0, 7.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.309326171875, -0.3000907897949219, -0.29085540771484375, -0.2816200256347656, -0.2723846435546875, -0.2631492614746094, -0.25391387939453125, -0.24467849731445312, -0.235443115234375, -0.22620773315429688, -0.21697235107421875, -0.20773696899414062, -0.1985015869140625, -0.18926620483398438, -0.18003082275390625, -0.17079544067382812, -0.16156005859375, -0.15232467651367188, -0.14308929443359375, -0.13385391235351562, -0.1246185302734375, -0.11538314819335938, -0.10614776611328125, -0.09691238403320312, -0.087677001953125, -0.07844161987304688, -0.06920623779296875, -0.059970855712890625, -0.0507354736328125, -0.041500091552734375, -0.03226470947265625, -0.023029327392578125, -0.0137939453125, -0.004558563232421875, 0.00467681884765625, 0.013912200927734375, 0.0231475830078125, 0.032382965087890625, 0.04161834716796875, 0.050853729248046875, 0.060089111328125, 0.06932449340820312, 0.07855987548828125, 0.08779525756835938, 0.0970306396484375, 0.10626602172851562, 0.11550140380859375, 0.12473678588867188, 0.13397216796875, 0.14320755004882812, 0.15244293212890625, 0.16167831420898438, 0.1709136962890625, 0.18014907836914062, 0.18938446044921875, 0.19861984252929688, 0.207855224609375, 0.21709060668945312, 0.22632598876953125, 0.23556137084960938, 0.2447967529296875, 0.2540321350097656, 0.26326751708984375, 0.2725028991699219, 0.28173828125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 6.0, 2.0, 5.0, 5.0, 20.0, 22.0, 32.0, 68.0, 144.0, 226.0, 211.0, 127.0, 42.0, 26.0, 20.0, 18.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.0748291015625, -0.07299947738647461, -0.07116985321044922, -0.06934022903442383, -0.06751060485839844, -0.06568098068237305, -0.06385135650634766, -0.062021732330322266, -0.060192108154296875, -0.058362483978271484, -0.056532859802246094, -0.0547032356262207, -0.05287361145019531, -0.05104398727416992, -0.04921436309814453, -0.04738473892211914, -0.04555511474609375, -0.04372549057006836, -0.04189586639404297, -0.04006624221801758, -0.03823661804199219, -0.0364069938659668, -0.034577369689941406, -0.032747745513916016, -0.030918121337890625, -0.029088497161865234, -0.027258872985839844, -0.025429248809814453, -0.023599624633789062, -0.021770000457763672, -0.01994037628173828, -0.01811075210571289, -0.0162811279296875, -0.01445150375366211, -0.012621879577636719, -0.010792255401611328, -0.008962631225585938, -0.007133007049560547, -0.005303382873535156, -0.0034737586975097656, -0.001644134521484375, 0.00018548965454101562, 0.0020151138305664062, 0.003844738006591797, 0.0056743621826171875, 0.007503986358642578, 0.009333610534667969, 0.01116323471069336, 0.01299285888671875, 0.01482248306274414, 0.01665210723876953, 0.018481731414794922, 0.020311355590820312, 0.022140979766845703, 0.023970603942871094, 0.025800228118896484, 0.027629852294921875, 0.029459476470947266, 0.031289100646972656, 0.03311872482299805, 0.03494834899902344, 0.03677797317504883, 0.03860759735107422, 0.04043722152709961, 0.042266845703125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 8.0, 11.0, 23.0, 77.0, 147.0, 336.0, 232.0, 89.0, 46.0, 22.0, 8.0, 8.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.740212619304657, -0.6771643161773682, -0.6141160726547241, -0.5510677695274353, -0.48801949620246887, -0.42497122287750244, -0.3619229197502136, -0.2988746464252472, -0.23582637310028076, -0.17277809977531433, -0.1097298115491867, -0.04668152332305908, 0.01636675000190735, 0.07941502332687378, 0.1424633264541626, 0.20551159977912903, 0.26855987310409546, 0.3316081464290619, 0.3946564197540283, 0.45770472288131714, 0.520753026008606, 0.58380126953125, 0.6468495726585388, 0.7098978757858276, 0.7729461193084717, 0.8359944224357605, 0.8990426659584045, 0.9620909690856934, 1.0251392126083374, 1.0881874561309814, 1.151235818862915, 1.214284062385559, 1.2773323059082031, 1.3403805494308472, 1.4034289121627808, 1.4664771556854248, 1.5295253992080688, 1.592573642730713, 1.6556220054626465, 1.7186702489852905, 1.7817184925079346, 1.8447667360305786, 1.9078150987625122, 1.9708633422851562, 2.03391170501709, 2.0969598293304443, 2.160008192062378, 2.2230565547943115, 2.286104679107666, 2.3491530418395996, 2.412201166152954, 2.4752495288848877, 2.5382978916168213, 2.601346015930176, 2.6643943786621094, 2.727442741394043, 2.7904911041259766, 2.85353946685791, 2.9165875911712646, 2.9796359539031982, 3.042684316635132, 3.1057324409484863, 3.16878080368042, 3.2318291664123535, 3.294877290725708]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 7.0, 9.0, 10.0, 20.0, 32.0, 39.0, 43.0, 68.0, 89.0, 63.0, 91.0, 80.0, 93.0, 90.0, 72.0, 52.0, 39.0, 36.0, 23.0, 18.0, 17.0, 8.0, 4.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1846389770507812, -1.159031867980957, -1.1334247589111328, -1.1078176498413086, -1.0822104215621948, -1.0566033124923706, -1.0309962034225464, -1.0053890943527222, -0.979781985282898, -0.9541748762130737, -0.9285677075386047, -0.9029605984687805, -0.8773534893989563, -0.8517463207244873, -0.8261392116546631, -0.8005321025848389, -0.7749249935150146, -0.7493178844451904, -0.7237107157707214, -0.6981036067008972, -0.672496497631073, -0.646889328956604, -0.6212822198867798, -0.5956751108169556, -0.5700679421424866, -0.5444608330726624, -0.5188536643981934, -0.49324655532836914, -0.4676394462585449, -0.4420323073863983, -0.4164251685142517, -0.3908180594444275, -0.36521095037460327, -0.33960381150245667, -0.31399670243263245, -0.28838956356048584, -0.2627824544906616, -0.23717531561851501, -0.2115681916475296, -0.1859610676765442, -0.16035394370555878, -0.13474681973457336, -0.10913969576358795, -0.08353256434202194, -0.05792544037103653, -0.03231830894947052, -0.006711184978485107, 0.018895938992500305, 0.04450306296348572, 0.07011018693447113, 0.09571731090545654, 0.12132444232702255, 0.14693155884742737, 0.17253869771957397, 0.1981458216905594, 0.2237529456615448, 0.2493600696325302, 0.2749671936035156, 0.30057433247566223, 0.32618144154548645, 0.35178858041763306, 0.3773956894874573, 0.4030028283596039, 0.4286099672317505, 0.4542170763015747]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 3.0, 4.0, 2.0, 2.0, 11.0, 16.0, 70.0, 159.0, 564.0, 2410.0, 16719.0, 532923.0, 476576.0, 15814.0, 2367.0, 602.0, 171.0, 61.0, 27.0, 10.0, 5.0, 3.0, 5.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.09765625, -2.0377044677734375, -1.977752685546875, -1.9178009033203125, -1.85784912109375, -1.7978973388671875, -1.737945556640625, -1.6779937744140625, -1.6180419921875, -1.5580902099609375, -1.498138427734375, -1.4381866455078125, -1.37823486328125, -1.3182830810546875, -1.258331298828125, -1.1983795166015625, -1.138427734375, -1.0784759521484375, -1.018524169921875, -0.9585723876953125, -0.89862060546875, -0.8386688232421875, -0.778717041015625, -0.7187652587890625, -0.6588134765625, -0.5988616943359375, -0.538909912109375, -0.4789581298828125, -0.41900634765625, -0.3590545654296875, -0.299102783203125, -0.2391510009765625, -0.17919921875, -0.1192474365234375, -0.059295654296875, 0.0006561279296875, 0.06060791015625, 0.1205596923828125, 0.180511474609375, 0.2404632568359375, 0.3004150390625, 0.3603668212890625, 0.420318603515625, 0.4802703857421875, 0.54022216796875, 0.6001739501953125, 0.660125732421875, 0.7200775146484375, 0.780029296875, 0.8399810791015625, 0.899932861328125, 0.9598846435546875, 1.01983642578125, 1.0797882080078125, 1.139739990234375, 1.1996917724609375, 1.2596435546875, 1.3195953369140625, 1.379547119140625, 1.4394989013671875, 1.49945068359375, 1.5594024658203125, 1.619354248046875, 1.6793060302734375, 1.7392578125]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 9.0, 7.0, 8.0, 9.0, 19.0, 20.0, 14.0, 30.0, 33.0, 49.0, 71.0, 48.0, 67.0, 64.0, 73.0, 75.0, 76.0, 71.0, 64.0, 44.0, 30.0, 36.0, 21.0, 24.0, 17.0, 8.0, 8.0, 8.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.779296875, -1.7383346557617188, -1.6973724365234375, -1.6564102172851562, -1.615447998046875, -1.5744857788085938, -1.5335235595703125, -1.4925613403320312, -1.45159912109375, -1.4106369018554688, -1.3696746826171875, -1.3287124633789062, -1.287750244140625, -1.2467880249023438, -1.2058258056640625, -1.1648635864257812, -1.1239013671875, -1.0829391479492188, -1.0419769287109375, -1.0010147094726562, -0.960052490234375, -0.9190902709960938, -0.8781280517578125, -0.8371658325195312, -0.79620361328125, -0.7552413940429688, -0.7142791748046875, -0.6733169555664062, -0.632354736328125, -0.5913925170898438, -0.5504302978515625, -0.5094680786132812, -0.468505859375, -0.42754364013671875, -0.3865814208984375, -0.34561920166015625, -0.304656982421875, -0.26369476318359375, -0.2227325439453125, -0.18177032470703125, -0.14080810546875, -0.09984588623046875, -0.0588836669921875, -0.01792144775390625, 0.023040771484375, 0.06400299072265625, 0.1049652099609375, 0.14592742919921875, 0.1868896484375, 0.22785186767578125, 0.2688140869140625, 0.30977630615234375, 0.350738525390625, 0.39170074462890625, 0.4326629638671875, 0.47362518310546875, 0.51458740234375, 0.5555496215820312, 0.5965118408203125, 0.6374740600585938, 0.678436279296875, 0.7193984985351562, 0.7603607177734375, 0.8013229370117188, 0.84228515625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 6.0, 6.0, 9.0, 7.0, 6.0, 17.0, 18.0, 22.0, 20.0, 28.0, 39.0, 51.0, 41.0, 64.0, 86.0, 192.0, 821.0, 22365.0, 1011844.0, 11734.0, 622.0, 158.0, 77.0, 71.0, 40.0, 43.0, 26.0, 29.0, 24.0, 15.0, 22.0, 14.0, 4.0, 8.0, 7.0, 3.0, 9.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.5, -3.388641357421875, -3.27728271484375, -3.165924072265625, -3.0545654296875, -2.943206787109375, -2.83184814453125, -2.720489501953125, -2.609130859375, -2.497772216796875, -2.38641357421875, -2.275054931640625, -2.1636962890625, -2.052337646484375, -1.94097900390625, -1.829620361328125, -1.71826171875, -1.606903076171875, -1.49554443359375, -1.384185791015625, -1.2728271484375, -1.161468505859375, -1.05010986328125, -0.938751220703125, -0.827392578125, -0.716033935546875, -0.60467529296875, -0.493316650390625, -0.3819580078125, -0.270599365234375, -0.15924072265625, -0.047882080078125, 0.0634765625, 0.174835205078125, 0.28619384765625, 0.397552490234375, 0.5089111328125, 0.620269775390625, 0.73162841796875, 0.842987060546875, 0.954345703125, 1.065704345703125, 1.17706298828125, 1.288421630859375, 1.3997802734375, 1.511138916015625, 1.62249755859375, 1.733856201171875, 1.84521484375, 1.956573486328125, 2.06793212890625, 2.179290771484375, 2.2906494140625, 2.402008056640625, 2.51336669921875, 2.624725341796875, 2.736083984375, 2.847442626953125, 2.95880126953125, 3.070159912109375, 3.1815185546875, 3.292877197265625, 3.40423583984375, 3.515594482421875, 3.626953125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 6.0, 3.0, 4.0, 8.0, 5.0, 9.0, 10.0, 14.0, 9.0, 27.0, 14.0, 27.0, 25.0, 35.0, 42.0, 47.0, 39.0, 38.0, 49.0, 54.0, 39.0, 56.0, 33.0, 40.0, 47.0, 38.0, 27.0, 31.0, 23.0, 35.0, 35.0, 29.0, 19.0, 16.0, 21.0, 15.0, 7.0, 9.0, 7.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.95068359375, -0.9230422973632812, -0.8954010009765625, -0.8677597045898438, -0.840118408203125, -0.8124771118164062, -0.7848358154296875, -0.7571945190429688, -0.72955322265625, -0.7019119262695312, -0.6742706298828125, -0.6466293334960938, -0.618988037109375, -0.5913467407226562, -0.5637054443359375, -0.5360641479492188, -0.5084228515625, -0.48078155517578125, -0.4531402587890625, -0.42549896240234375, -0.397857666015625, -0.37021636962890625, -0.3425750732421875, -0.31493377685546875, -0.28729248046875, -0.25965118408203125, -0.2320098876953125, -0.20436859130859375, -0.176727294921875, -0.14908599853515625, -0.1214447021484375, -0.09380340576171875, -0.066162109375, -0.03852081298828125, -0.0108795166015625, 0.01676177978515625, 0.044403076171875, 0.07204437255859375, 0.0996856689453125, 0.12732696533203125, 0.15496826171875, 0.18260955810546875, 0.2102508544921875, 0.23789215087890625, 0.265533447265625, 0.29317474365234375, 0.3208160400390625, 0.34845733642578125, 0.3760986328125, 0.40373992919921875, 0.4313812255859375, 0.45902252197265625, 0.486663818359375, 0.5143051147460938, 0.5419464111328125, 0.5695877075195312, 0.59722900390625, 0.6248703002929688, 0.6525115966796875, 0.6801528930664062, 0.707794189453125, 0.7354354858398438, 0.7630767822265625, 0.7907180786132812, 0.818359375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 1.0, 1.0, 3.0, 3.0, 10.0, 10.0, 11.0, 14.0, 31.0, 25.0, 85.0, 168.0, 316.0, 813.0, 2443.0, 11268.0, 261889.0, 750019.0, 16774.0, 2917.0, 918.0, 380.0, 212.0, 98.0, 56.0, 37.0, 18.0, 11.0, 7.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5927734375, -0.570892333984375, -0.54901123046875, -0.527130126953125, -0.5052490234375, -0.483367919921875, -0.46148681640625, -0.439605712890625, -0.417724609375, -0.395843505859375, -0.37396240234375, -0.352081298828125, -0.3302001953125, -0.308319091796875, -0.28643798828125, -0.264556884765625, -0.24267578125, -0.220794677734375, -0.19891357421875, -0.177032470703125, -0.1551513671875, -0.133270263671875, -0.11138916015625, -0.089508056640625, -0.067626953125, -0.045745849609375, -0.02386474609375, -0.001983642578125, 0.0198974609375, 0.041778564453125, 0.06365966796875, 0.085540771484375, 0.107421875, 0.129302978515625, 0.15118408203125, 0.173065185546875, 0.1949462890625, 0.216827392578125, 0.23870849609375, 0.260589599609375, 0.282470703125, 0.304351806640625, 0.32623291015625, 0.348114013671875, 0.3699951171875, 0.391876220703125, 0.41375732421875, 0.435638427734375, 0.45751953125, 0.479400634765625, 0.50128173828125, 0.523162841796875, 0.5450439453125, 0.566925048828125, 0.58880615234375, 0.610687255859375, 0.632568359375, 0.654449462890625, 0.67633056640625, 0.698211669921875, 0.7200927734375, 0.741973876953125, 0.76385498046875, 0.785736083984375, 0.8076171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 8.0, 9.0, 4.0, 14.0, 11.0, 32.0, 28.0, 68.0, 110.0, 208.0, 242.0, 111.0, 57.0, 41.0, 26.0, 10.0, 8.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.624792098999023e-05, -8.392054587602615e-05, -8.159317076206207e-05, -7.926579564809799e-05, -7.693842053413391e-05, -7.461104542016983e-05, -7.228367030620575e-05, -6.995629519224167e-05, -6.762892007827759e-05, -6.530154496431351e-05, -6.297416985034943e-05, -6.0646794736385345e-05, -5.8319419622421265e-05, -5.5992044508457184e-05, -5.36646693944931e-05, -5.133729428052902e-05, -4.900991916656494e-05, -4.668254405260086e-05, -4.435516893863678e-05, -4.20277938246727e-05, -3.970041871070862e-05, -3.737304359674454e-05, -3.5045668482780457e-05, -3.2718293368816376e-05, -3.0390918254852295e-05, -2.8063543140888214e-05, -2.5736168026924133e-05, -2.3408792912960052e-05, -2.108141779899597e-05, -1.875404268503189e-05, -1.642666757106781e-05, -1.409929245710373e-05, -1.1771917343139648e-05, -9.444542229175568e-06, -7.117167115211487e-06, -4.789792001247406e-06, -2.462416887283325e-06, -1.3504177331924438e-07, 2.1923333406448364e-06, 4.519708454608917e-06, 6.847083568572998e-06, 9.174458682537079e-06, 1.150183379650116e-05, 1.382920891046524e-05, 1.615658402442932e-05, 1.8483959138393402e-05, 2.0811334252357483e-05, 2.3138709366321564e-05, 2.5466084480285645e-05, 2.7793459594249725e-05, 3.0120834708213806e-05, 3.244820982217789e-05, 3.477558493614197e-05, 3.710296005010605e-05, 3.943033516407013e-05, 4.175771027803421e-05, 4.408508539199829e-05, 4.641246050596237e-05, 4.873983561992645e-05, 5.1067210733890533e-05, 5.3394585847854614e-05, 5.5721960961818695e-05, 5.8049336075782776e-05, 6.037671118974686e-05, 6.270408630371094e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 8.0, 3.0, 5.0, 8.0, 20.0, 28.0, 32.0, 63.0, 95.0, 206.0, 412.0, 983.0, 2876.0, 12104.0, 122522.0, 858005.0, 41285.0, 6672.0, 1819.0, 737.0, 306.0, 149.0, 74.0, 48.0, 44.0, 19.0, 12.0, 7.0, 6.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41357421875, -0.3965606689453125, -0.379547119140625, -0.3625335693359375, -0.34552001953125, -0.3285064697265625, -0.311492919921875, -0.2944793701171875, -0.2774658203125, -0.2604522705078125, -0.243438720703125, -0.2264251708984375, -0.20941162109375, -0.1923980712890625, -0.175384521484375, -0.1583709716796875, -0.141357421875, -0.1243438720703125, -0.107330322265625, -0.0903167724609375, -0.07330322265625, -0.0562896728515625, -0.039276123046875, -0.0222625732421875, -0.0052490234375, 0.0117645263671875, 0.028778076171875, 0.0457916259765625, 0.06280517578125, 0.0798187255859375, 0.096832275390625, 0.1138458251953125, 0.130859375, 0.1478729248046875, 0.164886474609375, 0.1819000244140625, 0.19891357421875, 0.2159271240234375, 0.232940673828125, 0.2499542236328125, 0.2669677734375, 0.2839813232421875, 0.300994873046875, 0.3180084228515625, 0.33502197265625, 0.3520355224609375, 0.369049072265625, 0.3860626220703125, 0.403076171875, 0.4200897216796875, 0.437103271484375, 0.4541168212890625, 0.47113037109375, 0.4881439208984375, 0.505157470703125, 0.5221710205078125, 0.5391845703125, 0.5561981201171875, 0.573211669921875, 0.5902252197265625, 0.60723876953125, 0.6242523193359375, 0.641265869140625, 0.6582794189453125, 0.67529296875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 9.0, 4.0, 13.0, 17.0, 23.0, 24.0, 42.0, 48.0, 79.0, 149.0, 193.0, 123.0, 66.0, 64.0, 29.0, 31.0, 13.0, 12.0, 12.0, 7.0, 7.0, 4.0, 5.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1610107421875, -0.15619468688964844, -0.15137863159179688, -0.1465625762939453, -0.14174652099609375, -0.1369304656982422, -0.13211441040039062, -0.12729835510253906, -0.1224822998046875, -0.11766624450683594, -0.11285018920898438, -0.10803413391113281, -0.10321807861328125, -0.09840202331542969, -0.09358596801757812, -0.08876991271972656, -0.083953857421875, -0.07913780212402344, -0.07432174682617188, -0.06950569152832031, -0.06468963623046875, -0.05987358093261719, -0.055057525634765625, -0.05024147033691406, -0.0454254150390625, -0.04060935974121094, -0.035793304443359375, -0.030977249145507812, -0.02616119384765625, -0.021345138549804688, -0.016529083251953125, -0.011713027954101562, -0.00689697265625, -0.0020809173583984375, 0.002735137939453125, 0.0075511932373046875, 0.01236724853515625, 0.017183303833007812, 0.021999359130859375, 0.026815414428710938, 0.0316314697265625, 0.03644752502441406, 0.041263580322265625, 0.04607963562011719, 0.05089569091796875, 0.05571174621582031, 0.060527801513671875, 0.06534385681152344, 0.070159912109375, 0.07497596740722656, 0.07979202270507812, 0.08460807800292969, 0.08942413330078125, 0.09424018859863281, 0.09905624389648438, 0.10387229919433594, 0.1086883544921875, 0.11350440979003906, 0.11832046508789062, 0.12313652038574219, 0.12795257568359375, 0.1327686309814453, 0.13758468627929688, 0.14240074157714844, 0.147216796875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 21.0, 77.0, 281.0, 425.0, 153.0, 34.0, 15.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.611502647399902, -10.416038513183594, -10.220574378967285, -10.025110244750977, -9.829647064208984, -9.634182929992676, -9.438718795776367, -9.243254661560059, -9.04779052734375, -8.852326393127441, -8.656862258911133, -8.461398124694824, -8.265934944152832, -8.070470809936523, -7.875006675720215, -7.679542541503906, -7.484078407287598, -7.288614273071289, -7.093150615692139, -6.89768648147583, -6.7022223472595215, -6.506758213043213, -6.3112945556640625, -6.115830421447754, -5.9203667640686035, -5.724902629852295, -5.5294389724731445, -5.333974838256836, -5.138510704040527, -4.943046569824219, -4.747582912445068, -4.55211877822876, -4.356654644012451, -4.161190509796143, -3.965726613998413, -3.7702627182006836, -3.574798583984375, -3.3793346881866455, -3.183870792388916, -2.9884066581726074, -2.792942523956299, -2.5974786281585693, -2.4020144939422607, -2.2065505981445312, -2.0110864639282227, -1.8156225681304932, -1.6201585531234741, -1.424694538116455, -1.2292306423187256, -1.0337666273117065, -0.8383026123046875, -0.6428386569023132, -0.4473746418952942, -0.25191062688827515, -0.05644667148590088, 0.13901734352111816, 0.3344813585281372, 0.5299453735351562, 0.7254093885421753, 0.9208733439445496, 1.1163372993469238, 1.3118014335632324, 1.507265329360962, 1.702729344367981, 1.898193359375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 2.0, 11.0, 9.0, 8.0, 13.0, 16.0, 22.0, 25.0, 40.0, 35.0, 35.0, 35.0, 41.0, 39.0, 54.0, 44.0, 47.0, 49.0, 63.0, 44.0, 44.0, 43.0, 37.0, 39.0, 37.0, 32.0, 21.0, 31.0, 12.0, 11.0, 19.0, 13.0, 11.0, 2.0, 7.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.689207673072815, -1.6446982622146606, -1.6001887321472168, -1.5556793212890625, -1.5111699104309082, -1.4666603803634644, -1.42215096950531, -1.3776414394378662, -1.333132028579712, -1.2886226177215576, -1.2441130876541138, -1.1996036767959595, -1.1550941467285156, -1.1105847358703613, -1.066075325012207, -1.0215659141540527, -0.9770563840866089, -0.9325469136238098, -0.8880374431610107, -0.8435280323028564, -0.7990185618400574, -0.7545090913772583, -0.709999680519104, -0.6654902100563049, -0.6209807395935059, -0.5764712691307068, -0.5319617986679077, -0.4874523878097534, -0.44294291734695435, -0.3984334468841553, -0.3539240062236786, -0.3094145655632019, -0.2649049758911133, -0.2203955203294754, -0.17588606476783752, -0.13137660920619965, -0.08686715364456177, -0.04235769808292389, 0.0021517574787139893, 0.046661198139190674, 0.09117066860198975, 0.13568012416362762, 0.1801895797252655, 0.22469903528690338, 0.26920849084854126, 0.31371796131134033, 0.358227401971817, 0.4027368426322937, 0.4472463130950928, 0.49175578355789185, 0.5362652540206909, 0.5807746648788452, 0.6252841353416443, 0.6697936058044434, 0.7143030166625977, 0.7588124871253967, 0.8033219575881958, 0.8478314280509949, 0.892340898513794, 0.9368503093719482, 0.9813597798347473, 1.0258692502975464, 1.0703786611557007, 1.1148881912231445, 1.1593976020812988]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 9.0, 8.0, 17.0, 22.0, 46.0, 63.0, 78.0, 141.0, 316.0, 1733.0, 22702.0, 4005653.0, 157868.0, 4493.0, 635.0, 190.0, 106.0, 58.0, 48.0, 34.0, 24.0, 13.0, 8.0, 5.0, 7.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.158203125, -3.035186767578125, -2.91217041015625, -2.789154052734375, -2.6661376953125, -2.543121337890625, -2.42010498046875, -2.297088623046875, -2.174072265625, -2.051055908203125, -1.92803955078125, -1.805023193359375, -1.6820068359375, -1.558990478515625, -1.43597412109375, -1.312957763671875, -1.18994140625, -1.066925048828125, -0.94390869140625, -0.820892333984375, -0.6978759765625, -0.574859619140625, -0.45184326171875, -0.328826904296875, -0.205810546875, -0.082794189453125, 0.04022216796875, 0.163238525390625, 0.2862548828125, 0.409271240234375, 0.53228759765625, 0.655303955078125, 0.7783203125, 0.901336669921875, 1.02435302734375, 1.147369384765625, 1.2703857421875, 1.393402099609375, 1.51641845703125, 1.639434814453125, 1.762451171875, 1.885467529296875, 2.00848388671875, 2.131500244140625, 2.2545166015625, 2.377532958984375, 2.50054931640625, 2.623565673828125, 2.74658203125, 2.869598388671875, 2.99261474609375, 3.115631103515625, 3.2386474609375, 3.361663818359375, 3.48468017578125, 3.607696533203125, 3.730712890625, 3.853729248046875, 3.97674560546875, 4.099761962890625, 4.2227783203125, 4.345794677734375, 4.46881103515625, 4.591827392578125, 4.71484375]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 11.0, 5.0, 17.0, 13.0, 17.0, 21.0, 23.0, 20.0, 25.0, 34.0, 44.0, 35.0, 36.0, 51.0, 41.0, 59.0, 55.0, 56.0, 48.0, 47.0, 42.0, 50.0, 31.0, 33.0, 31.0, 29.0, 23.0, 30.0, 16.0, 20.0, 5.0, 10.0, 8.0, 8.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.74853515625, -0.7276229858398438, -0.7067108154296875, -0.6857986450195312, -0.664886474609375, -0.6439743041992188, -0.6230621337890625, -0.6021499633789062, -0.58123779296875, -0.5603256225585938, -0.5394134521484375, -0.5185012817382812, -0.497589111328125, -0.47667694091796875, -0.4557647705078125, -0.43485260009765625, -0.4139404296875, -0.39302825927734375, -0.3721160888671875, -0.35120391845703125, -0.330291748046875, -0.30937957763671875, -0.2884674072265625, -0.26755523681640625, -0.24664306640625, -0.22573089599609375, -0.2048187255859375, -0.18390655517578125, -0.162994384765625, -0.14208221435546875, -0.1211700439453125, -0.10025787353515625, -0.079345703125, -0.05843353271484375, -0.0375213623046875, -0.01660919189453125, 0.004302978515625, 0.02521514892578125, 0.0461273193359375, 0.06703948974609375, 0.08795166015625, 0.10886383056640625, 0.1297760009765625, 0.15068817138671875, 0.171600341796875, 0.19251251220703125, 0.2134246826171875, 0.23433685302734375, 0.2552490234375, 0.27616119384765625, 0.2970733642578125, 0.31798553466796875, 0.338897705078125, 0.35980987548828125, 0.3807220458984375, 0.40163421630859375, 0.42254638671875, 0.44345855712890625, 0.4643707275390625, 0.48528289794921875, 0.506195068359375, 0.5271072387695312, 0.5480194091796875, 0.5689315795898438, 0.58984375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 8.0, 2.0, 8.0, 11.0, 9.0, 15.0, 13.0, 45.0, 66.0, 118.0, 268.0, 696.0, 2569.0, 17513.0, 1489528.0, 2658215.0, 21216.0, 2716.0, 697.0, 272.0, 126.0, 59.0, 36.0, 17.0, 7.0, 7.0, 3.0, 3.0, 6.0, 3.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.37109375, -2.29931640625, -2.2275390625, -2.15576171875, -2.083984375, -2.01220703125, -1.9404296875, -1.86865234375, -1.796875, -1.72509765625, -1.6533203125, -1.58154296875, -1.509765625, -1.43798828125, -1.3662109375, -1.29443359375, -1.22265625, -1.15087890625, -1.0791015625, -1.00732421875, -0.935546875, -0.86376953125, -0.7919921875, -0.72021484375, -0.6484375, -0.57666015625, -0.5048828125, -0.43310546875, -0.361328125, -0.28955078125, -0.2177734375, -0.14599609375, -0.07421875, -0.00244140625, 0.0693359375, 0.14111328125, 0.212890625, 0.28466796875, 0.3564453125, 0.42822265625, 0.5, 0.57177734375, 0.6435546875, 0.71533203125, 0.787109375, 0.85888671875, 0.9306640625, 1.00244140625, 1.07421875, 1.14599609375, 1.2177734375, 1.28955078125, 1.361328125, 1.43310546875, 1.5048828125, 1.57666015625, 1.6484375, 1.72021484375, 1.7919921875, 1.86376953125, 1.935546875, 2.00732421875, 2.0791015625, 2.15087890625, 2.22265625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 7.0, 6.0, 6.0, 8.0, 21.0, 22.0, 20.0, 28.0, 41.0, 51.0, 81.0, 128.0, 217.0, 391.0, 592.0, 774.0, 647.0, 376.0, 223.0, 133.0, 85.0, 62.0, 44.0, 21.0, 23.0, 16.0, 10.0, 10.0, 5.0, 9.0, 4.0, 1.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.27685546875, -0.26747894287109375, -0.2581024169921875, -0.24872589111328125, -0.239349365234375, -0.22997283935546875, -0.2205963134765625, -0.21121978759765625, -0.20184326171875, -0.19246673583984375, -0.1830902099609375, -0.17371368408203125, -0.164337158203125, -0.15496063232421875, -0.1455841064453125, -0.13620758056640625, -0.1268310546875, -0.11745452880859375, -0.1080780029296875, -0.09870147705078125, -0.089324951171875, -0.07994842529296875, -0.0705718994140625, -0.06119537353515625, -0.05181884765625, -0.04244232177734375, -0.0330657958984375, -0.02368927001953125, -0.014312744140625, -0.00493621826171875, 0.0044403076171875, 0.01381683349609375, 0.023193359375, 0.03256988525390625, 0.0419464111328125, 0.05132293701171875, 0.060699462890625, 0.07007598876953125, 0.0794525146484375, 0.08882904052734375, 0.09820556640625, 0.10758209228515625, 0.1169586181640625, 0.12633514404296875, 0.135711669921875, 0.14508819580078125, 0.1544647216796875, 0.16384124755859375, 0.1732177734375, 0.18259429931640625, 0.1919708251953125, 0.20134735107421875, 0.210723876953125, 0.22010040283203125, 0.2294769287109375, 0.23885345458984375, 0.24822998046875, 0.25760650634765625, 0.2669830322265625, 0.27635955810546875, 0.285736083984375, 0.29511260986328125, 0.3044891357421875, 0.31386566162109375, 0.3232421875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 7.0, 10.0, 22.0, 25.0, 43.0, 77.0, 88.0, 140.0, 155.0, 135.0, 115.0, 53.0, 46.0, 33.0, 22.0, 13.0, 4.0, 4.0, 2.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9143352508544922, -0.8651582598686218, -0.8159813284873962, -0.7668043375015259, -0.7176273465156555, -0.6684503555297852, -0.6192734241485596, -0.5700964331626892, -0.5209194421768188, -0.4717424809932709, -0.4225654900074005, -0.37338852882385254, -0.3242115378379822, -0.2750345766544342, -0.22585761547088623, -0.17668062448501587, -0.12750369310379028, -0.07832671701908112, -0.029149748384952545, 0.020027220249176025, 0.06920419633388519, 0.11838117241859436, 0.16755813360214233, 0.2167351245880127, 0.26591208577156067, 0.31508904695510864, 0.364266037940979, 0.413442999124527, 0.46261996030807495, 0.5117969512939453, 0.5609738826751709, 0.610150933265686, 0.6593278646469116, 0.708504855632782, 0.7576817870140076, 0.8068587779998779, 0.8560357689857483, 0.9052127599716187, 0.9543896913528442, 1.0035667419433594, 1.052743673324585, 1.1019206047058105, 1.1510976552963257, 1.2002745866775513, 1.2494515180587769, 1.298628568649292, 1.3478055000305176, 1.3969824314117432, 1.4461593627929688, 1.4953362941741943, 1.5445133447647095, 1.593690276145935, 1.6428672075271606, 1.6920442581176758, 1.7412211894989014, 1.790398120880127, 1.839575171470642, 1.8887521028518677, 1.9379291534423828, 1.9871060848236084, 2.036283016204834, 2.0854599475860596, 2.134636878967285, 2.18381404876709, 2.2329909801483154]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 6.0, 9.0, 9.0, 12.0, 12.0, 15.0, 17.0, 19.0, 23.0, 27.0, 35.0, 41.0, 47.0, 28.0, 30.0, 39.0, 40.0, 52.0, 46.0, 45.0, 43.0, 34.0, 31.0, 37.0, 40.0, 36.0, 36.0, 33.0, 14.0, 38.0, 29.0, 15.0, 8.0, 14.0, 11.0, 7.0, 7.0, 7.0, 3.0, 3.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.7121543288230896, -0.6915651559829712, -0.670975923538208, -0.6503867506980896, -0.6297975778579712, -0.609208345413208, -0.5886191725730896, -0.5680299997329712, -0.547440767288208, -0.5268515944480896, -0.5062623620033264, -0.485673189163208, -0.4650839865207672, -0.4444947838783264, -0.423905611038208, -0.4033164083957672, -0.3827272057533264, -0.3621380031108856, -0.3415488004684448, -0.3209596276283264, -0.3003704249858856, -0.2797812223434448, -0.2591920495033264, -0.23860284686088562, -0.21801364421844482, -0.19742444157600403, -0.17683525383472443, -0.15624606609344482, -0.13565686345100403, -0.11506766825914383, -0.09447847306728363, -0.07388928532600403, -0.05330002307891846, -0.03271082788705826, -0.012121632695198059, 0.00846756249666214, 0.02905675768852234, 0.04964595288038254, 0.07023514807224274, 0.09082433581352234, 0.11141353845596313, 0.13200274109840393, 0.15259192883968353, 0.17318111658096313, 0.19377031922340393, 0.21435952186584473, 0.23494870960712433, 0.25553789734840393, 0.2761270999908447, 0.2967163026332855, 0.3173055052757263, 0.3378946781158447, 0.3584838807582855, 0.3790730834007263, 0.3996622562408447, 0.4202514588832855, 0.4408406615257263, 0.4614298641681671, 0.4820190668106079, 0.5026082396507263, 0.5231974124908447, 0.5437866449356079, 0.5643758177757263, 0.5849649906158447, 0.6055542230606079]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 7.0, 6.0, 14.0, 19.0, 18.0, 57.0, 161.0, 720.0, 4311.0, 39314.0, 931308.0, 65395.0, 5950.0, 980.0, 165.0, 45.0, 30.0, 16.0, 5.0, 6.0, 8.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.935546875, -0.9016265869140625, -0.867706298828125, -0.8337860107421875, -0.79986572265625, -0.7659454345703125, -0.732025146484375, -0.6981048583984375, -0.6641845703125, -0.6302642822265625, -0.596343994140625, -0.5624237060546875, -0.52850341796875, -0.4945831298828125, -0.460662841796875, -0.4267425537109375, -0.392822265625, -0.3589019775390625, -0.324981689453125, -0.2910614013671875, -0.25714111328125, -0.2232208251953125, -0.189300537109375, -0.1553802490234375, -0.1214599609375, -0.0875396728515625, -0.053619384765625, -0.0196990966796875, 0.01422119140625, 0.0481414794921875, 0.082061767578125, 0.1159820556640625, 0.14990234375, 0.1838226318359375, 0.217742919921875, 0.2516632080078125, 0.28558349609375, 0.3195037841796875, 0.353424072265625, 0.3873443603515625, 0.4212646484375, 0.4551849365234375, 0.489105224609375, 0.5230255126953125, 0.55694580078125, 0.5908660888671875, 0.624786376953125, 0.6587066650390625, 0.692626953125, 0.7265472412109375, 0.760467529296875, 0.7943878173828125, 0.82830810546875, 0.8622283935546875, 0.896148681640625, 0.9300689697265625, 0.9639892578125, 0.9979095458984375, 1.031829833984375, 1.0657501220703125, 1.09967041015625, 1.1335906982421875, 1.167510986328125, 1.2014312744140625, 1.2353515625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 4.0, 8.0, 5.0, 13.0, 13.0, 31.0, 17.0, 28.0, 43.0, 44.0, 45.0, 51.0, 49.0, 60.0, 48.0, 59.0, 60.0, 45.0, 57.0, 50.0, 45.0, 48.0, 39.0, 32.0, 25.0, 24.0, 9.0, 14.0, 6.0, 7.0, 12.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.6494140625, -0.6334114074707031, -0.6174087524414062, -0.6014060974121094, -0.5854034423828125, -0.5694007873535156, -0.5533981323242188, -0.5373954772949219, -0.521392822265625, -0.5053901672363281, -0.48938751220703125, -0.4733848571777344, -0.4573822021484375, -0.4413795471191406, -0.42537689208984375, -0.4093742370605469, -0.39337158203125, -0.3773689270019531, -0.36136627197265625, -0.3453636169433594, -0.3293609619140625, -0.3133583068847656, -0.29735565185546875, -0.2813529968261719, -0.265350341796875, -0.24934768676757812, -0.23334503173828125, -0.21734237670898438, -0.2013397216796875, -0.18533706665039062, -0.16933441162109375, -0.15333175659179688, -0.1373291015625, -0.12132644653320312, -0.10532379150390625, -0.08932113647460938, -0.0733184814453125, -0.057315826416015625, -0.04131317138671875, -0.025310516357421875, -0.009307861328125, 0.006694793701171875, 0.02269744873046875, 0.038700103759765625, 0.0547027587890625, 0.07070541381835938, 0.08670806884765625, 0.10271072387695312, 0.11871337890625, 0.13471603393554688, 0.15071868896484375, 0.16672134399414062, 0.1827239990234375, 0.19872665405273438, 0.21472930908203125, 0.23073196411132812, 0.246734619140625, 0.2627372741699219, 0.27873992919921875, 0.2947425842285156, 0.3107452392578125, 0.3267478942871094, 0.34275054931640625, 0.3587532043457031, 0.374755859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 7.0, 10.0, 11.0, 16.0, 37.0, 64.0, 83.0, 169.0, 280.0, 571.0, 1095.0, 2431.0, 6002.0, 17706.0, 75479.0, 497030.0, 368393.0, 55289.0, 14594.0, 5006.0, 2126.0, 1000.0, 484.0, 275.0, 149.0, 94.0, 65.0, 28.0, 16.0, 11.0, 12.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.303955078125, -0.29499053955078125, -0.2860260009765625, -0.27706146240234375, -0.268096923828125, -0.25913238525390625, -0.2501678466796875, -0.24120330810546875, -0.23223876953125, -0.22327423095703125, -0.2143096923828125, -0.20534515380859375, -0.196380615234375, -0.18741607666015625, -0.1784515380859375, -0.16948699951171875, -0.1605224609375, -0.15155792236328125, -0.1425933837890625, -0.13362884521484375, -0.124664306640625, -0.11569976806640625, -0.1067352294921875, -0.09777069091796875, -0.08880615234375, -0.07984161376953125, -0.0708770751953125, -0.06191253662109375, -0.052947998046875, -0.04398345947265625, -0.0350189208984375, -0.02605438232421875, -0.01708984375, -0.00812530517578125, 0.0008392333984375, 0.00980377197265625, 0.018768310546875, 0.02773284912109375, 0.0366973876953125, 0.04566192626953125, 0.05462646484375, 0.06359100341796875, 0.0725555419921875, 0.08152008056640625, 0.090484619140625, 0.09944915771484375, 0.1084136962890625, 0.11737823486328125, 0.1263427734375, 0.13530731201171875, 0.1442718505859375, 0.15323638916015625, 0.162200927734375, 0.17116546630859375, 0.1801300048828125, 0.18909454345703125, 0.19805908203125, 0.20702362060546875, 0.2159881591796875, 0.22495269775390625, 0.233917236328125, 0.24288177490234375, 0.2518463134765625, 0.26081085205078125, 0.269775390625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 6.0, 5.0, 4.0, 7.0, 7.0, 9.0, 10.0, 14.0, 15.0, 24.0, 18.0, 26.0, 26.0, 24.0, 22.0, 24.0, 34.0, 39.0, 47.0, 48.0, 42.0, 54.0, 52.0, 46.0, 43.0, 29.0, 35.0, 31.0, 40.0, 31.0, 26.0, 19.0, 23.0, 18.0, 18.0, 19.0, 13.0, 11.0, 7.0, 7.0, 6.0, 4.0, 10.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6796875, -0.65838623046875, -0.6370849609375, -0.61578369140625, -0.594482421875, -0.57318115234375, -0.5518798828125, -0.53057861328125, -0.50927734375, -0.48797607421875, -0.4666748046875, -0.44537353515625, -0.424072265625, -0.40277099609375, -0.3814697265625, -0.36016845703125, -0.3388671875, -0.31756591796875, -0.2962646484375, -0.27496337890625, -0.253662109375, -0.23236083984375, -0.2110595703125, -0.18975830078125, -0.16845703125, -0.14715576171875, -0.1258544921875, -0.10455322265625, -0.083251953125, -0.06195068359375, -0.0406494140625, -0.01934814453125, 0.001953125, 0.02325439453125, 0.0445556640625, 0.06585693359375, 0.087158203125, 0.10845947265625, 0.1297607421875, 0.15106201171875, 0.17236328125, 0.19366455078125, 0.2149658203125, 0.23626708984375, 0.257568359375, 0.27886962890625, 0.3001708984375, 0.32147216796875, 0.3427734375, 0.36407470703125, 0.3853759765625, 0.40667724609375, 0.427978515625, 0.44927978515625, 0.4705810546875, 0.49188232421875, 0.51318359375, 0.53448486328125, 0.5557861328125, 0.57708740234375, 0.598388671875, 0.61968994140625, 0.6409912109375, 0.66229248046875, 0.68359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 4.0, 9.0, 6.0, 5.0, 15.0, 4.0, 18.0, 22.0, 35.0, 47.0, 75.0, 101.0, 136.0, 190.0, 331.0, 414.0, 681.0, 1053.0, 1620.0, 2601.0, 4179.0, 7128.0, 12850.0, 24706.0, 52972.0, 134391.0, 321822.0, 280379.0, 109201.0, 44156.0, 21350.0, 11227.0, 6320.0, 3806.0, 2250.0, 1501.0, 970.0, 629.0, 451.0, 274.0, 178.0, 149.0, 95.0, 51.0, 36.0, 31.0, 21.0, 21.0, 6.0, 14.0, 8.0, 2.0, 7.0, 5.0, 1.0, 3.0, 2.0, 3.0], "bins": [-0.03997802734375, -0.038762569427490234, -0.03754711151123047, -0.0363316535949707, -0.03511619567871094, -0.03390073776245117, -0.032685279846191406, -0.03146982192993164, -0.030254364013671875, -0.02903890609741211, -0.027823448181152344, -0.026607990264892578, -0.025392532348632812, -0.024177074432373047, -0.02296161651611328, -0.021746158599853516, -0.02053070068359375, -0.019315242767333984, -0.01809978485107422, -0.016884326934814453, -0.015668869018554688, -0.014453411102294922, -0.013237953186035156, -0.01202249526977539, -0.010807037353515625, -0.00959157943725586, -0.008376121520996094, -0.007160663604736328, -0.0059452056884765625, -0.004729747772216797, -0.0035142898559570312, -0.0022988319396972656, -0.0010833740234375, 0.00013208389282226562, 0.0013475418090820312, 0.002562999725341797, 0.0037784576416015625, 0.004993915557861328, 0.006209373474121094, 0.007424831390380859, 0.008640289306640625, 0.00985574722290039, 0.011071205139160156, 0.012286663055419922, 0.013502120971679688, 0.014717578887939453, 0.01593303680419922, 0.017148494720458984, 0.01836395263671875, 0.019579410552978516, 0.02079486846923828, 0.022010326385498047, 0.023225784301757812, 0.024441242218017578, 0.025656700134277344, 0.02687215805053711, 0.028087615966796875, 0.02930307388305664, 0.030518531799316406, 0.03173398971557617, 0.03294944763183594, 0.0341649055480957, 0.03538036346435547, 0.036595821380615234, 0.037811279296875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 5.0, 7.0, 9.0, 18.0, 23.0, 28.0, 55.0, 59.0, 121.0, 161.0, 170.0, 136.0, 71.0, 35.0, 22.0, 18.0, 13.0, 4.0, 9.0, 7.0, 7.0, 5.0, 4.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0650367736816406e-05, -3.89590859413147e-05, -3.726780414581299e-05, -3.557652235031128e-05, -3.388524055480957e-05, -3.219395875930786e-05, -3.0502676963806152e-05, -2.8811395168304443e-05, -2.7120113372802734e-05, -2.5428831577301025e-05, -2.3737549781799316e-05, -2.2046267986297607e-05, -2.03549861907959e-05, -1.866370439529419e-05, -1.697242259979248e-05, -1.528114080429077e-05, -1.3589859008789062e-05, -1.1898577213287354e-05, -1.0207295417785645e-05, -8.516013622283936e-06, -6.8247318267822266e-06, -5.133450031280518e-06, -3.4421682357788086e-06, -1.7508864402770996e-06, -5.960464477539063e-08, 1.6316771507263184e-06, 3.3229589462280273e-06, 5.014240741729736e-06, 6.705522537231445e-06, 8.396804332733154e-06, 1.0088086128234863e-05, 1.1779367923736572e-05, 1.3470649719238281e-05, 1.516193151473999e-05, 1.68532133102417e-05, 1.8544495105743408e-05, 2.0235776901245117e-05, 2.1927058696746826e-05, 2.3618340492248535e-05, 2.5309622287750244e-05, 2.7000904083251953e-05, 2.8692185878753662e-05, 3.038346767425537e-05, 3.207474946975708e-05, 3.376603126525879e-05, 3.54573130607605e-05, 3.714859485626221e-05, 3.8839876651763916e-05, 4.0531158447265625e-05, 4.2222440242767334e-05, 4.391372203826904e-05, 4.560500383377075e-05, 4.729628562927246e-05, 4.898756742477417e-05, 5.067884922027588e-05, 5.237013101577759e-05, 5.40614128112793e-05, 5.5752694606781006e-05, 5.7443976402282715e-05, 5.9135258197784424e-05, 6.082653999328613e-05, 6.251782178878784e-05, 6.420910358428955e-05, 6.590038537979126e-05, 6.759166717529297e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 7.0, 12.0, 11.0, 20.0, 66.0, 173.0, 816.0, 5592.0, 101636.0, 909208.0, 27561.0, 2731.0, 469.0, 132.0, 45.0, 24.0, 12.0, 7.0, 11.0, 3.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.28271484375, -0.27533721923828125, -0.2679595947265625, -0.26058197021484375, -0.253204345703125, -0.24582672119140625, -0.2384490966796875, -0.23107147216796875, -0.22369384765625, -0.21631622314453125, -0.2089385986328125, -0.20156097412109375, -0.194183349609375, -0.18680572509765625, -0.1794281005859375, -0.17205047607421875, -0.1646728515625, -0.15729522705078125, -0.1499176025390625, -0.14253997802734375, -0.135162353515625, -0.12778472900390625, -0.1204071044921875, -0.11302947998046875, -0.10565185546875, -0.09827423095703125, -0.0908966064453125, -0.08351898193359375, -0.076141357421875, -0.06876373291015625, -0.0613861083984375, -0.05400848388671875, -0.046630859375, -0.03925323486328125, -0.0318756103515625, -0.02449798583984375, -0.017120361328125, -0.00974273681640625, -0.0023651123046875, 0.00501251220703125, 0.01239013671875, 0.01976776123046875, 0.0271453857421875, 0.03452301025390625, 0.041900634765625, 0.04927825927734375, 0.0566558837890625, 0.06403350830078125, 0.0714111328125, 0.07878875732421875, 0.0861663818359375, 0.09354400634765625, 0.100921630859375, 0.10829925537109375, 0.1156768798828125, 0.12305450439453125, 0.13043212890625, 0.13780975341796875, 0.1451873779296875, 0.15256500244140625, 0.159942626953125, 0.16732025146484375, 0.1746978759765625, 0.18207550048828125, 0.189453125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 11.0, 9.0, 9.0, 10.0, 15.0, 22.0, 32.0, 34.0, 58.0, 72.0, 94.0, 104.0, 97.0, 96.0, 85.0, 61.0, 49.0, 34.0, 22.0, 19.0, 19.0, 14.0, 3.0, 9.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0205078125, -0.019870519638061523, -0.019233226776123047, -0.01859593391418457, -0.017958641052246094, -0.017321348190307617, -0.01668405532836914, -0.016046762466430664, -0.015409469604492188, -0.014772176742553711, -0.014134883880615234, -0.013497591018676758, -0.012860298156738281, -0.012223005294799805, -0.011585712432861328, -0.010948419570922852, -0.010311126708984375, -0.009673833847045898, -0.009036540985107422, -0.008399248123168945, -0.007761955261230469, -0.007124662399291992, -0.006487369537353516, -0.005850076675415039, -0.0052127838134765625, -0.004575490951538086, -0.003938198089599609, -0.003300905227661133, -0.0026636123657226562, -0.0020263195037841797, -0.0013890266418457031, -0.0007517337799072266, -0.00011444091796875, 0.0005228519439697266, 0.0011601448059082031, 0.0017974376678466797, 0.0024347305297851562, 0.003072023391723633, 0.0037093162536621094, 0.004346609115600586, 0.0049839019775390625, 0.005621194839477539, 0.006258487701416016, 0.006895780563354492, 0.007533073425292969, 0.008170366287231445, 0.008807659149169922, 0.009444952011108398, 0.010082244873046875, 0.010719537734985352, 0.011356830596923828, 0.011994123458862305, 0.012631416320800781, 0.013268709182739258, 0.013906002044677734, 0.014543294906616211, 0.015180587768554688, 0.015817880630493164, 0.01645517349243164, 0.017092466354370117, 0.017729759216308594, 0.01836705207824707, 0.019004344940185547, 0.019641637802124023, 0.0202789306640625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 18.0, 79.0, 315.0, 441.0, 120.0, 25.0, 8.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8653119206428528, -0.770869791507721, -0.6764277219772339, -0.581985592842102, -0.4875434637069702, -0.3931013345718384, -0.2986592650413513, -0.20421713590621948, -0.10977500677108765, -0.015332892537117004, 0.07910922169685364, 0.17355132102966309, 0.2679934501647949, 0.36243557929992676, 0.4568776488304138, 0.5513197779655457, 0.6457619071006775, 0.7402040362358093, 0.8346461057662964, 0.9290882349014282, 1.02353036403656, 1.117972493171692, 1.2124145030975342, 1.306856632232666, 1.4012987613677979, 1.4957408905029297, 1.5901830196380615, 1.6846251487731934, 1.7790672779083252, 1.873509407043457, 1.9679514169692993, 2.0623936653137207, 2.1568355560302734, 2.2512776851654053, 2.345719814300537, 2.440161943435669, 2.534604072570801, 2.6290462017059326, 2.7234883308410645, 2.817930221557617, 2.912372589111328, 3.00681471824646, 3.101256847381592, 3.1956989765167236, 3.2901411056518555, 3.3845832347869873, 3.479025363922119, 3.573467254638672, 3.6679093837738037, 3.7623515129089355, 3.8567936420440674, 3.951235771179199, 4.045677661895752, 4.140120029449463, 4.234561920166016, 4.329004287719727, 4.423446178436279, 4.517888069152832, 4.612330436706543, 4.706772327423096, 4.801214694976807, 4.895656585693359, 4.99009895324707, 5.084540843963623, 5.178983211517334]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 6.0, 6.0, 9.0, 13.0, 18.0, 22.0, 16.0, 31.0, 35.0, 44.0, 44.0, 42.0, 44.0, 56.0, 62.0, 55.0, 62.0, 39.0, 49.0, 42.0, 47.0, 39.0, 39.0, 44.0, 33.0, 28.0, 17.0, 8.0, 13.0, 10.0, 9.0, 10.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5836512446403503, -0.5690324306488037, -0.5544136166572571, -0.5397948026657104, -0.5251759886741638, -0.5105571746826172, -0.49593839049339294, -0.4813195765018463, -0.4667007625102997, -0.45208194851875305, -0.4374631345272064, -0.4228443503379822, -0.40822553634643555, -0.3936067223548889, -0.3789879083633423, -0.36436909437179565, -0.349750280380249, -0.3351314663887024, -0.32051265239715576, -0.30589383840560913, -0.2912750542163849, -0.27665624022483826, -0.2620374262332916, -0.247418612241745, -0.23279982805252075, -0.21818101406097412, -0.20356221497058868, -0.18894340097904205, -0.17432458698749542, -0.15970578789710999, -0.14508697390556335, -0.13046815991401672, -0.11584934592247009, -0.10123053938150406, -0.08661172538995743, -0.0719929188489914, -0.05737410858273506, -0.04275529831647873, -0.028136491775512695, -0.013517677783966064, 0.0011011287569999695, 0.015719939023256302, 0.030338747426867485, 0.04495755583047867, 0.059576366096735, 0.07419517636299133, 0.08881398290395737, 0.103432796895504, 0.11805160343647003, 0.13267041742801666, 0.1472892165184021, 0.16190803050994873, 0.17652684450149536, 0.191145658493042, 0.20576445758342743, 0.22038327157497406, 0.2350020706653595, 0.24962088465690613, 0.26423969864845276, 0.278858482837677, 0.29347729682922363, 0.30809611082077026, 0.3227149248123169, 0.3373337388038635, 0.35195255279541016]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 7.0, 11.0, 6.0, 12.0, 22.0, 41.0, 82.0, 172.0, 377.0, 895.0, 2360.0, 6424.0, 21574.0, 99738.0, 651750.0, 213474.0, 36121.0, 9737.0, 3473.0, 1300.0, 532.0, 221.0, 107.0, 52.0, 23.0, 11.0, 9.0, 6.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94287109375, -0.9140243530273438, -0.8851776123046875, -0.8563308715820312, -0.827484130859375, -0.7986373901367188, -0.7697906494140625, -0.7409439086914062, -0.71209716796875, -0.6832504272460938, -0.6544036865234375, -0.6255569458007812, -0.596710205078125, -0.5678634643554688, -0.5390167236328125, -0.5101699829101562, -0.4813232421875, -0.45247650146484375, -0.4236297607421875, -0.39478302001953125, -0.365936279296875, -0.33708953857421875, -0.3082427978515625, -0.27939605712890625, -0.25054931640625, -0.22170257568359375, -0.1928558349609375, -0.16400909423828125, -0.135162353515625, -0.10631561279296875, -0.0774688720703125, -0.04862213134765625, -0.019775390625, 0.00907135009765625, 0.0379180908203125, 0.06676483154296875, 0.095611572265625, 0.12445831298828125, 0.1533050537109375, 0.18215179443359375, 0.21099853515625, 0.23984527587890625, 0.2686920166015625, 0.29753875732421875, 0.326385498046875, 0.35523223876953125, 0.3840789794921875, 0.41292572021484375, 0.4417724609375, 0.47061920166015625, 0.4994659423828125, 0.5283126831054688, 0.557159423828125, 0.5860061645507812, 0.6148529052734375, 0.6436996459960938, 0.67254638671875, 0.7013931274414062, 0.7302398681640625, 0.7590866088867188, 0.787933349609375, 0.8167800903320312, 0.8456268310546875, 0.8744735717773438, 0.9033203125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 7.0, 2.0, 7.0, 5.0, 11.0, 9.0, 17.0, 17.0, 23.0, 23.0, 36.0, 39.0, 31.0, 49.0, 47.0, 60.0, 56.0, 58.0, 70.0, 55.0, 57.0, 49.0, 45.0, 38.0, 33.0, 39.0, 23.0, 17.0, 26.0, 17.0, 8.0, 13.0, 5.0, 7.0, 4.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.109375, -1.079345703125, -1.04931640625, -1.019287109375, -0.9892578125, -0.959228515625, -0.92919921875, -0.899169921875, -0.869140625, -0.839111328125, -0.80908203125, -0.779052734375, -0.7490234375, -0.718994140625, -0.68896484375, -0.658935546875, -0.62890625, -0.598876953125, -0.56884765625, -0.538818359375, -0.5087890625, -0.478759765625, -0.44873046875, -0.418701171875, -0.388671875, -0.358642578125, -0.32861328125, -0.298583984375, -0.2685546875, -0.238525390625, -0.20849609375, -0.178466796875, -0.1484375, -0.118408203125, -0.08837890625, -0.058349609375, -0.0283203125, 0.001708984375, 0.03173828125, 0.061767578125, 0.091796875, 0.121826171875, 0.15185546875, 0.181884765625, 0.2119140625, 0.241943359375, 0.27197265625, 0.302001953125, 0.33203125, 0.362060546875, 0.39208984375, 0.422119140625, 0.4521484375, 0.482177734375, 0.51220703125, 0.542236328125, 0.572265625, 0.602294921875, 0.63232421875, 0.662353515625, 0.6923828125, 0.722412109375, 0.75244140625, 0.782470703125, 0.8125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 6.0, 5.0, 8.0, 5.0, 7.0, 10.0, 16.0, 19.0, 16.0, 26.0, 29.0, 32.0, 42.0, 46.0, 77.0, 107.0, 168.0, 417.0, 2674.0, 64246.0, 957400.0, 20918.0, 1338.0, 334.0, 158.0, 87.0, 74.0, 60.0, 41.0, 40.0, 32.0, 14.0, 17.0, 14.0, 15.0, 9.0, 9.0, 9.0, 13.0, 8.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.24609375, -2.174468994140625, -2.10284423828125, -2.031219482421875, -1.9595947265625, -1.887969970703125, -1.81634521484375, -1.744720458984375, -1.673095703125, -1.601470947265625, -1.52984619140625, -1.458221435546875, -1.3865966796875, -1.314971923828125, -1.24334716796875, -1.171722412109375, -1.10009765625, -1.028472900390625, -0.95684814453125, -0.885223388671875, -0.8135986328125, -0.741973876953125, -0.67034912109375, -0.598724365234375, -0.527099609375, -0.455474853515625, -0.38385009765625, -0.312225341796875, -0.2406005859375, -0.168975830078125, -0.09735107421875, -0.025726318359375, 0.0458984375, 0.117523193359375, 0.18914794921875, 0.260772705078125, 0.3323974609375, 0.404022216796875, 0.47564697265625, 0.547271728515625, 0.618896484375, 0.690521240234375, 0.76214599609375, 0.833770751953125, 0.9053955078125, 0.977020263671875, 1.04864501953125, 1.120269775390625, 1.19189453125, 1.263519287109375, 1.33514404296875, 1.406768798828125, 1.4783935546875, 1.550018310546875, 1.62164306640625, 1.693267822265625, 1.764892578125, 1.836517333984375, 1.90814208984375, 1.979766845703125, 2.0513916015625, 2.123016357421875, 2.19464111328125, 2.266265869140625, 2.337890625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 4.0, 1.0, 4.0, 4.0, 4.0, 8.0, 12.0, 7.0, 15.0, 11.0, 23.0, 12.0, 19.0, 18.0, 24.0, 23.0, 38.0, 35.0, 28.0, 37.0, 39.0, 39.0, 49.0, 33.0, 52.0, 41.0, 45.0, 51.0, 41.0, 32.0, 32.0, 33.0, 31.0, 24.0, 26.0, 18.0, 15.0, 8.0, 11.0, 13.0, 11.0, 6.0, 6.0, 7.0, 8.0, 3.0, 0.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.62744140625, -0.6047515869140625, -0.582061767578125, -0.5593719482421875, -0.53668212890625, -0.5139923095703125, -0.491302490234375, -0.4686126708984375, -0.4459228515625, -0.4232330322265625, -0.400543212890625, -0.3778533935546875, -0.35516357421875, -0.3324737548828125, -0.309783935546875, -0.2870941162109375, -0.264404296875, -0.2417144775390625, -0.219024658203125, -0.1963348388671875, -0.17364501953125, -0.1509552001953125, -0.128265380859375, -0.1055755615234375, -0.0828857421875, -0.0601959228515625, -0.037506103515625, -0.0148162841796875, 0.00787353515625, 0.0305633544921875, 0.053253173828125, 0.0759429931640625, 0.0986328125, 0.1213226318359375, 0.144012451171875, 0.1667022705078125, 0.18939208984375, 0.2120819091796875, 0.234771728515625, 0.2574615478515625, 0.2801513671875, 0.3028411865234375, 0.325531005859375, 0.3482208251953125, 0.37091064453125, 0.3936004638671875, 0.416290283203125, 0.4389801025390625, 0.461669921875, 0.4843597412109375, 0.507049560546875, 0.5297393798828125, 0.55242919921875, 0.5751190185546875, 0.597808837890625, 0.6204986572265625, 0.6431884765625, 0.6658782958984375, 0.688568115234375, 0.7112579345703125, 0.73394775390625, 0.7566375732421875, 0.779327392578125, 0.8020172119140625, 0.82470703125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 6.0, 0.0, 3.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 4.0, 3.0, 10.0, 21.0, 31.0, 38.0, 79.0, 131.0, 278.0, 548.0, 1204.0, 3299.0, 12407.0, 90313.0, 796654.0, 122023.0, 15235.0, 3711.0, 1270.0, 616.0, 287.0, 150.0, 91.0, 49.0, 33.0, 15.0, 9.0, 9.0, 7.0, 6.0, 5.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.328125, -0.3186302185058594, -0.30913543701171875, -0.2996406555175781, -0.2901458740234375, -0.2806510925292969, -0.27115631103515625, -0.2616615295410156, -0.252166748046875, -0.24267196655273438, -0.23317718505859375, -0.22368240356445312, -0.2141876220703125, -0.20469284057617188, -0.19519805908203125, -0.18570327758789062, -0.17620849609375, -0.16671371459960938, -0.15721893310546875, -0.14772415161132812, -0.1382293701171875, -0.12873458862304688, -0.11923980712890625, -0.10974502563476562, -0.100250244140625, -0.09075546264648438, -0.08126068115234375, -0.07176589965820312, -0.0622711181640625, -0.052776336669921875, -0.04328155517578125, -0.033786773681640625, -0.0242919921875, -0.014797210693359375, -0.00530242919921875, 0.004192352294921875, 0.0136871337890625, 0.023181915283203125, 0.03267669677734375, 0.042171478271484375, 0.051666259765625, 0.061161041259765625, 0.07065582275390625, 0.08015060424804688, 0.0896453857421875, 0.09914016723632812, 0.10863494873046875, 0.11812973022460938, 0.12762451171875, 0.13711929321289062, 0.14661407470703125, 0.15610885620117188, 0.1656036376953125, 0.17509841918945312, 0.18459320068359375, 0.19408798217773438, 0.203582763671875, 0.21307754516601562, 0.22257232666015625, 0.23206710815429688, 0.2415618896484375, 0.2510566711425781, 0.26055145263671875, 0.2700462341308594, 0.279541015625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 7.0, 11.0, 14.0, 25.0, 46.0, 73.0, 188.0, 283.0, 158.0, 80.0, 43.0, 33.0, 21.0, 13.0, 6.0, 6.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.955862045288086e-05, -6.759818643331528e-05, -6.56377524137497e-05, -6.367731839418411e-05, -6.171688437461853e-05, -5.975645035505295e-05, -5.7796016335487366e-05, -5.5835582315921783e-05, -5.38751482963562e-05, -5.191471427679062e-05, -4.995428025722504e-05, -4.7993846237659454e-05, -4.603341221809387e-05, -4.407297819852829e-05, -4.211254417896271e-05, -4.0152110159397125e-05, -3.819167613983154e-05, -3.623124212026596e-05, -3.427080810070038e-05, -3.2310374081134796e-05, -3.0349940061569214e-05, -2.838950604200363e-05, -2.642907202243805e-05, -2.4468638002872467e-05, -2.2508203983306885e-05, -2.0547769963741302e-05, -1.858733594417572e-05, -1.6626901924610138e-05, -1.4666467905044556e-05, -1.2706033885478973e-05, -1.0745599865913391e-05, -8.785165846347809e-06, -6.8247318267822266e-06, -4.864297807216644e-06, -2.903863787651062e-06, -9.434297680854797e-07, 1.0170042514801025e-06, 2.977438271045685e-06, 4.937872290611267e-06, 6.898306310176849e-06, 8.858740329742432e-06, 1.0819174349308014e-05, 1.2779608368873596e-05, 1.4740042388439178e-05, 1.670047640800476e-05, 1.8660910427570343e-05, 2.0621344447135925e-05, 2.2581778466701508e-05, 2.454221248626709e-05, 2.6502646505832672e-05, 2.8463080525398254e-05, 3.0423514544963837e-05, 3.238394856452942e-05, 3.4344382584095e-05, 3.6304816603660583e-05, 3.8265250623226166e-05, 4.022568464279175e-05, 4.218611866235733e-05, 4.414655268192291e-05, 4.6106986701488495e-05, 4.806742072105408e-05, 5.002785474061966e-05, 5.198828876018524e-05, 5.3948722779750824e-05, 5.5909156799316406e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 9.0, 10.0, 20.0, 16.0, 38.0, 63.0, 115.0, 243.0, 489.0, 1150.0, 3799.0, 23596.0, 554629.0, 437965.0, 20652.0, 3642.0, 1095.0, 456.0, 256.0, 117.0, 68.0, 43.0, 30.0, 13.0, 4.0, 6.0, 4.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.42431640625, -0.4121818542480469, -0.40004730224609375, -0.3879127502441406, -0.3757781982421875, -0.3636436462402344, -0.35150909423828125, -0.3393745422363281, -0.327239990234375, -0.3151054382324219, -0.30297088623046875, -0.2908363342285156, -0.2787017822265625, -0.2665672302246094, -0.25443267822265625, -0.24229812622070312, -0.23016357421875, -0.21802902221679688, -0.20589447021484375, -0.19375991821289062, -0.1816253662109375, -0.16949081420898438, -0.15735626220703125, -0.14522171020507812, -0.133087158203125, -0.12095260620117188, -0.10881805419921875, -0.09668350219726562, -0.0845489501953125, -0.07241439819335938, -0.06027984619140625, -0.048145294189453125, -0.0360107421875, -0.023876190185546875, -0.01174163818359375, 0.000392913818359375, 0.0125274658203125, 0.024662017822265625, 0.03679656982421875, 0.048931121826171875, 0.061065673828125, 0.07320022583007812, 0.08533477783203125, 0.09746932983398438, 0.1096038818359375, 0.12173843383789062, 0.13387298583984375, 0.14600753784179688, 0.15814208984375, 0.17027664184570312, 0.18241119384765625, 0.19454574584960938, 0.2066802978515625, 0.21881484985351562, 0.23094940185546875, 0.24308395385742188, 0.255218505859375, 0.2673530578613281, 0.27948760986328125, 0.2916221618652344, 0.3037567138671875, 0.3158912658691406, 0.32802581787109375, 0.3401603698730469, 0.352294921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 9.0, 5.0, 16.0, 18.0, 28.0, 28.0, 50.0, 54.0, 70.0, 125.0, 121.0, 121.0, 93.0, 67.0, 40.0, 44.0, 29.0, 30.0, 10.0, 6.0, 10.0, 8.0, 6.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.090576171875, -0.0873727798461914, -0.08416938781738281, -0.08096599578857422, -0.07776260375976562, -0.07455921173095703, -0.07135581970214844, -0.06815242767333984, -0.06494903564453125, -0.061745643615722656, -0.05854225158691406, -0.05533885955810547, -0.052135467529296875, -0.04893207550048828, -0.04572868347167969, -0.042525291442871094, -0.0393218994140625, -0.036118507385253906, -0.03291511535644531, -0.02971172332763672, -0.026508331298828125, -0.02330493927001953, -0.020101547241210938, -0.016898155212402344, -0.01369476318359375, -0.010491371154785156, -0.0072879791259765625, -0.004084587097167969, -0.000881195068359375, 0.0023221969604492188, 0.0055255889892578125, 0.008728981018066406, 0.011932373046875, 0.015135765075683594, 0.018339157104492188, 0.02154254913330078, 0.024745941162109375, 0.02794933319091797, 0.031152725219726562, 0.034356117248535156, 0.03755950927734375, 0.040762901306152344, 0.04396629333496094, 0.04716968536376953, 0.050373077392578125, 0.05357646942138672, 0.05677986145019531, 0.059983253479003906, 0.0631866455078125, 0.0663900375366211, 0.06959342956542969, 0.07279682159423828, 0.07600021362304688, 0.07920360565185547, 0.08240699768066406, 0.08561038970947266, 0.08881378173828125, 0.09201717376708984, 0.09522056579589844, 0.09842395782470703, 0.10162734985351562, 0.10483074188232422, 0.10803413391113281, 0.1112375259399414, 0.11444091796875]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 5.0, 23.0, 20.0, 40.0, 68.0, 115.0, 114.0, 169.0, 156.0, 119.0, 60.0, 47.0, 25.0, 20.0, 7.0, 6.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2506989240646362, -1.1903655529022217, -1.1300321817398071, -1.0696988105773926, -1.009365439414978, -0.9490320682525635, -0.8886986970901489, -0.8283653259277344, -0.7680319547653198, -0.7076985836029053, -0.6473652124404907, -0.5870318412780762, -0.5266984701156616, -0.46636509895324707, -0.4060317277908325, -0.34569835662841797, -0.2853649854660034, -0.22503161430358887, -0.16469824314117432, -0.10436487197875977, -0.044031500816345215, 0.016301870346069336, 0.07663524150848389, 0.13696861267089844, 0.197301983833313, 0.25763535499572754, 0.3179687261581421, 0.37830209732055664, 0.4386354684829712, 0.49896883964538574, 0.5593022108078003, 0.6196355819702148, 0.6799688339233398, 0.7403022050857544, 0.800635576248169, 0.8609689474105835, 0.921302318572998, 0.9816356897354126, 1.0419690608978271, 1.1023024320602417, 1.1626358032226562, 1.2229691743850708, 1.2833025455474854, 1.3436359167099, 1.4039692878723145, 1.464302659034729, 1.5246360301971436, 1.584969401359558, 1.6453027725219727, 1.7056361436843872, 1.7659695148468018, 1.8263028860092163, 1.8866362571716309, 1.9469696283340454, 2.00730299949646, 2.067636489868164, 2.127969741821289, 2.188302993774414, 2.248636484146118, 2.3089699745178223, 2.3693032264709473, 2.4296364784240723, 2.4899699687957764, 2.5503034591674805, 2.6106367111206055]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 3.0, 5.0, 9.0, 8.0, 8.0, 11.0, 13.0, 19.0, 28.0, 25.0, 32.0, 34.0, 36.0, 31.0, 48.0, 42.0, 32.0, 47.0, 48.0, 36.0, 47.0, 43.0, 56.0, 44.0, 47.0, 29.0, 36.0, 27.0, 27.0, 19.0, 21.0, 19.0, 12.0, 13.0, 18.0, 7.0, 4.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0], "bins": [-1.6092500686645508, -1.5667966604232788, -1.5243432521820068, -1.4818898439407349, -1.439436435699463, -1.3969831466674805, -1.354529619216919, -1.3120763301849365, -1.2696229219436646, -1.2271695137023926, -1.1847161054611206, -1.1422626972198486, -1.0998092889785767, -1.0573558807373047, -1.0149025917053223, -0.9724491834640503, -0.9299957156181335, -0.8875423073768616, -0.8450888991355896, -0.8026355504989624, -0.7601821422576904, -0.7177287340164185, -0.6752753257751465, -0.6328219175338745, -0.5903685092926025, -0.5479151010513306, -0.5054616928100586, -0.463008314371109, -0.4205549359321594, -0.37810152769088745, -0.3356481194496155, -0.2931947410106659, -0.2507413625717163, -0.20828796923160553, -0.16583457589149475, -0.12338116765022278, -0.080927774310112, -0.03847438097000122, 0.003979027271270752, 0.04643240571022034, 0.08888581395149231, 0.1313392072916031, 0.17379260063171387, 0.21624600887298584, 0.2586994171142578, 0.3011527955532074, 0.34360620379447937, 0.38605958223342896, 0.4285129904747009, 0.4709663987159729, 0.5134198069572449, 0.5558731555938721, 0.598326563835144, 0.640779972076416, 0.683233380317688, 0.72568678855896, 0.7681401968002319, 0.8105936050415039, 0.8530470132827759, 0.8955004215240479, 0.937953770160675, 0.980407178401947, 1.0228605270385742, 1.0653139352798462, 1.1077673435211182]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 8.0, 16.0, 26.0, 55.0, 101.0, 420.0, 1819.0, 14191.0, 2519875.0, 1642499.0, 12642.0, 1950.0, 387.0, 140.0, 52.0, 32.0, 21.0, 16.0, 7.0, 5.0, 5.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.23828125, -3.145660400390625, -3.05303955078125, -2.960418701171875, -2.8677978515625, -2.775177001953125, -2.68255615234375, -2.589935302734375, -2.497314453125, -2.404693603515625, -2.31207275390625, -2.219451904296875, -2.1268310546875, -2.034210205078125, -1.94158935546875, -1.848968505859375, -1.75634765625, -1.663726806640625, -1.57110595703125, -1.478485107421875, -1.3858642578125, -1.293243408203125, -1.20062255859375, -1.108001708984375, -1.015380859375, -0.922760009765625, -0.83013916015625, -0.737518310546875, -0.6448974609375, -0.552276611328125, -0.45965576171875, -0.367034912109375, -0.2744140625, -0.181793212890625, -0.08917236328125, 0.003448486328125, 0.0960693359375, 0.188690185546875, 0.28131103515625, 0.373931884765625, 0.466552734375, 0.559173583984375, 0.65179443359375, 0.744415283203125, 0.8370361328125, 0.929656982421875, 1.02227783203125, 1.114898681640625, 1.20751953125, 1.300140380859375, 1.39276123046875, 1.485382080078125, 1.5780029296875, 1.670623779296875, 1.76324462890625, 1.855865478515625, 1.948486328125, 2.041107177734375, 2.13372802734375, 2.226348876953125, 2.3189697265625, 2.411590576171875, 2.50421142578125, 2.596832275390625, 2.689453125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 9.0, 13.0, 16.0, 19.0, 21.0, 25.0, 39.0, 50.0, 56.0, 57.0, 55.0, 77.0, 71.0, 65.0, 75.0, 66.0, 59.0, 54.0, 46.0, 36.0, 24.0, 21.0, 9.0, 16.0, 9.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99267578125, -0.9677047729492188, -0.9427337646484375, -0.9177627563476562, -0.892791748046875, -0.8678207397460938, -0.8428497314453125, -0.8178787231445312, -0.79290771484375, -0.7679367065429688, -0.7429656982421875, -0.7179946899414062, -0.693023681640625, -0.6680526733398438, -0.6430816650390625, -0.6181106567382812, -0.5931396484375, -0.5681686401367188, -0.5431976318359375, -0.5182266235351562, -0.493255615234375, -0.46828460693359375, -0.4433135986328125, -0.41834259033203125, -0.39337158203125, -0.36840057373046875, -0.3434295654296875, -0.31845855712890625, -0.293487548828125, -0.26851654052734375, -0.2435455322265625, -0.21857452392578125, -0.193603515625, -0.16863250732421875, -0.1436614990234375, -0.11869049072265625, -0.093719482421875, -0.06874847412109375, -0.0437774658203125, -0.01880645751953125, 0.00616455078125, 0.03113555908203125, 0.0561065673828125, 0.08107757568359375, 0.106048583984375, 0.13101959228515625, 0.1559906005859375, 0.18096160888671875, 0.2059326171875, 0.23090362548828125, 0.2558746337890625, 0.28084564208984375, 0.305816650390625, 0.33078765869140625, 0.3557586669921875, 0.38072967529296875, 0.40570068359375, 0.43067169189453125, 0.4556427001953125, 0.48061370849609375, 0.505584716796875, 0.5305557250976562, 0.5555267333984375, 0.5804977416992188, 0.60546875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 5.0, 12.0, 13.0, 14.0, 9.0, 22.0, 46.0, 54.0, 84.0, 139.0, 217.0, 415.0, 1017.0, 3731.0, 23063.0, 709918.0, 3399770.0, 47031.0, 5989.0, 1482.0, 557.0, 258.0, 149.0, 86.0, 65.0, 36.0, 28.0, 22.0, 16.0, 12.0, 10.0, 2.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4306640625, -1.384735107421875, -1.33880615234375, -1.292877197265625, -1.2469482421875, -1.201019287109375, -1.15509033203125, -1.109161376953125, -1.063232421875, -1.017303466796875, -0.97137451171875, -0.925445556640625, -0.8795166015625, -0.833587646484375, -0.78765869140625, -0.741729736328125, -0.69580078125, -0.649871826171875, -0.60394287109375, -0.558013916015625, -0.5120849609375, -0.466156005859375, -0.42022705078125, -0.374298095703125, -0.328369140625, -0.282440185546875, -0.23651123046875, -0.190582275390625, -0.1446533203125, -0.098724365234375, -0.05279541015625, -0.006866455078125, 0.0390625, 0.084991455078125, 0.13092041015625, 0.176849365234375, 0.2227783203125, 0.268707275390625, 0.31463623046875, 0.360565185546875, 0.406494140625, 0.452423095703125, 0.49835205078125, 0.544281005859375, 0.5902099609375, 0.636138916015625, 0.68206787109375, 0.727996826171875, 0.77392578125, 0.819854736328125, 0.86578369140625, 0.911712646484375, 0.9576416015625, 1.003570556640625, 1.04949951171875, 1.095428466796875, 1.141357421875, 1.187286376953125, 1.23321533203125, 1.279144287109375, 1.3250732421875, 1.371002197265625, 1.41693115234375, 1.462860107421875, 1.5087890625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 6.0, 7.0, 12.0, 19.0, 28.0, 39.0, 82.0, 139.0, 285.0, 633.0, 1189.0, 876.0, 345.0, 169.0, 95.0, 49.0, 43.0, 19.0, 19.0, 8.0, 10.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.415283203125, -0.4029541015625, -0.390625, -0.3782958984375, -0.365966796875, -0.3536376953125, -0.34130859375, -0.3289794921875, -0.316650390625, -0.3043212890625, -0.2919921875, -0.2796630859375, -0.267333984375, -0.2550048828125, -0.24267578125, -0.2303466796875, -0.218017578125, -0.2056884765625, -0.193359375, -0.1810302734375, -0.168701171875, -0.1563720703125, -0.14404296875, -0.1317138671875, -0.119384765625, -0.1070556640625, -0.0947265625, -0.0823974609375, -0.070068359375, -0.0577392578125, -0.04541015625, -0.0330810546875, -0.020751953125, -0.0084228515625, 0.00390625, 0.0162353515625, 0.028564453125, 0.0408935546875, 0.05322265625, 0.0655517578125, 0.077880859375, 0.0902099609375, 0.1025390625, 0.1148681640625, 0.127197265625, 0.1395263671875, 0.15185546875, 0.1641845703125, 0.176513671875, 0.1888427734375, 0.201171875, 0.2135009765625, 0.225830078125, 0.2381591796875, 0.25048828125, 0.2628173828125, 0.275146484375, 0.2874755859375, 0.2998046875, 0.3121337890625, 0.324462890625, 0.3367919921875, 0.34912109375, 0.3614501953125, 0.373779296875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 12.0, 18.0, 38.0, 51.0, 86.0, 146.0, 183.0, 194.0, 126.0, 67.0, 34.0, 22.0, 13.0, 6.0, 7.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7321183681488037, -0.6793529391288757, -0.6265875101089478, -0.573822021484375, -0.5210566520690918, -0.46829119324684143, -0.41552573442459106, -0.3627603054046631, -0.3099948763847351, -0.25722944736480713, -0.20446400344371796, -0.15169855952262878, -0.0989331305027008, -0.04616770148277283, 0.006597757339477539, 0.05936318635940552, 0.1121286153793335, 0.16489404439926147, 0.21765948832035065, 0.2704249322414398, 0.3231903612613678, 0.3759557902812958, 0.42872124910354614, 0.4814866781234741, 0.5342521071434021, 0.5870175361633301, 0.6397829651832581, 0.692548394203186, 0.7453138828277588, 0.798079252243042, 0.8508447408676147, 0.9036101698875427, 0.9563755989074707, 1.0091410875320435, 1.0619064569473267, 1.1146719455718994, 1.1674373149871826, 1.2202028036117554, 1.2729682922363281, 1.3257336616516113, 1.3784990310668945, 1.4312645196914673, 1.4840298891067505, 1.5367953777313232, 1.5895607471466064, 1.6423262357711792, 1.695091724395752, 1.7478570938110352, 1.800622582435608, 1.8533880710601807, 1.9061534404754639, 1.9589189291000366, 2.0116844177246094, 2.0644497871398926, 2.117215156555176, 2.169980525970459, 2.2227461338043213, 2.2755115032196045, 2.328277111053467, 2.38104248046875, 2.433807849884033, 2.4865732192993164, 2.5393388271331787, 2.592104196548462, 2.644869565963745]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 5.0, 6.0, 8.0, 9.0, 7.0, 18.0, 25.0, 28.0, 26.0, 33.0, 37.0, 49.0, 52.0, 53.0, 57.0, 64.0, 58.0, 74.0, 60.0, 49.0, 40.0, 42.0, 33.0, 39.0, 34.0, 26.0, 21.0, 15.0, 6.0, 10.0, 6.0, 8.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7617505788803101, -0.7377254366874695, -0.7137002944946289, -0.6896751523017883, -0.6656500101089478, -0.6416248679161072, -0.6175997257232666, -0.593574583530426, -0.5695494413375854, -0.5455242991447449, -0.5214991569519043, -0.4974740147590637, -0.47344887256622314, -0.44942373037338257, -0.425398588180542, -0.4013734459877014, -0.37734827399253845, -0.3533231317996979, -0.3292979896068573, -0.3052728474140167, -0.28124770522117615, -0.25722256302833557, -0.2331974059343338, -0.20917226374149323, -0.18514712154865265, -0.16112197935581207, -0.1370968371629715, -0.11307168751955032, -0.08904654532670975, -0.06502140313386917, -0.040996253490448, -0.016971111297607422, 0.007054030895233154, 0.03107917495071888, 0.055104319006204605, 0.07912946492433548, 0.10315460711717606, 0.12717974185943604, 0.1512048989534378, 0.17523004114627838, 0.19925518333911896, 0.22328032553195953, 0.2473054677248001, 0.2713306248188019, 0.29535576701164246, 0.31938090920448303, 0.3434060513973236, 0.3674311935901642, 0.39145633578300476, 0.41548147797584534, 0.4395066201686859, 0.4635317623615265, 0.48755690455436707, 0.51158207654953, 0.5356072187423706, 0.5596323609352112, 0.5836575031280518, 0.6076826453208923, 0.6317077875137329, 0.6557329297065735, 0.6797580718994141, 0.7037832140922546, 0.7278083562850952, 0.7518334984779358, 0.7758586406707764]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 4.0, 9.0, 11.0, 17.0, 21.0, 48.0, 55.0, 116.0, 311.0, 809.0, 3065.0, 18656.0, 187226.0, 722733.0, 100777.0, 11403.0, 2185.0, 658.0, 204.0, 111.0, 43.0, 35.0, 25.0, 13.0, 7.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2357177734375, -0.22741127014160156, -0.21910476684570312, -0.2107982635498047, -0.20249176025390625, -0.1941852569580078, -0.18587875366210938, -0.17757225036621094, -0.1692657470703125, -0.16095924377441406, -0.15265274047851562, -0.1443462371826172, -0.13603973388671875, -0.1277332305908203, -0.11942672729492188, -0.11112022399902344, -0.102813720703125, -0.09450721740722656, -0.08620071411132812, -0.07789421081542969, -0.06958770751953125, -0.06128120422363281, -0.052974700927734375, -0.04466819763183594, -0.0363616943359375, -0.028055191040039062, -0.019748687744140625, -0.011442184448242188, -0.00313568115234375, 0.0051708221435546875, 0.013477325439453125, 0.021783828735351562, 0.03009033203125, 0.03839683532714844, 0.046703338623046875, 0.05500984191894531, 0.06331634521484375, 0.07162284851074219, 0.07992935180664062, 0.08823585510253906, 0.0965423583984375, 0.10484886169433594, 0.11315536499023438, 0.12146186828613281, 0.12976837158203125, 0.1380748748779297, 0.14638137817382812, 0.15468788146972656, 0.162994384765625, 0.17130088806152344, 0.17960739135742188, 0.1879138946533203, 0.19622039794921875, 0.2045269012451172, 0.21283340454101562, 0.22113990783691406, 0.2294464111328125, 0.23775291442871094, 0.24605941772460938, 0.2543659210205078, 0.26267242431640625, 0.2709789276123047, 0.2792854309082031, 0.28759193420410156, 0.2958984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 9.0, 16.0, 11.0, 24.0, 36.0, 48.0, 60.0, 73.0, 84.0, 96.0, 102.0, 93.0, 79.0, 70.0, 47.0, 42.0, 48.0, 29.0, 11.0, 9.0, 8.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91552734375, -0.8916854858398438, -0.8678436279296875, -0.8440017700195312, -0.820159912109375, -0.7963180541992188, -0.7724761962890625, -0.7486343383789062, -0.72479248046875, -0.7009506225585938, -0.6771087646484375, -0.6532669067382812, -0.629425048828125, -0.6055831909179688, -0.5817413330078125, -0.5578994750976562, -0.5340576171875, -0.5102157592773438, -0.4863739013671875, -0.46253204345703125, -0.438690185546875, -0.41484832763671875, -0.3910064697265625, -0.36716461181640625, -0.34332275390625, -0.31948089599609375, -0.2956390380859375, -0.27179718017578125, -0.247955322265625, -0.22411346435546875, -0.2002716064453125, -0.17642974853515625, -0.152587890625, -0.12874603271484375, -0.1049041748046875, -0.08106231689453125, -0.057220458984375, -0.03337860107421875, -0.0095367431640625, 0.01430511474609375, 0.03814697265625, 0.06198883056640625, 0.0858306884765625, 0.10967254638671875, 0.133514404296875, 0.15735626220703125, 0.1811981201171875, 0.20503997802734375, 0.2288818359375, 0.25272369384765625, 0.2765655517578125, 0.30040740966796875, 0.324249267578125, 0.34809112548828125, 0.3719329833984375, 0.39577484130859375, 0.41961669921875, 0.44345855712890625, 0.4673004150390625, 0.49114227294921875, 0.514984130859375, 0.5388259887695312, 0.5626678466796875, 0.5865097045898438, 0.6103515625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 6.0, 10.0, 10.0, 13.0, 24.0, 35.0, 61.0, 128.0, 184.0, 299.0, 680.0, 1417.0, 3947.0, 13169.0, 55323.0, 274765.0, 516057.0, 141012.0, 29207.0, 7497.0, 2489.0, 1085.0, 478.0, 273.0, 143.0, 89.0, 49.0, 29.0, 29.0, 15.0, 10.0, 3.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.193603515625, -0.18854713439941406, -0.18349075317382812, -0.1784343719482422, -0.17337799072265625, -0.1683216094970703, -0.16326522827148438, -0.15820884704589844, -0.1531524658203125, -0.14809608459472656, -0.14303970336914062, -0.1379833221435547, -0.13292694091796875, -0.1278705596923828, -0.12281417846679688, -0.11775779724121094, -0.112701416015625, -0.10764503479003906, -0.10258865356445312, -0.09753227233886719, -0.09247589111328125, -0.08741950988769531, -0.08236312866210938, -0.07730674743652344, -0.0722503662109375, -0.06719398498535156, -0.062137603759765625, -0.05708122253417969, -0.05202484130859375, -0.04696846008300781, -0.041912078857421875, -0.03685569763183594, -0.03179931640625, -0.026742935180664062, -0.021686553955078125, -0.016630172729492188, -0.01157379150390625, -0.0065174102783203125, -0.001461029052734375, 0.0035953521728515625, 0.0086517333984375, 0.013708114624023438, 0.018764495849609375, 0.023820877075195312, 0.02887725830078125, 0.03393363952636719, 0.038990020751953125, 0.04404640197753906, 0.049102783203125, 0.05415916442871094, 0.059215545654296875, 0.06427192687988281, 0.06932830810546875, 0.07438468933105469, 0.07944107055664062, 0.08449745178222656, 0.0895538330078125, 0.09461021423339844, 0.09966659545898438, 0.10472297668457031, 0.10977935791015625, 0.11483573913574219, 0.11989212036132812, 0.12494850158691406, 0.1300048828125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 6.0, 2.0, 10.0, 9.0, 6.0, 12.0, 17.0, 18.0, 27.0, 24.0, 23.0, 25.0, 17.0, 34.0, 36.0, 40.0, 43.0, 37.0, 45.0, 60.0, 45.0, 45.0, 58.0, 54.0, 47.0, 37.0, 28.0, 26.0, 37.0, 21.0, 25.0, 21.0, 19.0, 10.0, 9.0, 11.0, 10.0, 2.0, 1.0, 1.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65283203125, -0.6292190551757812, -0.6056060791015625, -0.5819931030273438, -0.558380126953125, -0.5347671508789062, -0.5111541748046875, -0.48754119873046875, -0.46392822265625, -0.44031524658203125, -0.4167022705078125, -0.39308929443359375, -0.369476318359375, -0.34586334228515625, -0.3222503662109375, -0.29863739013671875, -0.2750244140625, -0.25141143798828125, -0.2277984619140625, -0.20418548583984375, -0.180572509765625, -0.15695953369140625, -0.1333465576171875, -0.10973358154296875, -0.08612060546875, -0.06250762939453125, -0.0388946533203125, -0.01528167724609375, 0.008331298828125, 0.03194427490234375, 0.0555572509765625, 0.07917022705078125, 0.102783203125, 0.12639617919921875, 0.1500091552734375, 0.17362213134765625, 0.197235107421875, 0.22084808349609375, 0.2444610595703125, 0.26807403564453125, 0.29168701171875, 0.31529998779296875, 0.3389129638671875, 0.36252593994140625, 0.386138916015625, 0.40975189208984375, 0.4333648681640625, 0.45697784423828125, 0.4805908203125, 0.5042037963867188, 0.5278167724609375, 0.5514297485351562, 0.575042724609375, 0.5986557006835938, 0.6222686767578125, 0.6458816528320312, 0.66949462890625, 0.6931076049804688, 0.7167205810546875, 0.7403335571289062, 0.763946533203125, 0.7875595092773438, 0.8111724853515625, 0.8347854614257812, 0.8583984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 6.0, 7.0, 10.0, 13.0, 23.0, 38.0, 67.0, 118.0, 160.0, 310.0, 544.0, 1059.0, 2104.0, 5011.0, 13291.0, 42873.0, 167786.0, 484776.0, 241581.0, 59449.0, 17571.0, 6420.0, 2629.0, 1254.0, 624.0, 307.0, 183.0, 119.0, 61.0, 43.0, 33.0, 27.0, 13.0, 7.0, 9.0, 8.0, 2.0, 1.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.035247802734375, -0.03401660919189453, -0.03278541564941406, -0.031554222106933594, -0.030323028564453125, -0.029091835021972656, -0.027860641479492188, -0.02662944793701172, -0.02539825439453125, -0.02416706085205078, -0.022935867309570312, -0.021704673767089844, -0.020473480224609375, -0.019242286682128906, -0.018011093139648438, -0.01677989959716797, -0.0155487060546875, -0.014317512512207031, -0.013086318969726562, -0.011855125427246094, -0.010623931884765625, -0.009392738342285156, -0.008161544799804688, -0.006930351257324219, -0.00569915771484375, -0.004467964172363281, -0.0032367706298828125, -0.0020055770874023438, -0.000774383544921875, 0.00045680999755859375, 0.0016880035400390625, 0.0029191970825195312, 0.004150390625, 0.005381584167480469, 0.0066127777099609375, 0.007843971252441406, 0.009075164794921875, 0.010306358337402344, 0.011537551879882812, 0.012768745422363281, 0.01399993896484375, 0.015231132507324219, 0.016462326049804688, 0.017693519592285156, 0.018924713134765625, 0.020155906677246094, 0.021387100219726562, 0.02261829376220703, 0.0238494873046875, 0.02508068084716797, 0.026311874389648438, 0.027543067932128906, 0.028774261474609375, 0.030005455017089844, 0.031236648559570312, 0.03246784210205078, 0.03369903564453125, 0.03493022918701172, 0.03616142272949219, 0.037392616271972656, 0.038623809814453125, 0.039855003356933594, 0.04108619689941406, 0.04231739044189453, 0.043548583984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 6.0, 9.0, 5.0, 10.0, 11.0, 14.0, 12.0, 29.0, 29.0, 43.0, 44.0, 60.0, 71.0, 79.0, 80.0, 85.0, 89.0, 67.0, 64.0, 41.0, 33.0, 27.0, 15.0, 16.0, 6.0, 13.0, 7.0, 8.0, 1.0, 7.0, 5.0, 3.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9729137420654297e-05, -1.9126571714878082e-05, -1.8524006009101868e-05, -1.7921440303325653e-05, -1.731887459754944e-05, -1.6716308891773224e-05, -1.611374318599701e-05, -1.5511177480220795e-05, -1.490861177444458e-05, -1.4306046068668365e-05, -1.3703480362892151e-05, -1.3100914657115936e-05, -1.2498348951339722e-05, -1.1895783245563507e-05, -1.1293217539787292e-05, -1.0690651834011078e-05, -1.0088086128234863e-05, -9.485520422458649e-06, -8.882954716682434e-06, -8.28038901090622e-06, -7.677823305130005e-06, -7.07525759935379e-06, -6.472691893577576e-06, -5.870126187801361e-06, -5.2675604820251465e-06, -4.664994776248932e-06, -4.062429070472717e-06, -3.4598633646965027e-06, -2.857297658920288e-06, -2.2547319531440735e-06, -1.6521662473678589e-06, -1.0496005415916443e-06, -4.470348358154297e-07, 1.555308699607849e-07, 7.580965757369995e-07, 1.3606622815132141e-06, 1.9632279872894287e-06, 2.5657936930656433e-06, 3.168359398841858e-06, 3.7709251046180725e-06, 4.373490810394287e-06, 4.976056516170502e-06, 5.578622221946716e-06, 6.181187927722931e-06, 6.7837536334991455e-06, 7.38631933927536e-06, 7.988885045051575e-06, 8.59145075082779e-06, 9.194016456604004e-06, 9.796582162380219e-06, 1.0399147868156433e-05, 1.1001713573932648e-05, 1.1604279279708862e-05, 1.2206844985485077e-05, 1.2809410691261292e-05, 1.3411976397037506e-05, 1.401454210281372e-05, 1.4617107808589935e-05, 1.521967351436615e-05, 1.5822239220142365e-05, 1.642480492591858e-05, 1.7027370631694794e-05, 1.7629936337471008e-05, 1.8232502043247223e-05, 1.8835067749023438e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 9.0, 11.0, 18.0, 9.0, 20.0, 26.0, 37.0, 76.0, 109.0, 157.0, 315.0, 661.0, 1418.0, 3677.0, 10345.0, 33034.0, 122139.0, 414254.0, 334197.0, 89139.0, 25420.0, 8067.0, 2901.0, 1216.0, 576.0, 297.0, 153.0, 92.0, 59.0, 40.0, 32.0, 18.0, 8.0, 12.0, 6.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037994384765625, -0.03676414489746094, -0.035533905029296875, -0.03430366516113281, -0.03307342529296875, -0.03184318542480469, -0.030612945556640625, -0.029382705688476562, -0.0281524658203125, -0.026922225952148438, -0.025691986083984375, -0.024461746215820312, -0.02323150634765625, -0.022001266479492188, -0.020771026611328125, -0.019540786743164062, -0.018310546875, -0.017080307006835938, -0.015850067138671875, -0.014619827270507812, -0.01338958740234375, -0.012159347534179688, -0.010929107666015625, -0.009698867797851562, -0.0084686279296875, -0.0072383880615234375, -0.006008148193359375, -0.0047779083251953125, -0.00354766845703125, -0.0023174285888671875, -0.001087188720703125, 0.0001430511474609375, 0.001373291015625, 0.0026035308837890625, 0.003833770751953125, 0.0050640106201171875, 0.00629425048828125, 0.0075244903564453125, 0.008754730224609375, 0.009984970092773438, 0.0112152099609375, 0.012445449829101562, 0.013675689697265625, 0.014905929565429688, 0.01613616943359375, 0.017366409301757812, 0.018596649169921875, 0.019826889038085938, 0.02105712890625, 0.022287368774414062, 0.023517608642578125, 0.024747848510742188, 0.02597808837890625, 0.027208328247070312, 0.028438568115234375, 0.029668807983398438, 0.0308990478515625, 0.03212928771972656, 0.033359527587890625, 0.03458976745605469, 0.03582000732421875, 0.03705024719238281, 0.038280487060546875, 0.03951072692871094, 0.040740966796875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 2.0, 2.0, 6.0, 6.0, 4.0, 12.0, 9.0, 14.0, 12.0, 13.0, 20.0, 25.0, 22.0, 24.0, 28.0, 41.0, 40.0, 32.0, 52.0, 45.0, 54.0, 57.0, 46.0, 54.0, 50.0, 39.0, 38.0, 36.0, 30.0, 34.0, 19.0, 35.0, 18.0, 22.0, 12.0, 6.0, 8.0, 8.0, 8.0, 8.0, 4.0, 5.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005889892578125, -0.0056498050689697266, -0.005409717559814453, -0.00516963005065918, -0.004929542541503906, -0.004689455032348633, -0.004449367523193359, -0.004209280014038086, -0.0039691925048828125, -0.003729104995727539, -0.0034890174865722656, -0.003248929977416992, -0.0030088424682617188, -0.0027687549591064453, -0.002528667449951172, -0.0022885799407958984, -0.002048492431640625, -0.0018084049224853516, -0.0015683174133300781, -0.0013282299041748047, -0.0010881423950195312, -0.0008480548858642578, -0.0006079673767089844, -0.00036787986755371094, -0.0001277923583984375, 0.00011229515075683594, 0.0003523826599121094, 0.0005924701690673828, 0.0008325576782226562, 0.0010726451873779297, 0.0013127326965332031, 0.0015528202056884766, 0.00179290771484375, 0.0020329952239990234, 0.002273082733154297, 0.0025131702423095703, 0.0027532577514648438, 0.002993345260620117, 0.0032334327697753906, 0.003473520278930664, 0.0037136077880859375, 0.003953695297241211, 0.004193782806396484, 0.004433870315551758, 0.004673957824707031, 0.004914045333862305, 0.005154132843017578, 0.0053942203521728516, 0.005634307861328125, 0.0058743953704833984, 0.006114482879638672, 0.006354570388793945, 0.006594657897949219, 0.006834745407104492, 0.007074832916259766, 0.007314920425415039, 0.0075550079345703125, 0.007795095443725586, 0.00803518295288086, 0.008275270462036133, 0.008515357971191406, 0.00875544548034668, 0.008995532989501953, 0.009235620498657227, 0.0094757080078125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 7.0, 9.0, 136.0, 629.0, 209.0, 23.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.817451536655426, -0.6943567991256714, -0.5712620615959167, -0.4481672942638397, -0.3250725567340851, -0.20197778940200806, -0.07888305187225342, 0.04421168565750122, 0.16730642318725586, 0.2904011607170105, 0.41349589824676514, 0.5365906953811646, 0.6596853733062744, 0.7827801704406738, 0.9058749079704285, 1.028969645500183, 1.152064323425293, 1.2751591205596924, 1.3982537984848022, 1.5213485956192017, 1.6444432735443115, 1.767538070678711, 1.8906328678131104, 2.0137276649475098, 2.13682222366333, 2.2599170207977295, 2.383011817932129, 2.506106376647949, 2.6292011737823486, 2.752295970916748, 2.8753907680511475, 2.998485565185547, 3.1215803623199463, 3.2446751594543457, 3.367769956588745, 3.4908645153045654, 3.613959312438965, 3.7370541095733643, 3.8601489067077637, 3.983243465423584, 4.1063385009765625, 4.229433059692383, 4.352528095245361, 4.475622653961182, 4.59871768951416, 4.7218122482299805, 4.844906806945801, 4.968001842498779, 5.0910964012146, 5.21419095993042, 5.337285995483398, 5.460380554199219, 5.583475589752197, 5.706570148468018, 5.829664707183838, 5.952759742736816, 6.075854301452637, 6.198948860168457, 6.3220438957214355, 6.445138454437256, 6.568233489990234, 6.691328048706055, 6.814422607421875, 6.9375176429748535, 7.060612201690674]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 10.0, 8.0, 14.0, 13.0, 29.0, 34.0, 46.0, 45.0, 70.0, 59.0, 84.0, 87.0, 95.0, 76.0, 65.0, 59.0, 52.0, 56.0, 37.0, 22.0, 13.0, 12.0, 6.0, 8.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7214376330375671, -0.700748860836029, -0.6800601482391357, -0.6593713760375977, -0.6386826038360596, -0.6179938912391663, -0.5973051190376282, -0.5766164064407349, -0.5559276342391968, -0.5352388620376587, -0.5145501494407654, -0.4938613772392273, -0.4731726348400116, -0.4524838924407959, -0.4317951202392578, -0.4111063778400421, -0.3904176354408264, -0.3697288930416107, -0.349040150642395, -0.32835137844085693, -0.30766263604164124, -0.28697389364242554, -0.26628512144088745, -0.24559637904167175, -0.22490763664245605, -0.20421889424324036, -0.18353013694286346, -0.16284137964248657, -0.14215263724327087, -0.12146388739347458, -0.10077513754367828, -0.08008638024330139, -0.05939757823944092, -0.03870882838964462, -0.018020078539848328, 0.0026686713099479675, 0.023357421159744263, 0.04404617100954056, 0.06473492085933685, 0.08542367815971375, 0.10611242055892944, 0.12680116295814514, 0.14748992025852203, 0.16817867755889893, 0.18886741995811462, 0.20955616235733032, 0.23024491965770721, 0.2509336769580841, 0.2716224193572998, 0.2923111617565155, 0.3129999041557312, 0.3336886763572693, 0.354377418756485, 0.3750661611557007, 0.39575493335723877, 0.41644367575645447, 0.43713241815567017, 0.45782116055488586, 0.47850990295410156, 0.49919867515563965, 0.5198874473571777, 0.540576159954071, 0.5612649321556091, 0.5819536447525024, 0.6026424169540405]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 1.0, 5.0, 6.0, 8.0, 9.0, 23.0, 40.0, 40.0, 62.0, 115.0, 154.0, 305.0, 537.0, 1043.0, 2063.0, 4408.0, 10267.0, 28611.0, 105765.0, 467628.0, 322866.0, 69141.0, 20541.0, 7810.0, 3511.0, 1611.0, 862.0, 468.0, 268.0, 141.0, 84.0, 49.0, 40.0, 26.0, 17.0, 8.0, 8.0, 4.0, 0.0, 4.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5224609375, -0.5060577392578125, -0.489654541015625, -0.4732513427734375, -0.45684814453125, -0.4404449462890625, -0.424041748046875, -0.4076385498046875, -0.3912353515625, -0.3748321533203125, -0.358428955078125, -0.3420257568359375, -0.32562255859375, -0.3092193603515625, -0.292816162109375, -0.2764129638671875, -0.260009765625, -0.2436065673828125, -0.227203369140625, -0.2108001708984375, -0.19439697265625, -0.1779937744140625, -0.161590576171875, -0.1451873779296875, -0.1287841796875, -0.1123809814453125, -0.095977783203125, -0.0795745849609375, -0.06317138671875, -0.0467681884765625, -0.030364990234375, -0.0139617919921875, 0.00244140625, 0.0188446044921875, 0.035247802734375, 0.0516510009765625, 0.06805419921875, 0.0844573974609375, 0.100860595703125, 0.1172637939453125, 0.1336669921875, 0.1500701904296875, 0.166473388671875, 0.1828765869140625, 0.19927978515625, 0.2156829833984375, 0.232086181640625, 0.2484893798828125, 0.264892578125, 0.2812957763671875, 0.297698974609375, 0.3141021728515625, 0.33050537109375, 0.3469085693359375, 0.363311767578125, 0.3797149658203125, 0.3961181640625, 0.4125213623046875, 0.428924560546875, 0.4453277587890625, 0.46173095703125, 0.4781341552734375, 0.494537353515625, 0.5109405517578125, 0.52734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 6.0, 5.0, 14.0, 10.0, 12.0, 15.0, 24.0, 22.0, 25.0, 23.0, 36.0, 36.0, 41.0, 45.0, 52.0, 57.0, 57.0, 47.0, 61.0, 45.0, 46.0, 41.0, 40.0, 36.0, 28.0, 32.0, 30.0, 26.0, 21.0, 15.0, 18.0, 3.0, 6.0, 6.0, 4.0, 4.0, 2.0, 5.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6865234375, -0.6639404296875, -0.641357421875, -0.6187744140625, -0.59619140625, -0.5736083984375, -0.551025390625, -0.5284423828125, -0.505859375, -0.4832763671875, -0.460693359375, -0.4381103515625, -0.41552734375, -0.3929443359375, -0.370361328125, -0.3477783203125, -0.3251953125, -0.3026123046875, -0.280029296875, -0.2574462890625, -0.23486328125, -0.2122802734375, -0.189697265625, -0.1671142578125, -0.14453125, -0.1219482421875, -0.099365234375, -0.0767822265625, -0.05419921875, -0.0316162109375, -0.009033203125, 0.0135498046875, 0.0361328125, 0.0587158203125, 0.081298828125, 0.1038818359375, 0.12646484375, 0.1490478515625, 0.171630859375, 0.1942138671875, 0.216796875, 0.2393798828125, 0.261962890625, 0.2845458984375, 0.30712890625, 0.3297119140625, 0.352294921875, 0.3748779296875, 0.3974609375, 0.4200439453125, 0.442626953125, 0.4652099609375, 0.48779296875, 0.5103759765625, 0.532958984375, 0.5555419921875, 0.578125, 0.6007080078125, 0.623291015625, 0.6458740234375, 0.66845703125, 0.6910400390625, 0.713623046875, 0.7362060546875, 0.7587890625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 11.0, 7.0, 17.0, 19.0, 31.0, 27.0, 42.0, 51.0, 57.0, 75.0, 108.0, 149.0, 210.0, 369.0, 798.0, 2357.0, 9494.0, 72195.0, 810344.0, 132982.0, 13752.0, 3160.0, 997.0, 421.0, 228.0, 161.0, 112.0, 81.0, 68.0, 47.0, 37.0, 25.0, 30.0, 20.0, 19.0, 11.0, 8.0, 9.0, 9.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0263671875, -0.9958267211914062, -0.9652862548828125, -0.9347457885742188, -0.904205322265625, -0.8736648559570312, -0.8431243896484375, -0.8125839233398438, -0.78204345703125, -0.7515029907226562, -0.7209625244140625, -0.6904220581054688, -0.659881591796875, -0.6293411254882812, -0.5988006591796875, -0.5682601928710938, -0.5377197265625, -0.5071792602539062, -0.4766387939453125, -0.44609832763671875, -0.415557861328125, -0.38501739501953125, -0.3544769287109375, -0.32393646240234375, -0.29339599609375, -0.26285552978515625, -0.2323150634765625, -0.20177459716796875, -0.171234130859375, -0.14069366455078125, -0.1101531982421875, -0.07961273193359375, -0.049072265625, -0.01853179931640625, 0.0120086669921875, 0.04254913330078125, 0.073089599609375, 0.10363006591796875, 0.1341705322265625, 0.16471099853515625, 0.19525146484375, 0.22579193115234375, 0.2563323974609375, 0.28687286376953125, 0.317413330078125, 0.34795379638671875, 0.3784942626953125, 0.40903472900390625, 0.4395751953125, 0.47011566162109375, 0.5006561279296875, 0.5311965942382812, 0.561737060546875, 0.5922775268554688, 0.6228179931640625, 0.6533584594726562, 0.68389892578125, 0.7144393920898438, 0.7449798583984375, 0.7755203247070312, 0.806060791015625, 0.8366012573242188, 0.8671417236328125, 0.8976821899414062, 0.92822265625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 10.0, 21.0, 15.0, 14.0, 16.0, 31.0, 21.0, 24.0, 22.0, 27.0, 30.0, 31.0, 43.0, 42.0, 45.0, 39.0, 38.0, 38.0, 33.0, 36.0, 39.0, 32.0, 35.0, 43.0, 39.0, 34.0, 27.0, 19.0, 21.0, 19.0, 22.0, 13.0, 11.0, 11.0, 10.0, 9.0, 13.0, 9.0, 3.0, 1.0, 1.0, 3.0, 0.0, 5.0, 1.0, 1.0, 1.0], "bins": [-0.6552734375, -0.6362380981445312, -0.6172027587890625, -0.5981674194335938, -0.579132080078125, -0.5600967407226562, -0.5410614013671875, -0.5220260620117188, -0.50299072265625, -0.48395538330078125, -0.4649200439453125, -0.44588470458984375, -0.426849365234375, -0.40781402587890625, -0.3887786865234375, -0.36974334716796875, -0.3507080078125, -0.33167266845703125, -0.3126373291015625, -0.29360198974609375, -0.274566650390625, -0.25553131103515625, -0.2364959716796875, -0.21746063232421875, -0.19842529296875, -0.17938995361328125, -0.1603546142578125, -0.14131927490234375, -0.122283935546875, -0.10324859619140625, -0.0842132568359375, -0.06517791748046875, -0.046142578125, -0.02710723876953125, -0.0080718994140625, 0.01096343994140625, 0.029998779296875, 0.04903411865234375, 0.0680694580078125, 0.08710479736328125, 0.10614013671875, 0.12517547607421875, 0.1442108154296875, 0.16324615478515625, 0.182281494140625, 0.20131683349609375, 0.2203521728515625, 0.23938751220703125, 0.2584228515625, 0.27745819091796875, 0.2964935302734375, 0.31552886962890625, 0.334564208984375, 0.35359954833984375, 0.3726348876953125, 0.39167022705078125, 0.41070556640625, 0.42974090576171875, 0.4487762451171875, 0.46781158447265625, 0.486846923828125, 0.5058822631835938, 0.5249176025390625, 0.5439529418945312, 0.56298828125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 8.0, 7.0, 16.0, 22.0, 40.0, 74.0, 160.0, 326.0, 748.0, 2194.0, 9248.0, 89825.0, 883259.0, 52675.0, 6923.0, 1837.0, 613.0, 272.0, 148.0, 75.0, 35.0, 22.0, 13.0, 9.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5634765625, -0.5495338439941406, -0.5355911254882812, -0.5216484069824219, -0.5077056884765625, -0.4937629699707031, -0.47982025146484375, -0.4658775329589844, -0.451934814453125, -0.4379920959472656, -0.42404937744140625, -0.4101066589355469, -0.3961639404296875, -0.3822212219238281, -0.36827850341796875, -0.3543357849121094, -0.34039306640625, -0.3264503479003906, -0.31250762939453125, -0.2985649108886719, -0.2846221923828125, -0.2706794738769531, -0.25673675537109375, -0.24279403686523438, -0.228851318359375, -0.21490859985351562, -0.20096588134765625, -0.18702316284179688, -0.1730804443359375, -0.15913772583007812, -0.14519500732421875, -0.13125228881835938, -0.1173095703125, -0.10336685180664062, -0.08942413330078125, -0.07548141479492188, -0.0615386962890625, -0.047595977783203125, -0.03365325927734375, -0.019710540771484375, -0.005767822265625, 0.008174896240234375, 0.02211761474609375, 0.036060333251953125, 0.0500030517578125, 0.06394577026367188, 0.07788848876953125, 0.09183120727539062, 0.10577392578125, 0.11971664428710938, 0.13365936279296875, 0.14760208129882812, 0.1615447998046875, 0.17548751831054688, 0.18943023681640625, 0.20337295532226562, 0.217315673828125, 0.23125839233398438, 0.24520111083984375, 0.2591438293457031, 0.2730865478515625, 0.2870292663574219, 0.30097198486328125, 0.3149147033691406, 0.328857421875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 8.0, 16.0, 26.0, 49.0, 80.0, 183.0, 245.0, 209.0, 85.0, 47.0, 10.0, 15.0, 4.0, 7.0, 8.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8995018005371094e-05, -4.672631621360779e-05, -4.445761442184448e-05, -4.218891263008118e-05, -3.992021083831787e-05, -3.7651509046554565e-05, -3.538280725479126e-05, -3.3114105463027954e-05, -3.084540367126465e-05, -2.8576701879501343e-05, -2.6308000087738037e-05, -2.403929829597473e-05, -2.1770596504211426e-05, -1.950189471244812e-05, -1.7233192920684814e-05, -1.4964491128921509e-05, -1.2695789337158203e-05, -1.0427087545394897e-05, -8.158385753631592e-06, -5.889683961868286e-06, -3.6209821701049805e-06, -1.3522803783416748e-06, 9.164214134216309e-07, 3.1851232051849365e-06, 5.453824996948242e-06, 7.722526788711548e-06, 9.991228580474854e-06, 1.225993037223816e-05, 1.4528632164001465e-05, 1.679733395576477e-05, 1.9066035747528076e-05, 2.1334737539291382e-05, 2.3603439331054688e-05, 2.5872141122817993e-05, 2.81408429145813e-05, 3.0409544706344604e-05, 3.267824649810791e-05, 3.4946948289871216e-05, 3.721565008163452e-05, 3.948435187339783e-05, 4.175305366516113e-05, 4.402175545692444e-05, 4.6290457248687744e-05, 4.855915904045105e-05, 5.0827860832214355e-05, 5.309656262397766e-05, 5.536526441574097e-05, 5.763396620750427e-05, 5.990266799926758e-05, 6.217136979103088e-05, 6.444007158279419e-05, 6.67087733745575e-05, 6.89774751663208e-05, 7.12461769580841e-05, 7.351487874984741e-05, 7.578358054161072e-05, 7.805228233337402e-05, 8.032098412513733e-05, 8.258968591690063e-05, 8.485838770866394e-05, 8.712708950042725e-05, 8.939579129219055e-05, 9.166449308395386e-05, 9.393319487571716e-05, 9.620189666748047e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 5.0, 6.0, 5.0, 8.0, 13.0, 14.0, 27.0, 48.0, 87.0, 274.0, 729.0, 2917.0, 20946.0, 806946.0, 204852.0, 9143.0, 1656.0, 486.0, 192.0, 80.0, 42.0, 30.0, 14.0, 11.0, 12.0, 6.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.324951171875, -0.3093452453613281, -0.29373931884765625, -0.2781333923339844, -0.2625274658203125, -0.24692153930664062, -0.23131561279296875, -0.21570968627929688, -0.200103759765625, -0.18449783325195312, -0.16889190673828125, -0.15328598022460938, -0.1376800537109375, -0.12207412719726562, -0.10646820068359375, -0.09086227416992188, -0.07525634765625, -0.059650421142578125, -0.04404449462890625, -0.028438568115234375, -0.0128326416015625, 0.002773284912109375, 0.01837921142578125, 0.033985137939453125, 0.049591064453125, 0.06519699096679688, 0.08080291748046875, 0.09640884399414062, 0.1120147705078125, 0.12762069702148438, 0.14322662353515625, 0.15883255004882812, 0.1744384765625, 0.19004440307617188, 0.20565032958984375, 0.22125625610351562, 0.2368621826171875, 0.2524681091308594, 0.26807403564453125, 0.2836799621582031, 0.299285888671875, 0.3148918151855469, 0.33049774169921875, 0.3461036682128906, 0.3617095947265625, 0.3773155212402344, 0.39292144775390625, 0.4085273742675781, 0.42413330078125, 0.4397392272949219, 0.45534515380859375, 0.4709510803222656, 0.4865570068359375, 0.5021629333496094, 0.5177688598632812, 0.5333747863769531, 0.548980712890625, 0.5645866394042969, 0.5801925659179688, 0.5957984924316406, 0.6114044189453125, 0.6270103454589844, 0.6426162719726562, 0.6582221984863281, 0.673828125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 7.0, 3.0, 5.0, 8.0, 18.0, 13.0, 14.0, 34.0, 65.0, 57.0, 99.0, 116.0, 103.0, 109.0, 95.0, 79.0, 42.0, 40.0, 26.0, 18.0, 11.0, 4.0, 7.0, 9.0, 7.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.146728515625, -0.1432971954345703, -0.13986587524414062, -0.13643455505371094, -0.13300323486328125, -0.12957191467285156, -0.12614059448242188, -0.12270927429199219, -0.1192779541015625, -0.11584663391113281, -0.11241531372070312, -0.10898399353027344, -0.10555267333984375, -0.10212135314941406, -0.09869003295898438, -0.09525871276855469, -0.091827392578125, -0.08839607238769531, -0.08496475219726562, -0.08153343200683594, -0.07810211181640625, -0.07467079162597656, -0.07123947143554688, -0.06780815124511719, -0.0643768310546875, -0.06094551086425781, -0.057514190673828125, -0.05408287048339844, -0.05065155029296875, -0.04722023010253906, -0.043788909912109375, -0.04035758972167969, -0.03692626953125, -0.03349494934082031, -0.030063629150390625, -0.026632308959960938, -0.02320098876953125, -0.019769668579101562, -0.016338348388671875, -0.012907028198242188, -0.0094757080078125, -0.0060443878173828125, -0.002613067626953125, 0.0008182525634765625, 0.00424957275390625, 0.0076808929443359375, 0.011112213134765625, 0.014543533325195312, 0.017974853515625, 0.021406173706054688, 0.024837493896484375, 0.028268814086914062, 0.03170013427734375, 0.03513145446777344, 0.038562774658203125, 0.04199409484863281, 0.0454254150390625, 0.04885673522949219, 0.052288055419921875, 0.05571937561035156, 0.05915069580078125, 0.06258201599121094, 0.06601333618164062, 0.06944465637207031, 0.0728759765625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 12.0, 22.0, 42.0, 49.0, 90.0, 129.0, 173.0, 165.0, 114.0, 67.0, 57.0, 32.0, 18.0, 9.0, 10.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4202715158462524, -1.3635207414627075, -1.306769847869873, -1.2500190734863281, -1.1932682991027832, -1.1365175247192383, -1.0797667503356934, -1.0230158567428589, -0.966265082359314, -0.909514307975769, -0.8527634739875793, -0.7960126399993896, -0.7392618656158447, -0.6825110912322998, -0.6257602572441101, -0.5690094232559204, -0.5122586488723755, -0.4555078446865082, -0.39875704050064087, -0.34200623631477356, -0.28525543212890625, -0.22850462794303894, -0.17175382375717163, -0.11500301957130432, -0.05825221538543701, -0.0015014111995697021, 0.05524939298629761, 0.11200019717216492, 0.16875100135803223, 0.22550180554389954, 0.28225260972976685, 0.33900341391563416, 0.395754337310791, 0.4525051414966583, 0.5092559456825256, 0.5660067796707153, 0.6227575540542603, 0.6795083284378052, 0.7362591624259949, 0.7930099964141846, 0.8497607707977295, 0.9065115451812744, 0.9632623791694641, 1.0200132131576538, 1.0767639875411987, 1.1335147619247437, 1.1902656555175781, 1.247016429901123, 1.303767204284668, 1.360517978668213, 1.4172687530517578, 1.4740196466445923, 1.5307704210281372, 1.5875211954116821, 1.6442720890045166, 1.7010228633880615, 1.7577736377716064, 1.8145244121551514, 1.8712751865386963, 1.9280260801315308, 1.9847768545150757, 2.04152774810791, 2.098278522491455, 2.155029296875, 2.211780071258545]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 4.0, 9.0, 8.0, 12.0, 9.0, 16.0, 21.0, 30.0, 26.0, 25.0, 24.0, 37.0, 38.0, 47.0, 53.0, 38.0, 43.0, 49.0, 39.0, 61.0, 49.0, 43.0, 44.0, 37.0, 35.0, 31.0, 28.0, 24.0, 20.0, 21.0, 18.0, 9.0, 15.0, 8.0, 10.0, 6.0, 4.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2263832092285156, -1.1879488229751587, -1.1495144367218018, -1.1110800504684448, -1.072645664215088, -1.034211277961731, -0.995776891708374, -0.9573425054550171, -0.9189081192016602, -0.8804737329483032, -0.8420393466949463, -0.8036049604415894, -0.7651705741882324, -0.7267361879348755, -0.6883018016815186, -0.6498674154281616, -0.6114329695701599, -0.572998583316803, -0.534564197063446, -0.4961298108100891, -0.4576954245567322, -0.41926103830337524, -0.3808266222476959, -0.342392235994339, -0.30395784974098206, -0.2655234634876251, -0.2270890772342682, -0.18865467607975006, -0.15022028982639313, -0.1117859035730362, -0.07335150241851807, -0.03491711616516113, 0.0035172700881958008, 0.04195166006684303, 0.08038605004549026, 0.1188204437494278, 0.15725483000278473, 0.19568921625614166, 0.2341236174106598, 0.2725580036640167, 0.31099238991737366, 0.3494267761707306, 0.3878611624240875, 0.42629557847976685, 0.4647299647331238, 0.5031643509864807, 0.5415987372398376, 0.5800331234931946, 0.6184675097465515, 0.6569018959999084, 0.6953362822532654, 0.7337706685066223, 0.7722050547599792, 0.8106394410133362, 0.8490738868713379, 0.8875082731246948, 0.9259426593780518, 0.9643770456314087, 1.0028114318847656, 1.0412458181381226, 1.0796802043914795, 1.1181145906448364, 1.1565489768981934, 1.1949833631515503, 1.2334177494049072]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 6.0, 6.0, 11.0, 7.0, 15.0, 31.0, 49.0, 94.0, 130.0, 427.0, 1663.0, 11939.0, 1704246.0, 2460075.0, 13086.0, 1722.0, 409.0, 143.0, 68.0, 44.0, 27.0, 15.0, 13.0, 12.0, 6.0, 4.0, 6.0, 1.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.40234375, -2.322357177734375, -2.24237060546875, -2.162384033203125, -2.0823974609375, -2.002410888671875, -1.92242431640625, -1.842437744140625, -1.762451171875, -1.682464599609375, -1.60247802734375, -1.522491455078125, -1.4425048828125, -1.362518310546875, -1.28253173828125, -1.202545166015625, -1.12255859375, -1.042572021484375, -0.96258544921875, -0.882598876953125, -0.8026123046875, -0.722625732421875, -0.64263916015625, -0.562652587890625, -0.482666015625, -0.402679443359375, -0.32269287109375, -0.242706298828125, -0.1627197265625, -0.082733154296875, -0.00274658203125, 0.077239990234375, 0.1572265625, 0.237213134765625, 0.31719970703125, 0.397186279296875, 0.4771728515625, 0.557159423828125, 0.63714599609375, 0.717132568359375, 0.797119140625, 0.877105712890625, 0.95709228515625, 1.037078857421875, 1.1170654296875, 1.197052001953125, 1.27703857421875, 1.357025146484375, 1.43701171875, 1.516998291015625, 1.59698486328125, 1.676971435546875, 1.7569580078125, 1.836944580078125, 1.91693115234375, 1.996917724609375, 2.076904296875, 2.156890869140625, 2.23687744140625, 2.316864013671875, 2.3968505859375, 2.476837158203125, 2.55682373046875, 2.636810302734375, 2.716796875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 9.0, 10.0, 8.0, 17.0, 19.0, 21.0, 30.0, 24.0, 36.0, 40.0, 55.0, 36.0, 70.0, 69.0, 73.0, 54.0, 78.0, 56.0, 48.0, 38.0, 42.0, 44.0, 40.0, 28.0, 18.0, 13.0, 12.0, 2.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51708984375, -0.49542999267578125, -0.4737701416015625, -0.45211029052734375, -0.430450439453125, -0.40879058837890625, -0.3871307373046875, -0.36547088623046875, -0.34381103515625, -0.32215118408203125, -0.3004913330078125, -0.27883148193359375, -0.257171630859375, -0.23551177978515625, -0.2138519287109375, -0.19219207763671875, -0.1705322265625, -0.14887237548828125, -0.1272125244140625, -0.10555267333984375, -0.083892822265625, -0.06223297119140625, -0.0405731201171875, -0.01891326904296875, 0.00274658203125, 0.02440643310546875, 0.0460662841796875, 0.06772613525390625, 0.089385986328125, 0.11104583740234375, 0.1327056884765625, 0.15436553955078125, 0.176025390625, 0.19768524169921875, 0.2193450927734375, 0.24100494384765625, 0.262664794921875, 0.28432464599609375, 0.3059844970703125, 0.32764434814453125, 0.34930419921875, 0.37096405029296875, 0.3926239013671875, 0.41428375244140625, 0.435943603515625, 0.45760345458984375, 0.4792633056640625, 0.5009231567382812, 0.5225830078125, 0.5442428588867188, 0.5659027099609375, 0.5875625610351562, 0.609222412109375, 0.6308822631835938, 0.6525421142578125, 0.6742019653320312, 0.69586181640625, 0.7175216674804688, 0.7391815185546875, 0.7608413696289062, 0.782501220703125, 0.8041610717773438, 0.8258209228515625, 0.8474807739257812, 0.869140625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 7.0, 6.0, 8.0, 5.0, 29.0, 32.0, 41.0, 78.0, 151.0, 245.0, 522.0, 1201.0, 3366.0, 14090.0, 120907.0, 3619734.0, 398244.0, 26941.0, 5451.0, 1667.0, 741.0, 323.0, 197.0, 97.0, 71.0, 43.0, 26.0, 17.0, 12.0, 10.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 5.0, 2.0], "bins": [-1.353515625, -1.3210372924804688, -1.2885589599609375, -1.2560806274414062, -1.223602294921875, -1.1911239624023438, -1.1586456298828125, -1.1261672973632812, -1.09368896484375, -1.0612106323242188, -1.0287322998046875, -0.9962539672851562, -0.963775634765625, -0.9312973022460938, -0.8988189697265625, -0.8663406372070312, -0.8338623046875, -0.8013839721679688, -0.7689056396484375, -0.7364273071289062, -0.703948974609375, -0.6714706420898438, -0.6389923095703125, -0.6065139770507812, -0.57403564453125, -0.5415573120117188, -0.5090789794921875, -0.47660064697265625, -0.444122314453125, -0.41164398193359375, -0.3791656494140625, -0.34668731689453125, -0.314208984375, -0.28173065185546875, -0.2492523193359375, -0.21677398681640625, -0.184295654296875, -0.15181732177734375, -0.1193389892578125, -0.08686065673828125, -0.05438232421875, -0.02190399169921875, 0.0105743408203125, 0.04305267333984375, 0.075531005859375, 0.10800933837890625, 0.1404876708984375, 0.17296600341796875, 0.2054443359375, 0.23792266845703125, 0.2704010009765625, 0.30287933349609375, 0.335357666015625, 0.36783599853515625, 0.4003143310546875, 0.43279266357421875, 0.46527099609375, 0.49774932861328125, 0.5302276611328125, 0.5627059936523438, 0.595184326171875, 0.6276626586914062, 0.6601409912109375, 0.6926193237304688, 0.72509765625]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 10.0, 8.0, 10.0, 12.0, 12.0, 26.0, 35.0, 44.0, 61.0, 78.0, 124.0, 205.0, 330.0, 509.0, 672.0, 594.0, 459.0, 345.0, 166.0, 107.0, 57.0, 63.0, 37.0, 32.0, 20.0, 13.0, 12.0, 5.0, 5.0, 5.0, 6.0, 6.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2467041015625, -0.24019622802734375, -0.2336883544921875, -0.22718048095703125, -0.220672607421875, -0.21416473388671875, -0.2076568603515625, -0.20114898681640625, -0.19464111328125, -0.18813323974609375, -0.1816253662109375, -0.17511749267578125, -0.168609619140625, -0.16210174560546875, -0.1555938720703125, -0.14908599853515625, -0.142578125, -0.13607025146484375, -0.1295623779296875, -0.12305450439453125, -0.116546630859375, -0.11003875732421875, -0.1035308837890625, -0.09702301025390625, -0.09051513671875, -0.08400726318359375, -0.0774993896484375, -0.07099151611328125, -0.064483642578125, -0.05797576904296875, -0.0514678955078125, -0.04496002197265625, -0.0384521484375, -0.03194427490234375, -0.0254364013671875, -0.01892852783203125, -0.012420654296875, -0.00591278076171875, 0.0005950927734375, 0.00710296630859375, 0.01361083984375, 0.02011871337890625, 0.0266265869140625, 0.03313446044921875, 0.039642333984375, 0.04615020751953125, 0.0526580810546875, 0.05916595458984375, 0.065673828125, 0.07218170166015625, 0.0786895751953125, 0.08519744873046875, 0.091705322265625, 0.09821319580078125, 0.1047210693359375, 0.11122894287109375, 0.11773681640625, 0.12424468994140625, 0.1307525634765625, 0.13726043701171875, 0.143768310546875, 0.15027618408203125, 0.1567840576171875, 0.16329193115234375, 0.1697998046875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 15.0, 6.0, 23.0, 51.0, 104.0, 136.0, 213.0, 193.0, 100.0, 79.0, 36.0, 20.0, 17.0, 9.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9311900734901428, -0.8792020082473755, -0.8272139430046082, -0.7752258777618408, -0.7232378125190735, -0.6712497472763062, -0.6192616820335388, -0.5672736167907715, -0.5152855515480042, -0.4632974863052368, -0.4113094210624695, -0.35932135581970215, -0.3073332905769348, -0.2553452253341675, -0.20335716009140015, -0.1513690948486328, -0.09938102960586548, -0.047392964363098145, 0.0045951008796691895, 0.05658316612243652, 0.10857123136520386, 0.1605592966079712, 0.21254736185073853, 0.26453542709350586, 0.3165234923362732, 0.3685115575790405, 0.42049962282180786, 0.4724876880645752, 0.5244757533073425, 0.5764638185501099, 0.6284518837928772, 0.6804399490356445, 0.7324280738830566, 0.784416139125824, 0.8364042043685913, 0.8883922696113586, 0.940380334854126, 0.9923684000968933, 1.0443564653396606, 1.0963444709777832, 1.1483325958251953, 1.2003207206726074, 1.25230872631073, 1.3042967319488525, 1.3562848567962646, 1.4082729816436768, 1.4602609872817993, 1.5122489929199219, 1.564237117767334, 1.616225242614746, 1.6682132482528687, 1.7202012538909912, 1.7721893787384033, 1.8241775035858154, 1.876165509223938, 1.9281535148620605, 1.9801416397094727, 2.0321297645568848, 2.084117889404297, 2.13610577583313, 2.188093900680542, 2.240082025527954, 2.292069911956787, 2.344058036804199, 2.3960461616516113]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 14.0, 11.0, 15.0, 25.0, 15.0, 24.0, 26.0, 30.0, 33.0, 42.0, 43.0, 60.0, 49.0, 75.0, 44.0, 58.0, 50.0, 61.0, 50.0, 50.0, 38.0, 38.0, 40.0, 26.0, 24.0, 8.0, 10.0, 12.0, 8.0, 9.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.565366268157959, -0.5442867279052734, -0.5232071876525879, -0.5021276473999023, -0.4810481071472168, -0.45996856689453125, -0.4388890564441681, -0.41780951619148254, -0.396729975938797, -0.37565043568611145, -0.3545708954334259, -0.33349138498306274, -0.3124118447303772, -0.29133230447769165, -0.2702527642250061, -0.24917322397232056, -0.228093683719635, -0.20701414346694946, -0.18593460321426392, -0.16485507786273956, -0.14377553761005402, -0.12269599735736847, -0.10161647200584412, -0.08053693175315857, -0.05945739150047302, -0.038377854973077774, -0.017298318445682526, 0.0037812143564224243, 0.02486075460910797, 0.04594029486179352, 0.06701982021331787, 0.08809936046600342, 0.10917896032333374, 0.1302585005760193, 0.15133804082870483, 0.1724175661802292, 0.19349710643291473, 0.21457664668560028, 0.23565617203712463, 0.2567357122898102, 0.2778152525424957, 0.2988947927951813, 0.3199743330478668, 0.34105384349823, 0.3621333837509155, 0.3832129240036011, 0.4042924642562866, 0.42537200450897217, 0.4464515447616577, 0.46753108501434326, 0.4886106252670288, 0.5096901655197144, 0.5307697057723999, 0.5518492460250854, 0.572928786277771, 0.5940083265304565, 0.6150878667831421, 0.6361674070358276, 0.6572469472885132, 0.6783264875411987, 0.6994060277938843, 0.7204855680465698, 0.7415651082992554, 0.7626446485519409, 0.7837241291999817]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 3.0, 6.0, 5.0, 12.0, 22.0, 29.0, 68.0, 185.0, 836.0, 5585.0, 86620.0, 887485.0, 62026.0, 4642.0, 719.0, 156.0, 68.0, 30.0, 13.0, 11.0, 6.0, 7.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3916015625, -0.3787422180175781, -0.36588287353515625, -0.3530235290527344, -0.3401641845703125, -0.3273048400878906, -0.31444549560546875, -0.3015861511230469, -0.288726806640625, -0.2758674621582031, -0.26300811767578125, -0.2501487731933594, -0.2372894287109375, -0.22443008422851562, -0.21157073974609375, -0.19871139526367188, -0.18585205078125, -0.17299270629882812, -0.16013336181640625, -0.14727401733398438, -0.1344146728515625, -0.12155532836914062, -0.10869598388671875, -0.09583663940429688, -0.082977294921875, -0.07011795043945312, -0.05725860595703125, -0.044399261474609375, -0.0315399169921875, -0.018680572509765625, -0.00582122802734375, 0.007038116455078125, 0.0198974609375, 0.032756805419921875, 0.04561614990234375, 0.058475494384765625, 0.0713348388671875, 0.08419418334960938, 0.09705352783203125, 0.10991287231445312, 0.122772216796875, 0.13563156127929688, 0.14849090576171875, 0.16135025024414062, 0.1742095947265625, 0.18706893920898438, 0.19992828369140625, 0.21278762817382812, 0.22564697265625, 0.23850631713867188, 0.25136566162109375, 0.2642250061035156, 0.2770843505859375, 0.2899436950683594, 0.30280303955078125, 0.3156623840332031, 0.328521728515625, 0.3413810729980469, 0.35424041748046875, 0.3670997619628906, 0.3799591064453125, 0.3928184509277344, 0.40567779541015625, 0.4185371398925781, 0.431396484375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 9.0, 9.0, 15.0, 16.0, 11.0, 23.0, 24.0, 30.0, 42.0, 45.0, 47.0, 62.0, 59.0, 65.0, 74.0, 72.0, 55.0, 65.0, 54.0, 48.0, 44.0, 40.0, 25.0, 16.0, 15.0, 11.0, 10.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46826171875, -0.451690673828125, -0.43511962890625, -0.418548583984375, -0.4019775390625, -0.385406494140625, -0.36883544921875, -0.352264404296875, -0.335693359375, -0.319122314453125, -0.30255126953125, -0.285980224609375, -0.2694091796875, -0.252838134765625, -0.23626708984375, -0.219696044921875, -0.203125, -0.186553955078125, -0.16998291015625, -0.153411865234375, -0.1368408203125, -0.120269775390625, -0.10369873046875, -0.087127685546875, -0.070556640625, -0.053985595703125, -0.03741455078125, -0.020843505859375, -0.0042724609375, 0.012298583984375, 0.02886962890625, 0.045440673828125, 0.06201171875, 0.078582763671875, 0.09515380859375, 0.111724853515625, 0.1282958984375, 0.144866943359375, 0.16143798828125, 0.178009033203125, 0.194580078125, 0.211151123046875, 0.22772216796875, 0.244293212890625, 0.2608642578125, 0.277435302734375, 0.29400634765625, 0.310577392578125, 0.3271484375, 0.343719482421875, 0.36029052734375, 0.376861572265625, 0.3934326171875, 0.410003662109375, 0.42657470703125, 0.443145751953125, 0.459716796875, 0.476287841796875, 0.49285888671875, 0.509429931640625, 0.5260009765625, 0.542572021484375, 0.55914306640625, 0.575714111328125, 0.59228515625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 7.0, 7.0, 10.0, 10.0, 13.0, 24.0, 28.0, 42.0, 76.0, 105.0, 173.0, 335.0, 639.0, 1239.0, 2624.0, 5925.0, 15441.0, 48455.0, 184737.0, 467171.0, 229803.0, 60337.0, 18449.0, 6910.0, 2972.0, 1391.0, 688.0, 359.0, 205.0, 138.0, 72.0, 49.0, 43.0, 18.0, 17.0, 7.0, 9.0, 8.0, 5.0, 1.0, 3.0, 2.0, 5.0, 4.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.13525390625, -0.1314525604248047, -0.12765121459960938, -0.12384986877441406, -0.12004852294921875, -0.11624717712402344, -0.11244583129882812, -0.10864448547363281, -0.1048431396484375, -0.10104179382324219, -0.09724044799804688, -0.09343910217285156, -0.08963775634765625, -0.08583641052246094, -0.08203506469726562, -0.07823371887207031, -0.074432373046875, -0.07063102722167969, -0.06682968139648438, -0.06302833557128906, -0.05922698974609375, -0.05542564392089844, -0.051624298095703125, -0.04782295227050781, -0.0440216064453125, -0.04022026062011719, -0.036418914794921875, -0.03261756896972656, -0.02881622314453125, -0.025014877319335938, -0.021213531494140625, -0.017412185668945312, -0.01361083984375, -0.009809494018554688, -0.006008148193359375, -0.0022068023681640625, 0.00159454345703125, 0.0053958892822265625, 0.009197235107421875, 0.012998580932617188, 0.0167999267578125, 0.020601272583007812, 0.024402618408203125, 0.028203964233398438, 0.03200531005859375, 0.03580665588378906, 0.039608001708984375, 0.04340934753417969, 0.047210693359375, 0.05101203918457031, 0.054813385009765625, 0.05861473083496094, 0.06241607666015625, 0.06621742248535156, 0.07001876831054688, 0.07382011413574219, 0.0776214599609375, 0.08142280578613281, 0.08522415161132812, 0.08902549743652344, 0.09282684326171875, 0.09662818908691406, 0.10042953491210938, 0.10423088073730469, 0.1080322265625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 15.0, 8.0, 10.0, 14.0, 15.0, 18.0, 32.0, 36.0, 40.0, 49.0, 48.0, 44.0, 61.0, 70.0, 65.0, 57.0, 70.0, 47.0, 45.0, 34.0, 43.0, 29.0, 34.0, 24.0, 17.0, 13.0, 13.0, 18.0, 9.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.9384765625, -0.9112091064453125, -0.883941650390625, -0.8566741943359375, -0.82940673828125, -0.8021392822265625, -0.774871826171875, -0.7476043701171875, -0.7203369140625, -0.6930694580078125, -0.665802001953125, -0.6385345458984375, -0.61126708984375, -0.5839996337890625, -0.556732177734375, -0.5294647216796875, -0.502197265625, -0.4749298095703125, -0.447662353515625, -0.4203948974609375, -0.39312744140625, -0.3658599853515625, -0.338592529296875, -0.3113250732421875, -0.2840576171875, -0.2567901611328125, -0.229522705078125, -0.2022552490234375, -0.17498779296875, -0.1477203369140625, -0.120452880859375, -0.0931854248046875, -0.06591796875, -0.0386505126953125, -0.011383056640625, 0.0158843994140625, 0.04315185546875, 0.0704193115234375, 0.097686767578125, 0.1249542236328125, 0.1522216796875, 0.1794891357421875, 0.206756591796875, 0.2340240478515625, 0.26129150390625, 0.2885589599609375, 0.315826416015625, 0.3430938720703125, 0.370361328125, 0.3976287841796875, 0.424896240234375, 0.4521636962890625, 0.47943115234375, 0.5066986083984375, 0.533966064453125, 0.5612335205078125, 0.5885009765625, 0.6157684326171875, 0.643035888671875, 0.6703033447265625, 0.69757080078125, 0.7248382568359375, 0.752105712890625, 0.7793731689453125, 0.806640625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 4.0, 8.0, 10.0, 23.0, 27.0, 25.0, 57.0, 84.0, 137.0, 197.0, 328.0, 463.0, 863.0, 1585.0, 3201.0, 6741.0, 16556.0, 46946.0, 145980.0, 355625.0, 302010.0, 108192.0, 35287.0, 12941.0, 5454.0, 2490.0, 1317.0, 761.0, 442.0, 276.0, 160.0, 116.0, 68.0, 54.0, 44.0, 21.0, 18.0, 11.0, 10.0, 9.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0238037109375, -0.022917747497558594, -0.022031784057617188, -0.02114582061767578, -0.020259857177734375, -0.01937389373779297, -0.018487930297851562, -0.017601966857910156, -0.01671600341796875, -0.015830039978027344, -0.014944076538085938, -0.014058113098144531, -0.013172149658203125, -0.012286186218261719, -0.011400222778320312, -0.010514259338378906, -0.0096282958984375, -0.008742332458496094, -0.007856369018554688, -0.006970405578613281, -0.006084442138671875, -0.005198478698730469, -0.0043125152587890625, -0.0034265518188476562, -0.00254058837890625, -0.0016546249389648438, -0.0007686614990234375, 0.00011730194091796875, 0.001003265380859375, 0.0018892288208007812, 0.0027751922607421875, 0.0036611557006835938, 0.004547119140625, 0.005433082580566406, 0.0063190460205078125, 0.007205009460449219, 0.008090972900390625, 0.008976936340332031, 0.009862899780273438, 0.010748863220214844, 0.01163482666015625, 0.012520790100097656, 0.013406753540039062, 0.014292716979980469, 0.015178680419921875, 0.01606464385986328, 0.016950607299804688, 0.017836570739746094, 0.0187225341796875, 0.019608497619628906, 0.020494461059570312, 0.02138042449951172, 0.022266387939453125, 0.02315235137939453, 0.024038314819335938, 0.024924278259277344, 0.02581024169921875, 0.026696205139160156, 0.027582168579101562, 0.02846813201904297, 0.029354095458984375, 0.03024005889892578, 0.031126022338867188, 0.032011985778808594, 0.03289794921875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 7.0, 12.0, 14.0, 22.0, 28.0, 34.0, 46.0, 51.0, 66.0, 82.0, 103.0, 95.0, 90.0, 90.0, 64.0, 61.0, 35.0, 21.0, 24.0, 16.0, 10.0, 11.0, 5.0, 7.0, 1.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7954578399658203e-05, -2.7242116630077362e-05, -2.652965486049652e-05, -2.581719309091568e-05, -2.510473132133484e-05, -2.4392269551753998e-05, -2.3679807782173157e-05, -2.2967346012592316e-05, -2.2254884243011475e-05, -2.1542422473430634e-05, -2.0829960703849792e-05, -2.011749893426895e-05, -1.940503716468811e-05, -1.869257539510727e-05, -1.7980113625526428e-05, -1.7267651855945587e-05, -1.6555190086364746e-05, -1.5842728316783905e-05, -1.5130266547203064e-05, -1.4417804777622223e-05, -1.3705343008041382e-05, -1.299288123846054e-05, -1.22804194688797e-05, -1.1567957699298859e-05, -1.0855495929718018e-05, -1.0143034160137177e-05, -9.430572390556335e-06, -8.718110620975494e-06, -8.005648851394653e-06, -7.293187081813812e-06, -6.580725312232971e-06, -5.86826354265213e-06, -5.155801773071289e-06, -4.443340003490448e-06, -3.730878233909607e-06, -3.018416464328766e-06, -2.305954694747925e-06, -1.5934929251670837e-06, -8.810311555862427e-07, -1.685693860054016e-07, 5.438923835754395e-07, 1.2563541531562805e-06, 1.9688159227371216e-06, 2.6812776923179626e-06, 3.3937394618988037e-06, 4.106201231479645e-06, 4.818663001060486e-06, 5.531124770641327e-06, 6.243586540222168e-06, 6.956048309803009e-06, 7.66851007938385e-06, 8.380971848964691e-06, 9.093433618545532e-06, 9.805895388126373e-06, 1.0518357157707214e-05, 1.1230818927288055e-05, 1.1943280696868896e-05, 1.2655742466449738e-05, 1.3368204236030579e-05, 1.408066600561142e-05, 1.479312777519226e-05, 1.5505589544773102e-05, 1.6218051314353943e-05, 1.6930513083934784e-05, 1.7642974853515625e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 10.0, 2.0, 11.0, 13.0, 15.0, 12.0, 26.0, 38.0, 58.0, 79.0, 130.0, 182.0, 312.0, 492.0, 820.0, 1609.0, 3340.0, 7113.0, 16559.0, 41542.0, 109359.0, 258032.0, 322601.0, 172625.0, 66819.0, 25860.0, 10799.0, 4790.0, 2325.0, 1192.0, 658.0, 393.0, 244.0, 162.0, 120.0, 61.0, 41.0, 32.0, 16.0, 17.0, 10.0, 8.0, 4.0, 9.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.022979736328125, -0.0223085880279541, -0.021637439727783203, -0.020966291427612305, -0.020295143127441406, -0.019623994827270508, -0.01895284652709961, -0.01828169822692871, -0.017610549926757812, -0.016939401626586914, -0.016268253326416016, -0.015597105026245117, -0.014925956726074219, -0.01425480842590332, -0.013583660125732422, -0.012912511825561523, -0.012241363525390625, -0.011570215225219727, -0.010899066925048828, -0.01022791862487793, -0.009556770324707031, -0.008885622024536133, -0.008214473724365234, -0.007543325424194336, -0.0068721771240234375, -0.006201028823852539, -0.005529880523681641, -0.004858732223510742, -0.004187583923339844, -0.0035164356231689453, -0.002845287322998047, -0.0021741390228271484, -0.00150299072265625, -0.0008318424224853516, -0.00016069412231445312, 0.0005104541778564453, 0.0011816024780273438, 0.0018527507781982422, 0.0025238990783691406, 0.003195047378540039, 0.0038661956787109375, 0.004537343978881836, 0.005208492279052734, 0.005879640579223633, 0.006550788879394531, 0.00722193717956543, 0.007893085479736328, 0.008564233779907227, 0.009235382080078125, 0.009906530380249023, 0.010577678680419922, 0.01124882698059082, 0.011919975280761719, 0.012591123580932617, 0.013262271881103516, 0.013933420181274414, 0.014604568481445312, 0.015275716781616211, 0.01594686508178711, 0.016618013381958008, 0.017289161682128906, 0.017960309982299805, 0.018631458282470703, 0.0193026065826416, 0.0199737548828125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 8.0, 4.0, 6.0, 5.0, 13.0, 21.0, 17.0, 19.0, 22.0, 33.0, 45.0, 39.0, 46.0, 45.0, 53.0, 45.0, 62.0, 43.0, 62.0, 66.0, 52.0, 49.0, 38.0, 32.0, 41.0, 23.0, 25.0, 19.0, 17.0, 17.0, 7.0, 6.0, 6.0, 7.0, 2.0, 4.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00606536865234375, -0.005846261978149414, -0.005627155303955078, -0.005408048629760742, -0.005188941955566406, -0.00496983528137207, -0.004750728607177734, -0.0045316219329833984, -0.0043125152587890625, -0.0040934085845947266, -0.0038743019104003906, -0.0036551952362060547, -0.0034360885620117188, -0.003216981887817383, -0.002997875213623047, -0.002778768539428711, -0.002559661865234375, -0.002340555191040039, -0.002121448516845703, -0.0019023418426513672, -0.0016832351684570312, -0.0014641284942626953, -0.0012450218200683594, -0.0010259151458740234, -0.0008068084716796875, -0.0005877017974853516, -0.0003685951232910156, -0.0001494884490966797, 6.961822509765625e-05, 0.0002887248992919922, 0.0005078315734863281, 0.0007269382476806641, 0.000946044921875, 0.001165151596069336, 0.0013842582702636719, 0.0016033649444580078, 0.0018224716186523438, 0.0020415782928466797, 0.0022606849670410156, 0.0024797916412353516, 0.0026988983154296875, 0.0029180049896240234, 0.0031371116638183594, 0.0033562183380126953, 0.0035753250122070312, 0.003794431686401367, 0.004013538360595703, 0.004232645034790039, 0.004451751708984375, 0.004670858383178711, 0.004889965057373047, 0.005109071731567383, 0.005328178405761719, 0.005547285079956055, 0.005766391754150391, 0.0059854984283447266, 0.0062046051025390625, 0.0064237117767333984, 0.006642818450927734, 0.00686192512512207, 0.007081031799316406, 0.007300138473510742, 0.007519245147705078, 0.007738351821899414, 0.00795745849609375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 16.0, 79.0, 518.0, 347.0, 49.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.552289605140686, -0.43884190917015076, -0.3253942131996155, -0.2119465172290802, -0.09849882125854492, 0.014948844909667969, 0.12839657068252563, 0.2418442964553833, 0.3552919626235962, 0.46873965859413147, 0.5821873545646667, 0.6956350803375244, 0.8090827465057373, 0.9225304126739502, 1.035978078842163, 1.1494258642196655, 1.2628735303878784, 1.3763211965560913, 1.4897689819335938, 1.6032166481018066, 1.7166643142700195, 1.8301119804382324, 1.9435596466064453, 2.057007312774658, 2.170454978942871, 2.283902645111084, 2.397350311279297, 2.5107979774475098, 2.6242456436157227, 2.7376933097839355, 2.8511412143707275, 2.9645888805389404, 3.0780367851257324, 3.1914844512939453, 3.304932117462158, 3.418379783630371, 3.531827449798584, 3.645275115966797, 3.758723020553589, 3.8721706867218018, 3.9856183528900146, 4.099066257476807, 4.2125139236450195, 4.325961589813232, 4.439409255981445, 4.552856922149658, 4.666304588317871, 4.779752254486084, 4.893199920654297, 5.00664758682251, 5.120095252990723, 5.2335429191589355, 5.346990585327148, 5.460438251495361, 5.573885917663574, 5.687334060668945, 5.80078125, 5.914228916168213, 6.027676582336426, 6.141124248504639, 6.254571914672852, 6.3680195808410645, 6.481467247009277, 6.594915390014648, 6.708363056182861]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 4.0, 1.0, 4.0, 7.0, 15.0, 19.0, 27.0, 26.0, 34.0, 38.0, 40.0, 69.0, 70.0, 79.0, 73.0, 81.0, 78.0, 70.0, 64.0, 52.0, 54.0, 37.0, 17.0, 14.0, 11.0, 14.0, 8.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5818410515785217, -0.5629381537437439, -0.5440352559089661, -0.5251323580741882, -0.5062295198440552, -0.48732659220695496, -0.4684237241744995, -0.4495208263397217, -0.43061792850494385, -0.411715030670166, -0.3928121328353882, -0.37390926480293274, -0.3550063669681549, -0.3361034691333771, -0.31720060110092163, -0.2982977032661438, -0.27939480543136597, -0.26049190759658813, -0.2415890246629715, -0.22268614172935486, -0.20378324389457703, -0.1848803460597992, -0.16597746312618256, -0.14707458019256592, -0.12817168235778809, -0.10926879197359085, -0.09036590158939362, -0.07146301120519638, -0.052560120820999146, -0.03365723043680191, -0.014754340052604675, 0.004148542881011963, 0.023051440715789795, 0.04195433109998703, 0.060857221484184265, 0.0797601118683815, 0.09866300225257874, 0.11756589263677597, 0.1364687830209732, 0.15537166595458984, 0.17427456378936768, 0.1931774616241455, 0.21208034455776215, 0.23098322749137878, 0.24988612532615662, 0.26878902316093445, 0.2876918911933899, 0.3065947890281677, 0.32549768686294556, 0.3444005846977234, 0.3633034825325012, 0.38220635056495667, 0.4011092483997345, 0.42001214623451233, 0.4389150142669678, 0.4578179121017456, 0.47672080993652344, 0.49562370777130127, 0.5145266056060791, 0.5334295034408569, 0.5523324012756348, 0.5712352395057678, 0.5901381373405457, 0.6090410351753235, 0.6279439330101013]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 7.0, 7.0, 2.0, 11.0, 19.0, 50.0, 77.0, 178.0, 462.0, 1373.0, 4734.0, 31057.0, 679383.0, 310139.0, 16249.0, 3162.0, 980.0, 354.0, 149.0, 69.0, 39.0, 19.0, 13.0, 8.0, 7.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92138671875, -0.8883132934570312, -0.8552398681640625, -0.8221664428710938, -0.789093017578125, -0.7560195922851562, -0.7229461669921875, -0.6898727416992188, -0.65679931640625, -0.6237258911132812, -0.5906524658203125, -0.5575790405273438, -0.524505615234375, -0.49143218994140625, -0.4583587646484375, -0.42528533935546875, -0.3922119140625, -0.35913848876953125, -0.3260650634765625, -0.29299163818359375, -0.259918212890625, -0.22684478759765625, -0.1937713623046875, -0.16069793701171875, -0.12762451171875, -0.09455108642578125, -0.0614776611328125, -0.02840423583984375, 0.004669189453125, 0.03774261474609375, 0.0708160400390625, 0.10388946533203125, 0.136962890625, 0.17003631591796875, 0.2031097412109375, 0.23618316650390625, 0.269256591796875, 0.30233001708984375, 0.3354034423828125, 0.36847686767578125, 0.40155029296875, 0.43462371826171875, 0.4676971435546875, 0.5007705688476562, 0.533843994140625, 0.5669174194335938, 0.5999908447265625, 0.6330642700195312, 0.6661376953125, 0.6992111206054688, 0.7322845458984375, 0.7653579711914062, 0.798431396484375, 0.8315048217773438, 0.8645782470703125, 0.8976516723632812, 0.93072509765625, 0.9637985229492188, 0.9968719482421875, 1.0299453735351562, 1.063018798828125, 1.0960922241210938, 1.1291656494140625, 1.1622390747070312, 1.1953125]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 7.0, 11.0, 13.0, 18.0, 17.0, 23.0, 34.0, 37.0, 29.0, 47.0, 58.0, 57.0, 84.0, 61.0, 75.0, 80.0, 67.0, 55.0, 55.0, 53.0, 40.0, 28.0, 17.0, 11.0, 13.0, 4.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85205078125, -0.8191146850585938, -0.7861785888671875, -0.7532424926757812, -0.720306396484375, -0.6873703002929688, -0.6544342041015625, -0.6214981079101562, -0.58856201171875, -0.5556259155273438, -0.5226898193359375, -0.48975372314453125, -0.456817626953125, -0.42388153076171875, -0.3909454345703125, -0.35800933837890625, -0.3250732421875, -0.29213714599609375, -0.2592010498046875, -0.22626495361328125, -0.193328857421875, -0.16039276123046875, -0.1274566650390625, -0.09452056884765625, -0.06158447265625, -0.02864837646484375, 0.0042877197265625, 0.03722381591796875, 0.070159912109375, 0.10309600830078125, 0.1360321044921875, 0.16896820068359375, 0.201904296875, 0.23484039306640625, 0.2677764892578125, 0.30071258544921875, 0.333648681640625, 0.36658477783203125, 0.3995208740234375, 0.43245697021484375, 0.46539306640625, 0.49832916259765625, 0.5312652587890625, 0.5642013549804688, 0.597137451171875, 0.6300735473632812, 0.6630096435546875, 0.6959457397460938, 0.7288818359375, 0.7618179321289062, 0.7947540283203125, 0.8276901245117188, 0.860626220703125, 0.8935623168945312, 0.9264984130859375, 0.9594345092773438, 0.99237060546875, 1.0253067016601562, 1.0582427978515625, 1.0911788940429688, 1.124114990234375, 1.1570510864257812, 1.1899871826171875, 1.2229232788085938, 1.255859375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 8.0, 11.0, 17.0, 18.0, 21.0, 28.0, 43.0, 61.0, 134.0, 202.0, 414.0, 948.0, 3538.0, 38669.0, 925332.0, 72026.0, 4833.0, 1191.0, 475.0, 237.0, 135.0, 74.0, 41.0, 29.0, 21.0, 14.0, 8.0, 6.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.259765625, -1.221099853515625, -1.18243408203125, -1.143768310546875, -1.1051025390625, -1.066436767578125, -1.02777099609375, -0.989105224609375, -0.950439453125, -0.911773681640625, -0.87310791015625, -0.834442138671875, -0.7957763671875, -0.757110595703125, -0.71844482421875, -0.679779052734375, -0.64111328125, -0.602447509765625, -0.56378173828125, -0.525115966796875, -0.4864501953125, -0.447784423828125, -0.40911865234375, -0.370452880859375, -0.331787109375, -0.293121337890625, -0.25445556640625, -0.215789794921875, -0.1771240234375, -0.138458251953125, -0.09979248046875, -0.061126708984375, -0.0224609375, 0.016204833984375, 0.05487060546875, 0.093536376953125, 0.1322021484375, 0.170867919921875, 0.20953369140625, 0.248199462890625, 0.286865234375, 0.325531005859375, 0.36419677734375, 0.402862548828125, 0.4415283203125, 0.480194091796875, 0.51885986328125, 0.557525634765625, 0.59619140625, 0.634857177734375, 0.67352294921875, 0.712188720703125, 0.7508544921875, 0.789520263671875, 0.82818603515625, 0.866851806640625, 0.905517578125, 0.944183349609375, 0.98284912109375, 1.021514892578125, 1.0601806640625, 1.098846435546875, 1.13751220703125, 1.176177978515625, 1.21484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 5.0, 9.0, 6.0, 6.0, 11.0, 12.0, 17.0, 27.0, 24.0, 26.0, 34.0, 22.0, 42.0, 43.0, 32.0, 55.0, 50.0, 48.0, 61.0, 39.0, 40.0, 46.0, 55.0, 38.0, 34.0, 39.0, 36.0, 27.0, 18.0, 17.0, 21.0, 9.0, 16.0, 8.0, 11.0, 1.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8349609375, -0.8076858520507812, -0.7804107666015625, -0.7531356811523438, -0.725860595703125, -0.6985855102539062, -0.6713104248046875, -0.6440353393554688, -0.61676025390625, -0.5894851684570312, -0.5622100830078125, -0.5349349975585938, -0.507659912109375, -0.48038482666015625, -0.4531097412109375, -0.42583465576171875, -0.3985595703125, -0.37128448486328125, -0.3440093994140625, -0.31673431396484375, -0.289459228515625, -0.26218414306640625, -0.2349090576171875, -0.20763397216796875, -0.18035888671875, -0.15308380126953125, -0.1258087158203125, -0.09853363037109375, -0.071258544921875, -0.04398345947265625, -0.0167083740234375, 0.01056671142578125, 0.037841796875, 0.06511688232421875, 0.0923919677734375, 0.11966705322265625, 0.146942138671875, 0.17421722412109375, 0.2014923095703125, 0.22876739501953125, 0.25604248046875, 0.28331756591796875, 0.3105926513671875, 0.33786773681640625, 0.365142822265625, 0.39241790771484375, 0.4196929931640625, 0.44696807861328125, 0.4742431640625, 0.5015182495117188, 0.5287933349609375, 0.5560684204101562, 0.583343505859375, 0.6106185913085938, 0.6378936767578125, 0.6651687622070312, 0.69244384765625, 0.7197189331054688, 0.7469940185546875, 0.7742691040039062, 0.801544189453125, 0.8288192749023438, 0.8560943603515625, 0.8833694458007812, 0.91064453125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 8.0, 21.0, 33.0, 48.0, 125.0, 320.0, 924.0, 4029.0, 46473.0, 949471.0, 41996.0, 3709.0, 881.0, 292.0, 109.0, 46.0, 27.0, 13.0, 7.0, 5.0, 5.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.59521484375, -0.5784416198730469, -0.5616683959960938, -0.5448951721191406, -0.5281219482421875, -0.5113487243652344, -0.49457550048828125, -0.4778022766113281, -0.461029052734375, -0.4442558288574219, -0.42748260498046875, -0.4107093811035156, -0.3939361572265625, -0.3771629333496094, -0.36038970947265625, -0.3436164855957031, -0.32684326171875, -0.3100700378417969, -0.29329681396484375, -0.2765235900878906, -0.2597503662109375, -0.24297714233398438, -0.22620391845703125, -0.20943069458007812, -0.192657470703125, -0.17588424682617188, -0.15911102294921875, -0.14233779907226562, -0.1255645751953125, -0.10879135131835938, -0.09201812744140625, -0.07524490356445312, -0.0584716796875, -0.041698455810546875, -0.02492523193359375, -0.008152008056640625, 0.0086212158203125, 0.025394439697265625, 0.04216766357421875, 0.058940887451171875, 0.075714111328125, 0.09248733520507812, 0.10926055908203125, 0.12603378295898438, 0.1428070068359375, 0.15958023071289062, 0.17635345458984375, 0.19312667846679688, 0.20989990234375, 0.22667312622070312, 0.24344635009765625, 0.2602195739746094, 0.2769927978515625, 0.2937660217285156, 0.31053924560546875, 0.3273124694824219, 0.344085693359375, 0.3608589172363281, 0.37763214111328125, 0.3944053649902344, 0.4111785888671875, 0.4279518127441406, 0.44472503662109375, 0.4614982604980469, 0.478271484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 6.0, 8.0, 12.0, 29.0, 55.0, 145.0, 245.0, 225.0, 135.0, 68.0, 19.0, 15.0, 13.0, 7.0, 10.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.598234176635742e-05, -6.384868174791336e-05, -6.17150217294693e-05, -5.958136171102524e-05, -5.744770169258118e-05, -5.5314041674137115e-05, -5.3180381655693054e-05, -5.104672163724899e-05, -4.891306161880493e-05, -4.677940160036087e-05, -4.464574158191681e-05, -4.251208156347275e-05, -4.0378421545028687e-05, -3.8244761526584625e-05, -3.6111101508140564e-05, -3.39774414896965e-05, -3.184378147125244e-05, -2.971012145280838e-05, -2.757646143436432e-05, -2.5442801415920258e-05, -2.3309141397476196e-05, -2.1175481379032135e-05, -1.9041821360588074e-05, -1.6908161342144012e-05, -1.4774501323699951e-05, -1.264084130525589e-05, -1.0507181286811829e-05, -8.373521268367767e-06, -6.239861249923706e-06, -4.106201231479645e-06, -1.9725412130355835e-06, 1.6111880540847778e-07, 2.294778823852539e-06, 4.4284388422966e-06, 6.562098860740662e-06, 8.695758879184723e-06, 1.0829418897628784e-05, 1.2963078916072845e-05, 1.5096738934516907e-05, 1.7230398952960968e-05, 1.936405897140503e-05, 2.149771898984909e-05, 2.3631379008293152e-05, 2.5765039026737213e-05, 2.7898699045181274e-05, 3.0032359063625336e-05, 3.21660190820694e-05, 3.429967910051346e-05, 3.643333911895752e-05, 3.856699913740158e-05, 4.070065915584564e-05, 4.28343191742897e-05, 4.4967979192733765e-05, 4.7101639211177826e-05, 4.923529922962189e-05, 5.136895924806595e-05, 5.350261926651001e-05, 5.563627928495407e-05, 5.776993930339813e-05, 5.9903599321842194e-05, 6.203725934028625e-05, 6.417091935873032e-05, 6.630457937717438e-05, 6.843823939561844e-05, 7.05718994140625e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 6.0, 4.0, 7.0, 11.0, 14.0, 19.0, 38.0, 61.0, 119.0, 236.0, 696.0, 3640.0, 41239.0, 944495.0, 52547.0, 4077.0, 809.0, 252.0, 121.0, 51.0, 31.0, 19.0, 16.0, 14.0, 6.0, 8.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56787109375, -0.5523262023925781, -0.5367813110351562, -0.5212364196777344, -0.5056915283203125, -0.4901466369628906, -0.47460174560546875, -0.4590568542480469, -0.443511962890625, -0.4279670715332031, -0.41242218017578125, -0.3968772888183594, -0.3813323974609375, -0.3657875061035156, -0.35024261474609375, -0.3346977233886719, -0.31915283203125, -0.3036079406738281, -0.28806304931640625, -0.2725181579589844, -0.2569732666015625, -0.24142837524414062, -0.22588348388671875, -0.21033859252929688, -0.194793701171875, -0.17924880981445312, -0.16370391845703125, -0.14815902709960938, -0.1326141357421875, -0.11706924438476562, -0.10152435302734375, -0.08597946166992188, -0.0704345703125, -0.054889678955078125, -0.03934478759765625, -0.023799896240234375, -0.0082550048828125, 0.007289886474609375, 0.02283477783203125, 0.038379669189453125, 0.053924560546875, 0.06946945190429688, 0.08501434326171875, 0.10055923461914062, 0.1161041259765625, 0.13164901733398438, 0.14719390869140625, 0.16273880004882812, 0.17828369140625, 0.19382858276367188, 0.20937347412109375, 0.22491836547851562, 0.2404632568359375, 0.2560081481933594, 0.27155303955078125, 0.2870979309082031, 0.302642822265625, 0.3181877136230469, 0.33373260498046875, 0.3492774963378906, 0.3648223876953125, 0.3803672790527344, 0.39591217041015625, 0.4114570617675781, 0.427001953125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 10.0, 6.0, 15.0, 12.0, 21.0, 34.0, 41.0, 74.0, 78.0, 119.0, 121.0, 111.0, 93.0, 77.0, 53.0, 45.0, 27.0, 13.0, 11.0, 10.0, 6.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.112060546875, -0.10871505737304688, -0.10536956787109375, -0.10202407836914062, -0.0986785888671875, -0.09533309936523438, -0.09198760986328125, -0.08864212036132812, -0.085296630859375, -0.08195114135742188, -0.07860565185546875, -0.07526016235351562, -0.0719146728515625, -0.06856918334960938, -0.06522369384765625, -0.061878204345703125, -0.05853271484375, -0.055187225341796875, -0.05184173583984375, -0.048496246337890625, -0.0451507568359375, -0.041805267333984375, -0.03845977783203125, -0.035114288330078125, -0.031768798828125, -0.028423309326171875, -0.02507781982421875, -0.021732330322265625, -0.0183868408203125, -0.015041351318359375, -0.01169586181640625, -0.008350372314453125, -0.0050048828125, -0.001659393310546875, 0.00168609619140625, 0.005031585693359375, 0.0083770751953125, 0.011722564697265625, 0.01506805419921875, 0.018413543701171875, 0.021759033203125, 0.025104522705078125, 0.02845001220703125, 0.031795501708984375, 0.0351409912109375, 0.038486480712890625, 0.04183197021484375, 0.045177459716796875, 0.04852294921875, 0.051868438720703125, 0.05521392822265625, 0.058559417724609375, 0.0619049072265625, 0.06525039672851562, 0.06859588623046875, 0.07194137573242188, 0.075286865234375, 0.07863235473632812, 0.08197784423828125, 0.08532333374023438, 0.0886688232421875, 0.09201431274414062, 0.09535980224609375, 0.09870529174804688, 0.10205078125]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 7.0, 12.0, 25.0, 37.0, 84.0, 130.0, 191.0, 187.0, 154.0, 83.0, 41.0, 22.0, 17.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.028669595718384, -1.9635827541351318, -1.8984960317611694, -1.8334091901779175, -1.768322467803955, -1.7032356262207031, -1.6381487846374512, -1.5730619430541992, -1.5079752206802368, -1.4428883790969849, -1.3778016567230225, -1.3127148151397705, -1.2476279735565186, -1.1825412511825562, -1.1174544095993042, -1.0523676872253418, -0.9872808456420898, -0.9221940636634827, -0.8571072816848755, -0.7920204401016235, -0.7269336581230164, -0.6618468761444092, -0.5967600345611572, -0.53167325258255, -0.46658647060394287, -0.4014996886253357, -0.33641287684440613, -0.27132606506347656, -0.20623928308486938, -0.1411525011062622, -0.07606568932533264, -0.010978877544403076, 0.0541081428527832, 0.11919493973255157, 0.18428173661231995, 0.24936853349208832, 0.3144553303718567, 0.37954211235046387, 0.44462892413139343, 0.509715735912323, 0.5748025178909302, 0.6398892998695374, 0.7049760818481445, 0.7700629234313965, 0.8351497054100037, 0.9002364873886108, 0.9653233289718628, 1.0304100513458252, 1.0954968929290771, 1.160583734512329, 1.2256704568862915, 1.2907572984695435, 1.3558440208435059, 1.4209308624267578, 1.4860177040100098, 1.5511045455932617, 1.6161912679672241, 1.681278109550476, 1.7463648319244385, 1.8114516735076904, 1.8765385150909424, 1.9416252374649048, 2.006711959838867, 2.071798801422119, 2.136885643005371]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 5.0, 4.0, 8.0, 11.0, 6.0, 12.0, 12.0, 13.0, 23.0, 26.0, 31.0, 23.0, 26.0, 27.0, 22.0, 30.0, 26.0, 32.0, 47.0, 33.0, 40.0, 37.0, 30.0, 26.0, 45.0, 31.0, 38.0, 38.0, 39.0, 41.0, 29.0, 26.0, 21.0, 23.0, 18.0, 15.0, 12.0, 7.0, 11.0, 10.0, 15.0, 6.0, 6.0, 6.0, 3.0, 5.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.162905216217041, -1.1256847381591797, -1.0884641408920288, -1.0512436628341675, -1.0140231847763062, -0.9768026471138, -0.939582109451294, -0.9023616313934326, -0.8651410937309265, -0.8279205560684204, -0.7907000780105591, -0.753479540348053, -0.7162590026855469, -0.6790385246276855, -0.6418179869651794, -0.6045974493026733, -0.567376971244812, -0.5301564335823059, -0.4929359555244446, -0.4557154178619385, -0.41849491000175476, -0.38127440214157104, -0.34405386447906494, -0.3068333566188812, -0.2696128487586975, -0.2323923408985138, -0.19517181813716888, -0.15795129537582397, -0.12073078751564026, -0.08351027965545654, -0.04628975689411163, -0.009069234132766724, 0.028151273727416992, 0.0653717890381813, 0.10259230434894562, 0.13981282711029053, 0.17703333497047424, 0.21425384283065796, 0.25147438049316406, 0.2886948883533478, 0.3259153962135315, 0.3631359040737152, 0.4003564119338989, 0.43757694959640503, 0.47479745745658875, 0.5120179653167725, 0.5492385029792786, 0.5864590406417847, 0.623679518699646, 0.6609000563621521, 0.6981205344200134, 0.7353410720825195, 0.7725615501403809, 0.809782087802887, 0.8470026254653931, 0.8842231035232544, 0.9214436411857605, 0.9586641788482666, 0.9958846569061279, 1.0331051349639893, 1.0703257322311401, 1.1075462102890015, 1.1447666883468628, 1.1819872856140137, 1.219207763671875]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 5.0, 9.0, 10.0, 12.0, 18.0, 38.0, 78.0, 252.0, 776.0, 3620.0, 116087.0, 4041468.0, 28230.0, 2576.0, 676.0, 209.0, 96.0, 44.0, 34.0, 11.0, 5.0, 9.0, 6.0, 4.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7236328125, -1.6465606689453125, -1.569488525390625, -1.4924163818359375, -1.41534423828125, -1.3382720947265625, -1.261199951171875, -1.1841278076171875, -1.1070556640625, -1.0299835205078125, -0.952911376953125, -0.8758392333984375, -0.79876708984375, -0.7216949462890625, -0.644622802734375, -0.5675506591796875, -0.490478515625, -0.4134063720703125, -0.336334228515625, -0.2592620849609375, -0.18218994140625, -0.1051177978515625, -0.028045654296875, 0.0490264892578125, 0.1260986328125, 0.2031707763671875, 0.280242919921875, 0.3573150634765625, 0.43438720703125, 0.5114593505859375, 0.588531494140625, 0.6656036376953125, 0.74267578125, 0.8197479248046875, 0.896820068359375, 0.9738922119140625, 1.05096435546875, 1.1280364990234375, 1.205108642578125, 1.2821807861328125, 1.3592529296875, 1.4363250732421875, 1.513397216796875, 1.5904693603515625, 1.66754150390625, 1.7446136474609375, 1.821685791015625, 1.8987579345703125, 1.975830078125, 2.0529022216796875, 2.129974365234375, 2.2070465087890625, 2.28411865234375, 2.3611907958984375, 2.438262939453125, 2.5153350830078125, 2.5924072265625, 2.6694793701171875, 2.746551513671875, 2.8236236572265625, 2.90069580078125, 2.9777679443359375, 3.054840087890625, 3.1319122314453125, 3.208984375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 7.0, 9.0, 11.0, 10.0, 17.0, 13.0, 18.0, 27.0, 32.0, 42.0, 41.0, 37.0, 42.0, 48.0, 52.0, 52.0, 57.0, 50.0, 60.0, 52.0, 60.0, 48.0, 47.0, 27.0, 34.0, 25.0, 16.0, 22.0, 14.0, 13.0, 4.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59375, -0.5763702392578125, -0.558990478515625, -0.5416107177734375, -0.52423095703125, -0.5068511962890625, -0.489471435546875, -0.4720916748046875, -0.4547119140625, -0.4373321533203125, -0.419952392578125, -0.4025726318359375, -0.38519287109375, -0.3678131103515625, -0.350433349609375, -0.3330535888671875, -0.315673828125, -0.2982940673828125, -0.280914306640625, -0.2635345458984375, -0.24615478515625, -0.2287750244140625, -0.211395263671875, -0.1940155029296875, -0.1766357421875, -0.1592559814453125, -0.141876220703125, -0.1244964599609375, -0.10711669921875, -0.0897369384765625, -0.072357177734375, -0.0549774169921875, -0.03759765625, -0.0202178955078125, -0.002838134765625, 0.0145416259765625, 0.03192138671875, 0.0493011474609375, 0.066680908203125, 0.0840606689453125, 0.1014404296875, 0.1188201904296875, 0.136199951171875, 0.1535797119140625, 0.17095947265625, 0.1883392333984375, 0.205718994140625, 0.2230987548828125, 0.240478515625, 0.2578582763671875, 0.275238037109375, 0.2926177978515625, 0.30999755859375, 0.3273773193359375, 0.344757080078125, 0.3621368408203125, 0.3795166015625, 0.3968963623046875, 0.414276123046875, 0.4316558837890625, 0.44903564453125, 0.4664154052734375, 0.483795166015625, 0.5011749267578125, 0.5185546875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 7.0, 5.0, 10.0, 12.0, 18.0, 29.0, 51.0, 72.0, 132.0, 227.0, 433.0, 1015.0, 2607.0, 10166.0, 86525.0, 3734014.0, 331870.0, 20141.0, 4185.0, 1406.0, 611.0, 316.0, 151.0, 95.0, 76.0, 36.0, 23.0, 14.0, 13.0, 8.0, 3.0, 5.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.94091796875, -0.9069290161132812, -0.8729400634765625, -0.8389511108398438, -0.804962158203125, -0.7709732055664062, -0.7369842529296875, -0.7029953002929688, -0.66900634765625, -0.6350173950195312, -0.6010284423828125, -0.5670394897460938, -0.533050537109375, -0.49906158447265625, -0.4650726318359375, -0.43108367919921875, -0.3970947265625, -0.36310577392578125, -0.3291168212890625, -0.29512786865234375, -0.261138916015625, -0.22714996337890625, -0.1931610107421875, -0.15917205810546875, -0.12518310546875, -0.09119415283203125, -0.0572052001953125, -0.02321624755859375, 0.010772705078125, 0.04476165771484375, 0.0787506103515625, 0.11273956298828125, 0.146728515625, 0.18071746826171875, 0.2147064208984375, 0.24869537353515625, 0.282684326171875, 0.31667327880859375, 0.3506622314453125, 0.38465118408203125, 0.41864013671875, 0.45262908935546875, 0.4866180419921875, 0.5206069946289062, 0.554595947265625, 0.5885848999023438, 0.6225738525390625, 0.6565628051757812, 0.6905517578125, 0.7245407104492188, 0.7585296630859375, 0.7925186157226562, 0.826507568359375, 0.8604965209960938, 0.8944854736328125, 0.9284744262695312, 0.96246337890625, 0.9964523315429688, 1.0304412841796875, 1.0644302368164062, 1.098419189453125, 1.1324081420898438, 1.1663970947265625, 1.2003860473632812, 1.234375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 9.0, 13.0, 15.0, 25.0, 35.0, 37.0, 80.0, 133.0, 269.0, 556.0, 876.0, 904.0, 527.0, 241.0, 135.0, 82.0, 37.0, 29.0, 20.0, 11.0, 11.0, 8.0, 5.0, 3.0, 0.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31103515625, -0.3023948669433594, -0.29375457763671875, -0.2851142883300781, -0.2764739990234375, -0.2678337097167969, -0.25919342041015625, -0.2505531311035156, -0.241912841796875, -0.23327255249023438, -0.22463226318359375, -0.21599197387695312, -0.2073516845703125, -0.19871139526367188, -0.19007110595703125, -0.18143081665039062, -0.17279052734375, -0.16415023803710938, -0.15550994873046875, -0.14686965942382812, -0.1382293701171875, -0.12958908081054688, -0.12094879150390625, -0.11230850219726562, -0.103668212890625, -0.09502792358398438, -0.08638763427734375, -0.07774734497070312, -0.0691070556640625, -0.060466766357421875, -0.05182647705078125, -0.043186187744140625, -0.0345458984375, -0.025905609130859375, -0.01726531982421875, -0.008625030517578125, 1.52587890625e-05, 0.008655548095703125, 0.01729583740234375, 0.025936126708984375, 0.034576416015625, 0.043216705322265625, 0.05185699462890625, 0.060497283935546875, 0.0691375732421875, 0.07777786254882812, 0.08641815185546875, 0.09505844116210938, 0.10369873046875, 0.11233901977539062, 0.12097930908203125, 0.12961959838867188, 0.1382598876953125, 0.14690017700195312, 0.15554046630859375, 0.16418075561523438, 0.172821044921875, 0.18146133422851562, 0.19010162353515625, 0.19874191284179688, 0.2073822021484375, 0.21602249145507812, 0.22466278076171875, 0.23330307006835938, 0.241943359375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 5.0, 7.0, 10.0, 20.0, 28.0, 44.0, 64.0, 80.0, 108.0, 124.0, 129.0, 102.0, 88.0, 69.0, 52.0, 17.0, 13.0, 8.0, 11.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6997055411338806, -0.6683148741722107, -0.636924147605896, -0.6055334806442261, -0.5741427540779114, -0.5427520871162415, -0.5113613605499268, -0.47997069358825684, -0.4485799968242645, -0.4171893000602722, -0.3857986032962799, -0.3544079065322876, -0.3230172395706177, -0.291626513004303, -0.26023584604263306, -0.22884514927864075, -0.19745445251464844, -0.16606375575065613, -0.13467305898666382, -0.1032823771238327, -0.0718916803598404, -0.040500983595848083, -0.009110301733016968, 0.022280395030975342, 0.05367109179496765, 0.08506178855895996, 0.11645247787237167, 0.1478431671857834, 0.1792338639497757, 0.210624560713768, 0.24201524257659912, 0.27340593934059143, 0.3047966957092285, 0.3361873924732208, 0.36757808923721313, 0.39896875619888306, 0.43035948276519775, 0.4617501497268677, 0.49314084649086, 0.5245315432548523, 0.555922269821167, 0.5873129367828369, 0.6187036633491516, 0.6500943303108215, 0.6814850568771362, 0.7128757238388062, 0.7442663908004761, 0.7756571173667908, 0.8070477843284607, 0.8384384512901306, 0.8698291778564453, 0.9012198448181152, 0.9326105713844299, 0.9640012383460999, 0.9953919649124146, 1.0267826318740845, 1.0581732988357544, 1.0895639657974243, 1.1209546327590942, 1.1523454189300537, 1.1837360858917236, 1.2151267528533936, 1.2465174198150635, 1.2779080867767334, 1.3092988729476929]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 10.0, 9.0, 4.0, 2.0, 13.0, 9.0, 14.0, 24.0, 25.0, 28.0, 29.0, 32.0, 33.0, 36.0, 33.0, 47.0, 49.0, 44.0, 52.0, 58.0, 56.0, 46.0, 47.0, 43.0, 27.0, 44.0, 26.0, 39.0, 25.0, 19.0, 19.0, 22.0, 9.0, 3.0, 8.0, 8.0, 2.0, 3.0, 4.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.568087100982666, -0.5508230924606323, -0.5335590839385986, -0.5162950754165649, -0.49903109669685364, -0.48176708817481995, -0.46450310945510864, -0.44723910093307495, -0.42997509241104126, -0.41271108388900757, -0.3954470753669739, -0.3781830966472626, -0.3609190881252289, -0.3436550796031952, -0.3263911008834839, -0.3091270923614502, -0.2918630838394165, -0.2745990753173828, -0.2573350667953491, -0.24007108807563782, -0.22280707955360413, -0.20554307103157043, -0.18827907741069794, -0.17101508378982544, -0.15375107526779175, -0.13648706674575806, -0.11922307312488556, -0.10195907205343246, -0.08469507098197937, -0.06743106991052628, -0.05016706883907318, -0.03290306776762009, -0.015639126300811768, 0.001624874770641327, 0.01888887584209442, 0.036152876913547516, 0.05341687798500061, 0.0706808790564537, 0.0879448801279068, 0.1052088811993599, 0.12247288227081299, 0.13973689079284668, 0.15700088441371918, 0.17426487803459167, 0.19152888655662537, 0.20879289507865906, 0.22605688869953156, 0.24332088232040405, 0.26058489084243774, 0.27784889936447144, 0.2951129078865051, 0.31237688660621643, 0.3296408951282501, 0.3469049036502838, 0.3641688823699951, 0.3814328908920288, 0.3986968994140625, 0.4159609079360962, 0.4332249164581299, 0.4504888951778412, 0.4677529036998749, 0.48501691222190857, 0.5022808909416199, 0.5195448994636536, 0.5368089079856873]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 4.0, 10.0, 13.0, 11.0, 21.0, 24.0, 38.0, 36.0, 48.0, 96.0, 130.0, 233.0, 438.0, 908.0, 2320.0, 6577.0, 20707.0, 72908.0, 267041.0, 447933.0, 163474.0, 44807.0, 13212.0, 4342.0, 1600.0, 699.0, 337.0, 183.0, 116.0, 65.0, 47.0, 41.0, 28.0, 21.0, 17.0, 16.0, 8.0, 5.0, 11.0, 7.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1070556640625, -0.10393524169921875, -0.1008148193359375, -0.09769439697265625, -0.094573974609375, -0.09145355224609375, -0.0883331298828125, -0.08521270751953125, -0.08209228515625, -0.07897186279296875, -0.0758514404296875, -0.07273101806640625, -0.069610595703125, -0.06649017333984375, -0.0633697509765625, -0.06024932861328125, -0.05712890625, -0.05400848388671875, -0.0508880615234375, -0.04776763916015625, -0.044647216796875, -0.04152679443359375, -0.0384063720703125, -0.03528594970703125, -0.03216552734375, -0.02904510498046875, -0.0259246826171875, -0.02280426025390625, -0.019683837890625, -0.01656341552734375, -0.0134429931640625, -0.01032257080078125, -0.0072021484375, -0.00408172607421875, -0.0009613037109375, 0.00215911865234375, 0.005279541015625, 0.00839996337890625, 0.0115203857421875, 0.01464080810546875, 0.01776123046875, 0.02088165283203125, 0.0240020751953125, 0.02712249755859375, 0.030242919921875, 0.03336334228515625, 0.0364837646484375, 0.03960418701171875, 0.042724609375, 0.04584503173828125, 0.0489654541015625, 0.05208587646484375, 0.055206298828125, 0.05832672119140625, 0.0614471435546875, 0.06456756591796875, 0.06768798828125, 0.07080841064453125, 0.0739288330078125, 0.07704925537109375, 0.080169677734375, 0.08329010009765625, 0.0864105224609375, 0.08953094482421875, 0.0926513671875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 9.0, 6.0, 10.0, 17.0, 22.0, 25.0, 26.0, 40.0, 42.0, 48.0, 52.0, 56.0, 84.0, 60.0, 82.0, 66.0, 64.0, 50.0, 55.0, 36.0, 48.0, 27.0, 19.0, 21.0, 14.0, 5.0, 7.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.487060546875, -0.4712333679199219, -0.45540618896484375, -0.4395790100097656, -0.4237518310546875, -0.4079246520996094, -0.39209747314453125, -0.3762702941894531, -0.360443115234375, -0.3446159362792969, -0.32878875732421875, -0.3129615783691406, -0.2971343994140625, -0.2813072204589844, -0.26548004150390625, -0.24965286254882812, -0.23382568359375, -0.21799850463867188, -0.20217132568359375, -0.18634414672851562, -0.1705169677734375, -0.15468978881835938, -0.13886260986328125, -0.12303543090820312, -0.107208251953125, -0.09138107299804688, -0.07555389404296875, -0.059726715087890625, -0.0438995361328125, -0.028072357177734375, -0.01224517822265625, 0.003582000732421875, 0.0194091796875, 0.035236358642578125, 0.05106353759765625, 0.06689071655273438, 0.0827178955078125, 0.09854507446289062, 0.11437225341796875, 0.13019943237304688, 0.146026611328125, 0.16185379028320312, 0.17768096923828125, 0.19350814819335938, 0.2093353271484375, 0.22516250610351562, 0.24098968505859375, 0.2568168640136719, 0.27264404296875, 0.2884712219238281, 0.30429840087890625, 0.3201255798339844, 0.3359527587890625, 0.3517799377441406, 0.36760711669921875, 0.3834342956542969, 0.399261474609375, 0.4150886535644531, 0.43091583251953125, 0.4467430114746094, 0.4625701904296875, 0.4783973693847656, 0.49422454833984375, 0.5100517272949219, 0.52587890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 7.0, 10.0, 5.0, 14.0, 30.0, 33.0, 46.0, 81.0, 80.0, 139.0, 213.0, 336.0, 541.0, 1063.0, 2049.0, 4406.0, 9798.0, 23652.0, 60011.0, 155003.0, 325482.0, 274212.0, 115579.0, 43979.0, 17432.0, 7327.0, 3221.0, 1558.0, 864.0, 472.0, 308.0, 187.0, 133.0, 75.0, 58.0, 44.0, 30.0, 15.0, 16.0, 13.0, 10.0, 5.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0594482421875, -0.057312965393066406, -0.05517768859863281, -0.05304241180419922, -0.050907135009765625, -0.04877185821533203, -0.04663658142089844, -0.044501304626464844, -0.04236602783203125, -0.040230751037597656, -0.03809547424316406, -0.03596019744873047, -0.033824920654296875, -0.03168964385986328, -0.029554367065429688, -0.027419090270996094, -0.0252838134765625, -0.023148536682128906, -0.021013259887695312, -0.01887798309326172, -0.016742706298828125, -0.014607429504394531, -0.012472152709960938, -0.010336875915527344, -0.00820159912109375, -0.006066322326660156, -0.0039310455322265625, -0.0017957687377929688, 0.000339508056640625, 0.0024747848510742188, 0.0046100616455078125, 0.006745338439941406, 0.008880615234375, 0.011015892028808594, 0.013151168823242188, 0.015286445617675781, 0.017421722412109375, 0.01955699920654297, 0.021692276000976562, 0.023827552795410156, 0.02596282958984375, 0.028098106384277344, 0.030233383178710938, 0.03236865997314453, 0.034503936767578125, 0.03663921356201172, 0.03877449035644531, 0.040909767150878906, 0.0430450439453125, 0.045180320739746094, 0.04731559753417969, 0.04945087432861328, 0.051586151123046875, 0.05372142791748047, 0.05585670471191406, 0.057991981506347656, 0.06012725830078125, 0.062262535095214844, 0.06439781188964844, 0.06653308868408203, 0.06866836547851562, 0.07080364227294922, 0.07293891906738281, 0.0750741958618164, 0.07720947265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 5.0, 2.0, 9.0, 9.0, 9.0, 12.0, 15.0, 15.0, 18.0, 19.0, 24.0, 29.0, 35.0, 56.0, 45.0, 43.0, 44.0, 55.0, 57.0, 64.0, 62.0, 61.0, 45.0, 40.0, 43.0, 36.0, 27.0, 26.0, 19.0, 16.0, 12.0, 21.0, 6.0, 12.0, 7.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7216796875, -0.6975173950195312, -0.6733551025390625, -0.6491928100585938, -0.625030517578125, -0.6008682250976562, -0.5767059326171875, -0.5525436401367188, -0.52838134765625, -0.5042190551757812, -0.4800567626953125, -0.45589447021484375, -0.431732177734375, -0.40756988525390625, -0.3834075927734375, -0.35924530029296875, -0.3350830078125, -0.31092071533203125, -0.2867584228515625, -0.26259613037109375, -0.238433837890625, -0.21427154541015625, -0.1901092529296875, -0.16594696044921875, -0.14178466796875, -0.11762237548828125, -0.0934600830078125, -0.06929779052734375, -0.045135498046875, -0.02097320556640625, 0.0031890869140625, 0.02735137939453125, 0.051513671875, 0.07567596435546875, 0.0998382568359375, 0.12400054931640625, 0.148162841796875, 0.17232513427734375, 0.1964874267578125, 0.22064971923828125, 0.24481201171875, 0.26897430419921875, 0.2931365966796875, 0.31729888916015625, 0.341461181640625, 0.36562347412109375, 0.3897857666015625, 0.41394805908203125, 0.4381103515625, 0.46227264404296875, 0.4864349365234375, 0.5105972290039062, 0.534759521484375, 0.5589218139648438, 0.5830841064453125, 0.6072463989257812, 0.63140869140625, 0.6555709838867188, 0.6797332763671875, 0.7038955688476562, 0.728057861328125, 0.7522201538085938, 0.7763824462890625, 0.8005447387695312, 0.82470703125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 9.0, 11.0, 14.0, 12.0, 26.0, 26.0, 52.0, 74.0, 127.0, 204.0, 354.0, 638.0, 1124.0, 2229.0, 5134.0, 14471.0, 52213.0, 239600.0, 502744.0, 171103.0, 38398.0, 11466.0, 4261.0, 1912.0, 1021.0, 545.0, 278.0, 182.0, 116.0, 62.0, 43.0, 27.0, 21.0, 17.0, 15.0, 7.0, 7.0, 7.0, 5.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0240631103515625, -0.023184537887573242, -0.022305965423583984, -0.021427392959594727, -0.02054882049560547, -0.01967024803161621, -0.018791675567626953, -0.017913103103637695, -0.017034530639648438, -0.01615595817565918, -0.015277385711669922, -0.014398813247680664, -0.013520240783691406, -0.012641668319702148, -0.01176309585571289, -0.010884523391723633, -0.010005950927734375, -0.009127378463745117, -0.00824880599975586, -0.0073702335357666016, -0.006491661071777344, -0.005613088607788086, -0.004734516143798828, -0.0038559436798095703, -0.0029773712158203125, -0.0020987987518310547, -0.0012202262878417969, -0.00034165382385253906, 0.0005369186401367188, 0.0014154911041259766, 0.0022940635681152344, 0.003172636032104492, 0.00405120849609375, 0.004929780960083008, 0.005808353424072266, 0.0066869258880615234, 0.007565498352050781, 0.008444070816040039, 0.009322643280029297, 0.010201215744018555, 0.011079788208007812, 0.01195836067199707, 0.012836933135986328, 0.013715505599975586, 0.014594078063964844, 0.015472650527954102, 0.01635122299194336, 0.017229795455932617, 0.018108367919921875, 0.018986940383911133, 0.01986551284790039, 0.02074408531188965, 0.021622657775878906, 0.022501230239868164, 0.023379802703857422, 0.02425837516784668, 0.025136947631835938, 0.026015520095825195, 0.026894092559814453, 0.02777266502380371, 0.02865123748779297, 0.029529809951782227, 0.030408382415771484, 0.03128695487976074, 0.03216552734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 9.0, 16.0, 12.0, 23.0, 24.0, 68.0, 61.0, 79.0, 106.0, 99.0, 115.0, 103.0, 82.0, 71.0, 28.0, 30.0, 18.0, 14.0, 11.0, 8.0, 4.0, 5.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.704692840576172e-05, -1.6475096344947815e-05, -1.590326428413391e-05, -1.5331432223320007e-05, -1.4759600162506104e-05, -1.41877681016922e-05, -1.3615936040878296e-05, -1.3044103980064392e-05, -1.2472271919250488e-05, -1.1900439858436584e-05, -1.132860779762268e-05, -1.0756775736808777e-05, -1.0184943675994873e-05, -9.61311161518097e-06, -9.041279554367065e-06, -8.469447493553162e-06, -7.897615432739258e-06, -7.325783371925354e-06, -6.75395131111145e-06, -6.182119250297546e-06, -5.610287189483643e-06, -5.038455128669739e-06, -4.466623067855835e-06, -3.894791007041931e-06, -3.3229589462280273e-06, -2.7511268854141235e-06, -2.1792948246002197e-06, -1.607462763786316e-06, -1.0356307029724121e-06, -4.637986421585083e-07, 1.0803341865539551e-07, 6.798654794692993e-07, 1.2516975402832031e-06, 1.823529601097107e-06, 2.3953616619110107e-06, 2.9671937227249146e-06, 3.5390257835388184e-06, 4.110857844352722e-06, 4.682689905166626e-06, 5.25452196598053e-06, 5.826354026794434e-06, 6.398186087608337e-06, 6.970018148422241e-06, 7.541850209236145e-06, 8.113682270050049e-06, 8.685514330863953e-06, 9.257346391677856e-06, 9.82917845249176e-06, 1.0401010513305664e-05, 1.0972842574119568e-05, 1.1544674634933472e-05, 1.2116506695747375e-05, 1.268833875656128e-05, 1.3260170817375183e-05, 1.3832002878189087e-05, 1.440383493900299e-05, 1.4975666999816895e-05, 1.55474990606308e-05, 1.6119331121444702e-05, 1.6691163182258606e-05, 1.726299524307251e-05, 1.7834827303886414e-05, 1.8406659364700317e-05, 1.897849142551422e-05, 1.9550323486328125e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 2.0, 6.0, 9.0, 7.0, 9.0, 15.0, 27.0, 26.0, 46.0, 72.0, 101.0, 150.0, 175.0, 330.0, 516.0, 891.0, 1675.0, 3216.0, 6713.0, 15010.0, 36160.0, 89049.0, 205464.0, 311340.0, 214908.0, 93805.0, 38272.0, 15955.0, 7151.0, 3350.0, 1698.0, 886.0, 520.0, 301.0, 222.0, 134.0, 97.0, 68.0, 39.0, 38.0, 24.0, 21.0, 15.0, 7.0, 12.0, 6.0, 7.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0190582275390625, -0.018489837646484375, -0.01792144775390625, -0.017353057861328125, -0.01678466796875, -0.016216278076171875, -0.01564788818359375, -0.015079498291015625, -0.0145111083984375, -0.013942718505859375, -0.01337432861328125, -0.012805938720703125, -0.012237548828125, -0.011669158935546875, -0.01110076904296875, -0.010532379150390625, -0.0099639892578125, -0.009395599365234375, -0.00882720947265625, -0.008258819580078125, -0.0076904296875, -0.007122039794921875, -0.00655364990234375, -0.005985260009765625, -0.0054168701171875, -0.004848480224609375, -0.00428009033203125, -0.003711700439453125, -0.003143310546875, -0.002574920654296875, -0.00200653076171875, -0.001438140869140625, -0.0008697509765625, -0.000301361083984375, 0.00026702880859375, 0.000835418701171875, 0.00140380859375, 0.001972198486328125, 0.00254058837890625, 0.003108978271484375, 0.0036773681640625, 0.004245758056640625, 0.00481414794921875, 0.005382537841796875, 0.005950927734375, 0.006519317626953125, 0.00708770751953125, 0.007656097412109375, 0.0082244873046875, 0.008792877197265625, 0.00936126708984375, 0.009929656982421875, 0.010498046875, 0.011066436767578125, 0.01163482666015625, 0.012203216552734375, 0.0127716064453125, 0.013339996337890625, 0.01390838623046875, 0.014476776123046875, 0.015045166015625, 0.015613555908203125, 0.01618194580078125, 0.016750335693359375, 0.0173187255859375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 3.0, 4.0, 13.0, 6.0, 9.0, 8.0, 12.0, 11.0, 17.0, 15.0, 14.0, 21.0, 18.0, 33.0, 29.0, 33.0, 38.0, 38.0, 52.0, 60.0, 43.0, 41.0, 51.0, 46.0, 37.0, 37.0, 32.0, 29.0, 37.0, 34.0, 24.0, 25.0, 24.0, 16.0, 13.0, 14.0, 11.0, 12.0, 12.0, 8.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.0054473876953125, -0.005285143852233887, -0.0051229000091552734, -0.00496065616607666, -0.004798412322998047, -0.004636168479919434, -0.00447392463684082, -0.004311680793762207, -0.004149436950683594, -0.0039871931076049805, -0.003824949264526367, -0.003662705421447754, -0.0035004615783691406, -0.0033382177352905273, -0.003175973892211914, -0.0030137300491333008, -0.0028514862060546875, -0.0026892423629760742, -0.002526998519897461, -0.0023647546768188477, -0.0022025108337402344, -0.002040266990661621, -0.0018780231475830078, -0.0017157793045043945, -0.0015535354614257812, -0.001391291618347168, -0.0012290477752685547, -0.0010668039321899414, -0.0009045600891113281, -0.0007423162460327148, -0.0005800724029541016, -0.0004178285598754883, -0.000255584716796875, -9.334087371826172e-05, 6.890296936035156e-05, 0.00023114681243896484, 0.0003933906555175781, 0.0005556344985961914, 0.0007178783416748047, 0.000880122184753418, 0.0010423660278320312, 0.0012046098709106445, 0.0013668537139892578, 0.001529097557067871, 0.0016913414001464844, 0.0018535852432250977, 0.002015829086303711, 0.0021780729293823242, 0.0023403167724609375, 0.0025025606155395508, 0.002664804458618164, 0.0028270483016967773, 0.0029892921447753906, 0.003151535987854004, 0.003313779830932617, 0.0034760236740112305, 0.0036382675170898438, 0.003800511360168457, 0.00396275520324707, 0.004124999046325684, 0.004287242889404297, 0.00444948673248291, 0.0046117305755615234, 0.004773974418640137, 0.00493621826171875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 30.0, 114.0, 258.0, 363.0, 163.0, 47.0, 20.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8652573227882385, -0.8086316585540771, -0.7520060539245605, -0.6953803896903992, -0.6387547254562378, -0.5821291208267212, -0.5255034565925598, -0.4688778221607208, -0.41225218772888184, -0.35562655329704285, -0.29900091886520386, -0.24237525463104248, -0.1857496201992035, -0.1291239857673645, -0.07249832153320312, -0.015872687101364136, 0.040752947330474854, 0.09737858921289444, 0.15400423109531403, 0.2106298804283142, 0.2672555148601532, 0.3238811492919922, 0.38050681352615356, 0.43713244795799255, 0.49375808238983154, 0.5503837466239929, 0.6070093512535095, 0.6636350154876709, 0.7202606201171875, 0.7768862843513489, 0.8335119485855103, 0.8901375532150269, 0.946763277053833, 1.0033888816833496, 1.0600146055221558, 1.1166402101516724, 1.173265814781189, 1.2298915386199951, 1.2865171432495117, 1.3431427478790283, 1.399768352508545, 1.4563939571380615, 1.5130196809768677, 1.5696452856063843, 1.6262708902359009, 1.682896614074707, 1.7395222187042236, 1.7961478233337402, 1.8527735471725464, 1.909399151802063, 1.9660248756408691, 2.0226504802703857, 2.0792760848999023, 2.135901689529419, 2.1925272941589355, 2.2491531372070312, 2.305778741836548, 2.3624043464660645, 2.419029951095581, 2.4756555557250977, 2.5322813987731934, 2.58890700340271, 2.6455326080322266, 2.702158212661743, 2.7587838172912598]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 5.0, 4.0, 3.0, 9.0, 8.0, 9.0, 14.0, 18.0, 33.0, 34.0, 33.0, 46.0, 42.0, 51.0, 68.0, 61.0, 72.0, 79.0, 61.0, 71.0, 47.0, 41.0, 54.0, 41.0, 21.0, 28.0, 22.0, 7.0, 6.0, 10.0, 5.0, 2.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.501637876033783, -0.4867832660675049, -0.4719286859035492, -0.4570740759372711, -0.44221946597099304, -0.42736488580703735, -0.4125102758407593, -0.3976556658744812, -0.3828010559082031, -0.36794644594192505, -0.35309186577796936, -0.3382372558116913, -0.3233826458454132, -0.3085280656814575, -0.29367345571517944, -0.27881884574890137, -0.2639642655849457, -0.2491096705198288, -0.23425506055355072, -0.21940046548843384, -0.20454585552215576, -0.18969126045703888, -0.174836665391922, -0.15998205542564392, -0.14512746036052704, -0.13027286529541016, -0.11541825532913208, -0.1005636602640152, -0.08570905774831772, -0.07085445523262024, -0.05599986016750336, -0.04114525765180588, -0.0262906551361084, -0.011436054483056068, 0.0034185461699962616, 0.018273144960403442, 0.03312774747610092, 0.0479823499917984, 0.06283694505691528, 0.07769154757261276, 0.09254615008831024, 0.10740075260400772, 0.1222553551197052, 0.13710995018482208, 0.15196454524993896, 0.16681915521621704, 0.18167375028133392, 0.1965283453464508, 0.21138295531272888, 0.22623755037784576, 0.24109216034412384, 0.2559467554092407, 0.2708013653755188, 0.2856559753417969, 0.30051055550575256, 0.31536516547203064, 0.33021974563598633, 0.3450743556022644, 0.3599289357662201, 0.37478354573249817, 0.38963815569877625, 0.40449273586273193, 0.41934734582901, 0.4342019557952881, 0.44905656576156616]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 4.0, 4.0, 21.0, 36.0, 34.0, 56.0, 79.0, 139.0, 222.0, 367.0, 648.0, 1133.0, 2248.0, 5011.0, 12351.0, 36456.0, 144824.0, 535044.0, 229319.0, 52051.0, 16186.0, 6236.0, 2801.0, 1372.0, 753.0, 428.0, 235.0, 160.0, 95.0, 71.0, 38.0, 28.0, 31.0, 14.0, 12.0, 13.0, 5.0, 5.0, 4.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.32470703125, -0.3133697509765625, -0.302032470703125, -0.2906951904296875, -0.27935791015625, -0.2680206298828125, -0.256683349609375, -0.2453460693359375, -0.2340087890625, -0.2226715087890625, -0.211334228515625, -0.1999969482421875, -0.18865966796875, -0.1773223876953125, -0.165985107421875, -0.1546478271484375, -0.143310546875, -0.1319732666015625, -0.120635986328125, -0.1092987060546875, -0.09796142578125, -0.0866241455078125, -0.075286865234375, -0.0639495849609375, -0.0526123046875, -0.0412750244140625, -0.029937744140625, -0.0186004638671875, -0.00726318359375, 0.0040740966796875, 0.015411376953125, 0.0267486572265625, 0.0380859375, 0.0494232177734375, 0.060760498046875, 0.0720977783203125, 0.08343505859375, 0.0947723388671875, 0.106109619140625, 0.1174468994140625, 0.1287841796875, 0.1401214599609375, 0.151458740234375, 0.1627960205078125, 0.17413330078125, 0.1854705810546875, 0.196807861328125, 0.2081451416015625, 0.219482421875, 0.2308197021484375, 0.242156982421875, 0.2534942626953125, 0.26483154296875, 0.2761688232421875, 0.287506103515625, 0.2988433837890625, 0.3101806640625, 0.3215179443359375, 0.332855224609375, 0.3441925048828125, 0.35552978515625, 0.3668670654296875, 0.378204345703125, 0.3895416259765625, 0.40087890625]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 6.0, 5.0, 8.0, 5.0, 11.0, 17.0, 16.0, 25.0, 22.0, 22.0, 28.0, 26.0, 40.0, 55.0, 46.0, 48.0, 58.0, 51.0, 50.0, 50.0, 55.0, 58.0, 46.0, 49.0, 46.0, 25.0, 27.0, 21.0, 20.0, 15.0, 16.0, 7.0, 4.0, 5.0, 6.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.90380859375, -0.8793792724609375, -0.854949951171875, -0.8305206298828125, -0.80609130859375, -0.7816619873046875, -0.757232666015625, -0.7328033447265625, -0.7083740234375, -0.6839447021484375, -0.659515380859375, -0.6350860595703125, -0.61065673828125, -0.5862274169921875, -0.561798095703125, -0.5373687744140625, -0.512939453125, -0.4885101318359375, -0.464080810546875, -0.4396514892578125, -0.41522216796875, -0.3907928466796875, -0.366363525390625, -0.3419342041015625, -0.3175048828125, -0.2930755615234375, -0.268646240234375, -0.2442169189453125, -0.21978759765625, -0.1953582763671875, -0.170928955078125, -0.1464996337890625, -0.1220703125, -0.0976409912109375, -0.073211669921875, -0.0487823486328125, -0.02435302734375, 7.62939453125e-05, 0.024505615234375, 0.0489349365234375, 0.0733642578125, 0.0977935791015625, 0.122222900390625, 0.1466522216796875, 0.17108154296875, 0.1955108642578125, 0.219940185546875, 0.2443695068359375, 0.268798828125, 0.2932281494140625, 0.317657470703125, 0.3420867919921875, 0.36651611328125, 0.3909454345703125, 0.415374755859375, 0.4398040771484375, 0.4642333984375, 0.4886627197265625, 0.513092041015625, 0.5375213623046875, 0.56195068359375, 0.5863800048828125, 0.610809326171875, 0.6352386474609375, 0.65966796875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 8.0, 3.0, 5.0, 11.0, 12.0, 16.0, 19.0, 29.0, 46.0, 57.0, 91.0, 136.0, 278.0, 586.0, 1762.0, 7364.0, 77331.0, 869601.0, 80430.0, 7607.0, 1796.0, 636.0, 260.0, 137.0, 100.0, 64.0, 51.0, 28.0, 16.0, 16.0, 20.0, 6.0, 9.0, 4.0, 5.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.7783203125, -0.7536163330078125, -0.728912353515625, -0.7042083740234375, -0.67950439453125, -0.6548004150390625, -0.630096435546875, -0.6053924560546875, -0.5806884765625, -0.5559844970703125, -0.531280517578125, -0.5065765380859375, -0.48187255859375, -0.4571685791015625, -0.432464599609375, -0.4077606201171875, -0.383056640625, -0.3583526611328125, -0.333648681640625, -0.3089447021484375, -0.28424072265625, -0.2595367431640625, -0.234832763671875, -0.2101287841796875, -0.1854248046875, -0.1607208251953125, -0.136016845703125, -0.1113128662109375, -0.08660888671875, -0.0619049072265625, -0.037200927734375, -0.0124969482421875, 0.01220703125, 0.0369110107421875, 0.061614990234375, 0.0863189697265625, 0.11102294921875, 0.1357269287109375, 0.160430908203125, 0.1851348876953125, 0.2098388671875, 0.2345428466796875, 0.259246826171875, 0.2839508056640625, 0.30865478515625, 0.3333587646484375, 0.358062744140625, 0.3827667236328125, 0.407470703125, 0.4321746826171875, 0.456878662109375, 0.4815826416015625, 0.50628662109375, 0.5309906005859375, 0.555694580078125, 0.5803985595703125, 0.6051025390625, 0.6298065185546875, 0.654510498046875, 0.6792144775390625, 0.70391845703125, 0.7286224365234375, 0.753326416015625, 0.7780303955078125, 0.802734375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 0.0, 8.0, 6.0, 5.0, 6.0, 4.0, 8.0, 11.0, 15.0, 28.0, 25.0, 33.0, 41.0, 33.0, 37.0, 29.0, 53.0, 52.0, 47.0, 47.0, 57.0, 53.0, 58.0, 51.0, 50.0, 50.0, 19.0, 32.0, 21.0, 20.0, 21.0, 16.0, 16.0, 11.0, 11.0, 8.0, 8.0, 5.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.951171875, -0.9241790771484375, -0.897186279296875, -0.8701934814453125, -0.84320068359375, -0.8162078857421875, -0.789215087890625, -0.7622222900390625, -0.7352294921875, -0.7082366943359375, -0.681243896484375, -0.6542510986328125, -0.62725830078125, -0.6002655029296875, -0.573272705078125, -0.5462799072265625, -0.519287109375, -0.4922943115234375, -0.465301513671875, -0.4383087158203125, -0.41131591796875, -0.3843231201171875, -0.357330322265625, -0.3303375244140625, -0.3033447265625, -0.2763519287109375, -0.249359130859375, -0.2223663330078125, -0.19537353515625, -0.1683807373046875, -0.141387939453125, -0.1143951416015625, -0.08740234375, -0.0604095458984375, -0.033416748046875, -0.0064239501953125, 0.02056884765625, 0.0475616455078125, 0.074554443359375, 0.1015472412109375, 0.1285400390625, 0.1555328369140625, 0.182525634765625, 0.2095184326171875, 0.23651123046875, 0.2635040283203125, 0.290496826171875, 0.3174896240234375, 0.344482421875, 0.3714752197265625, 0.398468017578125, 0.4254608154296875, 0.45245361328125, 0.4794464111328125, 0.506439208984375, 0.5334320068359375, 0.5604248046875, 0.5874176025390625, 0.614410400390625, 0.6414031982421875, 0.66839599609375, 0.6953887939453125, 0.722381591796875, 0.7493743896484375, 0.7763671875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 5.0, 4.0, 7.0, 4.0, 11.0, 7.0, 27.0, 25.0, 74.0, 126.0, 284.0, 813.0, 2638.0, 13921.0, 761171.0, 257954.0, 8494.0, 1906.0, 610.0, 224.0, 116.0, 61.0, 33.0, 13.0, 13.0, 6.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.389892578125, -0.37726593017578125, -0.3646392822265625, -0.35201263427734375, -0.339385986328125, -0.32675933837890625, -0.3141326904296875, -0.30150604248046875, -0.28887939453125, -0.27625274658203125, -0.2636260986328125, -0.25099945068359375, -0.238372802734375, -0.22574615478515625, -0.2131195068359375, -0.20049285888671875, -0.1878662109375, -0.17523956298828125, -0.1626129150390625, -0.14998626708984375, -0.137359619140625, -0.12473297119140625, -0.1121063232421875, -0.09947967529296875, -0.08685302734375, -0.07422637939453125, -0.0615997314453125, -0.04897308349609375, -0.036346435546875, -0.02371978759765625, -0.0110931396484375, 0.00153350830078125, 0.01416015625, 0.02678680419921875, 0.0394134521484375, 0.05204010009765625, 0.064666748046875, 0.07729339599609375, 0.0899200439453125, 0.10254669189453125, 0.11517333984375, 0.12779998779296875, 0.1404266357421875, 0.15305328369140625, 0.165679931640625, 0.17830657958984375, 0.1909332275390625, 0.20355987548828125, 0.2161865234375, 0.22881317138671875, 0.2414398193359375, 0.25406646728515625, 0.266693115234375, 0.27931976318359375, 0.2919464111328125, 0.30457305908203125, 0.31719970703125, 0.32982635498046875, 0.3424530029296875, 0.35507965087890625, 0.367706298828125, 0.38033294677734375, 0.3929595947265625, 0.40558624267578125, 0.418212890625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 3.0, 6.0, 12.0, 15.0, 34.0, 51.0, 64.0, 115.0, 173.0, 172.0, 103.0, 98.0, 60.0, 41.0, 17.0, 13.0, 7.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.369020462036133e-05, -4.254840314388275e-05, -4.1406601667404175e-05, -4.02648001909256e-05, -3.912299871444702e-05, -3.7981197237968445e-05, -3.683939576148987e-05, -3.569759428501129e-05, -3.4555792808532715e-05, -3.341399133205414e-05, -3.227218985557556e-05, -3.1130388379096985e-05, -2.9988586902618408e-05, -2.884678542613983e-05, -2.7704983949661255e-05, -2.6563182473182678e-05, -2.54213809967041e-05, -2.4279579520225525e-05, -2.3137778043746948e-05, -2.199597656726837e-05, -2.0854175090789795e-05, -1.9712373614311218e-05, -1.857057213783264e-05, -1.7428770661354065e-05, -1.6286969184875488e-05, -1.5145167708396912e-05, -1.4003366231918335e-05, -1.2861564755439758e-05, -1.1719763278961182e-05, -1.0577961802482605e-05, -9.436160326004028e-06, -8.294358849525452e-06, -7.152557373046875e-06, -6.010755896568298e-06, -4.868954420089722e-06, -3.727152943611145e-06, -2.5853514671325684e-06, -1.4435499906539917e-06, -3.0174851417541504e-07, 8.400529623031616e-07, 1.9818544387817383e-06, 3.123655915260315e-06, 4.265457391738892e-06, 5.407258868217468e-06, 6.549060344696045e-06, 7.690861821174622e-06, 8.832663297653198e-06, 9.974464774131775e-06, 1.1116266250610352e-05, 1.2258067727088928e-05, 1.3399869203567505e-05, 1.4541670680046082e-05, 1.5683472156524658e-05, 1.6825273633003235e-05, 1.796707510948181e-05, 1.9108876585960388e-05, 2.0250678062438965e-05, 2.139247953891754e-05, 2.2534281015396118e-05, 2.3676082491874695e-05, 2.481788396835327e-05, 2.5959685444831848e-05, 2.7101486921310425e-05, 2.8243288397789e-05, 2.9385089874267578e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 5.0, 10.0, 14.0, 12.0, 19.0, 30.0, 61.0, 130.0, 279.0, 808.0, 2836.0, 16044.0, 673291.0, 340279.0, 11238.0, 2335.0, 652.0, 244.0, 112.0, 50.0, 33.0, 15.0, 8.0, 12.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.35498046875, -0.3441963195800781, -0.33341217041015625, -0.3226280212402344, -0.3118438720703125, -0.3010597229003906, -0.29027557373046875, -0.2794914245605469, -0.268707275390625, -0.2579231262207031, -0.24713897705078125, -0.23635482788085938, -0.2255706787109375, -0.21478652954101562, -0.20400238037109375, -0.19321823120117188, -0.18243408203125, -0.17164993286132812, -0.16086578369140625, -0.15008163452148438, -0.1392974853515625, -0.12851333618164062, -0.11772918701171875, -0.10694503784179688, -0.096160888671875, -0.08537673950195312, -0.07459259033203125, -0.06380844116210938, -0.0530242919921875, -0.042240142822265625, -0.03145599365234375, -0.020671844482421875, -0.0098876953125, 0.000896453857421875, 0.01168060302734375, 0.022464752197265625, 0.0332489013671875, 0.044033050537109375, 0.05481719970703125, 0.06560134887695312, 0.076385498046875, 0.08716964721679688, 0.09795379638671875, 0.10873794555664062, 0.1195220947265625, 0.13030624389648438, 0.14109039306640625, 0.15187454223632812, 0.16265869140625, 0.17344284057617188, 0.18422698974609375, 0.19501113891601562, 0.2057952880859375, 0.21657943725585938, 0.22736358642578125, 0.23814773559570312, 0.248931884765625, 0.2597160339355469, 0.27050018310546875, 0.2812843322753906, 0.2920684814453125, 0.3028526306152344, 0.31363677978515625, 0.3244209289550781, 0.335205078125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 3.0, 13.0, 20.0, 28.0, 46.0, 42.0, 48.0, 91.0, 95.0, 113.0, 134.0, 82.0, 66.0, 58.0, 38.0, 22.0, 25.0, 21.0, 5.0, 6.0, 9.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0809326171875, -0.0784749984741211, -0.07601737976074219, -0.07355976104736328, -0.07110214233398438, -0.06864452362060547, -0.06618690490722656, -0.06372928619384766, -0.06127166748046875, -0.058814048767089844, -0.05635643005371094, -0.05389881134033203, -0.051441192626953125, -0.04898357391357422, -0.04652595520019531, -0.044068336486816406, -0.0416107177734375, -0.039153099060058594, -0.03669548034667969, -0.03423786163330078, -0.031780242919921875, -0.02932262420654297, -0.026865005493164062, -0.024407386779785156, -0.02194976806640625, -0.019492149353027344, -0.017034530639648438, -0.014576911926269531, -0.012119293212890625, -0.009661674499511719, -0.0072040557861328125, -0.004746437072753906, -0.002288818359375, 0.00016880035400390625, 0.0026264190673828125, 0.005084037780761719, 0.007541656494140625, 0.009999275207519531, 0.012456893920898438, 0.014914512634277344, 0.01737213134765625, 0.019829750061035156, 0.022287368774414062, 0.02474498748779297, 0.027202606201171875, 0.02966022491455078, 0.03211784362792969, 0.034575462341308594, 0.0370330810546875, 0.039490699768066406, 0.04194831848144531, 0.04440593719482422, 0.046863555908203125, 0.04932117462158203, 0.05177879333496094, 0.054236412048339844, 0.05669403076171875, 0.059151649475097656, 0.06160926818847656, 0.06406688690185547, 0.06652450561523438, 0.06898212432861328, 0.07143974304199219, 0.0738973617553711, 0.07635498046875]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 1.0, 3.0, 14.0, 13.0, 36.0, 40.0, 78.0, 92.0, 154.0, 159.0, 146.0, 102.0, 55.0, 45.0, 24.0, 16.0, 8.0, 5.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5553004741668701, -1.5075490474700928, -1.459797739982605, -1.4120464324951172, -1.3642950057983398, -1.3165435791015625, -1.2687922716140747, -1.221040964126587, -1.1732895374298096, -1.1255381107330322, -1.0777868032455444, -1.0300354957580566, -0.9822840690612793, -0.9345327019691467, -0.8867813348770142, -0.8390299677848816, -0.791278600692749, -0.7435272336006165, -0.6957758665084839, -0.6480244994163513, -0.6002731323242188, -0.5525217652320862, -0.5047703981399536, -0.45701903104782104, -0.4092676639556885, -0.3615162968635559, -0.31376492977142334, -0.26601356267929077, -0.2182621955871582, -0.17051082849502563, -0.12275946140289307, -0.0750080943107605, -0.02725684642791748, 0.020494520664215088, 0.06824588775634766, 0.11599725484848022, 0.1637486219406128, 0.21149998903274536, 0.25925135612487793, 0.3070027232170105, 0.35475409030914307, 0.40250545740127563, 0.4502568244934082, 0.49800819158554077, 0.5457595586776733, 0.5935109257698059, 0.6412622928619385, 0.689013659954071, 0.7367650270462036, 0.7845163941383362, 0.8322677612304688, 0.8800191283226013, 0.9277704954147339, 0.9755218625068665, 1.023273229598999, 1.0710246562957764, 1.1187759637832642, 1.166527271270752, 1.2142786979675293, 1.2620301246643066, 1.3097814321517944, 1.3575327396392822, 1.4052841663360596, 1.453035593032837, 1.5007869005203247]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 7.0, 11.0, 15.0, 13.0, 13.0, 17.0, 18.0, 27.0, 16.0, 24.0, 18.0, 40.0, 37.0, 28.0, 35.0, 33.0, 27.0, 36.0, 32.0, 35.0, 30.0, 39.0, 40.0, 33.0, 33.0, 33.0, 36.0, 29.0, 31.0, 25.0, 23.0, 19.0, 24.0, 18.0, 21.0, 11.0, 14.0, 11.0, 9.0, 7.0, 6.0, 5.0, 4.0, 2.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0419141054153442, -1.0074104070663452, -0.972906768321991, -0.9384031295776367, -0.9038994312286377, -0.8693957328796387, -0.8348920941352844, -0.8003884553909302, -0.7658847570419312, -0.7313810586929321, -0.6968774199485779, -0.6623737812042236, -0.6278700828552246, -0.5933663845062256, -0.5588627457618713, -0.5243591070175171, -0.48985540866851807, -0.45535174012184143, -0.4208480715751648, -0.38634440302848816, -0.3518407344818115, -0.3173370659351349, -0.28283339738845825, -0.24832972884178162, -0.21382606029510498, -0.17932239174842834, -0.1448187232017517, -0.11031505465507507, -0.07581138610839844, -0.0413077175617218, -0.006804049015045166, 0.02769961953163147, 0.062203288078308105, 0.09670695662498474, 0.13121062517166138, 0.165714293718338, 0.20021796226501465, 0.23472163081169128, 0.2692252993583679, 0.30372896790504456, 0.3382326364517212, 0.3727363049983978, 0.40723997354507446, 0.4417436420917511, 0.47624731063842773, 0.5107510089874268, 0.545254647731781, 0.5797582864761353, 0.6142619848251343, 0.6487656831741333, 0.6832693219184875, 0.7177729606628418, 0.7522766590118408, 0.7867803573608398, 0.8212839961051941, 0.8557876348495483, 0.8902913331985474, 0.9247950315475464, 0.9592986702919006, 0.9938023090362549, 1.028306007385254, 1.062809705734253, 1.097313404083252, 1.1318169832229614, 1.1663206815719604]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 0.0, 3.0, 4.0, 2.0, 9.0, 8.0, 14.0, 18.0, 23.0, 34.0, 63.0, 94.0, 211.0, 439.0, 1064.0, 3054.0, 16104.0, 701109.0, 3405019.0, 56152.0, 7030.0, 2159.0, 873.0, 376.0, 174.0, 98.0, 46.0, 32.0, 22.0, 17.0, 10.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.4951171875, -1.4501190185546875, -1.405120849609375, -1.3601226806640625, -1.31512451171875, -1.2701263427734375, -1.225128173828125, -1.1801300048828125, -1.1351318359375, -1.0901336669921875, -1.045135498046875, -1.0001373291015625, -0.95513916015625, -0.9101409912109375, -0.865142822265625, -0.8201446533203125, -0.775146484375, -0.7301483154296875, -0.685150146484375, -0.6401519775390625, -0.59515380859375, -0.5501556396484375, -0.505157470703125, -0.4601593017578125, -0.4151611328125, -0.3701629638671875, -0.325164794921875, -0.2801666259765625, -0.23516845703125, -0.1901702880859375, -0.145172119140625, -0.1001739501953125, -0.05517578125, -0.0101776123046875, 0.034820556640625, 0.0798187255859375, 0.12481689453125, 0.1698150634765625, 0.214813232421875, 0.2598114013671875, 0.3048095703125, 0.3498077392578125, 0.394805908203125, 0.4398040771484375, 0.48480224609375, 0.5298004150390625, 0.574798583984375, 0.6197967529296875, 0.664794921875, 0.7097930908203125, 0.754791259765625, 0.7997894287109375, 0.84478759765625, 0.8897857666015625, 0.934783935546875, 0.9797821044921875, 1.0247802734375, 1.0697784423828125, 1.114776611328125, 1.1597747802734375, 1.20477294921875, 1.2497711181640625, 1.294769287109375, 1.3397674560546875, 1.384765625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 7.0, 13.0, 9.0, 15.0, 19.0, 29.0, 36.0, 25.0, 45.0, 63.0, 65.0, 57.0, 68.0, 77.0, 60.0, 64.0, 66.0, 65.0, 44.0, 44.0, 33.0, 26.0, 20.0, 10.0, 16.0, 4.0, 6.0, 2.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.70703125, -0.6886024475097656, -0.6701736450195312, -0.6517448425292969, -0.6333160400390625, -0.6148872375488281, -0.5964584350585938, -0.5780296325683594, -0.559600830078125, -0.5411720275878906, -0.5227432250976562, -0.5043144226074219, -0.4858856201171875, -0.4674568176269531, -0.44902801513671875, -0.4305992126464844, -0.41217041015625, -0.3937416076660156, -0.37531280517578125, -0.3568840026855469, -0.3384552001953125, -0.3200263977050781, -0.30159759521484375, -0.2831687927246094, -0.264739990234375, -0.24631118774414062, -0.22788238525390625, -0.20945358276367188, -0.1910247802734375, -0.17259597778320312, -0.15416717529296875, -0.13573837280273438, -0.1173095703125, -0.09888076782226562, -0.08045196533203125, -0.062023162841796875, -0.0435943603515625, -0.025165557861328125, -0.00673675537109375, 0.011692047119140625, 0.030120849609375, 0.048549652099609375, 0.06697845458984375, 0.08540725708007812, 0.1038360595703125, 0.12226486206054688, 0.14069366455078125, 0.15912246704101562, 0.17755126953125, 0.19598007202148438, 0.21440887451171875, 0.23283767700195312, 0.2512664794921875, 0.2696952819824219, 0.28812408447265625, 0.3065528869628906, 0.324981689453125, 0.3434104919433594, 0.36183929443359375, 0.3802680969238281, 0.3986968994140625, 0.4171257019042969, 0.43555450439453125, 0.4539833068847656, 0.472412109375]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 13.0, 22.0, 20.0, 20.0, 48.0, 61.0, 109.0, 157.0, 288.0, 461.0, 947.0, 1939.0, 5080.0, 18834.0, 150455.0, 3562274.0, 409711.0, 31588.0, 7244.0, 2504.0, 1093.0, 571.0, 327.0, 184.0, 105.0, 59.0, 45.0, 26.0, 21.0, 12.0, 6.0, 8.0, 11.0, 3.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.84521484375, -0.820098876953125, -0.79498291015625, -0.769866943359375, -0.7447509765625, -0.719635009765625, -0.69451904296875, -0.669403076171875, -0.644287109375, -0.619171142578125, -0.59405517578125, -0.568939208984375, -0.5438232421875, -0.518707275390625, -0.49359130859375, -0.468475341796875, -0.443359375, -0.418243408203125, -0.39312744140625, -0.368011474609375, -0.3428955078125, -0.317779541015625, -0.29266357421875, -0.267547607421875, -0.242431640625, -0.217315673828125, -0.19219970703125, -0.167083740234375, -0.1419677734375, -0.116851806640625, -0.09173583984375, -0.066619873046875, -0.04150390625, -0.016387939453125, 0.00872802734375, 0.033843994140625, 0.0589599609375, 0.084075927734375, 0.10919189453125, 0.134307861328125, 0.159423828125, 0.184539794921875, 0.20965576171875, 0.234771728515625, 0.2598876953125, 0.285003662109375, 0.31011962890625, 0.335235595703125, 0.3603515625, 0.385467529296875, 0.41058349609375, 0.435699462890625, 0.4608154296875, 0.485931396484375, 0.51104736328125, 0.536163330078125, 0.561279296875, 0.586395263671875, 0.61151123046875, 0.636627197265625, 0.6617431640625, 0.686859130859375, 0.71197509765625, 0.737091064453125, 0.76220703125]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 17.0, 11.0, 15.0, 42.0, 54.0, 97.0, 190.0, 409.0, 810.0, 992.0, 672.0, 343.0, 143.0, 96.0, 56.0, 43.0, 24.0, 14.0, 10.0, 5.0, 6.0, 8.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.199951171875, -0.19141769409179688, -0.18288421630859375, -0.17435073852539062, -0.1658172607421875, -0.15728378295898438, -0.14875030517578125, -0.14021682739257812, -0.131683349609375, -0.12314987182617188, -0.11461639404296875, -0.10608291625976562, -0.0975494384765625, -0.08901596069335938, -0.08048248291015625, -0.07194900512695312, -0.06341552734375, -0.054882049560546875, -0.04634857177734375, -0.037815093994140625, -0.0292816162109375, -0.020748138427734375, -0.01221466064453125, -0.003681182861328125, 0.004852294921875, 0.013385772705078125, 0.02191925048828125, 0.030452728271484375, 0.0389862060546875, 0.047519683837890625, 0.05605316162109375, 0.06458663940429688, 0.0731201171875, 0.08165359497070312, 0.09018707275390625, 0.09872055053710938, 0.1072540283203125, 0.11578750610351562, 0.12432098388671875, 0.13285446166992188, 0.141387939453125, 0.14992141723632812, 0.15845489501953125, 0.16698837280273438, 0.1755218505859375, 0.18405532836914062, 0.19258880615234375, 0.20112228393554688, 0.20965576171875, 0.21818923950195312, 0.22672271728515625, 0.23525619506835938, 0.2437896728515625, 0.2523231506347656, 0.26085662841796875, 0.2693901062011719, 0.277923583984375, 0.2864570617675781, 0.29499053955078125, 0.3035240173339844, 0.3120574951171875, 0.3205909729003906, 0.32912445068359375, 0.3376579284667969, 0.34619140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 8.0, 5.0, 6.0, 13.0, 28.0, 55.0, 104.0, 116.0, 183.0, 159.0, 135.0, 85.0, 36.0, 34.0, 14.0, 7.0, 8.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0781259536743164, -1.039666771888733, -1.0012074708938599, -0.9627482891082764, -0.9242891073226929, -0.8858298659324646, -0.8473706245422363, -0.8089114427566528, -0.7704522609710693, -0.7319930195808411, -0.6935338377952576, -0.6550745964050293, -0.6166154146194458, -0.5781561732292175, -0.5396969318389893, -0.5012377500534058, -0.4627785086631775, -0.4243192970752716, -0.3858600854873657, -0.34740084409713745, -0.30894166231155396, -0.2704824209213257, -0.2320232093334198, -0.19356399774551392, -0.15510478615760803, -0.11664557456970215, -0.07818635553121567, -0.03972713649272919, -0.0012679249048233032, 0.03719128668308258, 0.07565051317214966, 0.11410972476005554, 0.15256893634796143, 0.1910281479358673, 0.2294873595237732, 0.26794660091400146, 0.30640578269958496, 0.34486502408981323, 0.3833242356777191, 0.421783447265625, 0.4602426588535309, 0.49870187044143677, 0.537161111831665, 0.5756202936172485, 0.6140795350074768, 0.6525387167930603, 0.6909979581832886, 0.7294571399688721, 0.7679163813591003, 0.8063756227493286, 0.8448348045349121, 0.8832940459251404, 0.9217532277107239, 0.9602124691009521, 0.9986716508865356, 1.0371308326721191, 1.0755901336669922, 1.1140493154525757, 1.1525086164474487, 1.1909677982330322, 1.2294269800186157, 1.2678861618041992, 1.3063454627990723, 1.3448046445846558, 1.3832638263702393]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 3.0, 7.0, 7.0, 9.0, 9.0, 17.0, 9.0, 14.0, 12.0, 21.0, 28.0, 49.0, 42.0, 36.0, 41.0, 42.0, 53.0, 49.0, 46.0, 42.0, 55.0, 44.0, 44.0, 42.0, 40.0, 44.0, 33.0, 30.0, 24.0, 31.0, 20.0, 13.0, 12.0, 12.0, 7.0, 4.0, 4.0, 7.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4527290165424347, -0.4377433955669403, -0.4227577745914459, -0.40777212381362915, -0.39278650283813477, -0.3778008818626404, -0.362815260887146, -0.3478296399116516, -0.3328440189361572, -0.31785839796066284, -0.30287277698516846, -0.2878871560096741, -0.2729015052318573, -0.2579158842563629, -0.24293026328086853, -0.22794464230537415, -0.21295899152755737, -0.197973370552063, -0.1829877346754074, -0.16800211369991302, -0.15301647782325745, -0.13803085684776306, -0.12304523587226868, -0.1080596074461937, -0.09307397902011871, -0.07808835059404373, -0.06310272216796875, -0.048117101192474365, -0.033131472766399384, -0.018145844340324402, -0.003160223364830017, 0.011825405061244965, 0.02681100368499756, 0.04179663211107254, 0.056782256811857224, 0.0717678815126419, 0.08675350993871689, 0.10173913836479187, 0.11672475934028625, 0.13171038031578064, 0.14669601619243622, 0.1616816371679306, 0.17666727304458618, 0.19165289402008057, 0.20663851499557495, 0.22162415087223053, 0.23660977184772491, 0.2515954077243805, 0.2665810286998749, 0.28156664967536926, 0.29655227065086365, 0.3115379214286804, 0.3265235424041748, 0.3415091633796692, 0.3564947843551636, 0.37148040533065796, 0.38646602630615234, 0.40145164728164673, 0.4164372682571411, 0.4314228892326355, 0.44640854001045227, 0.46139416098594666, 0.47637978196144104, 0.4913654029369354, 0.5063510537147522]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 6.0, 10.0, 8.0, 15.0, 21.0, 47.0, 49.0, 97.0, 184.0, 362.0, 955.0, 3073.0, 14277.0, 96470.0, 568385.0, 312957.0, 41440.0, 7103.0, 1809.0, 631.0, 303.0, 149.0, 76.0, 40.0, 36.0, 22.0, 9.0, 7.0, 6.0, 4.0, 1.0, 0.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.170166015625, -0.1655406951904297, -0.16091537475585938, -0.15629005432128906, -0.15166473388671875, -0.14703941345214844, -0.14241409301757812, -0.1377887725830078, -0.1331634521484375, -0.1285381317138672, -0.12391281127929688, -0.11928749084472656, -0.11466217041015625, -0.11003684997558594, -0.10541152954101562, -0.10078620910644531, -0.096160888671875, -0.09153556823730469, -0.08691024780273438, -0.08228492736816406, -0.07765960693359375, -0.07303428649902344, -0.06840896606445312, -0.06378364562988281, -0.0591583251953125, -0.05453300476074219, -0.049907684326171875, -0.04528236389160156, -0.04065704345703125, -0.03603172302246094, -0.031406402587890625, -0.026781082153320312, -0.02215576171875, -0.017530441284179688, -0.012905120849609375, -0.008279800415039062, -0.00365447998046875, 0.0009708404541015625, 0.005596160888671875, 0.010221481323242188, 0.0148468017578125, 0.019472122192382812, 0.024097442626953125, 0.028722763061523438, 0.03334808349609375, 0.03797340393066406, 0.042598724365234375, 0.04722404479980469, 0.051849365234375, 0.05647468566894531, 0.061100006103515625, 0.06572532653808594, 0.07035064697265625, 0.07497596740722656, 0.07960128784179688, 0.08422660827636719, 0.0888519287109375, 0.09347724914550781, 0.09810256958007812, 0.10272789001464844, 0.10735321044921875, 0.11197853088378906, 0.11660385131835938, 0.12122917175292969, 0.1258544921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 6.0, 6.0, 5.0, 7.0, 16.0, 12.0, 21.0, 25.0, 25.0, 48.0, 58.0, 36.0, 54.0, 65.0, 54.0, 73.0, 71.0, 55.0, 61.0, 45.0, 54.0, 42.0, 37.0, 39.0, 23.0, 22.0, 10.0, 9.0, 11.0, 7.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.356201171875, -0.3429069519042969, -0.32961273193359375, -0.3163185119628906, -0.3030242919921875, -0.2897300720214844, -0.27643585205078125, -0.2631416320800781, -0.249847412109375, -0.23655319213867188, -0.22325897216796875, -0.20996475219726562, -0.1966705322265625, -0.18337631225585938, -0.17008209228515625, -0.15678787231445312, -0.14349365234375, -0.13019943237304688, -0.11690521240234375, -0.10361099243164062, -0.0903167724609375, -0.07702255249023438, -0.06372833251953125, -0.050434112548828125, -0.037139892578125, -0.023845672607421875, -0.01055145263671875, 0.002742767333984375, 0.0160369873046875, 0.029331207275390625, 0.04262542724609375, 0.055919647216796875, 0.0692138671875, 0.08250808715820312, 0.09580230712890625, 0.10909652709960938, 0.1223907470703125, 0.13568496704101562, 0.14897918701171875, 0.16227340698242188, 0.175567626953125, 0.18886184692382812, 0.20215606689453125, 0.21545028686523438, 0.2287445068359375, 0.24203872680664062, 0.25533294677734375, 0.2686271667480469, 0.28192138671875, 0.2952156066894531, 0.30850982666015625, 0.3218040466308594, 0.3350982666015625, 0.3483924865722656, 0.36168670654296875, 0.3749809265136719, 0.388275146484375, 0.4015693664550781, 0.41486358642578125, 0.4281578063964844, 0.4414520263671875, 0.4547462463378906, 0.46804046630859375, 0.4813346862792969, 0.49462890625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 10.0, 12.0, 18.0, 19.0, 27.0, 44.0, 56.0, 68.0, 99.0, 140.0, 226.0, 342.0, 595.0, 1116.0, 2070.0, 3924.0, 8248.0, 17360.0, 38770.0, 87638.0, 187849.0, 286571.0, 218173.0, 106622.0, 47418.0, 21001.0, 9672.0, 4664.0, 2454.0, 1308.0, 750.0, 481.0, 261.0, 168.0, 99.0, 75.0, 44.0, 39.0, 28.0, 24.0, 14.0, 14.0, 8.0, 9.0, 6.0, 5.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.054901123046875, -0.05321788787841797, -0.05153465270996094, -0.049851417541503906, -0.048168182373046875, -0.046484947204589844, -0.04480171203613281, -0.04311847686767578, -0.04143524169921875, -0.03975200653076172, -0.03806877136230469, -0.036385536193847656, -0.034702301025390625, -0.033019065856933594, -0.03133583068847656, -0.02965259552001953, -0.0279693603515625, -0.02628612518310547, -0.024602890014648438, -0.022919654846191406, -0.021236419677734375, -0.019553184509277344, -0.017869949340820312, -0.01618671417236328, -0.01450347900390625, -0.012820243835449219, -0.011137008666992188, -0.009453773498535156, -0.007770538330078125, -0.006087303161621094, -0.0044040679931640625, -0.0027208328247070312, -0.00103759765625, 0.0006456375122070312, 0.0023288726806640625, 0.004012107849121094, 0.005695343017578125, 0.007378578186035156, 0.009061813354492188, 0.010745048522949219, 0.01242828369140625, 0.014111518859863281, 0.015794754028320312, 0.017477989196777344, 0.019161224365234375, 0.020844459533691406, 0.022527694702148438, 0.02421092987060547, 0.0258941650390625, 0.02757740020751953, 0.029260635375976562, 0.030943870544433594, 0.032627105712890625, 0.034310340881347656, 0.03599357604980469, 0.03767681121826172, 0.03936004638671875, 0.04104328155517578, 0.04272651672363281, 0.044409751892089844, 0.046092987060546875, 0.047776222229003906, 0.04945945739746094, 0.05114269256591797, 0.052825927734375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 4.0, 9.0, 6.0, 7.0, 7.0, 11.0, 11.0, 10.0, 16.0, 21.0, 18.0, 20.0, 21.0, 32.0, 37.0, 40.0, 37.0, 37.0, 40.0, 31.0, 45.0, 43.0, 43.0, 34.0, 36.0, 40.0, 51.0, 51.0, 36.0, 28.0, 22.0, 26.0, 21.0, 15.0, 20.0, 12.0, 12.0, 15.0, 8.0, 9.0, 4.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.5244140625, -0.5072784423828125, -0.490142822265625, -0.4730072021484375, -0.45587158203125, -0.4387359619140625, -0.421600341796875, -0.4044647216796875, -0.3873291015625, -0.3701934814453125, -0.353057861328125, -0.3359222412109375, -0.31878662109375, -0.3016510009765625, -0.284515380859375, -0.2673797607421875, -0.250244140625, -0.2331085205078125, -0.215972900390625, -0.1988372802734375, -0.18170166015625, -0.1645660400390625, -0.147430419921875, -0.1302947998046875, -0.1131591796875, -0.0960235595703125, -0.078887939453125, -0.0617523193359375, -0.04461669921875, -0.0274810791015625, -0.010345458984375, 0.0067901611328125, 0.02392578125, 0.0410614013671875, 0.058197021484375, 0.0753326416015625, 0.09246826171875, 0.1096038818359375, 0.126739501953125, 0.1438751220703125, 0.1610107421875, 0.1781463623046875, 0.195281982421875, 0.2124176025390625, 0.22955322265625, 0.2466888427734375, 0.263824462890625, 0.2809600830078125, 0.298095703125, 0.3152313232421875, 0.332366943359375, 0.3495025634765625, 0.36663818359375, 0.3837738037109375, 0.400909423828125, 0.4180450439453125, 0.4351806640625, 0.4523162841796875, 0.469451904296875, 0.4865875244140625, 0.50372314453125, 0.5208587646484375, 0.537994384765625, 0.5551300048828125, 0.572265625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 6.0, 8.0, 12.0, 24.0, 37.0, 64.0, 90.0, 154.0, 285.0, 541.0, 991.0, 1941.0, 4465.0, 12059.0, 44690.0, 198392.0, 472241.0, 235894.0, 53220.0, 14072.0, 4877.0, 2141.0, 1055.0, 536.0, 306.0, 172.0, 93.0, 70.0, 35.0, 26.0, 20.0, 8.0, 7.0, 6.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0239715576171875, -0.023160696029663086, -0.022349834442138672, -0.021538972854614258, -0.020728111267089844, -0.01991724967956543, -0.019106388092041016, -0.0182955265045166, -0.017484664916992188, -0.016673803329467773, -0.01586294174194336, -0.015052080154418945, -0.014241218566894531, -0.013430356979370117, -0.012619495391845703, -0.011808633804321289, -0.010997772216796875, -0.010186910629272461, -0.009376049041748047, -0.008565187454223633, -0.007754325866699219, -0.006943464279174805, -0.006132602691650391, -0.0053217411041259766, -0.0045108795166015625, -0.0037000179290771484, -0.0028891563415527344, -0.0020782947540283203, -0.0012674331665039062, -0.0004565715789794922, 0.0003542900085449219, 0.001165151596069336, 0.00197601318359375, 0.002786874771118164, 0.003597736358642578, 0.004408597946166992, 0.005219459533691406, 0.00603032112121582, 0.006841182708740234, 0.0076520442962646484, 0.008462905883789062, 0.009273767471313477, 0.01008462905883789, 0.010895490646362305, 0.011706352233886719, 0.012517213821411133, 0.013328075408935547, 0.014138936996459961, 0.014949798583984375, 0.01576066017150879, 0.016571521759033203, 0.017382383346557617, 0.01819324493408203, 0.019004106521606445, 0.01981496810913086, 0.020625829696655273, 0.021436691284179688, 0.0222475528717041, 0.023058414459228516, 0.02386927604675293, 0.024680137634277344, 0.025490999221801758, 0.026301860809326172, 0.027112722396850586, 0.027923583984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 2.0, 4.0, 6.0, 7.0, 9.0, 13.0, 22.0, 18.0, 22.0, 37.0, 42.0, 39.0, 60.0, 70.0, 71.0, 54.0, 73.0, 79.0, 68.0, 51.0, 40.0, 41.0, 36.0, 31.0, 26.0, 17.0, 15.0, 9.0, 12.0, 5.0, 4.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.68899917602539e-06, -7.360242307186127e-06, -7.031485438346863e-06, -6.702728569507599e-06, -6.373971700668335e-06, -6.045214831829071e-06, -5.716457962989807e-06, -5.387701094150543e-06, -5.058944225311279e-06, -4.730187356472015e-06, -4.4014304876327515e-06, -4.0726736187934875e-06, -3.7439167499542236e-06, -3.4151598811149597e-06, -3.086403012275696e-06, -2.757646143436432e-06, -2.428889274597168e-06, -2.100132405757904e-06, -1.7713755369186401e-06, -1.4426186680793762e-06, -1.1138617992401123e-06, -7.851049304008484e-07, -4.5634806156158447e-07, -1.2759119272232056e-07, 2.0116567611694336e-07, 5.299225449562073e-07, 8.586794137954712e-07, 1.1874362826347351e-06, 1.516193151473999e-06, 1.844950020313263e-06, 2.173706889152527e-06, 2.5024637579917908e-06, 2.8312206268310547e-06, 3.1599774956703186e-06, 3.4887343645095825e-06, 3.8174912333488464e-06, 4.14624810218811e-06, 4.475004971027374e-06, 4.803761839866638e-06, 5.132518708705902e-06, 5.461275577545166e-06, 5.79003244638443e-06, 6.118789315223694e-06, 6.447546184062958e-06, 6.776303052902222e-06, 7.105059921741486e-06, 7.4338167905807495e-06, 7.762573659420013e-06, 8.091330528259277e-06, 8.420087397098541e-06, 8.748844265937805e-06, 9.077601134777069e-06, 9.406358003616333e-06, 9.735114872455597e-06, 1.006387174129486e-05, 1.0392628610134125e-05, 1.0721385478973389e-05, 1.1050142347812653e-05, 1.1378899216651917e-05, 1.170765608549118e-05, 1.2036412954330444e-05, 1.2365169823169708e-05, 1.2693926692008972e-05, 1.3022683560848236e-05, 1.33514404296875e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 6.0, 6.0, 4.0, 7.0, 11.0, 18.0, 31.0, 33.0, 59.0, 82.0, 130.0, 183.0, 273.0, 487.0, 808.0, 1484.0, 3369.0, 7941.0, 20290.0, 54557.0, 147394.0, 297044.0, 289253.0, 139351.0, 52170.0, 19050.0, 7520.0, 3320.0, 1574.0, 812.0, 467.0, 310.0, 145.0, 124.0, 70.0, 49.0, 35.0, 20.0, 22.0, 13.0, 4.0, 6.0, 5.0, 6.0, 3.0, 1.0, 6.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.01873779296875, -0.01815176010131836, -0.01756572723388672, -0.016979694366455078, -0.016393661499023438, -0.015807628631591797, -0.015221595764160156, -0.014635562896728516, -0.014049530029296875, -0.013463497161865234, -0.012877464294433594, -0.012291431427001953, -0.011705398559570312, -0.011119365692138672, -0.010533332824707031, -0.00994729995727539, -0.00936126708984375, -0.00877523422241211, -0.008189201354980469, -0.007603168487548828, -0.0070171356201171875, -0.006431102752685547, -0.005845069885253906, -0.005259037017822266, -0.004673004150390625, -0.004086971282958984, -0.0035009384155273438, -0.002914905548095703, -0.0023288726806640625, -0.0017428398132324219, -0.0011568069458007812, -0.0005707740783691406, 1.52587890625e-05, 0.0006012916564941406, 0.0011873245239257812, 0.0017733573913574219, 0.0023593902587890625, 0.002945423126220703, 0.0035314559936523438, 0.004117488861083984, 0.004703521728515625, 0.005289554595947266, 0.005875587463378906, 0.006461620330810547, 0.0070476531982421875, 0.007633686065673828, 0.008219718933105469, 0.00880575180053711, 0.00939178466796875, 0.00997781753540039, 0.010563850402832031, 0.011149883270263672, 0.011735916137695312, 0.012321949005126953, 0.012907981872558594, 0.013494014739990234, 0.014080047607421875, 0.014666080474853516, 0.015252113342285156, 0.015838146209716797, 0.016424179077148438, 0.017010211944580078, 0.01759624481201172, 0.01818227767944336, 0.018768310546875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 8.0, 5.0, 5.0, 4.0, 10.0, 18.0, 11.0, 18.0, 22.0, 27.0, 25.0, 42.0, 50.0, 45.0, 46.0, 55.0, 56.0, 61.0, 49.0, 54.0, 50.0, 68.0, 42.0, 26.0, 29.0, 25.0, 25.0, 27.0, 22.0, 16.0, 15.0, 11.0, 4.0, 11.0, 7.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0057525634765625, -0.005561530590057373, -0.005370497703552246, -0.005179464817047119, -0.004988431930541992, -0.004797399044036865, -0.004606366157531738, -0.004415333271026611, -0.004224300384521484, -0.004033267498016357, -0.0038422346115112305, -0.0036512017250061035, -0.0034601688385009766, -0.0032691359519958496, -0.0030781030654907227, -0.0028870701789855957, -0.0026960372924804688, -0.002505004405975342, -0.002313971519470215, -0.002122938632965088, -0.001931905746459961, -0.001740872859954834, -0.001549839973449707, -0.00135880708694458, -0.0011677742004394531, -0.0009767413139343262, -0.0007857084274291992, -0.0005946755409240723, -0.0004036426544189453, -0.00021260976791381836, -2.1576881408691406e-05, 0.00016945600509643555, 0.0003604888916015625, 0.0005515217781066895, 0.0007425546646118164, 0.0009335875511169434, 0.0011246204376220703, 0.0013156533241271973, 0.0015066862106323242, 0.0016977190971374512, 0.0018887519836425781, 0.002079784870147705, 0.002270817756652832, 0.002461850643157959, 0.002652883529663086, 0.002843916416168213, 0.00303494930267334, 0.003225982189178467, 0.0034170150756835938, 0.0036080479621887207, 0.0037990808486938477, 0.003990113735198975, 0.0041811466217041016, 0.0043721795082092285, 0.0045632123947143555, 0.004754245281219482, 0.004945278167724609, 0.005136311054229736, 0.005327343940734863, 0.00551837682723999, 0.005709409713745117, 0.005900442600250244, 0.006091475486755371, 0.006282508373260498, 0.006473541259765625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 5.0, 10.0, 22.0, 43.0, 108.0, 238.0, 252.0, 183.0, 78.0, 30.0, 20.0, 9.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7442717552185059, -0.7094017267227173, -0.6745316386222839, -0.6396615505218506, -0.604791522026062, -0.5699214935302734, -0.5350514054298401, -0.5001813173294067, -0.46531128883361816, -0.4304412305355072, -0.39557117223739624, -0.3607011139392853, -0.3258310556411743, -0.29096099734306335, -0.2560909390449524, -0.22122088074684143, -0.18635082244873047, -0.1514807641506195, -0.11661070585250854, -0.08174064755439758, -0.04687058925628662, -0.01200053095817566, 0.022869527339935303, 0.057739585638046265, 0.09260964393615723, 0.1274797022342682, 0.16234976053237915, 0.1972198188304901, 0.23208987712860107, 0.26695993542671204, 0.301829993724823, 0.33670005202293396, 0.37156999111175537, 0.40644004940986633, 0.4413101077079773, 0.47618016600608826, 0.5110502243041992, 0.5459202527999878, 0.5807903409004211, 0.6156604290008545, 0.6505304574966431, 0.6854004859924316, 0.720270574092865, 0.7551406621932983, 0.7900106906890869, 0.8248807191848755, 0.8597508072853088, 0.8946208953857422, 0.9294909238815308, 0.9643609523773193, 0.9992310404777527, 1.034101128578186, 1.0689711570739746, 1.1038411855697632, 1.1387112140655518, 1.1735813617706299, 1.2084513902664185, 1.243321418762207, 1.2781915664672852, 1.3130615949630737, 1.3479316234588623, 1.3828016519546509, 1.4176716804504395, 1.4525418281555176, 1.4874118566513062]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 4.0, 6.0, 15.0, 10.0, 16.0, 17.0, 23.0, 30.0, 36.0, 57.0, 53.0, 53.0, 60.0, 61.0, 64.0, 54.0, 59.0, 65.0, 46.0, 58.0, 49.0, 30.0, 29.0, 34.0, 19.0, 15.0, 13.0, 7.0, 4.0, 8.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3560403883457184, -0.34330275654792786, -0.33056512475013733, -0.3178274929523468, -0.3050898611545563, -0.29235222935676575, -0.2796146273612976, -0.2668769955635071, -0.25413936376571655, -0.24140173196792603, -0.2286641001701355, -0.21592646837234497, -0.20318883657455444, -0.19045120477676392, -0.17771358788013458, -0.16497595608234406, -0.15223830938339233, -0.1395006775856018, -0.12676304578781128, -0.11402542144060135, -0.10128778964281082, -0.0885501578450203, -0.07581253349781036, -0.06307490170001984, -0.05033726990222931, -0.03759963810443878, -0.024862010031938553, -0.012124381959438324, 0.0006132498383522034, 0.01335088163614273, 0.02608850598335266, 0.03882613778114319, 0.05156373977661133, 0.06430137157440186, 0.07703900337219238, 0.08977662771940231, 0.10251425951719284, 0.11525189131498337, 0.1279895156621933, 0.14072714745998383, 0.15346477925777435, 0.16620241105556488, 0.1789400428533554, 0.19167765974998474, 0.20441529154777527, 0.2171529233455658, 0.22989055514335632, 0.24262818694114685, 0.2553658187389374, 0.2681034505367279, 0.28084108233451843, 0.29357871413230896, 0.3063163459300995, 0.31905397772789, 0.33179157972335815, 0.3445292115211487, 0.3572668433189392, 0.37000447511672974, 0.38274210691452026, 0.3954797387123108, 0.4082173705101013, 0.42095500230789185, 0.4336926341056824, 0.4464302659034729, 0.4591678977012634]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 2.0, 4.0, 4.0, 12.0, 10.0, 12.0, 23.0, 17.0, 54.0, 56.0, 80.0, 140.0, 203.0, 293.0, 429.0, 678.0, 1136.0, 2028.0, 3539.0, 6731.0, 13703.0, 31930.0, 85351.0, 257311.0, 397036.0, 152016.0, 52730.0, 21625.0, 9914.0, 4799.0, 2746.0, 1450.0, 908.0, 519.0, 335.0, 255.0, 156.0, 92.0, 61.0, 35.0, 36.0, 22.0, 21.0, 13.0, 12.0, 5.0, 7.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2183837890625, -0.2111682891845703, -0.20395278930664062, -0.19673728942871094, -0.18952178955078125, -0.18230628967285156, -0.17509078979492188, -0.1678752899169922, -0.1606597900390625, -0.1534442901611328, -0.14622879028320312, -0.13901329040527344, -0.13179779052734375, -0.12458229064941406, -0.11736679077148438, -0.11015129089355469, -0.102935791015625, -0.09572029113769531, -0.08850479125976562, -0.08128929138183594, -0.07407379150390625, -0.06685829162597656, -0.059642791748046875, -0.05242729187011719, -0.0452117919921875, -0.03799629211425781, -0.030780792236328125, -0.023565292358398438, -0.01634979248046875, -0.009134292602539062, -0.001918792724609375, 0.0052967071533203125, 0.01251220703125, 0.019727706909179688, 0.026943206787109375, 0.03415870666503906, 0.04137420654296875, 0.04858970642089844, 0.055805206298828125, 0.06302070617675781, 0.0702362060546875, 0.07745170593261719, 0.08466720581054688, 0.09188270568847656, 0.09909820556640625, 0.10631370544433594, 0.11352920532226562, 0.12074470520019531, 0.127960205078125, 0.1351757049560547, 0.14239120483398438, 0.14960670471191406, 0.15682220458984375, 0.16403770446777344, 0.17125320434570312, 0.1784687042236328, 0.1856842041015625, 0.1928997039794922, 0.20011520385742188, 0.20733070373535156, 0.21454620361328125, 0.22176170349121094, 0.22897720336914062, 0.2361927032470703, 0.243408203125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 12.0, 4.0, 15.0, 15.0, 16.0, 27.0, 37.0, 47.0, 49.0, 49.0, 50.0, 77.0, 64.0, 59.0, 62.0, 68.0, 57.0, 59.0, 42.0, 45.0, 36.0, 34.0, 20.0, 14.0, 14.0, 4.0, 8.0, 2.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7294921875, -0.7029266357421875, -0.676361083984375, -0.6497955322265625, -0.62322998046875, -0.5966644287109375, -0.570098876953125, -0.5435333251953125, -0.5169677734375, -0.4904022216796875, -0.463836669921875, -0.4372711181640625, -0.41070556640625, -0.3841400146484375, -0.357574462890625, -0.3310089111328125, -0.304443359375, -0.2778778076171875, -0.251312255859375, -0.2247467041015625, -0.19818115234375, -0.1716156005859375, -0.145050048828125, -0.1184844970703125, -0.0919189453125, -0.0653533935546875, -0.038787841796875, -0.0122222900390625, 0.01434326171875, 0.0409088134765625, 0.067474365234375, 0.0940399169921875, 0.12060546875, 0.1471710205078125, 0.173736572265625, 0.2003021240234375, 0.22686767578125, 0.2534332275390625, 0.279998779296875, 0.3065643310546875, 0.3331298828125, 0.3596954345703125, 0.386260986328125, 0.4128265380859375, 0.43939208984375, 0.4659576416015625, 0.492523193359375, 0.5190887451171875, 0.545654296875, 0.5722198486328125, 0.598785400390625, 0.6253509521484375, 0.65191650390625, 0.6784820556640625, 0.705047607421875, 0.7316131591796875, 0.7581787109375, 0.7847442626953125, 0.811309814453125, 0.8378753662109375, 0.86444091796875, 0.8910064697265625, 0.917572021484375, 0.9441375732421875, 0.970703125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 4.0, 2.0, 6.0, 2.0, 8.0, 9.0, 14.0, 13.0, 33.0, 26.0, 52.0, 67.0, 137.0, 175.0, 415.0, 1043.0, 3971.0, 28812.0, 667328.0, 325370.0, 16596.0, 2805.0, 799.0, 325.0, 180.0, 114.0, 61.0, 51.0, 33.0, 20.0, 19.0, 22.0, 15.0, 11.0, 7.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.732421875, -0.71142578125, -0.6904296875, -0.66943359375, -0.6484375, -0.62744140625, -0.6064453125, -0.58544921875, -0.564453125, -0.54345703125, -0.5224609375, -0.50146484375, -0.48046875, -0.45947265625, -0.4384765625, -0.41748046875, -0.396484375, -0.37548828125, -0.3544921875, -0.33349609375, -0.3125, -0.29150390625, -0.2705078125, -0.24951171875, -0.228515625, -0.20751953125, -0.1865234375, -0.16552734375, -0.14453125, -0.12353515625, -0.1025390625, -0.08154296875, -0.060546875, -0.03955078125, -0.0185546875, 0.00244140625, 0.0234375, 0.04443359375, 0.0654296875, 0.08642578125, 0.107421875, 0.12841796875, 0.1494140625, 0.17041015625, 0.19140625, 0.21240234375, 0.2333984375, 0.25439453125, 0.275390625, 0.29638671875, 0.3173828125, 0.33837890625, 0.359375, 0.38037109375, 0.4013671875, 0.42236328125, 0.443359375, 0.46435546875, 0.4853515625, 0.50634765625, 0.52734375, 0.54833984375, 0.5693359375, 0.59033203125, 0.611328125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 4.0, 7.0, 5.0, 9.0, 13.0, 14.0, 10.0, 16.0, 19.0, 14.0, 28.0, 23.0, 30.0, 27.0, 43.0, 27.0, 40.0, 39.0, 49.0, 54.0, 49.0, 28.0, 42.0, 28.0, 29.0, 45.0, 26.0, 33.0, 39.0, 27.0, 19.0, 30.0, 19.0, 20.0, 18.0, 15.0, 5.0, 11.0, 8.0, 6.0, 5.0, 4.0, 5.0, 6.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.65185546875, -0.6307601928710938, -0.6096649169921875, -0.5885696411132812, -0.567474365234375, -0.5463790893554688, -0.5252838134765625, -0.5041885375976562, -0.48309326171875, -0.46199798583984375, -0.4409027099609375, -0.41980743408203125, -0.398712158203125, -0.37761688232421875, -0.3565216064453125, -0.33542633056640625, -0.3143310546875, -0.29323577880859375, -0.2721405029296875, -0.25104522705078125, -0.229949951171875, -0.20885467529296875, -0.1877593994140625, -0.16666412353515625, -0.14556884765625, -0.12447357177734375, -0.1033782958984375, -0.08228302001953125, -0.061187744140625, -0.04009246826171875, -0.0189971923828125, 0.00209808349609375, 0.023193359375, 0.04428863525390625, 0.0653839111328125, 0.08647918701171875, 0.107574462890625, 0.12866973876953125, 0.1497650146484375, 0.17086029052734375, 0.19195556640625, 0.21305084228515625, 0.2341461181640625, 0.25524139404296875, 0.276336669921875, 0.29743194580078125, 0.3185272216796875, 0.33962249755859375, 0.3607177734375, 0.38181304931640625, 0.4029083251953125, 0.42400360107421875, 0.445098876953125, 0.46619415283203125, 0.4872894287109375, 0.5083847045898438, 0.52947998046875, 0.5505752563476562, 0.5716705322265625, 0.5927658081054688, 0.613861083984375, 0.6349563598632812, 0.6560516357421875, 0.6771469116210938, 0.6982421875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 5.0, 5.0, 4.0, 7.0, 9.0, 9.0, 17.0, 34.0, 38.0, 53.0, 113.0, 212.0, 515.0, 1319.0, 4510.0, 44514.0, 855820.0, 130851.0, 7546.0, 1743.0, 651.0, 287.0, 127.0, 67.0, 37.0, 24.0, 14.0, 9.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27392578125, -0.26578521728515625, -0.2576446533203125, -0.24950408935546875, -0.241363525390625, -0.23322296142578125, -0.2250823974609375, -0.21694183349609375, -0.20880126953125, -0.20066070556640625, -0.1925201416015625, -0.18437957763671875, -0.176239013671875, -0.16809844970703125, -0.1599578857421875, -0.15181732177734375, -0.1436767578125, -0.13553619384765625, -0.1273956298828125, -0.11925506591796875, -0.111114501953125, -0.10297393798828125, -0.0948333740234375, -0.08669281005859375, -0.07855224609375, -0.07041168212890625, -0.0622711181640625, -0.05413055419921875, -0.045989990234375, -0.03784942626953125, -0.0297088623046875, -0.02156829833984375, -0.013427734375, -0.00528717041015625, 0.0028533935546875, 0.01099395751953125, 0.019134521484375, 0.02727508544921875, 0.0354156494140625, 0.04355621337890625, 0.05169677734375, 0.05983734130859375, 0.0679779052734375, 0.07611846923828125, 0.084259033203125, 0.09239959716796875, 0.1005401611328125, 0.10868072509765625, 0.1168212890625, 0.12496185302734375, 0.1331024169921875, 0.14124298095703125, 0.149383544921875, 0.15752410888671875, 0.1656646728515625, 0.17380523681640625, 0.18194580078125, 0.19008636474609375, 0.1982269287109375, 0.20636749267578125, 0.214508056640625, 0.22264862060546875, 0.2307891845703125, 0.23892974853515625, 0.2470703125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 15.0, 28.0, 55.0, 137.0, 236.0, 249.0, 159.0, 72.0, 34.0, 9.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.848573684692383e-05, -6.668455898761749e-05, -6.488338112831116e-05, -6.308220326900482e-05, -6.128102540969849e-05, -5.947984755039215e-05, -5.7678669691085815e-05, -5.587749183177948e-05, -5.4076313972473145e-05, -5.227513611316681e-05, -5.0473958253860474e-05, -4.867278039455414e-05, -4.68716025352478e-05, -4.507042467594147e-05, -4.326924681663513e-05, -4.1468068957328796e-05, -3.966689109802246e-05, -3.7865713238716125e-05, -3.606453537940979e-05, -3.4263357520103455e-05, -3.246217966079712e-05, -3.0661001801490784e-05, -2.8859823942184448e-05, -2.7058646082878113e-05, -2.5257468223571777e-05, -2.3456290364265442e-05, -2.1655112504959106e-05, -1.985393464565277e-05, -1.8052756786346436e-05, -1.62515789270401e-05, -1.4450401067733765e-05, -1.264922320842743e-05, -1.0848045349121094e-05, -9.046867489814758e-06, -7.245689630508423e-06, -5.444511771202087e-06, -3.643333911895752e-06, -1.8421560525894165e-06, -4.0978193283081055e-08, 1.7601996660232544e-06, 3.56137752532959e-06, 5.362555384635925e-06, 7.163733243942261e-06, 8.964911103248596e-06, 1.0766088962554932e-05, 1.2567266821861267e-05, 1.4368444681167603e-05, 1.6169622540473938e-05, 1.7970800399780273e-05, 1.977197825908661e-05, 2.1573156118392944e-05, 2.337433397769928e-05, 2.5175511837005615e-05, 2.697668969631195e-05, 2.8777867555618286e-05, 3.057904541492462e-05, 3.238022327423096e-05, 3.418140113353729e-05, 3.598257899284363e-05, 3.778375685214996e-05, 3.95849347114563e-05, 4.1386112570762634e-05, 4.318729043006897e-05, 4.4988468289375305e-05, 4.678964614868164e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 3.0, 9.0, 19.0, 15.0, 36.0, 60.0, 157.0, 278.0, 669.0, 1657.0, 5664.0, 52290.0, 864274.0, 111860.0, 7885.0, 2104.0, 859.0, 367.0, 175.0, 71.0, 38.0, 23.0, 12.0, 10.0, 6.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.265380859375, -0.2567100524902344, -0.24803924560546875, -0.23936843872070312, -0.2306976318359375, -0.22202682495117188, -0.21335601806640625, -0.20468521118164062, -0.196014404296875, -0.18734359741210938, -0.17867279052734375, -0.17000198364257812, -0.1613311767578125, -0.15266036987304688, -0.14398956298828125, -0.13531875610351562, -0.12664794921875, -0.11797714233398438, -0.10930633544921875, -0.10063552856445312, -0.0919647216796875, -0.08329391479492188, -0.07462310791015625, -0.06595230102539062, -0.057281494140625, -0.048610687255859375, -0.03993988037109375, -0.031269073486328125, -0.0225982666015625, -0.013927459716796875, -0.00525665283203125, 0.003414154052734375, 0.0120849609375, 0.020755767822265625, 0.02942657470703125, 0.038097381591796875, 0.0467681884765625, 0.055438995361328125, 0.06410980224609375, 0.07278060913085938, 0.081451416015625, 0.09012222290039062, 0.09879302978515625, 0.10746383666992188, 0.1161346435546875, 0.12480545043945312, 0.13347625732421875, 0.14214706420898438, 0.15081787109375, 0.15948867797851562, 0.16815948486328125, 0.17683029174804688, 0.1855010986328125, 0.19417190551757812, 0.20284271240234375, 0.21151351928710938, 0.220184326171875, 0.22885513305664062, 0.23752593994140625, 0.24619674682617188, 0.2548675537109375, 0.2635383605957031, 0.27220916748046875, 0.2808799743652344, 0.28955078125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 8.0, 5.0, 9.0, 17.0, 18.0, 25.0, 29.0, 48.0, 70.0, 57.0, 83.0, 116.0, 118.0, 86.0, 78.0, 59.0, 42.0, 39.0, 22.0, 26.0, 20.0, 10.0, 11.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06317138671875, -0.06114959716796875, -0.0591278076171875, -0.05710601806640625, -0.055084228515625, -0.05306243896484375, -0.0510406494140625, -0.04901885986328125, -0.0469970703125, -0.04497528076171875, -0.0429534912109375, -0.04093170166015625, -0.038909912109375, -0.03688812255859375, -0.0348663330078125, -0.03284454345703125, -0.03082275390625, -0.02880096435546875, -0.0267791748046875, -0.02475738525390625, -0.022735595703125, -0.02071380615234375, -0.0186920166015625, -0.01667022705078125, -0.0146484375, -0.01262664794921875, -0.0106048583984375, -0.00858306884765625, -0.006561279296875, -0.00453948974609375, -0.0025177001953125, -0.00049591064453125, 0.00152587890625, 0.00354766845703125, 0.0055694580078125, 0.00759124755859375, 0.009613037109375, 0.01163482666015625, 0.0136566162109375, 0.01567840576171875, 0.0177001953125, 0.01972198486328125, 0.0217437744140625, 0.02376556396484375, 0.025787353515625, 0.02780914306640625, 0.0298309326171875, 0.03185272216796875, 0.03387451171875, 0.03589630126953125, 0.0379180908203125, 0.03993988037109375, 0.041961669921875, 0.04398345947265625, 0.0460052490234375, 0.04802703857421875, 0.050048828125, 0.05207061767578125, 0.0540924072265625, 0.05611419677734375, 0.058135986328125, 0.06015777587890625, 0.0621795654296875, 0.06420135498046875, 0.06622314453125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 7.0, 4.0, 3.0, 14.0, 30.0, 47.0, 95.0, 155.0, 186.0, 176.0, 118.0, 94.0, 25.0, 22.0, 16.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1412497758865356, -1.0889570713043213, -1.0366644859313965, -0.9843717813491821, -0.9320791363716125, -0.879786491394043, -0.8274937868118286, -0.775201141834259, -0.7229084968566895, -0.6706158518791199, -0.6183232069015503, -0.5660305023193359, -0.5137378573417664, -0.4614452123641968, -0.4091525375843048, -0.35685986280441284, -0.30456721782684326, -0.2522745728492737, -0.1999818980693817, -0.14768923819065094, -0.09539657831192017, -0.043103933334350586, 0.009188741445541382, 0.06148141622543335, 0.11377406120300293, 0.1660667210817337, 0.21835938096046448, 0.27065205574035645, 0.322944700717926, 0.3752373456954956, 0.4275300204753876, 0.47982269525527954, 0.5321152210235596, 0.5844078660011292, 0.6367005109786987, 0.6889932155609131, 0.7412858605384827, 0.7935785055160522, 0.8458712100982666, 0.8981638550758362, 0.9504565000534058, 1.0027492046356201, 1.055041790008545, 1.1073344945907593, 1.1596271991729736, 1.2119197845458984, 1.2642124891281128, 1.3165051937103271, 1.368797779083252, 1.4210904836654663, 1.4733830690383911, 1.5256757736206055, 1.5779683589935303, 1.6302610635757446, 1.682553768157959, 1.7348463535308838, 1.7871390581130981, 1.8394317626953125, 1.8917243480682373, 1.9440170526504517, 1.996309757232666, 2.048602342605591, 2.1008949279785156, 2.1531877517700195, 2.2054803371429443]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 4.0, 2.0, 6.0, 6.0, 5.0, 4.0, 10.0, 5.0, 10.0, 12.0, 15.0, 21.0, 30.0, 23.0, 20.0, 21.0, 27.0, 25.0, 35.0, 32.0, 36.0, 42.0, 42.0, 44.0, 41.0, 51.0, 43.0, 37.0, 41.0, 42.0, 32.0, 28.0, 29.0, 21.0, 23.0, 21.0, 17.0, 18.0, 12.0, 11.0, 10.0, 10.0, 13.0, 8.0, 3.0, 9.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.8651425838470459, -0.8339269757270813, -0.8027114272117615, -0.7714958190917969, -0.740280270576477, -0.7090646624565125, -0.6778490543365479, -0.646633505821228, -0.6154178977012634, -0.5842022895812988, -0.552986741065979, -0.5217711329460144, -0.4905555546283722, -0.45933997631073, -0.42812439799308777, -0.39690881967544556, -0.36569324135780334, -0.33447766304016113, -0.3032620847225189, -0.2720465064048767, -0.2408308982849121, -0.2096153199672699, -0.17839974164962769, -0.14718414843082428, -0.11596857011318207, -0.08475298434495926, -0.05353740230202675, -0.02232182025909424, 0.00889376550912857, 0.04010935127735138, 0.07132492959499359, 0.102540522813797, 0.1337561011314392, 0.16497167944908142, 0.19618727266788483, 0.22740285098552704, 0.25861844420433044, 0.28983402252197266, 0.32104960083961487, 0.3522651791572571, 0.3834807872772217, 0.4146963655948639, 0.4459119439125061, 0.4771275520324707, 0.5083431005477905, 0.5395587086677551, 0.5707743167877197, 0.6019898653030396, 0.6332054138183594, 0.664421021938324, 0.6956365704536438, 0.7268521785736084, 0.7580677270889282, 0.7892833352088928, 0.8204989433288574, 0.8517144918441772, 0.8829300999641418, 0.9141457080841064, 0.9453612565994263, 0.9765768647193909, 1.0077924728393555, 1.0390080213546753, 1.0702235698699951, 1.1014392375946045, 1.1326547861099243]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 1.0, 5.0, 1.0, 2.0, 2.0, 11.0, 15.0, 19.0, 27.0, 48.0, 106.0, 232.0, 574.0, 1982.0, 8617.0, 186418.0, 3893197.0, 92337.0, 7390.0, 2071.0, 702.0, 271.0, 114.0, 61.0, 39.0, 9.0, 10.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.669921875, -1.62530517578125, -1.5806884765625, -1.53607177734375, -1.491455078125, -1.44683837890625, -1.4022216796875, -1.35760498046875, -1.31298828125, -1.26837158203125, -1.2237548828125, -1.17913818359375, -1.134521484375, -1.08990478515625, -1.0452880859375, -1.00067138671875, -0.9560546875, -0.91143798828125, -0.8668212890625, -0.82220458984375, -0.777587890625, -0.73297119140625, -0.6883544921875, -0.64373779296875, -0.59912109375, -0.55450439453125, -0.5098876953125, -0.46527099609375, -0.420654296875, -0.37603759765625, -0.3314208984375, -0.28680419921875, -0.2421875, -0.19757080078125, -0.1529541015625, -0.10833740234375, -0.063720703125, -0.01910400390625, 0.0255126953125, 0.07012939453125, 0.11474609375, 0.15936279296875, 0.2039794921875, 0.24859619140625, 0.293212890625, 0.33782958984375, 0.3824462890625, 0.42706298828125, 0.4716796875, 0.51629638671875, 0.5609130859375, 0.60552978515625, 0.650146484375, 0.69476318359375, 0.7393798828125, 0.78399658203125, 0.82861328125, 0.87322998046875, 0.9178466796875, 0.96246337890625, 1.007080078125, 1.05169677734375, 1.0963134765625, 1.14093017578125, 1.185546875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 7.0, 3.0, 7.0, 9.0, 18.0, 23.0, 23.0, 36.0, 62.0, 57.0, 86.0, 70.0, 80.0, 91.0, 78.0, 68.0, 68.0, 52.0, 52.0, 30.0, 29.0, 19.0, 11.0, 8.0, 9.0, 1.0, 6.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6904296875, -0.6718482971191406, -0.6532669067382812, -0.6346855163574219, -0.6161041259765625, -0.5975227355957031, -0.5789413452148438, -0.5603599548339844, -0.541778564453125, -0.5231971740722656, -0.5046157836914062, -0.4860343933105469, -0.4674530029296875, -0.4488716125488281, -0.43029022216796875, -0.4117088317871094, -0.39312744140625, -0.3745460510253906, -0.35596466064453125, -0.3373832702636719, -0.3188018798828125, -0.3002204895019531, -0.28163909912109375, -0.2630577087402344, -0.244476318359375, -0.22589492797851562, -0.20731353759765625, -0.18873214721679688, -0.1701507568359375, -0.15156936645507812, -0.13298797607421875, -0.11440658569335938, -0.0958251953125, -0.07724380493164062, -0.05866241455078125, -0.040081024169921875, -0.0214996337890625, -0.002918243408203125, 0.01566314697265625, 0.034244537353515625, 0.052825927734375, 0.07140731811523438, 0.08998870849609375, 0.10857009887695312, 0.1271514892578125, 0.14573287963867188, 0.16431427001953125, 0.18289566040039062, 0.20147705078125, 0.22005844116210938, 0.23863983154296875, 0.2572212219238281, 0.2758026123046875, 0.2943840026855469, 0.31296539306640625, 0.3315467834472656, 0.350128173828125, 0.3687095642089844, 0.38729095458984375, 0.4058723449707031, 0.4244537353515625, 0.4430351257324219, 0.46161651611328125, 0.4801979064941406, 0.498779296875]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 3.0, 6.0, 11.0, 18.0, 34.0, 54.0, 92.0, 186.0, 403.0, 1019.0, 3279.0, 20414.0, 1273973.0, 2861047.0, 27864.0, 3698.0, 1153.0, 510.0, 205.0, 131.0, 72.0, 39.0, 17.0, 12.0, 9.0, 12.0, 3.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80859375, -0.77020263671875, -0.7318115234375, -0.69342041015625, -0.655029296875, -0.61663818359375, -0.5782470703125, -0.53985595703125, -0.50146484375, -0.46307373046875, -0.4246826171875, -0.38629150390625, -0.347900390625, -0.30950927734375, -0.2711181640625, -0.23272705078125, -0.1943359375, -0.15594482421875, -0.1175537109375, -0.07916259765625, -0.040771484375, -0.00238037109375, 0.0360107421875, 0.07440185546875, 0.11279296875, 0.15118408203125, 0.1895751953125, 0.22796630859375, 0.266357421875, 0.30474853515625, 0.3431396484375, 0.38153076171875, 0.419921875, 0.45831298828125, 0.4967041015625, 0.53509521484375, 0.573486328125, 0.61187744140625, 0.6502685546875, 0.68865966796875, 0.72705078125, 0.76544189453125, 0.8038330078125, 0.84222412109375, 0.880615234375, 0.91900634765625, 0.9573974609375, 0.99578857421875, 1.0341796875, 1.07257080078125, 1.1109619140625, 1.14935302734375, 1.187744140625, 1.22613525390625, 1.2645263671875, 1.30291748046875, 1.34130859375, 1.37969970703125, 1.4180908203125, 1.45648193359375, 1.494873046875, 1.53326416015625, 1.5716552734375, 1.61004638671875, 1.6484375]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 6.0, 7.0, 13.0, 12.0, 35.0, 34.0, 59.0, 79.0, 137.0, 267.0, 570.0, 937.0, 837.0, 460.0, 260.0, 127.0, 70.0, 50.0, 39.0, 20.0, 10.0, 12.0, 8.0, 11.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.275390625, -0.26791954040527344, -0.2604484558105469, -0.2529773712158203, -0.24550628662109375, -0.2380352020263672, -0.23056411743164062, -0.22309303283691406, -0.2156219482421875, -0.20815086364746094, -0.20067977905273438, -0.1932086944580078, -0.18573760986328125, -0.1782665252685547, -0.17079544067382812, -0.16332435607910156, -0.155853271484375, -0.14838218688964844, -0.14091110229492188, -0.1334400177001953, -0.12596893310546875, -0.11849784851074219, -0.11102676391601562, -0.10355567932128906, -0.0960845947265625, -0.08861351013183594, -0.08114242553710938, -0.07367134094238281, -0.06620025634765625, -0.05872917175292969, -0.051258087158203125, -0.04378700256347656, -0.03631591796875, -0.028844833374023438, -0.021373748779296875, -0.013902664184570312, -0.00643157958984375, 0.0010395050048828125, 0.008510589599609375, 0.015981674194335938, 0.0234527587890625, 0.030923843383789062, 0.038394927978515625, 0.04586601257324219, 0.05333709716796875, 0.06080818176269531, 0.06827926635742188, 0.07575035095214844, 0.083221435546875, 0.09069252014160156, 0.09816360473632812, 0.10563468933105469, 0.11310577392578125, 0.12057685852050781, 0.12804794311523438, 0.13551902770996094, 0.1429901123046875, 0.15046119689941406, 0.15793228149414062, 0.1654033660888672, 0.17287445068359375, 0.1803455352783203, 0.18781661987304688, 0.19528770446777344, 0.2027587890625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 10.0, 15.0, 8.0, 38.0, 49.0, 71.0, 97.0, 131.0, 128.0, 125.0, 95.0, 73.0, 54.0, 35.0, 36.0, 11.0, 5.0, 10.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9480636119842529, -0.9206008315086365, -0.8931381106376648, -0.8656753301620483, -0.8382126092910767, -0.8107498288154602, -0.7832870483398438, -0.7558243274688721, -0.7283615469932556, -0.7008987665176392, -0.6734360456466675, -0.645973265171051, -0.6185104846954346, -0.5910477638244629, -0.5635849833488464, -0.53612220287323, -0.5086594820022583, -0.48119673132896423, -0.45373398065567017, -0.4262712001800537, -0.39880844950675964, -0.3713456988334656, -0.3438829183578491, -0.31642016768455505, -0.288957417011261, -0.2614946663379669, -0.23403190076351166, -0.2065691351890564, -0.17910638451576233, -0.15164363384246826, -0.124180868268013, -0.09671810269355774, -0.0692552924156189, -0.04179253429174423, -0.014329776167869568, 0.013132981956005096, 0.04059574007987976, 0.06805849075317383, 0.09552125632762909, 0.12298402190208435, 0.15044677257537842, 0.17790952324867249, 0.20537228882312775, 0.232835054397583, 0.2602978050708771, 0.28776055574417114, 0.3152233362197876, 0.34268608689308167, 0.37014883756637573, 0.3976115882396698, 0.42507433891296387, 0.4525371193885803, 0.4799998700618744, 0.5074626207351685, 0.5349254012107849, 0.5623881816864014, 0.589850902557373, 0.6173136830329895, 0.6447764039039612, 0.6722391843795776, 0.6997019052505493, 0.7271646857261658, 0.7546274662017822, 0.7820901870727539, 0.8095529675483704]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 8.0, 3.0, 4.0, 7.0, 7.0, 12.0, 12.0, 14.0, 14.0, 23.0, 24.0, 31.0, 36.0, 27.0, 37.0, 47.0, 49.0, 32.0, 39.0, 39.0, 52.0, 46.0, 40.0, 36.0, 42.0, 48.0, 39.0, 33.0, 29.0, 22.0, 27.0, 28.0, 19.0, 12.0, 14.0, 7.0, 9.0, 7.0, 4.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.3701837360858917, -0.3575890064239502, -0.3449942469596863, -0.33239951729774475, -0.3198047876358032, -0.3072100281715393, -0.2946152985095978, -0.28202056884765625, -0.26942580938339233, -0.2568310797214508, -0.2442363202571869, -0.23164159059524536, -0.21904684603214264, -0.20645210146903992, -0.1938573718070984, -0.18126262724399567, -0.16866788268089294, -0.15607313811779022, -0.1434783935546875, -0.13088366389274597, -0.11828891932964325, -0.10569417476654053, -0.0930994376540184, -0.08050470054149628, -0.06790995597839355, -0.05531521514058113, -0.04272047430276871, -0.030125733464956284, -0.01753099262714386, -0.004936248064041138, 0.0076584890484809875, 0.020253226161003113, 0.03284800052642822, 0.045442741364240646, 0.05803748220205307, 0.0706322193145752, 0.08322696387767792, 0.09582170844078064, 0.10841644555330276, 0.12101118266582489, 0.1336059272289276, 0.14620067179203033, 0.15879541635513306, 0.17139014601707458, 0.1839848905801773, 0.19657963514328003, 0.20917436480522156, 0.22176910936832428, 0.234363853931427, 0.24695859849452972, 0.25955334305763245, 0.272148072719574, 0.2847428321838379, 0.2973375618457794, 0.30993229150772095, 0.32252705097198486, 0.3351217806339264, 0.3477165102958679, 0.36031126976013184, 0.37290599942207336, 0.3855007290840149, 0.3980954885482788, 0.41069021821022034, 0.42328494787216187, 0.4358797073364258]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 2.0, 8.0, 11.0, 6.0, 12.0, 10.0, 22.0, 47.0, 72.0, 179.0, 398.0, 1140.0, 3326.0, 13795.0, 116139.0, 760696.0, 132414.0, 14623.0, 3654.0, 1187.0, 423.0, 159.0, 79.0, 40.0, 23.0, 13.0, 8.0, 10.0, 6.0, 12.0, 5.0, 8.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.22705078125, -0.2206592559814453, -0.21426773071289062, -0.20787620544433594, -0.20148468017578125, -0.19509315490722656, -0.18870162963867188, -0.1823101043701172, -0.1759185791015625, -0.1695270538330078, -0.16313552856445312, -0.15674400329589844, -0.15035247802734375, -0.14396095275878906, -0.13756942749023438, -0.1311779022216797, -0.124786376953125, -0.11839485168457031, -0.11200332641601562, -0.10561180114746094, -0.09922027587890625, -0.09282875061035156, -0.08643722534179688, -0.08004570007324219, -0.0736541748046875, -0.06726264953613281, -0.060871124267578125, -0.05447959899902344, -0.04808807373046875, -0.04169654846191406, -0.035305023193359375, -0.028913497924804688, -0.02252197265625, -0.016130447387695312, -0.009738922119140625, -0.0033473968505859375, 0.00304412841796875, 0.009435653686523438, 0.015827178955078125, 0.022218704223632812, 0.0286102294921875, 0.03500175476074219, 0.041393280029296875, 0.04778480529785156, 0.05417633056640625, 0.06056785583496094, 0.06695938110351562, 0.07335090637207031, 0.079742431640625, 0.08613395690917969, 0.09252548217773438, 0.09891700744628906, 0.10530853271484375, 0.11170005798339844, 0.11809158325195312, 0.12448310852050781, 0.1308746337890625, 0.1372661590576172, 0.14365768432617188, 0.15004920959472656, 0.15644073486328125, 0.16283226013183594, 0.16922378540039062, 0.1756153106689453, 0.1820068359375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 11.0, 6.0, 7.0, 16.0, 15.0, 17.0, 23.0, 44.0, 48.0, 44.0, 47.0, 61.0, 58.0, 45.0, 63.0, 59.0, 56.0, 55.0, 43.0, 47.0, 43.0, 36.0, 35.0, 31.0, 18.0, 13.0, 8.0, 9.0, 8.0, 6.0, 6.0, 4.0, 7.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26025390625, -0.24976348876953125, -0.2392730712890625, -0.22878265380859375, -0.218292236328125, -0.20780181884765625, -0.1973114013671875, -0.18682098388671875, -0.17633056640625, -0.16584014892578125, -0.1553497314453125, -0.14485931396484375, -0.134368896484375, -0.12387847900390625, -0.1133880615234375, -0.10289764404296875, -0.0924072265625, -0.08191680908203125, -0.0714263916015625, -0.06093597412109375, -0.050445556640625, -0.03995513916015625, -0.0294647216796875, -0.01897430419921875, -0.00848388671875, 0.00200653076171875, 0.0124969482421875, 0.02298736572265625, 0.033477783203125, 0.04396820068359375, 0.0544586181640625, 0.06494903564453125, 0.075439453125, 0.08592987060546875, 0.0964202880859375, 0.10691070556640625, 0.117401123046875, 0.12789154052734375, 0.1383819580078125, 0.14887237548828125, 0.15936279296875, 0.16985321044921875, 0.1803436279296875, 0.19083404541015625, 0.201324462890625, 0.21181488037109375, 0.2223052978515625, 0.23279571533203125, 0.2432861328125, 0.25377655029296875, 0.2642669677734375, 0.27475738525390625, 0.285247802734375, 0.29573822021484375, 0.3062286376953125, 0.31671905517578125, 0.32720947265625, 0.33769989013671875, 0.3481903076171875, 0.35868072509765625, 0.369171142578125, 0.37966156005859375, 0.3901519775390625, 0.40064239501953125, 0.4111328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 5.0, 11.0, 21.0, 22.0, 31.0, 40.0, 75.0, 102.0, 143.0, 235.0, 366.0, 660.0, 1043.0, 1929.0, 3981.0, 9011.0, 24622.0, 88070.0, 315246.0, 409046.0, 135251.0, 35914.0, 11889.0, 5031.0, 2474.0, 1300.0, 747.0, 460.0, 275.0, 189.0, 116.0, 66.0, 60.0, 38.0, 23.0, 19.0, 11.0, 7.0, 6.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0906982421875, -0.088043212890625, -0.08538818359375, -0.082733154296875, -0.080078125, -0.077423095703125, -0.07476806640625, -0.072113037109375, -0.0694580078125, -0.066802978515625, -0.06414794921875, -0.061492919921875, -0.058837890625, -0.056182861328125, -0.05352783203125, -0.050872802734375, -0.0482177734375, -0.045562744140625, -0.04290771484375, -0.040252685546875, -0.03759765625, -0.034942626953125, -0.03228759765625, -0.029632568359375, -0.0269775390625, -0.024322509765625, -0.02166748046875, -0.019012451171875, -0.016357421875, -0.013702392578125, -0.01104736328125, -0.008392333984375, -0.0057373046875, -0.003082275390625, -0.00042724609375, 0.002227783203125, 0.0048828125, 0.007537841796875, 0.01019287109375, 0.012847900390625, 0.0155029296875, 0.018157958984375, 0.02081298828125, 0.023468017578125, 0.026123046875, 0.028778076171875, 0.03143310546875, 0.034088134765625, 0.0367431640625, 0.039398193359375, 0.04205322265625, 0.044708251953125, 0.04736328125, 0.050018310546875, 0.05267333984375, 0.055328369140625, 0.0579833984375, 0.060638427734375, 0.06329345703125, 0.065948486328125, 0.068603515625, 0.071258544921875, 0.07391357421875, 0.076568603515625, 0.0792236328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 9.0, 3.0, 8.0, 10.0, 17.0, 19.0, 11.0, 18.0, 18.0, 27.0, 27.0, 25.0, 46.0, 46.0, 43.0, 51.0, 51.0, 36.0, 46.0, 46.0, 43.0, 33.0, 40.0, 46.0, 48.0, 37.0, 41.0, 31.0, 22.0, 16.0, 17.0, 19.0, 11.0, 6.0, 5.0, 9.0, 6.0, 3.0, 6.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.583984375, -0.566680908203125, -0.54937744140625, -0.532073974609375, -0.5147705078125, -0.497467041015625, -0.48016357421875, -0.462860107421875, -0.445556640625, -0.428253173828125, -0.41094970703125, -0.393646240234375, -0.3763427734375, -0.359039306640625, -0.34173583984375, -0.324432373046875, -0.30712890625, -0.289825439453125, -0.27252197265625, -0.255218505859375, -0.2379150390625, -0.220611572265625, -0.20330810546875, -0.186004638671875, -0.168701171875, -0.151397705078125, -0.13409423828125, -0.116790771484375, -0.0994873046875, -0.082183837890625, -0.06488037109375, -0.047576904296875, -0.0302734375, -0.012969970703125, 0.00433349609375, 0.021636962890625, 0.0389404296875, 0.056243896484375, 0.07354736328125, 0.090850830078125, 0.108154296875, 0.125457763671875, 0.14276123046875, 0.160064697265625, 0.1773681640625, 0.194671630859375, 0.21197509765625, 0.229278564453125, 0.24658203125, 0.263885498046875, 0.28118896484375, 0.298492431640625, 0.3157958984375, 0.333099365234375, 0.35040283203125, 0.367706298828125, 0.385009765625, 0.402313232421875, 0.41961669921875, 0.436920166015625, 0.4542236328125, 0.471527099609375, 0.48883056640625, 0.506134033203125, 0.5234375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 5.0, 9.0, 16.0, 14.0, 33.0, 43.0, 54.0, 81.0, 131.0, 214.0, 382.0, 677.0, 1378.0, 2977.0, 7206.0, 21174.0, 94362.0, 424977.0, 383616.0, 80181.0, 18870.0, 6431.0, 2801.0, 1325.0, 670.0, 379.0, 202.0, 120.0, 74.0, 45.0, 40.0, 13.0, 17.0, 8.0, 9.0, 8.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0294647216796875, -0.02851271629333496, -0.027560710906982422, -0.026608705520629883, -0.025656700134277344, -0.024704694747924805, -0.023752689361572266, -0.022800683975219727, -0.021848678588867188, -0.02089667320251465, -0.01994466781616211, -0.01899266242980957, -0.01804065704345703, -0.017088651657104492, -0.016136646270751953, -0.015184640884399414, -0.014232635498046875, -0.013280630111694336, -0.012328624725341797, -0.011376619338989258, -0.010424613952636719, -0.00947260856628418, -0.00852060317993164, -0.0075685977935791016, -0.0066165924072265625, -0.0056645870208740234, -0.004712581634521484, -0.0037605762481689453, -0.0028085708618164062, -0.0018565654754638672, -0.0009045600891113281, 4.744529724121094e-05, 0.00099945068359375, 0.001951456069946289, 0.002903461456298828, 0.003855466842651367, 0.004807472229003906, 0.005759477615356445, 0.006711483001708984, 0.0076634883880615234, 0.008615493774414062, 0.009567499160766602, 0.01051950454711914, 0.01147150993347168, 0.012423515319824219, 0.013375520706176758, 0.014327526092529297, 0.015279531478881836, 0.016231536865234375, 0.017183542251586914, 0.018135547637939453, 0.019087553024291992, 0.02003955841064453, 0.02099156379699707, 0.02194356918334961, 0.02289557456970215, 0.023847579956054688, 0.024799585342407227, 0.025751590728759766, 0.026703596115112305, 0.027655601501464844, 0.028607606887817383, 0.029559612274169922, 0.03051161766052246, 0.031463623046875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 2.0, 3.0, 0.0, 3.0, 8.0, 11.0, 6.0, 17.0, 18.0, 32.0, 44.0, 52.0, 70.0, 95.0, 134.0, 113.0, 105.0, 69.0, 70.0, 41.0, 31.0, 27.0, 18.0, 5.0, 9.0, 5.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5139579772949219e-05, -1.4603137969970703e-05, -1.4066696166992188e-05, -1.3530254364013672e-05, -1.2993812561035156e-05, -1.245737075805664e-05, -1.1920928955078125e-05, -1.138448715209961e-05, -1.0848045349121094e-05, -1.0311603546142578e-05, -9.775161743164062e-06, -9.238719940185547e-06, -8.702278137207031e-06, -8.165836334228516e-06, -7.62939453125e-06, -7.092952728271484e-06, -6.556510925292969e-06, -6.020069122314453e-06, -5.4836273193359375e-06, -4.947185516357422e-06, -4.410743713378906e-06, -3.874301910400391e-06, -3.337860107421875e-06, -2.8014183044433594e-06, -2.2649765014648438e-06, -1.7285346984863281e-06, -1.1920928955078125e-06, -6.556510925292969e-07, -1.1920928955078125e-07, 4.172325134277344e-07, 9.5367431640625e-07, 1.4901161193847656e-06, 2.0265579223632812e-06, 2.562999725341797e-06, 3.0994415283203125e-06, 3.635883331298828e-06, 4.172325134277344e-06, 4.708766937255859e-06, 5.245208740234375e-06, 5.781650543212891e-06, 6.318092346191406e-06, 6.854534149169922e-06, 7.3909759521484375e-06, 7.927417755126953e-06, 8.463859558105469e-06, 9.000301361083984e-06, 9.5367431640625e-06, 1.0073184967041016e-05, 1.0609626770019531e-05, 1.1146068572998047e-05, 1.1682510375976562e-05, 1.2218952178955078e-05, 1.2755393981933594e-05, 1.329183578491211e-05, 1.3828277587890625e-05, 1.436471939086914e-05, 1.4901161193847656e-05, 1.5437602996826172e-05, 1.5974044799804688e-05, 1.6510486602783203e-05, 1.704692840576172e-05, 1.7583370208740234e-05, 1.811981201171875e-05, 1.8656253814697266e-05, 1.919269561767578e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 8.0, 10.0, 24.0, 34.0, 49.0, 77.0, 133.0, 215.0, 366.0, 668.0, 1070.0, 1974.0, 4146.0, 9310.0, 27832.0, 109755.0, 400573.0, 359966.0, 91702.0, 24346.0, 8333.0, 3600.0, 1830.0, 999.0, 618.0, 379.0, 203.0, 126.0, 72.0, 41.0, 33.0, 21.0, 13.0, 9.0, 8.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0360107421875, -0.03506159782409668, -0.03411245346069336, -0.03316330909729004, -0.03221416473388672, -0.0312650203704834, -0.030315876007080078, -0.029366731643676758, -0.028417587280273438, -0.027468442916870117, -0.026519298553466797, -0.025570154190063477, -0.024621009826660156, -0.023671865463256836, -0.022722721099853516, -0.021773576736450195, -0.020824432373046875, -0.019875288009643555, -0.018926143646240234, -0.017976999282836914, -0.017027854919433594, -0.016078710556030273, -0.015129566192626953, -0.014180421829223633, -0.013231277465820312, -0.012282133102416992, -0.011332988739013672, -0.010383844375610352, -0.009434700012207031, -0.008485555648803711, -0.007536411285400391, -0.00658726692199707, -0.00563812255859375, -0.00468897819519043, -0.0037398338317871094, -0.002790689468383789, -0.0018415451049804688, -0.0008924007415771484, 5.6743621826171875e-05, 0.0010058879852294922, 0.0019550323486328125, 0.002904176712036133, 0.003853321075439453, 0.0048024654388427734, 0.005751609802246094, 0.006700754165649414, 0.007649898529052734, 0.008599042892456055, 0.009548187255859375, 0.010497331619262695, 0.011446475982666016, 0.012395620346069336, 0.013344764709472656, 0.014293909072875977, 0.015243053436279297, 0.016192197799682617, 0.017141342163085938, 0.018090486526489258, 0.019039630889892578, 0.0199887752532959, 0.02093791961669922, 0.02188706398010254, 0.02283620834350586, 0.02378535270690918, 0.0247344970703125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 5.0, 8.0, 6.0, 11.0, 3.0, 11.0, 18.0, 16.0, 33.0, 36.0, 57.0, 53.0, 67.0, 77.0, 72.0, 69.0, 81.0, 57.0, 61.0, 47.0, 41.0, 33.0, 30.0, 27.0, 21.0, 12.0, 9.0, 3.0, 8.0, 3.0, 3.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.008331298828125, -0.008081316947937012, -0.007831335067749023, -0.007581353187561035, -0.007331371307373047, -0.007081389427185059, -0.00683140754699707, -0.006581425666809082, -0.006331443786621094, -0.0060814619064331055, -0.005831480026245117, -0.005581498146057129, -0.005331516265869141, -0.005081534385681152, -0.004831552505493164, -0.004581570625305176, -0.0043315887451171875, -0.004081606864929199, -0.003831624984741211, -0.0035816431045532227, -0.0033316612243652344, -0.003081679344177246, -0.002831697463989258, -0.0025817155838012695, -0.0023317337036132812, -0.002081751823425293, -0.0018317699432373047, -0.0015817880630493164, -0.0013318061828613281, -0.0010818243026733398, -0.0008318424224853516, -0.0005818605422973633, -0.000331878662109375, -8.189678192138672e-05, 0.00016808509826660156, 0.00041806697845458984, 0.0006680488586425781, 0.0009180307388305664, 0.0011680126190185547, 0.001417994499206543, 0.0016679763793945312, 0.0019179582595825195, 0.002167940139770508, 0.002417922019958496, 0.0026679039001464844, 0.0029178857803344727, 0.003167867660522461, 0.0034178495407104492, 0.0036678314208984375, 0.003917813301086426, 0.004167795181274414, 0.004417777061462402, 0.004667758941650391, 0.004917740821838379, 0.005167722702026367, 0.0054177045822143555, 0.005667686462402344, 0.005917668342590332, 0.00616765022277832, 0.006417632102966309, 0.006667613983154297, 0.006917595863342285, 0.0071675777435302734, 0.007417559623718262, 0.00766754150390625]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 11.0, 34.0, 65.0, 145.0, 214.0, 238.0, 153.0, 79.0, 35.0, 12.0, 4.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.691898763179779, -0.6619037985801697, -0.6319088339805603, -0.6019138693809509, -0.5719189047813416, -0.5419239401817322, -0.5119289755821228, -0.4819340109825134, -0.45193904638290405, -0.4219440817832947, -0.3919491171836853, -0.3619541525840759, -0.33195918798446655, -0.3019642233848572, -0.2719692587852478, -0.24197429418563843, -0.21197932958602905, -0.18198436498641968, -0.1519894003868103, -0.12199443578720093, -0.09199947118759155, -0.06200450658798218, -0.0320095419883728, -0.0020145773887634277, 0.027980387210845947, 0.05797535181045532, 0.0879703164100647, 0.11796528100967407, 0.14796024560928345, 0.17795521020889282, 0.2079501748085022, 0.23794513940811157, 0.2679401636123657, 0.2979351282119751, 0.3279300928115845, 0.35792505741119385, 0.3879200220108032, 0.4179149866104126, 0.447909951210022, 0.47790491580963135, 0.5078998804092407, 0.5378948450088501, 0.5678898096084595, 0.5978847742080688, 0.6278797388076782, 0.6578747034072876, 0.687869668006897, 0.7178646326065063, 0.7478595972061157, 0.7778545618057251, 0.8078495264053345, 0.8378444910049438, 0.8678394556045532, 0.8978344202041626, 0.927829384803772, 0.9578243494033813, 0.9878193140029907, 1.0178142786026, 1.0478092432022095, 1.0778042078018188, 1.1077991724014282, 1.1377941370010376, 1.167789101600647, 1.1977840662002563, 1.2277790307998657]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 4.0, 6.0, 9.0, 13.0, 10.0, 12.0, 19.0, 21.0, 23.0, 47.0, 37.0, 28.0, 45.0, 65.0, 42.0, 46.0, 60.0, 56.0, 52.0, 40.0, 52.0, 47.0, 49.0, 35.0, 38.0, 29.0, 24.0, 14.0, 22.0, 7.0, 7.0, 8.0, 8.0, 5.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2623453438282013, -0.2529442012310028, -0.24354302883148193, -0.23414188623428345, -0.22474072873592377, -0.2153395712375641, -0.2059384137392044, -0.19653725624084473, -0.18713611364364624, -0.17773495614528656, -0.16833379864692688, -0.1589326560497284, -0.1495314985513687, -0.14013034105300903, -0.13072918355464935, -0.12132803350687027, -0.11192686855792999, -0.10252571105957031, -0.09312456101179123, -0.08372340351343155, -0.07432225346565247, -0.06492109596729279, -0.055519938468933105, -0.04611878842115402, -0.03671763092279434, -0.02731647714972496, -0.01791532151401043, -0.008514165878295898, 0.0008869878947734833, 0.010288141667842865, 0.019689299166202545, 0.02909044921398163, 0.03849160671234131, 0.04789276048541069, 0.05729391425848007, 0.06669507175683975, 0.07609622180461884, 0.08549737930297852, 0.0948985368013382, 0.10429968684911728, 0.11370084434747696, 0.12310200184583664, 0.13250315189361572, 0.1419043093919754, 0.15130546689033508, 0.16070660948753357, 0.17010778188705444, 0.17950892448425293, 0.1889100819826126, 0.1983112394809723, 0.20771239697933197, 0.21711355447769165, 0.22651469707489014, 0.23591585457324982, 0.2453170120716095, 0.254718154668808, 0.26411932706832886, 0.27352046966552734, 0.2829216420650482, 0.2923227846622467, 0.3017239570617676, 0.31112509965896606, 0.32052624225616455, 0.3299274146556854, 0.3393285572528839]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 7.0, 8.0, 7.0, 4.0, 14.0, 44.0, 54.0, 85.0, 149.0, 268.0, 568.0, 1301.0, 3526.0, 11035.0, 43254.0, 342061.0, 569590.0, 55920.0, 13728.0, 4134.0, 1447.0, 611.0, 298.0, 175.0, 95.0, 62.0, 27.0, 20.0, 19.0, 16.0, 5.0, 10.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0], "bins": [-0.50244140625, -0.4888916015625, -0.475341796875, -0.4617919921875, -0.4482421875, -0.4346923828125, -0.421142578125, -0.4075927734375, -0.39404296875, -0.3804931640625, -0.366943359375, -0.3533935546875, -0.33984375, -0.3262939453125, -0.312744140625, -0.2991943359375, -0.28564453125, -0.2720947265625, -0.258544921875, -0.2449951171875, -0.2314453125, -0.2178955078125, -0.204345703125, -0.1907958984375, -0.17724609375, -0.1636962890625, -0.150146484375, -0.1365966796875, -0.123046875, -0.1094970703125, -0.095947265625, -0.0823974609375, -0.06884765625, -0.0552978515625, -0.041748046875, -0.0281982421875, -0.0146484375, -0.0010986328125, 0.012451171875, 0.0260009765625, 0.03955078125, 0.0531005859375, 0.066650390625, 0.0802001953125, 0.09375, 0.1072998046875, 0.120849609375, 0.1343994140625, 0.14794921875, 0.1614990234375, 0.175048828125, 0.1885986328125, 0.2021484375, 0.2156982421875, 0.229248046875, 0.2427978515625, 0.25634765625, 0.2698974609375, 0.283447265625, 0.2969970703125, 0.310546875, 0.3240966796875, 0.337646484375, 0.3511962890625, 0.36474609375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 1.0, 6.0, 7.0, 11.0, 9.0, 15.0, 26.0, 13.0, 36.0, 34.0, 30.0, 37.0, 46.0, 37.0, 44.0, 57.0, 53.0, 51.0, 58.0, 48.0, 52.0, 57.0, 37.0, 53.0, 37.0, 17.0, 22.0, 19.0, 12.0, 16.0, 14.0, 6.0, 5.0, 10.0, 5.0, 3.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5498046875, -0.5316925048828125, -0.513580322265625, -0.4954681396484375, -0.47735595703125, -0.4592437744140625, -0.441131591796875, -0.4230194091796875, -0.4049072265625, -0.3867950439453125, -0.368682861328125, -0.3505706787109375, -0.33245849609375, -0.3143463134765625, -0.296234130859375, -0.2781219482421875, -0.260009765625, -0.2418975830078125, -0.223785400390625, -0.2056732177734375, -0.18756103515625, -0.1694488525390625, -0.151336669921875, -0.1332244873046875, -0.1151123046875, -0.0970001220703125, -0.078887939453125, -0.0607757568359375, -0.04266357421875, -0.0245513916015625, -0.006439208984375, 0.0116729736328125, 0.02978515625, 0.0478973388671875, 0.066009521484375, 0.0841217041015625, 0.10223388671875, 0.1203460693359375, 0.138458251953125, 0.1565704345703125, 0.1746826171875, 0.1927947998046875, 0.210906982421875, 0.2290191650390625, 0.24713134765625, 0.2652435302734375, 0.283355712890625, 0.3014678955078125, 0.319580078125, 0.3376922607421875, 0.355804443359375, 0.3739166259765625, 0.39202880859375, 0.4101409912109375, 0.428253173828125, 0.4463653564453125, 0.4644775390625, 0.4825897216796875, 0.500701904296875, 0.5188140869140625, 0.53692626953125, 0.5550384521484375, 0.573150634765625, 0.5912628173828125, 0.609375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 6.0, 6.0, 4.0, 6.0, 7.0, 10.0, 9.0, 12.0, 13.0, 12.0, 19.0, 23.0, 36.0, 42.0, 69.0, 71.0, 116.0, 158.0, 290.0, 605.0, 1836.0, 11212.0, 225697.0, 783161.0, 20809.0, 2648.0, 695.0, 321.0, 183.0, 131.0, 88.0, 59.0, 41.0, 33.0, 25.0, 22.0, 17.0, 21.0, 20.0, 6.0, 2.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6845703125, -0.6583709716796875, -0.632171630859375, -0.6059722900390625, -0.57977294921875, -0.5535736083984375, -0.527374267578125, -0.5011749267578125, -0.4749755859375, -0.4487762451171875, -0.422576904296875, -0.3963775634765625, -0.37017822265625, -0.3439788818359375, -0.317779541015625, -0.2915802001953125, -0.265380859375, -0.2391815185546875, -0.212982177734375, -0.1867828369140625, -0.16058349609375, -0.1343841552734375, -0.108184814453125, -0.0819854736328125, -0.0557861328125, -0.0295867919921875, -0.003387451171875, 0.0228118896484375, 0.04901123046875, 0.0752105712890625, 0.101409912109375, 0.1276092529296875, 0.15380859375, 0.1800079345703125, 0.206207275390625, 0.2324066162109375, 0.25860595703125, 0.2848052978515625, 0.311004638671875, 0.3372039794921875, 0.3634033203125, 0.3896026611328125, 0.415802001953125, 0.4420013427734375, 0.46820068359375, 0.4944000244140625, 0.520599365234375, 0.5467987060546875, 0.572998046875, 0.5991973876953125, 0.625396728515625, 0.6515960693359375, 0.67779541015625, 0.7039947509765625, 0.730194091796875, 0.7563934326171875, 0.7825927734375, 0.8087921142578125, 0.834991455078125, 0.8611907958984375, 0.88739013671875, 0.9135894775390625, 0.939788818359375, 0.9659881591796875, 0.9921875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 8.0, 3.0, 7.0, 14.0, 12.0, 15.0, 10.0, 15.0, 13.0, 21.0, 26.0, 30.0, 26.0, 44.0, 28.0, 38.0, 55.0, 45.0, 67.0, 63.0, 41.0, 46.0, 45.0, 45.0, 32.0, 37.0, 35.0, 21.0, 31.0, 16.0, 19.0, 20.0, 21.0, 17.0, 7.0, 6.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.578125, -0.557525634765625, -0.53692626953125, -0.516326904296875, -0.4957275390625, -0.475128173828125, -0.45452880859375, -0.433929443359375, -0.413330078125, -0.392730712890625, -0.37213134765625, -0.351531982421875, -0.3309326171875, -0.310333251953125, -0.28973388671875, -0.269134521484375, -0.24853515625, -0.227935791015625, -0.20733642578125, -0.186737060546875, -0.1661376953125, -0.145538330078125, -0.12493896484375, -0.104339599609375, -0.083740234375, -0.063140869140625, -0.04254150390625, -0.021942138671875, -0.0013427734375, 0.019256591796875, 0.03985595703125, 0.060455322265625, 0.0810546875, 0.101654052734375, 0.12225341796875, 0.142852783203125, 0.1634521484375, 0.184051513671875, 0.20465087890625, 0.225250244140625, 0.245849609375, 0.266448974609375, 0.28704833984375, 0.307647705078125, 0.3282470703125, 0.348846435546875, 0.36944580078125, 0.390045166015625, 0.41064453125, 0.431243896484375, 0.45184326171875, 0.472442626953125, 0.4930419921875, 0.513641357421875, 0.53424072265625, 0.554840087890625, 0.575439453125, 0.596038818359375, 0.61663818359375, 0.637237548828125, 0.6578369140625, 0.678436279296875, 0.69903564453125, 0.719635009765625, 0.740234375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 13.0, 18.0, 20.0, 34.0, 56.0, 113.0, 183.0, 382.0, 987.0, 5579.0, 634468.0, 399931.0, 4978.0, 979.0, 368.0, 182.0, 97.0, 61.0, 25.0, 28.0, 15.0, 9.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.55224609375, -0.5396881103515625, -0.527130126953125, -0.5145721435546875, -0.50201416015625, -0.4894561767578125, -0.476898193359375, -0.4643402099609375, -0.4517822265625, -0.4392242431640625, -0.426666259765625, -0.4141082763671875, -0.40155029296875, -0.3889923095703125, -0.376434326171875, -0.3638763427734375, -0.351318359375, -0.3387603759765625, -0.326202392578125, -0.3136444091796875, -0.30108642578125, -0.2885284423828125, -0.275970458984375, -0.2634124755859375, -0.2508544921875, -0.2382965087890625, -0.225738525390625, -0.2131805419921875, -0.20062255859375, -0.1880645751953125, -0.175506591796875, -0.1629486083984375, -0.150390625, -0.1378326416015625, -0.125274658203125, -0.1127166748046875, -0.10015869140625, -0.0876007080078125, -0.075042724609375, -0.0624847412109375, -0.0499267578125, -0.0373687744140625, -0.024810791015625, -0.0122528076171875, 0.00030517578125, 0.0128631591796875, 0.025421142578125, 0.0379791259765625, 0.050537109375, 0.0630950927734375, 0.075653076171875, 0.0882110595703125, 0.10076904296875, 0.1133270263671875, 0.125885009765625, 0.1384429931640625, 0.1510009765625, 0.1635589599609375, 0.176116943359375, 0.1886749267578125, 0.20123291015625, 0.2137908935546875, 0.226348876953125, 0.2389068603515625, 0.25146484375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 9.0, 14.0, 20.0, 69.0, 218.0, 505.0, 115.0, 41.0, 11.0, 9.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001373291015625, -0.00013459939509630203, -0.00013186968863010406, -0.0001291399821639061, -0.00012641027569770813, -0.00012368056923151016, -0.0001209508627653122, -0.00011822115629911423, -0.00011549144983291626, -0.00011276174336671829, -0.00011003203690052032, -0.00010730233043432236, -0.00010457262396812439, -0.00010184291750192642, -9.911321103572845e-05, -9.638350456953049e-05, -9.365379810333252e-05, -9.092409163713455e-05, -8.819438517093658e-05, -8.546467870473862e-05, -8.273497223854065e-05, -8.000526577234268e-05, -7.727555930614471e-05, -7.454585283994675e-05, -7.181614637374878e-05, -6.908643990755081e-05, -6.635673344135284e-05, -6.362702697515488e-05, -6.089732050895691e-05, -5.816761404275894e-05, -5.5437907576560974e-05, -5.2708201110363007e-05, -4.997849464416504e-05, -4.724878817796707e-05, -4.4519081711769104e-05, -4.1789375245571136e-05, -3.905966877937317e-05, -3.63299623131752e-05, -3.3600255846977234e-05, -3.0870549380779266e-05, -2.81408429145813e-05, -2.541113644838333e-05, -2.2681429982185364e-05, -1.9951723515987396e-05, -1.722201704978943e-05, -1.4492310583591461e-05, -1.1762604117393494e-05, -9.032897651195526e-06, -6.303191184997559e-06, -3.573484718799591e-06, -8.437782526016235e-07, 1.885928213596344e-06, 4.6156346797943115e-06, 7.345341145992279e-06, 1.0075047612190247e-05, 1.2804754078388214e-05, 1.553446054458618e-05, 1.826416701078415e-05, 2.0993873476982117e-05, 2.3723579943180084e-05, 2.6453286409378052e-05, 2.918299287557602e-05, 3.191269934177399e-05, 3.4642405807971954e-05, 3.737211227416992e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 10.0, 34.0, 53.0, 130.0, 300.0, 1018.0, 11944.0, 1021441.0, 12082.0, 1028.0, 276.0, 105.0, 56.0, 28.0, 23.0, 11.0, 7.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54248046875, -0.5220108032226562, -0.5015411376953125, -0.48107147216796875, -0.460601806640625, -0.44013214111328125, -0.4196624755859375, -0.39919281005859375, -0.37872314453125, -0.35825347900390625, -0.3377838134765625, -0.31731414794921875, -0.296844482421875, -0.27637481689453125, -0.2559051513671875, -0.23543548583984375, -0.2149658203125, -0.19449615478515625, -0.1740264892578125, -0.15355682373046875, -0.133087158203125, -0.11261749267578125, -0.0921478271484375, -0.07167816162109375, -0.05120849609375, -0.03073883056640625, -0.0102691650390625, 0.01020050048828125, 0.030670166015625, 0.05113983154296875, 0.0716094970703125, 0.09207916259765625, 0.112548828125, 0.13301849365234375, 0.1534881591796875, 0.17395782470703125, 0.194427490234375, 0.21489715576171875, 0.2353668212890625, 0.25583648681640625, 0.27630615234375, 0.29677581787109375, 0.3172454833984375, 0.33771514892578125, 0.358184814453125, 0.37865447998046875, 0.3991241455078125, 0.41959381103515625, 0.4400634765625, 0.46053314208984375, 0.4810028076171875, 0.5014724731445312, 0.521942138671875, 0.5424118041992188, 0.5628814697265625, 0.5833511352539062, 0.60382080078125, 0.6242904663085938, 0.6447601318359375, 0.6652297973632812, 0.685699462890625, 0.7061691284179688, 0.7266387939453125, 0.7471084594726562, 0.767578125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 7.0, 16.0, 22.0, 29.0, 51.0, 68.0, 148.0, 294.0, 148.0, 89.0, 51.0, 25.0, 21.0, 11.0, 10.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.140869140625, -0.1373891830444336, -0.1339092254638672, -0.13042926788330078, -0.12694931030273438, -0.12346935272216797, -0.11998939514160156, -0.11650943756103516, -0.11302947998046875, -0.10954952239990234, -0.10606956481933594, -0.10258960723876953, -0.09910964965820312, -0.09562969207763672, -0.09214973449707031, -0.0886697769165039, -0.0851898193359375, -0.0817098617553711, -0.07822990417480469, -0.07474994659423828, -0.07126998901367188, -0.06779003143310547, -0.06431007385253906, -0.060830116271972656, -0.05735015869140625, -0.053870201110839844, -0.05039024353027344, -0.04691028594970703, -0.043430328369140625, -0.03995037078857422, -0.03647041320800781, -0.032990455627441406, -0.029510498046875, -0.026030540466308594, -0.022550582885742188, -0.01907062530517578, -0.015590667724609375, -0.012110710144042969, -0.008630752563476562, -0.005150794982910156, -0.00167083740234375, 0.0018091201782226562, 0.0052890777587890625, 0.008769035339355469, 0.012248992919921875, 0.01572895050048828, 0.019208908081054688, 0.022688865661621094, 0.0261688232421875, 0.029648780822753906, 0.03312873840332031, 0.03660869598388672, 0.040088653564453125, 0.04356861114501953, 0.04704856872558594, 0.050528526306152344, 0.05400848388671875, 0.057488441467285156, 0.06096839904785156, 0.06444835662841797, 0.06792831420898438, 0.07140827178955078, 0.07488822937011719, 0.0783681869506836, 0.08184814453125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 8.0, 9.0, 13.0, 27.0, 36.0, 50.0, 80.0, 111.0, 125.0, 137.0, 111.0, 78.0, 79.0, 55.0, 24.0, 26.0, 15.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1382230520248413, -1.105010747909546, -1.07179856300354, -1.0385863780975342, -1.0053740739822388, -0.9721618294715881, -0.9389495849609375, -0.9057373404502869, -0.8725250959396362, -0.8393128514289856, -0.806100606918335, -0.7728883624076843, -0.7396761178970337, -0.7064638733863831, -0.6732516288757324, -0.6400393843650818, -0.6068271398544312, -0.5736148953437805, -0.5404026508331299, -0.5071904063224792, -0.4739781618118286, -0.440765917301178, -0.40755367279052734, -0.3743414282798767, -0.3411291837692261, -0.30791693925857544, -0.2747046947479248, -0.24149245023727417, -0.20828020572662354, -0.1750679612159729, -0.14185571670532227, -0.10864347219467163, -0.07543134689331055, -0.04221910238265991, -0.009006857872009277, 0.024205386638641357, 0.05741763114929199, 0.09062987565994263, 0.12384212017059326, 0.1570543646812439, 0.19026660919189453, 0.22347885370254517, 0.2566910982131958, 0.28990334272384644, 0.32311558723449707, 0.3563278317451477, 0.38954007625579834, 0.422752320766449, 0.4559645652770996, 0.48917680978775024, 0.5223890542984009, 0.5556012988090515, 0.5888135433197021, 0.6220257878303528, 0.6552380323410034, 0.688450276851654, 0.7216625213623047, 0.7548747658729553, 0.788087010383606, 0.8212992548942566, 0.8545114994049072, 0.8877237439155579, 0.9209359884262085, 0.9541482329368591, 0.9873604774475098]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 10.0, 8.0, 7.0, 13.0, 15.0, 22.0, 9.0, 18.0, 28.0, 26.0, 36.0, 25.0, 30.0, 34.0, 32.0, 40.0, 45.0, 35.0, 41.0, 51.0, 42.0, 31.0, 41.0, 34.0, 40.0, 26.0, 36.0, 44.0, 16.0, 16.0, 12.0, 18.0, 17.0, 12.0, 16.0, 12.0, 7.0, 6.0, 10.0, 6.0, 9.0, 6.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0], "bins": [-0.9578178524971008, -0.9307506680488586, -0.9036834836006165, -0.8766162991523743, -0.8495491147041321, -0.8224819302558899, -0.7954146862030029, -0.7683475017547607, -0.7412803173065186, -0.7142131328582764, -0.6871459484100342, -0.660078763961792, -0.6330115795135498, -0.6059443950653076, -0.5788772106170654, -0.5518100261688232, -0.524742841720581, -0.49767565727233887, -0.4706084728240967, -0.4435412883758545, -0.4164741039276123, -0.3894069194793701, -0.36233970522880554, -0.33527252078056335, -0.30820533633232117, -0.281138151884079, -0.2540709674358368, -0.2270037680864334, -0.19993658363819122, -0.17286939918994904, -0.14580219984054565, -0.11873501539230347, -0.0916677713394165, -0.06460058689117432, -0.03753339499235153, -0.010466203093528748, 0.01660098135471344, 0.04366816580295563, 0.07073536515235901, 0.0978025496006012, 0.12486973404884338, 0.15193691849708557, 0.17900410294532776, 0.20607130229473114, 0.23313848674297333, 0.2602056860923767, 0.2872728705406189, 0.3143400549888611, 0.34140723943710327, 0.36847442388534546, 0.39554160833358765, 0.42260879278182983, 0.449675977230072, 0.4767431616783142, 0.5038104057312012, 0.5308775901794434, 0.5579447746276855, 0.5850119590759277, 0.6120791435241699, 0.6391463279724121, 0.6662135124206543, 0.6932806968688965, 0.7203478813171387, 0.7474150657653809, 0.774482250213623]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 6.0, 5.0, 5.0, 2.0, 5.0, 9.0, 11.0, 15.0, 24.0, 38.0, 61.0, 103.0, 151.0, 262.0, 576.0, 1469.0, 5180.0, 33146.0, 1774142.0, 2329801.0, 40134.0, 6099.0, 1778.0, 602.0, 274.0, 166.0, 79.0, 53.0, 36.0, 21.0, 14.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3427734375, -1.309234619140625, -1.27569580078125, -1.242156982421875, -1.2086181640625, -1.175079345703125, -1.14154052734375, -1.108001708984375, -1.074462890625, -1.040924072265625, -1.00738525390625, -0.973846435546875, -0.9403076171875, -0.906768798828125, -0.87322998046875, -0.839691162109375, -0.80615234375, -0.772613525390625, -0.73907470703125, -0.705535888671875, -0.6719970703125, -0.638458251953125, -0.60491943359375, -0.571380615234375, -0.537841796875, -0.504302978515625, -0.47076416015625, -0.437225341796875, -0.4036865234375, -0.370147705078125, -0.33660888671875, -0.303070068359375, -0.26953125, -0.235992431640625, -0.20245361328125, -0.168914794921875, -0.1353759765625, -0.101837158203125, -0.06829833984375, -0.034759521484375, -0.001220703125, 0.032318115234375, 0.06585693359375, 0.099395751953125, 0.1329345703125, 0.166473388671875, 0.20001220703125, 0.233551025390625, 0.26708984375, 0.300628662109375, 0.33416748046875, 0.367706298828125, 0.4012451171875, 0.434783935546875, 0.46832275390625, 0.501861572265625, 0.535400390625, 0.568939208984375, 0.60247802734375, 0.636016845703125, 0.6695556640625, 0.703094482421875, 0.73663330078125, 0.770172119140625, 0.8037109375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 7.0, 11.0, 9.0, 5.0, 10.0, 15.0, 17.0, 28.0, 27.0, 35.0, 40.0, 37.0, 49.0, 65.0, 51.0, 59.0, 62.0, 53.0, 63.0, 48.0, 57.0, 39.0, 39.0, 27.0, 34.0, 26.0, 21.0, 13.0, 15.0, 10.0, 8.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.312744140625, -0.3009033203125, -0.2890625, -0.2772216796875, -0.265380859375, -0.2535400390625, -0.24169921875, -0.2298583984375, -0.218017578125, -0.2061767578125, -0.1943359375, -0.1824951171875, -0.170654296875, -0.1588134765625, -0.14697265625, -0.1351318359375, -0.123291015625, -0.1114501953125, -0.099609375, -0.0877685546875, -0.075927734375, -0.0640869140625, -0.05224609375, -0.0404052734375, -0.028564453125, -0.0167236328125, -0.0048828125, 0.0069580078125, 0.018798828125, 0.0306396484375, 0.04248046875, 0.0543212890625, 0.066162109375, 0.0780029296875, 0.08984375, 0.1016845703125, 0.113525390625, 0.1253662109375, 0.13720703125, 0.1490478515625, 0.160888671875, 0.1727294921875, 0.1845703125, 0.1964111328125, 0.208251953125, 0.2200927734375, 0.23193359375, 0.2437744140625, 0.255615234375, 0.2674560546875, 0.279296875, 0.2911376953125, 0.302978515625, 0.3148193359375, 0.32666015625, 0.3385009765625, 0.350341796875, 0.3621826171875, 0.3740234375, 0.3858642578125, 0.397705078125, 0.4095458984375, 0.42138671875, 0.4332275390625, 0.445068359375]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 3.0, 5.0, 3.0, 5.0, 10.0, 12.0, 19.0, 24.0, 32.0, 61.0, 80.0, 144.0, 260.0, 542.0, 1276.0, 4394.0, 25120.0, 1038126.0, 3074041.0, 41197.0, 5852.0, 1640.0, 640.0, 355.0, 156.0, 99.0, 60.0, 33.0, 24.0, 30.0, 12.0, 12.0, 9.0, 8.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6865234375, -0.65545654296875, -0.6243896484375, -0.59332275390625, -0.562255859375, -0.53118896484375, -0.5001220703125, -0.46905517578125, -0.43798828125, -0.40692138671875, -0.3758544921875, -0.34478759765625, -0.313720703125, -0.28265380859375, -0.2515869140625, -0.22052001953125, -0.189453125, -0.15838623046875, -0.1273193359375, -0.09625244140625, -0.065185546875, -0.03411865234375, -0.0030517578125, 0.02801513671875, 0.05908203125, 0.09014892578125, 0.1212158203125, 0.15228271484375, 0.183349609375, 0.21441650390625, 0.2454833984375, 0.27655029296875, 0.3076171875, 0.33868408203125, 0.3697509765625, 0.40081787109375, 0.431884765625, 0.46295166015625, 0.4940185546875, 0.52508544921875, 0.55615234375, 0.58721923828125, 0.6182861328125, 0.64935302734375, 0.680419921875, 0.71148681640625, 0.7425537109375, 0.77362060546875, 0.8046875, 0.83575439453125, 0.8668212890625, 0.89788818359375, 0.928955078125, 0.96002197265625, 0.9910888671875, 1.02215576171875, 1.05322265625, 1.08428955078125, 1.1153564453125, 1.14642333984375, 1.177490234375, 1.20855712890625, 1.2396240234375, 1.27069091796875, 1.3017578125]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 14.0, 14.0, 18.0, 16.0, 37.0, 28.0, 48.0, 72.0, 114.0, 179.0, 293.0, 544.0, 691.0, 726.0, 491.0, 327.0, 159.0, 90.0, 71.0, 28.0, 24.0, 15.0, 15.0, 15.0, 7.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1976318359375, -0.1921253204345703, -0.18661880493164062, -0.18111228942871094, -0.17560577392578125, -0.17009925842285156, -0.16459274291992188, -0.1590862274169922, -0.1535797119140625, -0.1480731964111328, -0.14256668090820312, -0.13706016540527344, -0.13155364990234375, -0.12604713439941406, -0.12054061889648438, -0.11503410339355469, -0.109527587890625, -0.10402107238769531, -0.09851455688476562, -0.09300804138183594, -0.08750152587890625, -0.08199501037597656, -0.07648849487304688, -0.07098197937011719, -0.0654754638671875, -0.05996894836425781, -0.054462432861328125, -0.04895591735839844, -0.04344940185546875, -0.03794288635253906, -0.032436370849609375, -0.026929855346679688, -0.02142333984375, -0.015916824340820312, -0.010410308837890625, -0.0049037933349609375, 0.00060272216796875, 0.0061092376708984375, 0.011615753173828125, 0.017122268676757812, 0.0226287841796875, 0.028135299682617188, 0.033641815185546875, 0.03914833068847656, 0.04465484619140625, 0.05016136169433594, 0.055667877197265625, 0.06117439270019531, 0.066680908203125, 0.07218742370605469, 0.07769393920898438, 0.08320045471191406, 0.08870697021484375, 0.09421348571777344, 0.09972000122070312, 0.10522651672363281, 0.1107330322265625, 0.11623954772949219, 0.12174606323242188, 0.12725257873535156, 0.13275909423828125, 0.13826560974121094, 0.14377212524414062, 0.1492786407470703, 0.15478515625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 9.0, 10.0, 15.0, 21.0, 24.0, 50.0, 73.0, 76.0, 101.0, 121.0, 105.0, 106.0, 84.0, 59.0, 55.0, 30.0, 20.0, 16.0, 4.0, 10.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6262499690055847, -0.6048156023025513, -0.5833812355995178, -0.5619468688964844, -0.5405125617980957, -0.5190781950950623, -0.4976438283920288, -0.47620946168899536, -0.4547750949859619, -0.43334072828292847, -0.411906361579895, -0.39047202467918396, -0.3690376579761505, -0.34760329127311707, -0.326168954372406, -0.30473458766937256, -0.2833002209663391, -0.26186585426330566, -0.2404315024614334, -0.21899715065956116, -0.1975627839565277, -0.17612841725349426, -0.154694065451622, -0.13325971364974976, -0.11182534694671631, -0.09039098769426346, -0.06895662844181061, -0.04752226918935776, -0.026087909936904907, -0.004653550684452057, 0.016780808568000793, 0.03821516036987305, 0.05964958667755127, 0.08108394593000412, 0.10251830518245697, 0.12395266443490982, 0.14538702368736267, 0.16682139039039612, 0.18825574219226837, 0.20969009399414062, 0.23112446069717407, 0.2525588274002075, 0.27399319410324097, 0.295427531003952, 0.3168618977069855, 0.3382962644100189, 0.35973060131073, 0.3811649680137634, 0.4025993347167969, 0.4240337014198303, 0.44546806812286377, 0.46690240502357483, 0.4883367717266083, 0.5097711086273193, 0.5312054753303528, 0.5526398420333862, 0.5740742087364197, 0.5955085754394531, 0.6169429421424866, 0.63837730884552, 0.6598116159439087, 0.6812459826469421, 0.7026803493499756, 0.724114716053009, 0.7455490827560425]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 6.0, 4.0, 3.0, 8.0, 10.0, 14.0, 10.0, 10.0, 13.0, 20.0, 27.0, 22.0, 15.0, 31.0, 37.0, 44.0, 51.0, 47.0, 45.0, 43.0, 47.0, 53.0, 35.0, 43.0, 31.0, 48.0, 41.0, 41.0, 25.0, 31.0, 18.0, 15.0, 19.0, 18.0, 20.0, 13.0, 14.0, 12.0, 6.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.3579709529876709, -0.34680646657943726, -0.3356419801712036, -0.32447749376296997, -0.31331300735473633, -0.3021485209465027, -0.29098403453826904, -0.2798195481300354, -0.26865506172180176, -0.2574905753135681, -0.24632608890533447, -0.23516160249710083, -0.2239971160888672, -0.21283262968063354, -0.2016681432723999, -0.19050365686416626, -0.17933915555477142, -0.16817466914653778, -0.15701018273830414, -0.1458456963300705, -0.13468120992183685, -0.12351672351360321, -0.11235222965478897, -0.10118774324655533, -0.09002325683832169, -0.07885877043008804, -0.0676942840218544, -0.05652979388833046, -0.04536530748009682, -0.034200821071863174, -0.023036330938339233, -0.01187184453010559, -0.0007073581218719482, 0.010457129217684269, 0.021621616557240486, 0.03278610482811928, 0.04395059123635292, 0.05511507764458656, 0.0662795677781105, 0.07744405418634415, 0.08860854059457779, 0.09977302700281143, 0.11093751341104507, 0.12210200726985931, 0.13326649367809296, 0.1444309800863266, 0.15559546649456024, 0.16675995290279388, 0.17792443931102753, 0.18908892571926117, 0.2002534121274948, 0.21141789853572845, 0.2225823849439621, 0.23374687135219574, 0.24491137266159058, 0.2560758590698242, 0.26724034547805786, 0.2784048318862915, 0.28956931829452515, 0.3007338047027588, 0.31189829111099243, 0.3230627775192261, 0.3342272639274597, 0.34539175033569336, 0.356556236743927]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 8.0, 17.0, 13.0, 22.0, 31.0, 56.0, 122.0, 265.0, 642.0, 1739.0, 5457.0, 20905.0, 257899.0, 703172.0, 45013.0, 8894.0, 2647.0, 882.0, 363.0, 167.0, 85.0, 48.0, 28.0, 17.0, 11.0, 13.0, 5.0, 8.0, 3.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.289794921875, -0.2805061340332031, -0.27121734619140625, -0.2619285583496094, -0.2526397705078125, -0.24335098266601562, -0.23406219482421875, -0.22477340698242188, -0.215484619140625, -0.20619583129882812, -0.19690704345703125, -0.18761825561523438, -0.1783294677734375, -0.16904067993164062, -0.15975189208984375, -0.15046310424804688, -0.14117431640625, -0.13188552856445312, -0.12259674072265625, -0.11330795288085938, -0.1040191650390625, -0.09473037719726562, -0.08544158935546875, -0.07615280151367188, -0.066864013671875, -0.057575225830078125, -0.04828643798828125, -0.038997650146484375, -0.0297088623046875, -0.020420074462890625, -0.01113128662109375, -0.001842498779296875, 0.0074462890625, 0.016735076904296875, 0.02602386474609375, 0.035312652587890625, 0.0446014404296875, 0.053890228271484375, 0.06317901611328125, 0.07246780395507812, 0.081756591796875, 0.09104537963867188, 0.10033416748046875, 0.10962295532226562, 0.1189117431640625, 0.12820053100585938, 0.13748931884765625, 0.14677810668945312, 0.15606689453125, 0.16535568237304688, 0.17464447021484375, 0.18393325805664062, 0.1932220458984375, 0.20251083374023438, 0.21179962158203125, 0.22108840942382812, 0.230377197265625, 0.23966598510742188, 0.24895477294921875, 0.2582435607910156, 0.2675323486328125, 0.2768211364746094, 0.28610992431640625, 0.2953987121582031, 0.3046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 4.0, 8.0, 8.0, 12.0, 14.0, 11.0, 21.0, 21.0, 33.0, 28.0, 34.0, 44.0, 59.0, 57.0, 55.0, 48.0, 61.0, 52.0, 54.0, 49.0, 53.0, 46.0, 34.0, 30.0, 29.0, 29.0, 21.0, 19.0, 20.0, 8.0, 14.0, 6.0, 3.0, 5.0, 2.0, 0.0, 3.0, 4.0, 2.0, 0.0, 0.0, 4.0], "bins": [-0.368896484375, -0.35936546325683594, -0.3498344421386719, -0.3403034210205078, -0.33077239990234375, -0.3212413787841797, -0.3117103576660156, -0.30217933654785156, -0.2926483154296875, -0.28311729431152344, -0.2735862731933594, -0.2640552520751953, -0.25452423095703125, -0.2449932098388672, -0.23546218872070312, -0.22593116760253906, -0.216400146484375, -0.20686912536621094, -0.19733810424804688, -0.1878070831298828, -0.17827606201171875, -0.1687450408935547, -0.15921401977539062, -0.14968299865722656, -0.1401519775390625, -0.13062095642089844, -0.12108993530273438, -0.11155891418457031, -0.10202789306640625, -0.09249687194824219, -0.08296585083007812, -0.07343482971191406, -0.06390380859375, -0.05437278747558594, -0.044841766357421875, -0.03531074523925781, -0.02577972412109375, -0.016248703002929688, -0.006717681884765625, 0.0028133392333984375, 0.0123443603515625, 0.021875381469726562, 0.031406402587890625, 0.04093742370605469, 0.05046844482421875, 0.05999946594238281, 0.06953048706054688, 0.07906150817871094, 0.088592529296875, 0.09812355041503906, 0.10765457153320312, 0.11718559265136719, 0.12671661376953125, 0.1362476348876953, 0.14577865600585938, 0.15530967712402344, 0.1648406982421875, 0.17437171936035156, 0.18390274047851562, 0.1934337615966797, 0.20296478271484375, 0.2124958038330078, 0.22202682495117188, 0.23155784606933594, 0.2410888671875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 12.0, 12.0, 33.0, 36.0, 60.0, 121.0, 240.0, 554.0, 1143.0, 2907.0, 9311.0, 40356.0, 279672.0, 590104.0, 97597.0, 17936.0, 5011.0, 1886.0, 774.0, 377.0, 173.0, 106.0, 52.0, 28.0, 21.0, 8.0, 3.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1385498046875, -0.13346481323242188, -0.12837982177734375, -0.12329483032226562, -0.1182098388671875, -0.11312484741210938, -0.10803985595703125, -0.10295486450195312, -0.097869873046875, -0.09278488159179688, -0.08769989013671875, -0.08261489868164062, -0.0775299072265625, -0.07244491577148438, -0.06735992431640625, -0.062274932861328125, -0.05718994140625, -0.052104949951171875, -0.04701995849609375, -0.041934967041015625, -0.0368499755859375, -0.031764984130859375, -0.02667999267578125, -0.021595001220703125, -0.016510009765625, -0.011425018310546875, -0.00634002685546875, -0.001255035400390625, 0.0038299560546875, 0.008914947509765625, 0.01399993896484375, 0.019084930419921875, 0.024169921875, 0.029254913330078125, 0.03433990478515625, 0.039424896240234375, 0.0445098876953125, 0.049594879150390625, 0.05467987060546875, 0.059764862060546875, 0.064849853515625, 0.06993484497070312, 0.07501983642578125, 0.08010482788085938, 0.0851898193359375, 0.09027481079101562, 0.09535980224609375, 0.10044479370117188, 0.10552978515625, 0.11061477661132812, 0.11569976806640625, 0.12078475952148438, 0.1258697509765625, 0.13095474243164062, 0.13603973388671875, 0.14112472534179688, 0.146209716796875, 0.15129470825195312, 0.15637969970703125, 0.16146469116210938, 0.1665496826171875, 0.17163467407226562, 0.17671966552734375, 0.18180465698242188, 0.1868896484375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 2.0, 2.0, 7.0, 8.0, 11.0, 10.0, 19.0, 17.0, 18.0, 20.0, 33.0, 36.0, 41.0, 34.0, 43.0, 49.0, 40.0, 59.0, 44.0, 47.0, 53.0, 37.0, 43.0, 43.0, 46.0, 38.0, 38.0, 34.0, 25.0, 23.0, 15.0, 7.0, 12.0, 6.0, 8.0, 6.0, 7.0, 3.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.548828125, -0.5302047729492188, -0.5115814208984375, -0.49295806884765625, -0.474334716796875, -0.45571136474609375, -0.4370880126953125, -0.41846466064453125, -0.39984130859375, -0.38121795654296875, -0.3625946044921875, -0.34397125244140625, -0.325347900390625, -0.30672454833984375, -0.2881011962890625, -0.26947784423828125, -0.2508544921875, -0.23223114013671875, -0.2136077880859375, -0.19498443603515625, -0.176361083984375, -0.15773773193359375, -0.1391143798828125, -0.12049102783203125, -0.10186767578125, -0.08324432373046875, -0.0646209716796875, -0.04599761962890625, -0.027374267578125, -0.00875091552734375, 0.0098724365234375, 0.02849578857421875, 0.047119140625, 0.06574249267578125, 0.0843658447265625, 0.10298919677734375, 0.121612548828125, 0.14023590087890625, 0.1588592529296875, 0.17748260498046875, 0.19610595703125, 0.21472930908203125, 0.2333526611328125, 0.25197601318359375, 0.270599365234375, 0.28922271728515625, 0.3078460693359375, 0.32646942138671875, 0.3450927734375, 0.36371612548828125, 0.3823394775390625, 0.40096282958984375, 0.419586181640625, 0.43820953369140625, 0.4568328857421875, 0.47545623779296875, 0.49407958984375, 0.5127029418945312, 0.5313262939453125, 0.5499496459960938, 0.568572998046875, 0.5871963500976562, 0.6058197021484375, 0.6244430541992188, 0.64306640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 10.0, 20.0, 17.0, 36.0, 46.0, 55.0, 115.0, 201.0, 409.0, 744.0, 1776.0, 4142.0, 11670.0, 44173.0, 242268.0, 540233.0, 156746.0, 30897.0, 8871.0, 3343.0, 1411.0, 618.0, 327.0, 176.0, 106.0, 59.0, 23.0, 20.0, 10.0, 9.0, 10.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.042022705078125, -0.04092764854431152, -0.03983259201049805, -0.03873753547668457, -0.037642478942871094, -0.03654742240905762, -0.03545236587524414, -0.034357309341430664, -0.03326225280761719, -0.03216719627380371, -0.031072139739990234, -0.029977083206176758, -0.02888202667236328, -0.027786970138549805, -0.026691913604736328, -0.02559685707092285, -0.024501800537109375, -0.0234067440032959, -0.022311687469482422, -0.021216630935668945, -0.02012157440185547, -0.019026517868041992, -0.017931461334228516, -0.01683640480041504, -0.015741348266601562, -0.014646291732788086, -0.01355123519897461, -0.012456178665161133, -0.011361122131347656, -0.01026606559753418, -0.009171009063720703, -0.008075952529907227, -0.00698089599609375, -0.0058858394622802734, -0.004790782928466797, -0.0036957263946533203, -0.0026006698608398438, -0.0015056133270263672, -0.0004105567932128906, 0.0006844997406005859, 0.0017795562744140625, 0.002874612808227539, 0.003969669342041016, 0.005064725875854492, 0.006159782409667969, 0.007254838943481445, 0.008349895477294922, 0.009444952011108398, 0.010540008544921875, 0.011635065078735352, 0.012730121612548828, 0.013825178146362305, 0.014920234680175781, 0.016015291213989258, 0.017110347747802734, 0.01820540428161621, 0.019300460815429688, 0.020395517349243164, 0.02149057388305664, 0.022585630416870117, 0.023680686950683594, 0.02477574348449707, 0.025870800018310547, 0.026965856552124023, 0.0280609130859375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 3.0, 3.0, 9.0, 11.0, 18.0, 25.0, 44.0, 35.0, 62.0, 79.0, 86.0, 94.0, 107.0, 94.0, 88.0, 58.0, 51.0, 43.0, 22.0, 14.0, 14.0, 11.0, 5.0, 3.0, 3.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6033649444580078e-05, -1.54813751578331e-05, -1.492910087108612e-05, -1.4376826584339142e-05, -1.3824552297592163e-05, -1.3272278010845184e-05, -1.2720003724098206e-05, -1.2167729437351227e-05, -1.1615455150604248e-05, -1.106318086385727e-05, -1.051090657711029e-05, -9.958632290363312e-06, -9.406358003616333e-06, -8.854083716869354e-06, -8.301809430122375e-06, -7.749535143375397e-06, -7.197260856628418e-06, -6.644986569881439e-06, -6.0927122831344604e-06, -5.540437996387482e-06, -4.988163709640503e-06, -4.435889422893524e-06, -3.883615136146545e-06, -3.3313408493995667e-06, -2.779066562652588e-06, -2.226792275905609e-06, -1.6745179891586304e-06, -1.1222437024116516e-06, -5.699694156646729e-07, -1.7695128917694092e-08, 5.345791578292847e-07, 1.0868534445762634e-06, 1.6391277313232422e-06, 2.191402018070221e-06, 2.7436763048171997e-06, 3.2959505915641785e-06, 3.848224878311157e-06, 4.400499165058136e-06, 4.952773451805115e-06, 5.5050477385520935e-06, 6.057322025299072e-06, 6.609596312046051e-06, 7.16187059879303e-06, 7.714144885540009e-06, 8.266419172286987e-06, 8.818693459033966e-06, 9.370967745780945e-06, 9.923242032527924e-06, 1.0475516319274902e-05, 1.1027790606021881e-05, 1.158006489276886e-05, 1.2132339179515839e-05, 1.2684613466262817e-05, 1.3236887753009796e-05, 1.3789162039756775e-05, 1.4341436326503754e-05, 1.4893710613250732e-05, 1.544598489999771e-05, 1.599825918674469e-05, 1.655053347349167e-05, 1.7102807760238647e-05, 1.7655082046985626e-05, 1.8207356333732605e-05, 1.8759630620479584e-05, 1.9311904907226562e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 5.0, 9.0, 8.0, 10.0, 16.0, 15.0, 25.0, 35.0, 43.0, 47.0, 82.0, 139.0, 230.0, 406.0, 776.0, 1634.0, 3617.0, 10003.0, 30793.0, 119041.0, 396944.0, 348208.0, 95760.0, 25998.0, 8421.0, 3220.0, 1412.0, 728.0, 335.0, 196.0, 120.0, 79.0, 61.0, 34.0, 29.0, 17.0, 11.0, 15.0, 15.0, 7.0, 3.0, 2.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0343017578125, -0.03325986862182617, -0.032217979431152344, -0.031176090240478516, -0.030134201049804688, -0.02909231185913086, -0.02805042266845703, -0.027008533477783203, -0.025966644287109375, -0.024924755096435547, -0.02388286590576172, -0.02284097671508789, -0.021799087524414062, -0.020757198333740234, -0.019715309143066406, -0.018673419952392578, -0.01763153076171875, -0.016589641571044922, -0.015547752380371094, -0.014505863189697266, -0.013463973999023438, -0.01242208480834961, -0.011380195617675781, -0.010338306427001953, -0.009296417236328125, -0.008254528045654297, -0.007212638854980469, -0.006170749664306641, -0.0051288604736328125, -0.004086971282958984, -0.0030450820922851562, -0.002003192901611328, -0.0009613037109375, 8.058547973632812e-05, 0.0011224746704101562, 0.0021643638610839844, 0.0032062530517578125, 0.004248142242431641, 0.005290031433105469, 0.006331920623779297, 0.007373809814453125, 0.008415699005126953, 0.009457588195800781, 0.01049947738647461, 0.011541366577148438, 0.012583255767822266, 0.013625144958496094, 0.014667034149169922, 0.01570892333984375, 0.016750812530517578, 0.017792701721191406, 0.018834590911865234, 0.019876480102539062, 0.02091836929321289, 0.02196025848388672, 0.023002147674560547, 0.024044036865234375, 0.025085926055908203, 0.02612781524658203, 0.02716970443725586, 0.028211593627929688, 0.029253482818603516, 0.030295372009277344, 0.03133726119995117, 0.032379150390625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 7.0, 5.0, 10.0, 6.0, 8.0, 10.0, 10.0, 20.0, 27.0, 40.0, 52.0, 53.0, 69.0, 74.0, 67.0, 86.0, 85.0, 66.0, 67.0, 47.0, 41.0, 34.0, 29.0, 23.0, 12.0, 11.0, 13.0, 9.0, 5.0, 7.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0117950439453125, -0.011431217193603516, -0.011067390441894531, -0.010703563690185547, -0.010339736938476562, -0.009975910186767578, -0.009612083435058594, -0.00924825668334961, -0.008884429931640625, -0.00852060317993164, -0.008156776428222656, -0.007792949676513672, -0.0074291229248046875, -0.007065296173095703, -0.006701469421386719, -0.006337642669677734, -0.00597381591796875, -0.005609989166259766, -0.005246162414550781, -0.004882335662841797, -0.0045185089111328125, -0.004154682159423828, -0.0037908554077148438, -0.0034270286560058594, -0.003063201904296875, -0.0026993751525878906, -0.0023355484008789062, -0.001971721649169922, -0.0016078948974609375, -0.0012440681457519531, -0.0008802413940429688, -0.0005164146423339844, -0.000152587890625, 0.00021123886108398438, 0.0005750656127929688, 0.0009388923645019531, 0.0013027191162109375, 0.0016665458679199219, 0.0020303726196289062, 0.0023941993713378906, 0.002758026123046875, 0.0031218528747558594, 0.0034856796264648438, 0.003849506378173828, 0.0042133331298828125, 0.004577159881591797, 0.004940986633300781, 0.005304813385009766, 0.00566864013671875, 0.006032466888427734, 0.006396293640136719, 0.006760120391845703, 0.0071239471435546875, 0.007487773895263672, 0.007851600646972656, 0.00821542739868164, 0.008579254150390625, 0.00894308090209961, 0.009306907653808594, 0.009670734405517578, 0.010034561157226562, 0.010398387908935547, 0.010762214660644531, 0.011126041412353516, 0.0114898681640625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 5.0, 6.0, 8.0, 21.0, 29.0, 44.0, 73.0, 112.0, 162.0, 146.0, 146.0, 106.0, 62.0, 30.0, 24.0, 14.0, 9.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3167197108268738, -0.2973078489303589, -0.277895987033844, -0.2584841251373291, -0.2390722781419754, -0.2196604162454605, -0.2002485692501068, -0.18083670735359192, -0.16142484545707703, -0.14201298356056213, -0.12260112911462784, -0.10318927466869354, -0.08377741277217865, -0.06436555087566376, -0.04495369642972946, -0.025541841983795166, -0.0061299800872802734, 0.01328187808394432, 0.032693736255168915, 0.05210559442639351, 0.0715174525976181, 0.090929314494133, 0.11034116894006729, 0.1297530233860016, 0.14916488528251648, 0.16857674717903137, 0.18798860907554626, 0.20740045607089996, 0.22681231796741486, 0.24622417986392975, 0.26563602685928345, 0.28504788875579834, 0.304459810256958, 0.3238716721534729, 0.3432835340499878, 0.3626953959465027, 0.3821072578430176, 0.40151911973953247, 0.420930951833725, 0.44034281373023987, 0.45975467562675476, 0.47916653752326965, 0.49857839941978455, 0.517990231513977, 0.5374020934104919, 0.5568139553070068, 0.5762258172035217, 0.5956376791000366, 0.6150495409965515, 0.6344614028930664, 0.6538732647895813, 0.6732851266860962, 0.6926969885826111, 0.712108850479126, 0.7315207123756409, 0.7509325742721558, 0.7703443765640259, 0.7897562384605408, 0.8091681003570557, 0.8285799622535706, 0.8479918241500854, 0.8674036860466003, 0.8868155479431152, 0.9062273502349854, 0.925639271736145]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 8.0, 0.0, 8.0, 9.0, 17.0, 13.0, 10.0, 18.0, 25.0, 35.0, 26.0, 41.0, 44.0, 52.0, 61.0, 55.0, 63.0, 55.0, 56.0, 52.0, 51.0, 46.0, 41.0, 34.0, 31.0, 27.0, 23.0, 24.0, 13.0, 22.0, 12.0, 12.0, 2.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.32876110076904297, -0.3194924592971802, -0.3102238178253174, -0.3009551763534546, -0.2916865348815918, -0.2824179232120514, -0.2731492817401886, -0.2638806402683258, -0.254611998796463, -0.24534335732460022, -0.23607471585273743, -0.22680608928203583, -0.21753744781017303, -0.20826880633831024, -0.19900017976760864, -0.18973153829574585, -0.18046289682388306, -0.17119425535202026, -0.16192561388015747, -0.15265698730945587, -0.14338834583759308, -0.13411970436573029, -0.12485107034444809, -0.1155824363231659, -0.1063137948513031, -0.09704515337944031, -0.08777651935815811, -0.07850788533687592, -0.06923924386501312, -0.05997060611844063, -0.050701968371868134, -0.04143333435058594, -0.032164692878723145, -0.02289605513215065, -0.013627417385578156, -0.004358779639005661, 0.0049098581075668335, 0.014178495854139328, 0.023447133600711823, 0.03271576762199402, 0.04198440909385681, 0.051253046840429306, 0.0605216845870018, 0.069790318608284, 0.07905896008014679, 0.08832760155200958, 0.09759623557329178, 0.10686486959457397, 0.11613351106643677, 0.12540215253829956, 0.13467079401016235, 0.14393942058086395, 0.15320806205272675, 0.16247670352458954, 0.17174533009529114, 0.18101397156715393, 0.19028261303901672, 0.19955125451087952, 0.2088198959827423, 0.2180885225534439, 0.2273571640253067, 0.2366258054971695, 0.2458944320678711, 0.2551630735397339, 0.2644317150115967]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 6.0, 8.0, 8.0, 4.0, 16.0, 18.0, 28.0, 38.0, 74.0, 81.0, 118.0, 180.0, 324.0, 527.0, 986.0, 1903.0, 4050.0, 9725.0, 27038.0, 87634.0, 417301.0, 373462.0, 81825.0, 25895.0, 9214.0, 3963.0, 1836.0, 895.0, 531.0, 282.0, 210.0, 127.0, 69.0, 52.0, 38.0, 27.0, 25.0, 10.0, 12.0, 5.0, 3.0, 3.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.283447265625, -0.2739906311035156, -0.26453399658203125, -0.2550773620605469, -0.2456207275390625, -0.23616409301757812, -0.22670745849609375, -0.21725082397460938, -0.207794189453125, -0.19833755493164062, -0.18888092041015625, -0.17942428588867188, -0.1699676513671875, -0.16051101684570312, -0.15105438232421875, -0.14159774780273438, -0.13214111328125, -0.12268447875976562, -0.11322784423828125, -0.10377120971679688, -0.0943145751953125, -0.08485794067382812, -0.07540130615234375, -0.06594467163085938, -0.056488037109375, -0.047031402587890625, -0.03757476806640625, -0.028118133544921875, -0.0186614990234375, -0.009204864501953125, 0.00025177001953125, 0.009708404541015625, 0.0191650390625, 0.028621673583984375, 0.03807830810546875, 0.047534942626953125, 0.0569915771484375, 0.06644821166992188, 0.07590484619140625, 0.08536148071289062, 0.094818115234375, 0.10427474975585938, 0.11373138427734375, 0.12318801879882812, 0.1326446533203125, 0.14210128784179688, 0.15155792236328125, 0.16101455688476562, 0.17047119140625, 0.17992782592773438, 0.18938446044921875, 0.19884109497070312, 0.2082977294921875, 0.21775436401367188, 0.22721099853515625, 0.23666763305664062, 0.246124267578125, 0.2555809020996094, 0.26503753662109375, 0.2744941711425781, 0.2839508056640625, 0.2934074401855469, 0.30286407470703125, 0.3123207092285156, 0.32177734375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 1.0, 7.0, 12.0, 8.0, 17.0, 6.0, 13.0, 22.0, 24.0, 28.0, 36.0, 38.0, 44.0, 49.0, 52.0, 53.0, 55.0, 51.0, 50.0, 50.0, 52.0, 53.0, 41.0, 39.0, 27.0, 31.0, 23.0, 27.0, 18.0, 11.0, 19.0, 10.0, 8.0, 4.0, 9.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5478515625, -0.5316963195800781, -0.5155410766601562, -0.4993858337402344, -0.4832305908203125, -0.4670753479003906, -0.45092010498046875, -0.4347648620605469, -0.418609619140625, -0.4024543762207031, -0.38629913330078125, -0.3701438903808594, -0.3539886474609375, -0.3378334045410156, -0.32167816162109375, -0.3055229187011719, -0.28936767578125, -0.2732124328613281, -0.25705718994140625, -0.24090194702148438, -0.2247467041015625, -0.20859146118164062, -0.19243621826171875, -0.17628097534179688, -0.160125732421875, -0.14397048950195312, -0.12781524658203125, -0.11166000366210938, -0.0955047607421875, -0.07934951782226562, -0.06319427490234375, -0.047039031982421875, -0.0308837890625, -0.014728546142578125, 0.00142669677734375, 0.017581939697265625, 0.0337371826171875, 0.049892425537109375, 0.06604766845703125, 0.08220291137695312, 0.098358154296875, 0.11451339721679688, 0.13066864013671875, 0.14682388305664062, 0.1629791259765625, 0.17913436889648438, 0.19528961181640625, 0.21144485473632812, 0.22760009765625, 0.24375534057617188, 0.25991058349609375, 0.2760658264160156, 0.2922210693359375, 0.3083763122558594, 0.32453155517578125, 0.3406867980957031, 0.356842041015625, 0.3729972839355469, 0.38915252685546875, 0.4053077697753906, 0.4214630126953125, 0.4376182556152344, 0.45377349853515625, 0.4699287414550781, 0.486083984375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 6.0, 5.0, 6.0, 5.0, 13.0, 11.0, 18.0, 28.0, 32.0, 37.0, 65.0, 75.0, 152.0, 231.0, 622.0, 3398.0, 148431.0, 882284.0, 11268.0, 1017.0, 332.0, 174.0, 100.0, 69.0, 46.0, 28.0, 25.0, 20.0, 17.0, 12.0, 6.0, 8.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.853515625, -0.8167266845703125, -0.779937744140625, -0.7431488037109375, -0.70635986328125, -0.6695709228515625, -0.632781982421875, -0.5959930419921875, -0.5592041015625, -0.5224151611328125, -0.485626220703125, -0.4488372802734375, -0.41204833984375, -0.3752593994140625, -0.338470458984375, -0.3016815185546875, -0.264892578125, -0.2281036376953125, -0.191314697265625, -0.1545257568359375, -0.11773681640625, -0.0809478759765625, -0.044158935546875, -0.0073699951171875, 0.0294189453125, 0.0662078857421875, 0.102996826171875, 0.1397857666015625, 0.17657470703125, 0.2133636474609375, 0.250152587890625, 0.2869415283203125, 0.32373046875, 0.3605194091796875, 0.397308349609375, 0.4340972900390625, 0.47088623046875, 0.5076751708984375, 0.544464111328125, 0.5812530517578125, 0.6180419921875, 0.6548309326171875, 0.691619873046875, 0.7284088134765625, 0.76519775390625, 0.8019866943359375, 0.838775634765625, 0.8755645751953125, 0.912353515625, 0.9491424560546875, 0.985931396484375, 1.0227203369140625, 1.05950927734375, 1.0962982177734375, 1.133087158203125, 1.1698760986328125, 1.2066650390625, 1.2434539794921875, 1.280242919921875, 1.3170318603515625, 1.35382080078125, 1.3906097412109375, 1.427398681640625, 1.4641876220703125, 1.5009765625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 5.0, 3.0, 5.0, 3.0, 16.0, 11.0, 14.0, 22.0, 32.0, 36.0, 28.0, 37.0, 38.0, 62.0, 63.0, 59.0, 56.0, 59.0, 76.0, 58.0, 49.0, 53.0, 38.0, 38.0, 26.0, 28.0, 21.0, 12.0, 12.0, 9.0, 7.0, 4.0, 9.0, 4.0, 6.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59716796875, -0.5736083984375, -0.550048828125, -0.5264892578125, -0.5029296875, -0.4793701171875, -0.455810546875, -0.4322509765625, -0.40869140625, -0.3851318359375, -0.361572265625, -0.3380126953125, -0.314453125, -0.2908935546875, -0.267333984375, -0.2437744140625, -0.22021484375, -0.1966552734375, -0.173095703125, -0.1495361328125, -0.1259765625, -0.1024169921875, -0.078857421875, -0.0552978515625, -0.03173828125, -0.0081787109375, 0.015380859375, 0.0389404296875, 0.0625, 0.0860595703125, 0.109619140625, 0.1331787109375, 0.15673828125, 0.1802978515625, 0.203857421875, 0.2274169921875, 0.2509765625, 0.2745361328125, 0.298095703125, 0.3216552734375, 0.34521484375, 0.3687744140625, 0.392333984375, 0.4158935546875, 0.439453125, 0.4630126953125, 0.486572265625, 0.5101318359375, 0.53369140625, 0.5572509765625, 0.580810546875, 0.6043701171875, 0.6279296875, 0.6514892578125, 0.675048828125, 0.6986083984375, 0.72216796875, 0.7457275390625, 0.769287109375, 0.7928466796875, 0.81640625, 0.8399658203125, 0.863525390625, 0.8870849609375, 0.91064453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 3.0, 0.0, 7.0, 7.0, 8.0, 6.0, 13.0, 11.0, 15.0, 25.0, 40.0, 64.0, 138.0, 208.0, 396.0, 847.0, 1842.0, 5714.0, 39182.0, 865648.0, 119764.0, 9676.0, 2629.0, 1110.0, 511.0, 265.0, 139.0, 93.0, 56.0, 33.0, 26.0, 15.0, 12.0, 8.0, 5.0, 8.0, 5.0, 7.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2158203125, -0.20741653442382812, -0.19901275634765625, -0.19060897827148438, -0.1822052001953125, -0.17380142211914062, -0.16539764404296875, -0.15699386596679688, -0.148590087890625, -0.14018630981445312, -0.13178253173828125, -0.12337875366210938, -0.1149749755859375, -0.10657119750976562, -0.09816741943359375, -0.08976364135742188, -0.08135986328125, -0.07295608520507812, -0.06455230712890625, -0.056148529052734375, -0.0477447509765625, -0.039340972900390625, -0.03093719482421875, -0.022533416748046875, -0.014129638671875, -0.005725860595703125, 0.00267791748046875, 0.011081695556640625, 0.0194854736328125, 0.027889251708984375, 0.03629302978515625, 0.044696807861328125, 0.0531005859375, 0.061504364013671875, 0.06990814208984375, 0.07831192016601562, 0.0867156982421875, 0.09511947631835938, 0.10352325439453125, 0.11192703247070312, 0.120330810546875, 0.12873458862304688, 0.13713836669921875, 0.14554214477539062, 0.1539459228515625, 0.16234970092773438, 0.17075347900390625, 0.17915725708007812, 0.18756103515625, 0.19596481323242188, 0.20436859130859375, 0.21277236938476562, 0.2211761474609375, 0.22957992553710938, 0.23798370361328125, 0.24638748168945312, 0.254791259765625, 0.2631950378417969, 0.27159881591796875, 0.2800025939941406, 0.2884063720703125, 0.2968101501464844, 0.30521392822265625, 0.3136177062988281, 0.322021484375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 1.0, 3.0, 4.0, 2.0, 2.0, 8.0, 8.0, 17.0, 30.0, 68.0, 179.0, 413.0, 154.0, 57.0, 20.0, 14.0, 6.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.218122482299805e-05, -7.00848177075386e-05, -6.798841059207916e-05, -6.589200347661972e-05, -6.379559636116028e-05, -6.169918924570084e-05, -5.9602782130241394e-05, -5.750637501478195e-05, -5.540996789932251e-05, -5.331356078386307e-05, -5.1217153668403625e-05, -4.912074655294418e-05, -4.702433943748474e-05, -4.49279323220253e-05, -4.283152520656586e-05, -4.0735118091106415e-05, -3.863871097564697e-05, -3.654230386018753e-05, -3.444589674472809e-05, -3.2349489629268646e-05, -3.0253082513809204e-05, -2.8156675398349762e-05, -2.606026828289032e-05, -2.3963861167430878e-05, -2.1867454051971436e-05, -1.9771046936511993e-05, -1.767463982105255e-05, -1.557823270559311e-05, -1.3481825590133667e-05, -1.1385418474674225e-05, -9.289011359214783e-06, -7.1926042437553406e-06, -5.0961971282958984e-06, -2.9997900128364563e-06, -9.033828973770142e-07, 1.193024218082428e-06, 3.28943133354187e-06, 5.385838449001312e-06, 7.482245564460754e-06, 9.578652679920197e-06, 1.1675059795379639e-05, 1.377146691083908e-05, 1.5867874026298523e-05, 1.7964281141757965e-05, 2.0060688257217407e-05, 2.215709537267685e-05, 2.425350248813629e-05, 2.6349909603595734e-05, 2.8446316719055176e-05, 3.054272383451462e-05, 3.263913094997406e-05, 3.47355380654335e-05, 3.6831945180892944e-05, 3.8928352296352386e-05, 4.102475941181183e-05, 4.312116652727127e-05, 4.521757364273071e-05, 4.7313980758190155e-05, 4.94103878736496e-05, 5.150679498910904e-05, 5.360320210456848e-05, 5.5699609220027924e-05, 5.7796016335487366e-05, 5.989242345094681e-05, 6.198883056640625e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 4.0, 10.0, 12.0, 28.0, 37.0, 46.0, 104.0, 182.0, 346.0, 656.0, 1328.0, 2811.0, 8712.0, 55712.0, 754919.0, 196531.0, 18845.0, 4487.0, 1790.0, 859.0, 495.0, 239.0, 134.0, 92.0, 45.0, 31.0, 24.0, 18.0, 10.0, 10.0, 5.0, 8.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2266845703125, -0.22015953063964844, -0.21363449096679688, -0.2071094512939453, -0.20058441162109375, -0.1940593719482422, -0.18753433227539062, -0.18100929260253906, -0.1744842529296875, -0.16795921325683594, -0.16143417358398438, -0.1549091339111328, -0.14838409423828125, -0.1418590545654297, -0.13533401489257812, -0.12880897521972656, -0.122283935546875, -0.11575889587402344, -0.10923385620117188, -0.10270881652832031, -0.09618377685546875, -0.08965873718261719, -0.08313369750976562, -0.07660865783691406, -0.0700836181640625, -0.06355857849121094, -0.057033538818359375, -0.05050849914550781, -0.04398345947265625, -0.03745841979980469, -0.030933380126953125, -0.024408340454101562, -0.01788330078125, -0.011358261108398438, -0.004833221435546875, 0.0016918182373046875, 0.00821685791015625, 0.014741897583007812, 0.021266937255859375, 0.027791976928710938, 0.0343170166015625, 0.04084205627441406, 0.047367095947265625, 0.05389213562011719, 0.06041717529296875, 0.06694221496582031, 0.07346725463867188, 0.07999229431152344, 0.086517333984375, 0.09304237365722656, 0.09956741333007812, 0.10609245300292969, 0.11261749267578125, 0.11914253234863281, 0.12566757202148438, 0.13219261169433594, 0.1387176513671875, 0.14524269104003906, 0.15176773071289062, 0.1582927703857422, 0.16481781005859375, 0.1713428497314453, 0.17786788940429688, 0.18439292907714844, 0.19091796875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 7.0, 7.0, 13.0, 8.0, 21.0, 24.0, 20.0, 31.0, 33.0, 59.0, 70.0, 127.0, 155.0, 124.0, 77.0, 64.0, 52.0, 32.0, 26.0, 9.0, 16.0, 2.0, 8.0, 6.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0665283203125, -0.06427288055419922, -0.06201744079589844, -0.059762001037597656, -0.057506561279296875, -0.055251121520996094, -0.05299568176269531, -0.05074024200439453, -0.04848480224609375, -0.04622936248779297, -0.04397392272949219, -0.041718482971191406, -0.039463043212890625, -0.037207603454589844, -0.03495216369628906, -0.03269672393798828, -0.0304412841796875, -0.02818584442138672, -0.025930404663085938, -0.023674964904785156, -0.021419525146484375, -0.019164085388183594, -0.016908645629882812, -0.014653205871582031, -0.01239776611328125, -0.010142326354980469, -0.007886886596679688, -0.005631446838378906, -0.003376007080078125, -0.0011205673217773438, 0.0011348724365234375, 0.0033903121948242188, 0.005645751953125, 0.007901191711425781, 0.010156631469726562, 0.012412071228027344, 0.014667510986328125, 0.016922950744628906, 0.019178390502929688, 0.02143383026123047, 0.02368927001953125, 0.02594470977783203, 0.028200149536132812, 0.030455589294433594, 0.032711029052734375, 0.034966468811035156, 0.03722190856933594, 0.03947734832763672, 0.0417327880859375, 0.04398822784423828, 0.04624366760253906, 0.048499107360839844, 0.050754547119140625, 0.053009986877441406, 0.05526542663574219, 0.05752086639404297, 0.05977630615234375, 0.06203174591064453, 0.06428718566894531, 0.0665426254272461, 0.06879806518554688, 0.07105350494384766, 0.07330894470214844, 0.07556438446044922, 0.07781982421875]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 5.0, 20.0, 94.0, 418.0, 370.0, 88.0, 15.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6520538926124573, -0.5211829543113708, -0.39031198620796204, -0.2594410181045532, -0.1285700798034668, 0.002300858497619629, 0.13317185640335083, 0.26404279470443726, 0.3949137330055237, 0.5257846713066101, 0.6566556692123413, 0.7875266075134277, 0.9183975458145142, 1.0492684841156006, 1.1801395416259766, 1.3110103607177734, 1.4418814182281494, 1.5727523565292358, 1.7036232948303223, 1.8344943523406982, 1.9653651714324951, 2.096236228942871, 2.227107048034668, 2.357978105545044, 2.488848924636841, 2.619719982147217, 2.7505908012390137, 2.8814618587493896, 3.0123326778411865, 3.1432037353515625, 3.2740745544433594, 3.4049456119537354, 3.535816192626953, 3.666687250137329, 3.797558069229126, 3.928429126739502, 4.059299945831299, 4.190170764923096, 4.321042060852051, 4.451912879943848, 4.5827836990356445, 4.713654518127441, 4.8445258140563965, 4.975396633148193, 5.10626745223999, 5.237138271331787, 5.368009567260742, 5.498880386352539, 5.629751205444336, 5.760622024536133, 5.891493320465088, 6.022364139556885, 6.153234958648682, 6.2841057777404785, 6.414977073669434, 6.5458478927612305, 6.6767191886901855, 6.807590007781982, 6.9384613037109375, 7.069332122802734, 7.200202941894531, 7.331073760986328, 7.461945056915283, 7.59281587600708, 7.723686695098877]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 5.0, 6.0, 10.0, 7.0, 6.0, 13.0, 13.0, 12.0, 8.0, 22.0, 22.0, 20.0, 28.0, 40.0, 33.0, 37.0, 42.0, 41.0, 43.0, 39.0, 57.0, 34.0, 37.0, 56.0, 42.0, 33.0, 27.0, 37.0, 22.0, 25.0, 27.0, 14.0, 24.0, 20.0, 13.0, 14.0, 16.0, 19.0, 10.0, 10.0, 3.0, 3.0, 8.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.9124016761779785, -0.8852574825286865, -0.8581132292747498, -0.8309690356254578, -0.803824782371521, -0.776680588722229, -0.749536395072937, -0.722392201423645, -0.6952479481697083, -0.6681037545204163, -0.6409595012664795, -0.6138153076171875, -0.5866711139678955, -0.5595268607139587, -0.5323826670646667, -0.50523841381073, -0.478094220161438, -0.4509499967098236, -0.42380577325820923, -0.39666157960891724, -0.36951735615730286, -0.3423731327056885, -0.3152289390563965, -0.2880847156047821, -0.2609404921531677, -0.23379626870155334, -0.20665206015110016, -0.17950785160064697, -0.1523636281490326, -0.1252194046974182, -0.09807519614696503, -0.07093098759651184, -0.04378676414489746, -0.016642548143863678, 0.010501667857170105, 0.03764588385820389, 0.06479009985923767, 0.09193432331085205, 0.11907853186130524, 0.14622274041175842, 0.1733669638633728, 0.20051118731498718, 0.22765539586544037, 0.25479960441589355, 0.28194382786750793, 0.3090880513191223, 0.3362322449684143, 0.3633764684200287, 0.39052069187164307, 0.41766491532325745, 0.4448091387748718, 0.4719533324241638, 0.4990975558757782, 0.5262417793273926, 0.5533859729766846, 0.5805301666259766, 0.6076744198799133, 0.6348186135292053, 0.6619628667831421, 0.6891070604324341, 0.7162512540817261, 0.7433955073356628, 0.7705397009849548, 0.7976839542388916, 0.8248281478881836]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 6.0, 4.0, 4.0, 6.0, 13.0, 20.0, 23.0, 34.0, 52.0, 76.0, 119.0, 225.0, 331.0, 545.0, 998.0, 1715.0, 3538.0, 7700.0, 21466.0, 119056.0, 1604383.0, 2215191.0, 173061.0, 26946.0, 9600.0, 4242.0, 2052.0, 1199.0, 636.0, 396.0, 227.0, 151.0, 84.0, 54.0, 50.0, 25.0, 17.0, 13.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.59521484375, -0.5787200927734375, -0.562225341796875, -0.5457305908203125, -0.52923583984375, -0.5127410888671875, -0.496246337890625, -0.4797515869140625, -0.4632568359375, -0.4467620849609375, -0.430267333984375, -0.4137725830078125, -0.39727783203125, -0.3807830810546875, -0.364288330078125, -0.3477935791015625, -0.331298828125, -0.3148040771484375, -0.298309326171875, -0.2818145751953125, -0.26531982421875, -0.2488250732421875, -0.232330322265625, -0.2158355712890625, -0.1993408203125, -0.1828460693359375, -0.166351318359375, -0.1498565673828125, -0.13336181640625, -0.1168670654296875, -0.100372314453125, -0.0838775634765625, -0.0673828125, -0.0508880615234375, -0.034393310546875, -0.0178985595703125, -0.00140380859375, 0.0150909423828125, 0.031585693359375, 0.0480804443359375, 0.0645751953125, 0.0810699462890625, 0.097564697265625, 0.1140594482421875, 0.13055419921875, 0.1470489501953125, 0.163543701171875, 0.1800384521484375, 0.196533203125, 0.2130279541015625, 0.229522705078125, 0.2460174560546875, 0.26251220703125, 0.2790069580078125, 0.295501708984375, 0.3119964599609375, 0.3284912109375, 0.3449859619140625, 0.361480712890625, 0.3779754638671875, 0.39447021484375, 0.4109649658203125, 0.427459716796875, 0.4439544677734375, 0.46044921875]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 7.0, 2.0, 10.0, 6.0, 8.0, 11.0, 16.0, 28.0, 22.0, 23.0, 26.0, 28.0, 46.0, 39.0, 41.0, 45.0, 44.0, 50.0, 57.0, 42.0, 48.0, 50.0, 37.0, 36.0, 42.0, 39.0, 22.0, 24.0, 21.0, 22.0, 10.0, 23.0, 21.0, 8.0, 5.0, 6.0, 6.0, 7.0, 2.0, 4.0, 3.0, 5.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.257568359375, -0.24895477294921875, -0.2403411865234375, -0.23172760009765625, -0.223114013671875, -0.21450042724609375, -0.2058868408203125, -0.19727325439453125, -0.18865966796875, -0.18004608154296875, -0.1714324951171875, -0.16281890869140625, -0.154205322265625, -0.14559173583984375, -0.1369781494140625, -0.12836456298828125, -0.1197509765625, -0.11113739013671875, -0.1025238037109375, -0.09391021728515625, -0.085296630859375, -0.07668304443359375, -0.0680694580078125, -0.05945587158203125, -0.05084228515625, -0.04222869873046875, -0.0336151123046875, -0.02500152587890625, -0.016387939453125, -0.00777435302734375, 0.0008392333984375, 0.00945281982421875, 0.01806640625, 0.02667999267578125, 0.0352935791015625, 0.04390716552734375, 0.052520751953125, 0.06113433837890625, 0.0697479248046875, 0.07836151123046875, 0.08697509765625, 0.09558868408203125, 0.1042022705078125, 0.11281585693359375, 0.121429443359375, 0.13004302978515625, 0.1386566162109375, 0.14727020263671875, 0.1558837890625, 0.16449737548828125, 0.1731109619140625, 0.18172454833984375, 0.190338134765625, 0.19895172119140625, 0.2075653076171875, 0.21617889404296875, 0.22479248046875, 0.23340606689453125, 0.2420196533203125, 0.25063323974609375, 0.259246826171875, 0.26786041259765625, 0.2764739990234375, 0.28508758544921875, 0.293701171875]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 6.0, 3.0, 10.0, 10.0, 18.0, 16.0, 30.0, 46.0, 61.0, 164.0, 344.0, 909.0, 2903.0, 14628.0, 267454.0, 3823876.0, 73297.0, 7431.0, 1866.0, 622.0, 251.0, 131.0, 63.0, 39.0, 27.0, 23.0, 8.0, 12.0, 5.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0673828125, -1.0353546142578125, -1.003326416015625, -0.9712982177734375, -0.93927001953125, -0.9072418212890625, -0.875213623046875, -0.8431854248046875, -0.8111572265625, -0.7791290283203125, -0.747100830078125, -0.7150726318359375, -0.68304443359375, -0.6510162353515625, -0.618988037109375, -0.5869598388671875, -0.554931640625, -0.5229034423828125, -0.490875244140625, -0.4588470458984375, -0.42681884765625, -0.3947906494140625, -0.362762451171875, -0.3307342529296875, -0.2987060546875, -0.2666778564453125, -0.234649658203125, -0.2026214599609375, -0.17059326171875, -0.1385650634765625, -0.106536865234375, -0.0745086669921875, -0.04248046875, -0.0104522705078125, 0.021575927734375, 0.0536041259765625, 0.08563232421875, 0.1176605224609375, 0.149688720703125, 0.1817169189453125, 0.2137451171875, 0.2457733154296875, 0.277801513671875, 0.3098297119140625, 0.34185791015625, 0.3738861083984375, 0.405914306640625, 0.4379425048828125, 0.469970703125, 0.5019989013671875, 0.534027099609375, 0.5660552978515625, 0.59808349609375, 0.6301116943359375, 0.662139892578125, 0.6941680908203125, 0.7261962890625, 0.7582244873046875, 0.790252685546875, 0.8222808837890625, 0.85430908203125, 0.8863372802734375, 0.918365478515625, 0.9503936767578125, 0.982421875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 8.0, 4.0, 8.0, 9.0, 14.0, 18.0, 31.0, 25.0, 51.0, 85.0, 125.0, 218.0, 368.0, 614.0, 755.0, 654.0, 429.0, 220.0, 147.0, 78.0, 59.0, 51.0, 30.0, 19.0, 11.0, 6.0, 9.0, 9.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1708984375, -0.1653118133544922, -0.15972518920898438, -0.15413856506347656, -0.14855194091796875, -0.14296531677246094, -0.13737869262695312, -0.1317920684814453, -0.1262054443359375, -0.12061882019042969, -0.11503219604492188, -0.10944557189941406, -0.10385894775390625, -0.09827232360839844, -0.09268569946289062, -0.08709907531738281, -0.081512451171875, -0.07592582702636719, -0.07033920288085938, -0.06475257873535156, -0.05916595458984375, -0.05357933044433594, -0.047992706298828125, -0.04240608215332031, -0.0368194580078125, -0.031232833862304688, -0.025646209716796875, -0.020059585571289062, -0.01447296142578125, -0.008886337280273438, -0.003299713134765625, 0.0022869110107421875, 0.00787353515625, 0.013460159301757812, 0.019046783447265625, 0.024633407592773438, 0.03022003173828125, 0.03580665588378906, 0.041393280029296875, 0.04697990417480469, 0.0525665283203125, 0.05815315246582031, 0.06373977661132812, 0.06932640075683594, 0.07491302490234375, 0.08049964904785156, 0.08608627319335938, 0.09167289733886719, 0.097259521484375, 0.10284614562988281, 0.10843276977539062, 0.11401939392089844, 0.11960601806640625, 0.12519264221191406, 0.13077926635742188, 0.1363658905029297, 0.1419525146484375, 0.1475391387939453, 0.15312576293945312, 0.15871238708496094, 0.16429901123046875, 0.16988563537597656, 0.17547225952148438, 0.1810588836669922, 0.1866455078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 1.0, 5.0, 3.0, 3.0, 4.0, 6.0, 16.0, 13.0, 16.0, 23.0, 22.0, 34.0, 23.0, 26.0, 37.0, 42.0, 56.0, 47.0, 69.0, 41.0, 59.0, 62.0, 57.0, 51.0, 46.0, 42.0, 30.0, 28.0, 31.0, 26.0, 11.0, 17.0, 11.0, 6.0, 9.0, 3.0, 9.0, 1.0, 6.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3081919848918915, -0.29761067032814026, -0.28702932596206665, -0.27644801139831543, -0.2658666670322418, -0.2552853524684906, -0.244704008102417, -0.23412269353866577, -0.22354134917259216, -0.21296001970767975, -0.20237869024276733, -0.19179736077785492, -0.1812160313129425, -0.1706347018480301, -0.16005337238311768, -0.14947205781936646, -0.13889072835445404, -0.12830939888954163, -0.11772806942462921, -0.1071467399597168, -0.09656541049480438, -0.08598408102989197, -0.07540275901556015, -0.06482142955064774, -0.05424010008573532, -0.043658770620822906, -0.03307744115591049, -0.022496115416288376, -0.011914785951375961, -0.0013334564864635468, 0.00924786925315857, 0.019829198718070984, 0.0304105281829834, 0.04099185764789581, 0.05157318711280823, 0.062154512852430344, 0.07273584604263306, 0.08331717550754547, 0.09389849752187729, 0.1044798269867897, 0.11506115645170212, 0.12564247846603394, 0.13622380793094635, 0.14680513739585876, 0.15738646686077118, 0.1679677963256836, 0.178549125790596, 0.18913045525550842, 0.19971178472042084, 0.21029311418533325, 0.22087444365024567, 0.23145577311515808, 0.2420371025800705, 0.2526184320449829, 0.26319974660873413, 0.27378109097480774, 0.28436240553855896, 0.2949437201023102, 0.3055250644683838, 0.316106379032135, 0.3266877233982086, 0.33726903796195984, 0.34785038232803345, 0.35843169689178467, 0.3690130412578583]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 5.0, 6.0, 16.0, 16.0, 13.0, 11.0, 20.0, 20.0, 22.0, 28.0, 36.0, 37.0, 32.0, 44.0, 40.0, 37.0, 32.0, 33.0, 48.0, 47.0, 42.0, 39.0, 34.0, 28.0, 43.0, 37.0, 25.0, 34.0, 24.0, 22.0, 25.0, 27.0, 14.0, 9.0, 17.0, 9.0, 6.0, 7.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.34922969341278076, -0.3395542502403259, -0.3298787772655487, -0.32020333409309387, -0.31052789092063904, -0.3008524179458618, -0.291176974773407, -0.28150153160095215, -0.2718260884284973, -0.2621506452560425, -0.25247517228126526, -0.24279972910881042, -0.2331242859363556, -0.22344882786273956, -0.21377336978912354, -0.2040979266166687, -0.19442245364189148, -0.18474699556827545, -0.17507155239582062, -0.1653960943222046, -0.15572065114974976, -0.14604519307613373, -0.1363697350025177, -0.12669429183006287, -0.11701883375644684, -0.10734338313341141, -0.09766793251037598, -0.08799247443675995, -0.07831702381372452, -0.06864157319068909, -0.05896611884236336, -0.04929066449403763, -0.0396152138710022, -0.029939761385321617, -0.020264308899641037, -0.010588856413960457, -0.0009134039282798767, 0.008762046694755554, 0.018437501043081284, 0.028112955391407013, 0.037788406014442444, 0.047463856637477875, 0.057139310985803604, 0.06681476533412933, 0.07649021595716476, 0.0861656665802002, 0.09584112465381622, 0.10551657527685165, 0.11519202589988708, 0.12486747652292252, 0.13454292714595795, 0.14421838521957397, 0.1538938283920288, 0.16356928646564484, 0.17324474453926086, 0.1829201877117157, 0.19259564578533173, 0.20227110385894775, 0.2119465470314026, 0.22162200510501862, 0.23129746317863464, 0.24097290635108948, 0.2506483495235443, 0.26032382249832153, 0.26999926567077637]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 6.0, 3.0, 11.0, 15.0, 22.0, 39.0, 45.0, 111.0, 170.0, 286.0, 566.0, 1082.0, 2261.0, 4893.0, 11670.0, 46057.0, 494701.0, 426095.0, 40603.0, 10923.0, 4539.0, 2170.0, 1032.0, 567.0, 282.0, 179.0, 89.0, 50.0, 29.0, 18.0, 10.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1954345703125, -0.18912315368652344, -0.18281173706054688, -0.1765003204345703, -0.17018890380859375, -0.1638774871826172, -0.15756607055664062, -0.15125465393066406, -0.1449432373046875, -0.13863182067871094, -0.13232040405273438, -0.1260089874267578, -0.11969757080078125, -0.11338615417480469, -0.10707473754882812, -0.10076332092285156, -0.094451904296875, -0.08814048767089844, -0.08182907104492188, -0.07551765441894531, -0.06920623779296875, -0.06289482116699219, -0.056583404541015625, -0.05027198791503906, -0.0439605712890625, -0.03764915466308594, -0.031337738037109375, -0.025026321411132812, -0.01871490478515625, -0.012403488159179688, -0.006092071533203125, 0.0002193450927734375, 0.00653076171875, 0.012842178344726562, 0.019153594970703125, 0.025465011596679688, 0.03177642822265625, 0.03808784484863281, 0.044399261474609375, 0.05071067810058594, 0.0570220947265625, 0.06333351135253906, 0.06964492797851562, 0.07595634460449219, 0.08226776123046875, 0.08857917785644531, 0.09489059448242188, 0.10120201110839844, 0.107513427734375, 0.11382484436035156, 0.12013626098632812, 0.1264476776123047, 0.13275909423828125, 0.1390705108642578, 0.14538192749023438, 0.15169334411621094, 0.1580047607421875, 0.16431617736816406, 0.17062759399414062, 0.1769390106201172, 0.18325042724609375, 0.1895618438720703, 0.19587326049804688, 0.20218467712402344, 0.20849609375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 7.0, 4.0, 13.0, 8.0, 11.0, 9.0, 22.0, 20.0, 17.0, 45.0, 31.0, 32.0, 33.0, 45.0, 37.0, 46.0, 44.0, 41.0, 45.0, 49.0, 38.0, 32.0, 52.0, 41.0, 35.0, 29.0, 23.0, 30.0, 36.0, 20.0, 21.0, 18.0, 15.0, 7.0, 7.0, 9.0, 6.0, 5.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1912841796875, -0.1852264404296875, -0.179168701171875, -0.1731109619140625, -0.16705322265625, -0.1609954833984375, -0.154937744140625, -0.1488800048828125, -0.142822265625, -0.1367645263671875, -0.130706787109375, -0.1246490478515625, -0.11859130859375, -0.1125335693359375, -0.106475830078125, -0.1004180908203125, -0.0943603515625, -0.0883026123046875, -0.082244873046875, -0.0761871337890625, -0.07012939453125, -0.0640716552734375, -0.058013916015625, -0.0519561767578125, -0.0458984375, -0.0398406982421875, -0.033782958984375, -0.0277252197265625, -0.02166748046875, -0.0156097412109375, -0.009552001953125, -0.0034942626953125, 0.0025634765625, 0.0086212158203125, 0.014678955078125, 0.0207366943359375, 0.02679443359375, 0.0328521728515625, 0.038909912109375, 0.0449676513671875, 0.051025390625, 0.0570831298828125, 0.063140869140625, 0.0691986083984375, 0.07525634765625, 0.0813140869140625, 0.087371826171875, 0.0934295654296875, 0.0994873046875, 0.1055450439453125, 0.111602783203125, 0.1176605224609375, 0.12371826171875, 0.1297760009765625, 0.135833740234375, 0.1418914794921875, 0.14794921875, 0.1540069580078125, 0.160064697265625, 0.1661224365234375, 0.17218017578125, 0.1782379150390625, 0.184295654296875, 0.1903533935546875, 0.1964111328125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 9.0, 17.0, 17.0, 18.0, 36.0, 48.0, 108.0, 178.0, 242.0, 389.0, 709.0, 1283.0, 2466.0, 5143.0, 11917.0, 36092.0, 144844.0, 463156.0, 280099.0, 67514.0, 19529.0, 7412.0, 3433.0, 1697.0, 852.0, 526.0, 314.0, 170.0, 115.0, 71.0, 48.0, 27.0, 20.0, 19.0, 10.0, 8.0, 3.0, 6.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0872802734375, -0.08452987670898438, -0.08177947998046875, -0.07902908325195312, -0.0762786865234375, -0.07352828979492188, -0.07077789306640625, -0.06802749633789062, -0.065277099609375, -0.06252670288085938, -0.05977630615234375, -0.057025909423828125, -0.0542755126953125, -0.051525115966796875, -0.04877471923828125, -0.046024322509765625, -0.04327392578125, -0.040523529052734375, -0.03777313232421875, -0.035022735595703125, -0.0322723388671875, -0.029521942138671875, -0.02677154541015625, -0.024021148681640625, -0.021270751953125, -0.018520355224609375, -0.01576995849609375, -0.013019561767578125, -0.0102691650390625, -0.007518768310546875, -0.00476837158203125, -0.002017974853515625, 0.000732421875, 0.003482818603515625, 0.00623321533203125, 0.008983612060546875, 0.0117340087890625, 0.014484405517578125, 0.01723480224609375, 0.019985198974609375, 0.022735595703125, 0.025485992431640625, 0.02823638916015625, 0.030986785888671875, 0.0337371826171875, 0.036487579345703125, 0.03923797607421875, 0.041988372802734375, 0.04473876953125, 0.047489166259765625, 0.05023956298828125, 0.052989959716796875, 0.0557403564453125, 0.058490753173828125, 0.06124114990234375, 0.06399154663085938, 0.066741943359375, 0.06949234008789062, 0.07224273681640625, 0.07499313354492188, 0.0777435302734375, 0.08049392700195312, 0.08324432373046875, 0.08599472045898438, 0.0887451171875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 7.0, 9.0, 3.0, 13.0, 9.0, 17.0, 11.0, 21.0, 24.0, 29.0, 25.0, 41.0, 35.0, 28.0, 54.0, 42.0, 39.0, 38.0, 51.0, 45.0, 48.0, 38.0, 50.0, 45.0, 31.0, 33.0, 30.0, 28.0, 25.0, 13.0, 25.0, 20.0, 9.0, 14.0, 12.0, 10.0, 10.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.39990234375, -0.387969970703125, -0.37603759765625, -0.364105224609375, -0.3521728515625, -0.340240478515625, -0.32830810546875, -0.316375732421875, -0.304443359375, -0.292510986328125, -0.28057861328125, -0.268646240234375, -0.2567138671875, -0.244781494140625, -0.23284912109375, -0.220916748046875, -0.208984375, -0.197052001953125, -0.18511962890625, -0.173187255859375, -0.1612548828125, -0.149322509765625, -0.13739013671875, -0.125457763671875, -0.113525390625, -0.101593017578125, -0.08966064453125, -0.077728271484375, -0.0657958984375, -0.053863525390625, -0.04193115234375, -0.029998779296875, -0.01806640625, -0.006134033203125, 0.00579833984375, 0.017730712890625, 0.0296630859375, 0.041595458984375, 0.05352783203125, 0.065460205078125, 0.077392578125, 0.089324951171875, 0.10125732421875, 0.113189697265625, 0.1251220703125, 0.137054443359375, 0.14898681640625, 0.160919189453125, 0.1728515625, 0.184783935546875, 0.19671630859375, 0.208648681640625, 0.2205810546875, 0.232513427734375, 0.24444580078125, 0.256378173828125, 0.268310546875, 0.280242919921875, 0.29217529296875, 0.304107666015625, 0.3160400390625, 0.327972412109375, 0.33990478515625, 0.351837158203125, 0.36376953125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 6.0, 6.0, 15.0, 13.0, 28.0, 43.0, 59.0, 118.0, 199.0, 362.0, 696.0, 1450.0, 3438.0, 9486.0, 33031.0, 166531.0, 542348.0, 228352.0, 43471.0, 11487.0, 3983.0, 1646.0, 786.0, 420.0, 234.0, 129.0, 79.0, 53.0, 29.0, 14.0, 12.0, 7.0, 6.0, 3.0, 2.0, 6.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03350830078125, -0.03248023986816406, -0.031452178955078125, -0.030424118041992188, -0.02939605712890625, -0.028367996215820312, -0.027339935302734375, -0.026311874389648438, -0.0252838134765625, -0.024255752563476562, -0.023227691650390625, -0.022199630737304688, -0.02117156982421875, -0.020143508911132812, -0.019115447998046875, -0.018087387084960938, -0.017059326171875, -0.016031265258789062, -0.015003204345703125, -0.013975143432617188, -0.01294708251953125, -0.011919021606445312, -0.010890960693359375, -0.009862899780273438, -0.0088348388671875, -0.0078067779541015625, -0.006778717041015625, -0.0057506561279296875, -0.00472259521484375, -0.0036945343017578125, -0.002666473388671875, -0.0016384124755859375, -0.0006103515625, 0.0004177093505859375, 0.001445770263671875, 0.0024738311767578125, 0.00350189208984375, 0.0045299530029296875, 0.005558013916015625, 0.0065860748291015625, 0.0076141357421875, 0.008642196655273438, 0.009670257568359375, 0.010698318481445312, 0.01172637939453125, 0.012754440307617188, 0.013782501220703125, 0.014810562133789062, 0.015838623046875, 0.016866683959960938, 0.017894744873046875, 0.018922805786132812, 0.01995086669921875, 0.020978927612304688, 0.022006988525390625, 0.023035049438476562, 0.0240631103515625, 0.025091171264648438, 0.026119232177734375, 0.027147293090820312, 0.02817535400390625, 0.029203414916992188, 0.030231475830078125, 0.03125953674316406, 0.03228759765625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 8.0, 6.0, 8.0, 7.0, 9.0, 15.0, 33.0, 30.0, 38.0, 60.0, 91.0, 78.0, 86.0, 111.0, 85.0, 85.0, 54.0, 63.0, 36.0, 28.0, 24.0, 13.0, 7.0, 8.0, 8.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.424551010131836e-05, -1.368299126625061e-05, -1.3120472431182861e-05, -1.2557953596115112e-05, -1.1995434761047363e-05, -1.1432915925979614e-05, -1.0870397090911865e-05, -1.0307878255844116e-05, -9.745359420776367e-06, -9.182840585708618e-06, -8.620321750640869e-06, -8.05780291557312e-06, -7.495284080505371e-06, -6.932765245437622e-06, -6.370246410369873e-06, -5.807727575302124e-06, -5.245208740234375e-06, -4.682689905166626e-06, -4.120171070098877e-06, -3.557652235031128e-06, -2.995133399963379e-06, -2.43261456489563e-06, -1.8700957298278809e-06, -1.3075768947601318e-06, -7.450580596923828e-07, -1.825392246246338e-07, 3.7997961044311523e-07, 9.424984455108643e-07, 1.5050172805786133e-06, 2.0675361156463623e-06, 2.6300549507141113e-06, 3.1925737857818604e-06, 3.7550926208496094e-06, 4.317611455917358e-06, 4.880130290985107e-06, 5.4426491260528564e-06, 6.0051679611206055e-06, 6.5676867961883545e-06, 7.1302056312561035e-06, 7.692724466323853e-06, 8.255243301391602e-06, 8.81776213645935e-06, 9.3802809715271e-06, 9.942799806594849e-06, 1.0505318641662598e-05, 1.1067837476730347e-05, 1.1630356311798096e-05, 1.2192875146865845e-05, 1.2755393981933594e-05, 1.3317912817001343e-05, 1.3880431652069092e-05, 1.444295048713684e-05, 1.500546932220459e-05, 1.556798815727234e-05, 1.6130506992340088e-05, 1.6693025827407837e-05, 1.7255544662475586e-05, 1.7818063497543335e-05, 1.8380582332611084e-05, 1.8943101167678833e-05, 1.9505620002746582e-05, 2.006813883781433e-05, 2.063065767288208e-05, 2.119317650794983e-05, 2.1755695343017578e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 4.0, 7.0, 3.0, 6.0, 14.0, 10.0, 22.0, 27.0, 26.0, 49.0, 68.0, 108.0, 162.0, 295.0, 571.0, 1033.0, 2029.0, 4287.0, 10237.0, 28266.0, 97623.0, 357638.0, 385061.0, 109319.0, 31305.0, 11049.0, 4718.0, 2122.0, 1041.0, 596.0, 327.0, 193.0, 118.0, 70.0, 44.0, 26.0, 18.0, 17.0, 12.0, 9.0, 11.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0316162109375, -0.030563831329345703, -0.029511451721191406, -0.02845907211303711, -0.027406692504882812, -0.026354312896728516, -0.02530193328857422, -0.024249553680419922, -0.023197174072265625, -0.022144794464111328, -0.02109241485595703, -0.020040035247802734, -0.018987655639648438, -0.01793527603149414, -0.016882896423339844, -0.015830516815185547, -0.01477813720703125, -0.013725757598876953, -0.012673377990722656, -0.01162099838256836, -0.010568618774414062, -0.009516239166259766, -0.008463859558105469, -0.007411479949951172, -0.006359100341796875, -0.005306720733642578, -0.004254341125488281, -0.0032019615173339844, -0.0021495819091796875, -0.0010972023010253906, -4.482269287109375e-05, 0.0010075569152832031, 0.0020599365234375, 0.003112316131591797, 0.004164695739746094, 0.005217075347900391, 0.0062694549560546875, 0.007321834564208984, 0.008374214172363281, 0.009426593780517578, 0.010478973388671875, 0.011531352996826172, 0.012583732604980469, 0.013636112213134766, 0.014688491821289062, 0.01574087142944336, 0.016793251037597656, 0.017845630645751953, 0.01889801025390625, 0.019950389862060547, 0.021002769470214844, 0.02205514907836914, 0.023107528686523438, 0.024159908294677734, 0.02521228790283203, 0.026264667510986328, 0.027317047119140625, 0.028369426727294922, 0.02942180633544922, 0.030474185943603516, 0.03152656555175781, 0.03257894515991211, 0.033631324768066406, 0.0346837043762207, 0.035736083984375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 5.0, 4.0, 5.0, 5.0, 7.0, 10.0, 9.0, 18.0, 17.0, 26.0, 31.0, 53.0, 54.0, 61.0, 80.0, 68.0, 93.0, 79.0, 89.0, 51.0, 48.0, 39.0, 23.0, 28.0, 16.0, 18.0, 16.0, 6.0, 8.0, 6.0, 5.0, 6.0, 3.0, 4.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.008270263671875, -0.00800621509552002, -0.007742166519165039, -0.007478117942810059, -0.007214069366455078, -0.006950020790100098, -0.006685972213745117, -0.006421923637390137, -0.006157875061035156, -0.005893826484680176, -0.005629777908325195, -0.005365729331970215, -0.005101680755615234, -0.004837632179260254, -0.0045735836029052734, -0.004309535026550293, -0.0040454864501953125, -0.003781437873840332, -0.0035173892974853516, -0.003253340721130371, -0.0029892921447753906, -0.00272524356842041, -0.0024611949920654297, -0.0021971464157104492, -0.0019330978393554688, -0.0016690492630004883, -0.0014050006866455078, -0.0011409521102905273, -0.0008769035339355469, -0.0006128549575805664, -0.00034880638122558594, -8.475780487060547e-05, 0.000179290771484375, 0.00044333934783935547, 0.0007073879241943359, 0.0009714365005493164, 0.0012354850769042969, 0.0014995336532592773, 0.0017635822296142578, 0.0020276308059692383, 0.0022916793823242188, 0.0025557279586791992, 0.0028197765350341797, 0.00308382511138916, 0.0033478736877441406, 0.003611922264099121, 0.0038759708404541016, 0.004140019416809082, 0.0044040679931640625, 0.004668116569519043, 0.0049321651458740234, 0.005196213722229004, 0.005460262298583984, 0.005724310874938965, 0.005988359451293945, 0.006252408027648926, 0.006516456604003906, 0.006780505180358887, 0.007044553756713867, 0.007308602333068848, 0.007572650909423828, 0.007836699485778809, 0.008100748062133789, 0.00836479663848877, 0.00862884521484375]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 11.0, 8.0, 18.0, 12.0, 21.0, 33.0, 32.0, 46.0, 57.0, 60.0, 60.0, 73.0, 65.0, 69.0, 71.0, 69.0, 56.0, 47.0, 37.0, 29.0, 23.0, 32.0, 14.0, 12.0, 13.0, 5.0, 4.0, 9.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.26439544558525085, -0.25705698132514954, -0.2497185468673706, -0.2423800826072693, -0.23504163324832916, -0.22770318388938904, -0.22036471962928772, -0.2130262702703476, -0.20568782091140747, -0.19834937155246735, -0.19101092219352722, -0.1836724579334259, -0.17633400857448578, -0.16899555921554565, -0.16165709495544434, -0.1543186455965042, -0.1469801962375641, -0.13964174687862396, -0.13230329751968384, -0.12496483325958252, -0.1176263839006424, -0.11028793454170227, -0.10294947773218155, -0.09561102092266083, -0.0882725715637207, -0.08093412220478058, -0.07359566539525986, -0.06625720858573914, -0.05891875922679901, -0.05158030614256859, -0.044241853058338165, -0.03690339997410774, -0.029564961791038513, -0.02222650870680809, -0.014888055622577667, -0.007549602538347244, -0.0002111494541168213, 0.007127303630113602, 0.014465756714344025, 0.021804209798574448, 0.02914266288280487, 0.036481115967035294, 0.04381956905126572, 0.05115802213549614, 0.05849647521972656, 0.06583492457866669, 0.07317338138818741, 0.08051183819770813, 0.08785028755664825, 0.09518873691558838, 0.1025271937251091, 0.10986565053462982, 0.11720409989356995, 0.12454254925251007, 0.1318809986114502, 0.1392194628715515, 0.14655791223049164, 0.15389636158943176, 0.16123482584953308, 0.1685732752084732, 0.17591172456741333, 0.18325017392635345, 0.19058862328529358, 0.1979270875453949, 0.20526553690433502]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 0.0, 5.0, 5.0, 6.0, 10.0, 12.0, 9.0, 12.0, 19.0, 19.0, 19.0, 31.0, 23.0, 42.0, 40.0, 48.0, 32.0, 41.0, 28.0, 47.0, 46.0, 55.0, 45.0, 37.0, 34.0, 36.0, 40.0, 31.0, 27.0, 30.0, 32.0, 27.0, 17.0, 24.0, 20.0, 8.0, 14.0, 8.0, 6.0, 5.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1884523332118988, -0.18275634944438934, -0.17706038057804108, -0.17136439681053162, -0.16566841304302216, -0.1599724441766739, -0.15427646040916443, -0.14858049154281616, -0.1428845077753067, -0.13718852400779724, -0.13149255514144897, -0.12579657137393951, -0.12010059505701065, -0.11440461874008179, -0.10870863497257233, -0.10301265865564346, -0.097316674888134, -0.09162069857120514, -0.08592471480369568, -0.08022873848676682, -0.07453276216983795, -0.06883677840232849, -0.06314080208539963, -0.057444825768470764, -0.0517488457262516, -0.04605286568403244, -0.04035688936710358, -0.034660909324884415, -0.028964931145310402, -0.02326895296573639, -0.017572972923517227, -0.011876996606588364, -0.006181016564369202, -0.0004850379191339016, 0.0052109407261013985, 0.010906919836997986, 0.016602898016572, 0.02229887619614601, 0.027994856238365173, 0.03369083255529404, 0.0393868125975132, 0.04508279263973236, 0.050778768956661224, 0.056474748998880386, 0.06217072904109955, 0.06786670535802841, 0.07356268167495728, 0.07925866544246674, 0.0849546417593956, 0.09065061807632446, 0.09634660184383392, 0.10204257816076279, 0.10773855447769165, 0.11343453824520111, 0.11913051456212997, 0.12482649087905884, 0.1305224746465683, 0.13621845841407776, 0.14191442728042603, 0.14761041104793549, 0.15330639481544495, 0.1590023636817932, 0.16469834744930267, 0.17039433121681213, 0.1760903000831604]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 12.0, 11.0, 23.0, 38.0, 68.0, 78.0, 145.0, 276.0, 595.0, 1241.0, 2979.0, 7678.0, 21775.0, 75310.0, 478366.0, 368030.0, 61636.0, 18532.0, 6828.0, 2634.0, 1156.0, 488.0, 283.0, 161.0, 87.0, 38.0, 30.0, 12.0, 14.0, 11.0, 6.0, 3.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.37255859375, -0.3601112365722656, -0.34766387939453125, -0.3352165222167969, -0.3227691650390625, -0.3103218078613281, -0.29787445068359375, -0.2854270935058594, -0.272979736328125, -0.2605323791503906, -0.24808502197265625, -0.23563766479492188, -0.2231903076171875, -0.21074295043945312, -0.19829559326171875, -0.18584823608398438, -0.17340087890625, -0.16095352172851562, -0.14850616455078125, -0.13605880737304688, -0.1236114501953125, -0.11116409301757812, -0.09871673583984375, -0.08626937866210938, -0.073822021484375, -0.061374664306640625, -0.04892730712890625, -0.036479949951171875, -0.0240325927734375, -0.011585235595703125, 0.00086212158203125, 0.013309478759765625, 0.0257568359375, 0.038204193115234375, 0.05065155029296875, 0.06309890747070312, 0.0755462646484375, 0.08799362182617188, 0.10044097900390625, 0.11288833618164062, 0.125335693359375, 0.13778305053710938, 0.15023040771484375, 0.16267776489257812, 0.1751251220703125, 0.18757247924804688, 0.20001983642578125, 0.21246719360351562, 0.22491455078125, 0.23736190795898438, 0.24980926513671875, 0.2622566223144531, 0.2747039794921875, 0.2871513366699219, 0.29959869384765625, 0.3120460510253906, 0.324493408203125, 0.3369407653808594, 0.34938812255859375, 0.3618354797363281, 0.3742828369140625, 0.3867301940917969, 0.39917755126953125, 0.4116249084472656, 0.424072265625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 5.0, 0.0, 3.0, 4.0, 7.0, 8.0, 9.0, 11.0, 11.0, 17.0, 15.0, 20.0, 30.0, 23.0, 28.0, 21.0, 30.0, 39.0, 42.0, 38.0, 49.0, 53.0, 44.0, 39.0, 37.0, 50.0, 28.0, 35.0, 37.0, 34.0, 41.0, 27.0, 23.0, 25.0, 16.0, 19.0, 19.0, 7.0, 13.0, 10.0, 10.0, 7.0, 9.0, 4.0, 2.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.405517578125, -0.39430999755859375, -0.3831024169921875, -0.37189483642578125, -0.360687255859375, -0.34947967529296875, -0.3382720947265625, -0.32706451416015625, -0.31585693359375, -0.30464935302734375, -0.2934417724609375, -0.28223419189453125, -0.271026611328125, -0.25981903076171875, -0.2486114501953125, -0.23740386962890625, -0.2261962890625, -0.21498870849609375, -0.2037811279296875, -0.19257354736328125, -0.181365966796875, -0.17015838623046875, -0.1589508056640625, -0.14774322509765625, -0.13653564453125, -0.12532806396484375, -0.1141204833984375, -0.10291290283203125, -0.091705322265625, -0.08049774169921875, -0.0692901611328125, -0.05808258056640625, -0.046875, -0.03566741943359375, -0.0244598388671875, -0.01325225830078125, -0.002044677734375, 0.00916290283203125, 0.0203704833984375, 0.03157806396484375, 0.04278564453125, 0.05399322509765625, 0.0652008056640625, 0.07640838623046875, 0.087615966796875, 0.09882354736328125, 0.1100311279296875, 0.12123870849609375, 0.1324462890625, 0.14365386962890625, 0.1548614501953125, 0.16606903076171875, 0.177276611328125, 0.18848419189453125, 0.1996917724609375, 0.21089935302734375, 0.22210693359375, 0.23331451416015625, 0.2445220947265625, 0.25572967529296875, 0.266937255859375, 0.27814483642578125, 0.2893524169921875, 0.30055999755859375, 0.311767578125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 2.0, 6.0, 5.0, 4.0, 7.0, 10.0, 15.0, 20.0, 34.0, 46.0, 39.0, 66.0, 106.0, 171.0, 406.0, 813.0, 2220.0, 7198.0, 30664.0, 264768.0, 662741.0, 60834.0, 12566.0, 3496.0, 1136.0, 499.0, 230.0, 143.0, 80.0, 55.0, 44.0, 33.0, 18.0, 21.0, 10.0, 8.0, 10.0, 5.0, 6.0, 3.0, 6.0, 5.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.495361328125, -0.4799766540527344, -0.46459197998046875, -0.4492073059082031, -0.4338226318359375, -0.4184379577636719, -0.40305328369140625, -0.3876686096191406, -0.372283935546875, -0.3568992614746094, -0.34151458740234375, -0.3261299133300781, -0.3107452392578125, -0.2953605651855469, -0.27997589111328125, -0.2645912170410156, -0.24920654296875, -0.23382186889648438, -0.21843719482421875, -0.20305252075195312, -0.1876678466796875, -0.17228317260742188, -0.15689849853515625, -0.14151382446289062, -0.126129150390625, -0.11074447631835938, -0.09535980224609375, -0.07997512817382812, -0.0645904541015625, -0.049205780029296875, -0.03382110595703125, -0.018436431884765625, -0.0030517578125, 0.012332916259765625, 0.02771759033203125, 0.043102264404296875, 0.0584869384765625, 0.07387161254882812, 0.08925628662109375, 0.10464096069335938, 0.120025634765625, 0.13541030883789062, 0.15079498291015625, 0.16617965698242188, 0.1815643310546875, 0.19694900512695312, 0.21233367919921875, 0.22771835327148438, 0.24310302734375, 0.2584877014160156, 0.27387237548828125, 0.2892570495605469, 0.3046417236328125, 0.3200263977050781, 0.33541107177734375, 0.3507957458496094, 0.366180419921875, 0.3815650939941406, 0.39694976806640625, 0.4123344421386719, 0.4277191162109375, 0.4431037902832031, 0.45848846435546875, 0.4738731384277344, 0.4892578125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 2.0, 9.0, 7.0, 15.0, 11.0, 16.0, 11.0, 15.0, 14.0, 20.0, 28.0, 25.0, 30.0, 34.0, 44.0, 33.0, 45.0, 34.0, 44.0, 47.0, 59.0, 44.0, 39.0, 48.0, 54.0, 37.0, 40.0, 30.0, 28.0, 27.0, 18.0, 12.0, 20.0, 13.0, 14.0, 8.0, 5.0, 6.0, 3.0, 3.0, 4.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.33251953125, -0.3195762634277344, -0.30663299560546875, -0.2936897277832031, -0.2807464599609375, -0.2678031921386719, -0.25485992431640625, -0.24191665649414062, -0.228973388671875, -0.21603012084960938, -0.20308685302734375, -0.19014358520507812, -0.1772003173828125, -0.16425704956054688, -0.15131378173828125, -0.13837051391601562, -0.12542724609375, -0.11248397827148438, -0.09954071044921875, -0.08659744262695312, -0.0736541748046875, -0.060710906982421875, -0.04776763916015625, -0.034824371337890625, -0.021881103515625, -0.008937835693359375, 0.00400543212890625, 0.016948699951171875, 0.0298919677734375, 0.042835235595703125, 0.05577850341796875, 0.06872177124023438, 0.0816650390625, 0.09460830688476562, 0.10755157470703125, 0.12049484252929688, 0.1334381103515625, 0.14638137817382812, 0.15932464599609375, 0.17226791381835938, 0.185211181640625, 0.19815444946289062, 0.21109771728515625, 0.22404098510742188, 0.2369842529296875, 0.24992752075195312, 0.26287078857421875, 0.2758140563964844, 0.28875732421875, 0.3017005920410156, 0.31464385986328125, 0.3275871276855469, 0.3405303955078125, 0.3534736633300781, 0.36641693115234375, 0.3793601989746094, 0.392303466796875, 0.4052467346191406, 0.41819000244140625, 0.4311332702636719, 0.4440765380859375, 0.4570198059082031, 0.46996307373046875, 0.4829063415527344, 0.495849609375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 3.0, 8.0, 3.0, 5.0, 7.0, 8.0, 11.0, 29.0, 34.0, 73.0, 128.0, 265.0, 574.0, 1732.0, 7310.0, 61695.0, 771117.0, 186317.0, 14688.0, 2844.0, 911.0, 372.0, 170.0, 89.0, 50.0, 33.0, 28.0, 14.0, 5.0, 10.0, 4.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1512451171875, -0.1471233367919922, -0.14300155639648438, -0.13887977600097656, -0.13475799560546875, -0.13063621520996094, -0.12651443481445312, -0.12239265441894531, -0.1182708740234375, -0.11414909362792969, -0.11002731323242188, -0.10590553283691406, -0.10178375244140625, -0.09766197204589844, -0.09354019165039062, -0.08941841125488281, -0.085296630859375, -0.08117485046386719, -0.07705307006835938, -0.07293128967285156, -0.06880950927734375, -0.06468772888183594, -0.060565948486328125, -0.05644416809082031, -0.0523223876953125, -0.04820060729980469, -0.044078826904296875, -0.03995704650878906, -0.03583526611328125, -0.03171348571777344, -0.027591705322265625, -0.023469924926757812, -0.01934814453125, -0.015226364135742188, -0.011104583740234375, -0.0069828033447265625, -0.00286102294921875, 0.0012607574462890625, 0.005382537841796875, 0.009504318237304688, 0.0136260986328125, 0.017747879028320312, 0.021869659423828125, 0.025991439819335938, 0.03011322021484375, 0.03423500061035156, 0.038356781005859375, 0.04247856140136719, 0.046600341796875, 0.05072212219238281, 0.054843902587890625, 0.05896568298339844, 0.06308746337890625, 0.06720924377441406, 0.07133102416992188, 0.07545280456542969, 0.0795745849609375, 0.08369636535644531, 0.08781814575195312, 0.09193992614746094, 0.09606170654296875, 0.10018348693847656, 0.10430526733398438, 0.10842704772949219, 0.112548828125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 5.0, 3.0, 9.0, 13.0, 16.0, 29.0, 34.0, 34.0, 57.0, 83.0, 91.0, 154.0, 133.0, 89.0, 76.0, 64.0, 30.0, 26.0, 16.0, 12.0, 6.0, 3.0, 3.0, 6.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.09808349609375e-05, -2.043880522251129e-05, -1.9896775484085083e-05, -1.9354745745658875e-05, -1.8812716007232666e-05, -1.8270686268806458e-05, -1.772865653038025e-05, -1.718662679195404e-05, -1.6644597053527832e-05, -1.6102567315101624e-05, -1.5560537576675415e-05, -1.5018507838249207e-05, -1.4476478099822998e-05, -1.393444836139679e-05, -1.3392418622970581e-05, -1.2850388884544373e-05, -1.2308359146118164e-05, -1.1766329407691956e-05, -1.1224299669265747e-05, -1.0682269930839539e-05, -1.014024019241333e-05, -9.598210453987122e-06, -9.056180715560913e-06, -8.514150977134705e-06, -7.972121238708496e-06, -7.430091500282288e-06, -6.888061761856079e-06, -6.346032023429871e-06, -5.804002285003662e-06, -5.261972546577454e-06, -4.719942808151245e-06, -4.177913069725037e-06, -3.635883331298828e-06, -3.0938535928726196e-06, -2.551823854446411e-06, -2.0097941160202026e-06, -1.4677643775939941e-06, -9.257346391677856e-07, -3.8370490074157715e-07, 1.5832483768463135e-07, 7.003545761108398e-07, 1.2423843145370483e-06, 1.7844140529632568e-06, 2.3264437913894653e-06, 2.868473529815674e-06, 3.4105032682418823e-06, 3.952533006668091e-06, 4.494562745094299e-06, 5.036592483520508e-06, 5.578622221946716e-06, 6.120651960372925e-06, 6.662681698799133e-06, 7.204711437225342e-06, 7.74674117565155e-06, 8.288770914077759e-06, 8.830800652503967e-06, 9.372830390930176e-06, 9.914860129356384e-06, 1.0456889867782593e-05, 1.0998919606208801e-05, 1.154094934463501e-05, 1.2082979083061218e-05, 1.2625008821487427e-05, 1.3167038559913635e-05, 1.3709068298339844e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 10.0, 4.0, 5.0, 19.0, 38.0, 60.0, 82.0, 117.0, 198.0, 347.0, 544.0, 1060.0, 2201.0, 5792.0, 22872.0, 191742.0, 713037.0, 88756.0, 13717.0, 4104.0, 1711.0, 916.0, 487.0, 286.0, 176.0, 96.0, 51.0, 46.0, 23.0, 18.0, 10.0, 7.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.153564453125, -0.1493387222290039, -0.1451129913330078, -0.14088726043701172, -0.13666152954101562, -0.13243579864501953, -0.12821006774902344, -0.12398433685302734, -0.11975860595703125, -0.11553287506103516, -0.11130714416503906, -0.10708141326904297, -0.10285568237304688, -0.09862995147705078, -0.09440422058105469, -0.0901784896850586, -0.0859527587890625, -0.0817270278930664, -0.07750129699707031, -0.07327556610107422, -0.06904983520507812, -0.06482410430908203, -0.06059837341308594, -0.056372642517089844, -0.05214691162109375, -0.047921180725097656, -0.04369544982910156, -0.03946971893310547, -0.035243988037109375, -0.03101825714111328, -0.026792526245117188, -0.022566795349121094, -0.018341064453125, -0.014115333557128906, -0.009889602661132812, -0.005663871765136719, -0.001438140869140625, 0.0027875900268554688, 0.0070133209228515625, 0.011239051818847656, 0.01546478271484375, 0.019690513610839844, 0.023916244506835938, 0.02814197540283203, 0.032367706298828125, 0.03659343719482422, 0.04081916809082031, 0.045044898986816406, 0.0492706298828125, 0.053496360778808594, 0.05772209167480469, 0.06194782257080078, 0.06617355346679688, 0.07039928436279297, 0.07462501525878906, 0.07885074615478516, 0.08307647705078125, 0.08730220794677734, 0.09152793884277344, 0.09575366973876953, 0.09997940063476562, 0.10420513153076172, 0.10843086242675781, 0.1126565933227539, 0.11688232421875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 7.0, 15.0, 16.0, 21.0, 19.0, 32.0, 31.0, 42.0, 68.0, 80.0, 110.0, 119.0, 111.0, 66.0, 56.0, 56.0, 26.0, 28.0, 25.0, 12.0, 15.0, 8.0, 6.0, 3.0, 1.0, 4.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0457763671875, -0.044361114501953125, -0.04294586181640625, -0.041530609130859375, -0.0401153564453125, -0.038700103759765625, -0.03728485107421875, -0.035869598388671875, -0.034454345703125, -0.033039093017578125, -0.03162384033203125, -0.030208587646484375, -0.0287933349609375, -0.027378082275390625, -0.02596282958984375, -0.024547576904296875, -0.02313232421875, -0.021717071533203125, -0.02030181884765625, -0.018886566162109375, -0.0174713134765625, -0.016056060791015625, -0.01464080810546875, -0.013225555419921875, -0.011810302734375, -0.010395050048828125, -0.00897979736328125, -0.007564544677734375, -0.0061492919921875, -0.004734039306640625, -0.00331878662109375, -0.001903533935546875, -0.00048828125, 0.000926971435546875, 0.00234222412109375, 0.003757476806640625, 0.0051727294921875, 0.006587982177734375, 0.00800323486328125, 0.009418487548828125, 0.010833740234375, 0.012248992919921875, 0.01366424560546875, 0.015079498291015625, 0.0164947509765625, 0.017910003662109375, 0.01932525634765625, 0.020740509033203125, 0.02215576171875, 0.023571014404296875, 0.02498626708984375, 0.026401519775390625, 0.0278167724609375, 0.029232025146484375, 0.03064727783203125, 0.032062530517578125, 0.033477783203125, 0.034893035888671875, 0.03630828857421875, 0.037723541259765625, 0.0391387939453125, 0.040554046630859375, 0.04196929931640625, 0.043384552001953125, 0.0447998046875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 4.0, 9.0, 22.0, 35.0, 65.0, 93.0, 136.0, 131.0, 145.0, 132.0, 89.0, 53.0, 44.0, 28.0, 9.0, 8.0, 2.0, 5.0, 1.0, 2.0], "bins": [-1.6661275625228882, -1.6341406106948853, -1.6021536588668823, -1.5701667070388794, -1.5381797552108765, -1.5061928033828735, -1.4742058515548706, -1.4422187805175781, -1.4102318286895752, -1.3782448768615723, -1.3462579250335693, -1.3142709732055664, -1.2822840213775635, -1.2502970695495605, -1.2183101177215576, -1.1863231658935547, -1.1543362140655518, -1.1223492622375488, -1.090362310409546, -1.058375358581543, -1.02638840675354, -0.9944014549255371, -0.9624144434928894, -0.9304274916648865, -0.8984405398368835, -0.8664535880088806, -0.8344666361808777, -0.8024796843528748, -0.770492672920227, -0.7385057210922241, -0.7065187692642212, -0.6745318174362183, -0.6425447463989258, -0.6105577945709229, -0.5785708427429199, -0.546583890914917, -0.5145969390869141, -0.48260995745658875, -0.4506229758262634, -0.4186360239982605, -0.38664907217025757, -0.35466212034225464, -0.3226751685142517, -0.2906881868839264, -0.25870123505592346, -0.22671428322792053, -0.1947273164987564, -0.16274034976959229, -0.13075339794158936, -0.09876643866300583, -0.0667794793844223, -0.034792520105838776, -0.002805560827255249, 0.02918139100074768, 0.061168357729911804, 0.09315532445907593, 0.12514227628707886, 0.1571292281150818, 0.1891161948442459, 0.22110316157341003, 0.25309011340141296, 0.2850770652294159, 0.3170640468597412, 0.34905099868774414, 0.38103795051574707]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 1.0, 3.0, 5.0, 4.0, 10.0, 10.0, 15.0, 17.0, 18.0, 23.0, 23.0, 25.0, 19.0, 44.0, 38.0, 31.0, 26.0, 24.0, 37.0, 52.0, 26.0, 52.0, 37.0, 37.0, 33.0, 41.0, 35.0, 32.0, 28.0, 33.0, 20.0, 26.0, 28.0, 22.0, 18.0, 23.0, 16.0, 12.0, 18.0, 8.0, 7.0, 7.0, 5.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5250296592712402, -0.506401777267456, -0.48777392506599426, -0.46914607286453247, -0.4505181908607483, -0.4318903088569641, -0.4132624566555023, -0.3946346044540405, -0.37600672245025635, -0.35737884044647217, -0.3387509882450104, -0.3201231360435486, -0.3014952540397644, -0.2828673720359802, -0.26423951983451843, -0.24561165273189545, -0.22698378562927246, -0.20835591852664948, -0.1897280514240265, -0.1711001843214035, -0.15247231721878052, -0.13384445011615753, -0.11521658301353455, -0.09658871591091156, -0.07796084880828857, -0.05933298170566559, -0.0407051146030426, -0.022077247500419617, -0.003449380397796631, 0.015178486704826355, 0.03380635380744934, 0.05243422091007233, 0.07106208801269531, 0.0896899551153183, 0.10831782221794128, 0.12694568932056427, 0.14557355642318726, 0.16420142352581024, 0.18282929062843323, 0.2014571577310562, 0.2200850248336792, 0.23871289193630219, 0.25734075903892517, 0.27596861124038696, 0.29459649324417114, 0.3132243752479553, 0.3318522274494171, 0.3504800796508789, 0.3691079616546631, 0.38773584365844727, 0.40636369585990906, 0.42499154806137085, 0.44361943006515503, 0.4622473120689392, 0.480875164270401, 0.4995030164718628, 0.518130898475647, 0.5367587804794312, 0.5553866624832153, 0.5740144848823547, 0.5926423668861389, 0.6112702488899231, 0.6298980712890625, 0.6485259532928467, 0.6671538352966309]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 9.0, 4.0, 8.0, 26.0, 29.0, 32.0, 36.0, 78.0, 185.0, 287.0, 669.0, 1367.0, 3007.0, 8027.0, 33514.0, 824762.0, 3172936.0, 125468.0, 14961.0, 4919.0, 1973.0, 963.0, 464.0, 220.0, 116.0, 58.0, 51.0, 42.0, 16.0, 16.0, 12.0, 10.0, 7.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.66650390625, -0.6470489501953125, -0.627593994140625, -0.6081390380859375, -0.58868408203125, -0.5692291259765625, -0.549774169921875, -0.5303192138671875, -0.5108642578125, -0.4914093017578125, -0.471954345703125, -0.4524993896484375, -0.43304443359375, -0.4135894775390625, -0.394134521484375, -0.3746795654296875, -0.355224609375, -0.3357696533203125, -0.316314697265625, -0.2968597412109375, -0.27740478515625, -0.2579498291015625, -0.238494873046875, -0.2190399169921875, -0.1995849609375, -0.1801300048828125, -0.160675048828125, -0.1412200927734375, -0.12176513671875, -0.1023101806640625, -0.082855224609375, -0.0634002685546875, -0.0439453125, -0.0244903564453125, -0.005035400390625, 0.0144195556640625, 0.03387451171875, 0.0533294677734375, 0.072784423828125, 0.0922393798828125, 0.1116943359375, 0.1311492919921875, 0.150604248046875, 0.1700592041015625, 0.18951416015625, 0.2089691162109375, 0.228424072265625, 0.2478790283203125, 0.267333984375, 0.2867889404296875, 0.306243896484375, 0.3256988525390625, 0.34515380859375, 0.3646087646484375, 0.384063720703125, 0.4035186767578125, 0.4229736328125, 0.4424285888671875, 0.461883544921875, 0.4813385009765625, 0.50079345703125, 0.5202484130859375, 0.539703369140625, 0.5591583251953125, 0.57861328125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 4.0, 3.0, 7.0, 5.0, 7.0, 13.0, 17.0, 26.0, 27.0, 20.0, 21.0, 21.0, 33.0, 25.0, 31.0, 38.0, 57.0, 49.0, 44.0, 35.0, 44.0, 43.0, 43.0, 50.0, 42.0, 35.0, 25.0, 36.0, 28.0, 32.0, 25.0, 22.0, 16.0, 21.0, 14.0, 10.0, 7.0, 7.0, 7.0, 3.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1837158203125, -0.17726898193359375, -0.1708221435546875, -0.16437530517578125, -0.157928466796875, -0.15148162841796875, -0.1450347900390625, -0.13858795166015625, -0.13214111328125, -0.12569427490234375, -0.1192474365234375, -0.11280059814453125, -0.106353759765625, -0.09990692138671875, -0.0934600830078125, -0.08701324462890625, -0.08056640625, -0.07411956787109375, -0.0676727294921875, -0.06122589111328125, -0.054779052734375, -0.04833221435546875, -0.0418853759765625, -0.03543853759765625, -0.02899169921875, -0.02254486083984375, -0.0160980224609375, -0.00965118408203125, -0.003204345703125, 0.00324249267578125, 0.0096893310546875, 0.01613616943359375, 0.0225830078125, 0.02902984619140625, 0.0354766845703125, 0.04192352294921875, 0.048370361328125, 0.05481719970703125, 0.0612640380859375, 0.06771087646484375, 0.07415771484375, 0.08060455322265625, 0.0870513916015625, 0.09349822998046875, 0.099945068359375, 0.10639190673828125, 0.1128387451171875, 0.11928558349609375, 0.125732421875, 0.13217926025390625, 0.1386260986328125, 0.14507293701171875, 0.151519775390625, 0.15796661376953125, 0.1644134521484375, 0.17086029052734375, 0.17730712890625, 0.18375396728515625, 0.1902008056640625, 0.19664764404296875, 0.203094482421875, 0.20954132080078125, 0.2159881591796875, 0.22243499755859375, 0.2288818359375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 6.0, 22.0, 18.0, 46.0, 74.0, 179.0, 461.0, 1618.0, 8253.0, 134374.0, 3949160.0, 90920.0, 6915.0, 1446.0, 447.0, 161.0, 60.0, 46.0, 24.0, 18.0, 10.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88232421875, -0.8513107299804688, -0.8202972412109375, -0.7892837524414062, -0.758270263671875, -0.7272567749023438, -0.6962432861328125, -0.6652297973632812, -0.63421630859375, -0.6032028198242188, -0.5721893310546875, -0.5411758422851562, -0.510162353515625, -0.47914886474609375, -0.4481353759765625, -0.41712188720703125, -0.3861083984375, -0.35509490966796875, -0.3240814208984375, -0.29306793212890625, -0.262054443359375, -0.23104095458984375, -0.2000274658203125, -0.16901397705078125, -0.13800048828125, -0.10698699951171875, -0.0759735107421875, -0.04496002197265625, -0.013946533203125, 0.01706695556640625, 0.0480804443359375, 0.07909393310546875, 0.110107421875, 0.14112091064453125, 0.1721343994140625, 0.20314788818359375, 0.234161376953125, 0.26517486572265625, 0.2961883544921875, 0.32720184326171875, 0.35821533203125, 0.38922882080078125, 0.4202423095703125, 0.45125579833984375, 0.482269287109375, 0.5132827758789062, 0.5442962646484375, 0.5753097534179688, 0.6063232421875, 0.6373367309570312, 0.6683502197265625, 0.6993637084960938, 0.730377197265625, 0.7613906860351562, 0.7924041748046875, 0.8234176635742188, 0.85443115234375, 0.8854446411132812, 0.9164581298828125, 0.9474716186523438, 0.978485107421875, 1.0094985961914062, 1.0405120849609375, 1.0715255737304688, 1.1025390625]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 7.0, 9.0, 16.0, 16.0, 17.0, 21.0, 32.0, 57.0, 89.0, 136.0, 214.0, 375.0, 607.0, 736.0, 652.0, 437.0, 251.0, 131.0, 83.0, 56.0, 34.0, 28.0, 21.0, 14.0, 12.0, 3.0, 7.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.185302734375, -0.18037033081054688, -0.17543792724609375, -0.17050552368164062, -0.1655731201171875, -0.16064071655273438, -0.15570831298828125, -0.15077590942382812, -0.145843505859375, -0.14091110229492188, -0.13597869873046875, -0.13104629516601562, -0.1261138916015625, -0.12118148803710938, -0.11624908447265625, -0.11131668090820312, -0.10638427734375, -0.10145187377929688, -0.09651947021484375, -0.09158706665039062, -0.0866546630859375, -0.08172225952148438, -0.07678985595703125, -0.07185745239257812, -0.066925048828125, -0.061992645263671875, -0.05706024169921875, -0.052127838134765625, -0.0471954345703125, -0.042263031005859375, -0.03733062744140625, -0.032398223876953125, -0.0274658203125, -0.022533416748046875, -0.01760101318359375, -0.012668609619140625, -0.0077362060546875, -0.002803802490234375, 0.00212860107421875, 0.007061004638671875, 0.011993408203125, 0.016925811767578125, 0.02185821533203125, 0.026790618896484375, 0.0317230224609375, 0.036655426025390625, 0.04158782958984375, 0.046520233154296875, 0.05145263671875, 0.056385040283203125, 0.06131744384765625, 0.06624984741210938, 0.0711822509765625, 0.07611465454101562, 0.08104705810546875, 0.08597946166992188, 0.090911865234375, 0.09584426879882812, 0.10077667236328125, 0.10570907592773438, 0.1106414794921875, 0.11557388305664062, 0.12050628662109375, 0.12543869018554688, 0.13037109375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 11.0, 12.0, 14.0, 15.0, 21.0, 25.0, 32.0, 38.0, 42.0, 54.0, 62.0, 70.0, 56.0, 70.0, 74.0, 64.0, 47.0, 56.0, 54.0, 41.0, 30.0, 17.0, 22.0, 17.0, 13.0, 12.0, 10.0, 8.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29683399200439453, -0.2860824465751648, -0.27533093094825745, -0.2645793855190277, -0.25382786989212036, -0.24307632446289062, -0.2323247790336609, -0.22157324850559235, -0.2108217179775238, -0.20007018744945526, -0.18931865692138672, -0.17856711149215698, -0.16781558096408844, -0.1570640504360199, -0.14631250500679016, -0.13556097447872162, -0.12480944395065308, -0.11405791342258453, -0.1033063754439354, -0.09255483746528625, -0.08180330693721771, -0.07105177640914917, -0.06030023843050003, -0.04954870045185089, -0.03879716992378235, -0.028045635670423508, -0.017294101417064667, -0.006542567163705826, 0.004208967089653015, 0.014960501343011856, 0.025712035596370697, 0.036463573575019836, 0.04721510410308838, 0.05796663835644722, 0.06871817260980606, 0.0794697105884552, 0.09022124111652374, 0.10097277164459229, 0.11172430962324142, 0.12247584760189056, 0.1332273781299591, 0.14397890865802765, 0.1547304391860962, 0.16548198461532593, 0.17623351514339447, 0.186985045671463, 0.19773659110069275, 0.2084881216287613, 0.21923965215682983, 0.22999118268489838, 0.24074271321296692, 0.25149425864219666, 0.262245774269104, 0.27299731969833374, 0.2837488651275635, 0.2945004105567932, 0.30525192618370056, 0.3160034716129303, 0.32675498723983765, 0.3375065326690674, 0.3482580780982971, 0.35900959372520447, 0.3697611391544342, 0.38051265478134155, 0.3912642002105713]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 7.0, 7.0, 11.0, 14.0, 15.0, 25.0, 19.0, 23.0, 24.0, 29.0, 33.0, 37.0, 31.0, 40.0, 41.0, 46.0, 41.0, 38.0, 41.0, 35.0, 47.0, 36.0, 34.0, 37.0, 36.0, 33.0, 30.0, 26.0, 26.0, 35.0, 17.0, 20.0, 14.0, 11.0, 7.0, 8.0, 9.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2376996874809265, -0.22973011434078217, -0.22176054120063782, -0.21379095315933228, -0.20582138001918793, -0.19785180687904358, -0.18988221883773804, -0.1819126456975937, -0.17394307255744934, -0.165973499417305, -0.15800392627716064, -0.1500343382358551, -0.14206476509571075, -0.1340951919555664, -0.12612560391426086, -0.11815603077411652, -0.11018645763397217, -0.10221688449382782, -0.09424730390310287, -0.08627772331237793, -0.07830815017223358, -0.07033857703208923, -0.06236899644136429, -0.05439941957592964, -0.046429842710494995, -0.03846026584506035, -0.030490688979625702, -0.022521112114191055, -0.014551535248756409, -0.006581958383321762, 0.0013876184821128845, 0.009357195347547531, 0.017326772212982178, 0.025296349078416824, 0.03326592594385147, 0.04123550280928612, 0.049205079674720764, 0.05717465654015541, 0.06514423340559006, 0.073113813996315, 0.08108338713645935, 0.0890529602766037, 0.09702254086732864, 0.10499212145805359, 0.11296169459819794, 0.12093126773834229, 0.12890085577964783, 0.13687042891979218, 0.14484000205993652, 0.15280957520008087, 0.16077914834022522, 0.16874873638153076, 0.1767183095216751, 0.18468788266181946, 0.192657470703125, 0.20062704384326935, 0.2085966169834137, 0.21656619012355804, 0.2245357632637024, 0.23250535130500793, 0.24047492444515228, 0.24844449758529663, 0.2564140856266022, 0.2643836438655853, 0.27235323190689087]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 6.0, 8.0, 14.0, 29.0, 38.0, 47.0, 67.0, 111.0, 152.0, 273.0, 458.0, 715.0, 1310.0, 2574.0, 4988.0, 10498.0, 25356.0, 115029.0, 594710.0, 226862.0, 38325.0, 13636.0, 6241.0, 3171.0, 1676.0, 906.0, 504.0, 287.0, 176.0, 115.0, 89.0, 46.0, 41.0, 34.0, 19.0, 12.0, 11.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0], "bins": [-0.1278076171875, -0.12441444396972656, -0.12102127075195312, -0.11762809753417969, -0.11423492431640625, -0.11084175109863281, -0.10744857788085938, -0.10405540466308594, -0.1006622314453125, -0.09726905822753906, -0.09387588500976562, -0.09048271179199219, -0.08708953857421875, -0.08369636535644531, -0.08030319213867188, -0.07691001892089844, -0.073516845703125, -0.07012367248535156, -0.06673049926757812, -0.06333732604980469, -0.05994415283203125, -0.05655097961425781, -0.053157806396484375, -0.04976463317871094, -0.0463714599609375, -0.04297828674316406, -0.039585113525390625, -0.03619194030761719, -0.03279876708984375, -0.029405593872070312, -0.026012420654296875, -0.022619247436523438, -0.01922607421875, -0.015832901000976562, -0.012439727783203125, -0.009046554565429688, -0.00565338134765625, -0.0022602081298828125, 0.001132965087890625, 0.0045261383056640625, 0.0079193115234375, 0.011312484741210938, 0.014705657958984375, 0.018098831176757812, 0.02149200439453125, 0.024885177612304688, 0.028278350830078125, 0.03167152404785156, 0.035064697265625, 0.03845787048339844, 0.041851043701171875, 0.04524421691894531, 0.04863739013671875, 0.05203056335449219, 0.055423736572265625, 0.05881690979003906, 0.0622100830078125, 0.06560325622558594, 0.06899642944335938, 0.07238960266113281, 0.07578277587890625, 0.07917594909667969, 0.08256912231445312, 0.08596229553222656, 0.08935546875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 3.0, 6.0, 7.0, 7.0, 11.0, 8.0, 20.0, 23.0, 25.0, 18.0, 24.0, 38.0, 29.0, 41.0, 38.0, 44.0, 41.0, 47.0, 42.0, 46.0, 43.0, 37.0, 44.0, 46.0, 33.0, 34.0, 32.0, 28.0, 28.0, 35.0, 32.0, 18.0, 19.0, 9.0, 14.0, 6.0, 5.0, 6.0, 4.0, 6.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1531982421875, -0.14783668518066406, -0.14247512817382812, -0.1371135711669922, -0.13175201416015625, -0.1263904571533203, -0.12102890014648438, -0.11566734313964844, -0.1103057861328125, -0.10494422912597656, -0.09958267211914062, -0.09422111511230469, -0.08885955810546875, -0.08349800109863281, -0.07813644409179688, -0.07277488708496094, -0.067413330078125, -0.06205177307128906, -0.056690216064453125, -0.05132865905761719, -0.04596710205078125, -0.04060554504394531, -0.035243988037109375, -0.029882431030273438, -0.0245208740234375, -0.019159317016601562, -0.013797760009765625, -0.008436203002929688, -0.00307464599609375, 0.0022869110107421875, 0.007648468017578125, 0.013010025024414062, 0.01837158203125, 0.023733139038085938, 0.029094696044921875, 0.03445625305175781, 0.03981781005859375, 0.04517936706542969, 0.050540924072265625, 0.05590248107910156, 0.0612640380859375, 0.06662559509277344, 0.07198715209960938, 0.07734870910644531, 0.08271026611328125, 0.08807182312011719, 0.09343338012695312, 0.09879493713378906, 0.104156494140625, 0.10951805114746094, 0.11487960815429688, 0.12024116516113281, 0.12560272216796875, 0.1309642791748047, 0.13632583618164062, 0.14168739318847656, 0.1470489501953125, 0.15241050720214844, 0.15777206420898438, 0.1631336212158203, 0.16849517822265625, 0.1738567352294922, 0.17921829223632812, 0.18457984924316406, 0.18994140625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 10.0, 6.0, 16.0, 14.0, 27.0, 48.0, 84.0, 140.0, 240.0, 501.0, 1053.0, 2189.0, 5190.0, 14296.0, 45364.0, 193481.0, 526676.0, 190346.0, 45138.0, 14225.0, 5228.0, 2222.0, 957.0, 505.0, 251.0, 139.0, 92.0, 36.0, 35.0, 11.0, 12.0, 9.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0882568359375, -0.08569812774658203, -0.08313941955566406, -0.0805807113647461, -0.07802200317382812, -0.07546329498291016, -0.07290458679199219, -0.07034587860107422, -0.06778717041015625, -0.06522846221923828, -0.06266975402832031, -0.060111045837402344, -0.057552337646484375, -0.054993629455566406, -0.05243492126464844, -0.04987621307373047, -0.0473175048828125, -0.04475879669189453, -0.04220008850097656, -0.039641380310058594, -0.037082672119140625, -0.034523963928222656, -0.03196525573730469, -0.02940654754638672, -0.02684783935546875, -0.02428913116455078, -0.021730422973632812, -0.019171714782714844, -0.016613006591796875, -0.014054298400878906, -0.011495590209960938, -0.008936882019042969, -0.006378173828125, -0.0038194656372070312, -0.0012607574462890625, 0.0012979507446289062, 0.003856658935546875, 0.006415367126464844, 0.008974075317382812, 0.011532783508300781, 0.01409149169921875, 0.01665019989013672, 0.019208908081054688, 0.021767616271972656, 0.024326324462890625, 0.026885032653808594, 0.029443740844726562, 0.03200244903564453, 0.0345611572265625, 0.03711986541748047, 0.03967857360839844, 0.042237281799316406, 0.044795989990234375, 0.047354698181152344, 0.04991340637207031, 0.05247211456298828, 0.05503082275390625, 0.05758953094482422, 0.06014823913574219, 0.06270694732666016, 0.06526565551757812, 0.0678243637084961, 0.07038307189941406, 0.07294178009033203, 0.07550048828125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 9.0, 8.0, 4.0, 12.0, 15.0, 14.0, 15.0, 23.0, 26.0, 28.0, 24.0, 34.0, 41.0, 37.0, 25.0, 37.0, 40.0, 37.0, 27.0, 56.0, 35.0, 38.0, 50.0, 46.0, 34.0, 30.0, 31.0, 34.0, 24.0, 22.0, 23.0, 15.0, 18.0, 18.0, 12.0, 11.0, 9.0, 5.0, 4.0, 9.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.383056640625, -0.37109375, -0.359130859375, -0.34716796875, -0.335205078125, -0.3232421875, -0.311279296875, -0.29931640625, -0.287353515625, -0.275390625, -0.263427734375, -0.25146484375, -0.239501953125, -0.2275390625, -0.215576171875, -0.20361328125, -0.191650390625, -0.1796875, -0.167724609375, -0.15576171875, -0.143798828125, -0.1318359375, -0.119873046875, -0.10791015625, -0.095947265625, -0.083984375, -0.072021484375, -0.06005859375, -0.048095703125, -0.0361328125, -0.024169921875, -0.01220703125, -0.000244140625, 0.01171875, 0.023681640625, 0.03564453125, 0.047607421875, 0.0595703125, 0.071533203125, 0.08349609375, 0.095458984375, 0.107421875, 0.119384765625, 0.13134765625, 0.143310546875, 0.1552734375, 0.167236328125, 0.17919921875, 0.191162109375, 0.203125, 0.215087890625, 0.22705078125, 0.239013671875, 0.2509765625, 0.262939453125, 0.27490234375, 0.286865234375, 0.298828125, 0.310791015625, 0.32275390625, 0.334716796875, 0.3466796875, 0.358642578125, 0.37060546875, 0.382568359375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 6.0, 15.0, 18.0, 32.0, 53.0, 79.0, 151.0, 283.0, 578.0, 1215.0, 2737.0, 7592.0, 27488.0, 201988.0, 662020.0, 114309.0, 19649.0, 6023.0, 2326.0, 942.0, 481.0, 242.0, 121.0, 72.0, 47.0, 28.0, 23.0, 11.0, 5.0, 4.0, 6.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055145263671875, -0.05366992950439453, -0.05219459533691406, -0.050719261169433594, -0.049243927001953125, -0.047768592834472656, -0.04629325866699219, -0.04481792449951172, -0.04334259033203125, -0.04186725616455078, -0.04039192199707031, -0.038916587829589844, -0.037441253662109375, -0.035965919494628906, -0.03449058532714844, -0.03301525115966797, -0.0315399169921875, -0.03006458282470703, -0.028589248657226562, -0.027113914489746094, -0.025638580322265625, -0.024163246154785156, -0.022687911987304688, -0.02121257781982422, -0.01973724365234375, -0.01826190948486328, -0.016786575317382812, -0.015311241149902344, -0.013835906982421875, -0.012360572814941406, -0.010885238647460938, -0.009409904479980469, -0.0079345703125, -0.006459236145019531, -0.0049839019775390625, -0.0035085678100585938, -0.002033233642578125, -0.0005578994750976562, 0.0009174346923828125, 0.0023927688598632812, 0.00386810302734375, 0.005343437194824219, 0.0068187713623046875, 0.008294105529785156, 0.009769439697265625, 0.011244773864746094, 0.012720108032226562, 0.014195442199707031, 0.0156707763671875, 0.01714611053466797, 0.018621444702148438, 0.020096778869628906, 0.021572113037109375, 0.023047447204589844, 0.024522781372070312, 0.02599811553955078, 0.02747344970703125, 0.02894878387451172, 0.030424118041992188, 0.031899452209472656, 0.033374786376953125, 0.034850120544433594, 0.03632545471191406, 0.03780078887939453, 0.039276123046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 15.0, 11.0, 15.0, 37.0, 54.0, 86.0, 100.0, 138.0, 132.0, 123.0, 95.0, 48.0, 35.0, 37.0, 13.0, 14.0, 9.0, 9.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.9742717742919922e-05, -2.898741513490677e-05, -2.8232112526893616e-05, -2.7476809918880463e-05, -2.672150731086731e-05, -2.5966204702854156e-05, -2.5210902094841003e-05, -2.445559948682785e-05, -2.3700296878814697e-05, -2.2944994270801544e-05, -2.218969166278839e-05, -2.1434389054775238e-05, -2.0679086446762085e-05, -1.9923783838748932e-05, -1.916848123073578e-05, -1.8413178622722626e-05, -1.7657876014709473e-05, -1.690257340669632e-05, -1.6147270798683167e-05, -1.5391968190670013e-05, -1.463666558265686e-05, -1.3881362974643707e-05, -1.3126060366630554e-05, -1.2370757758617401e-05, -1.1615455150604248e-05, -1.0860152542591095e-05, -1.0104849934577942e-05, -9.349547326564789e-06, -8.594244718551636e-06, -7.838942110538483e-06, -7.08363950252533e-06, -6.3283368945121765e-06, -5.5730342864990234e-06, -4.81773167848587e-06, -4.062429070472717e-06, -3.307126462459564e-06, -2.551823854446411e-06, -1.796521246433258e-06, -1.041218638420105e-06, -2.859160304069519e-07, 4.6938657760620117e-07, 1.2246891856193542e-06, 1.9799917936325073e-06, 2.7352944016456604e-06, 3.4905970096588135e-06, 4.2458996176719666e-06, 5.00120222568512e-06, 5.756504833698273e-06, 6.511807441711426e-06, 7.267110049724579e-06, 8.022412657737732e-06, 8.777715265750885e-06, 9.533017873764038e-06, 1.0288320481777191e-05, 1.1043623089790344e-05, 1.1798925697803497e-05, 1.255422830581665e-05, 1.3309530913829803e-05, 1.4064833521842957e-05, 1.482013612985611e-05, 1.5575438737869263e-05, 1.6330741345882416e-05, 1.708604395389557e-05, 1.7841346561908722e-05, 1.8596649169921875e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 8.0, 6.0, 17.0, 30.0, 36.0, 57.0, 70.0, 140.0, 220.0, 377.0, 687.0, 1265.0, 2394.0, 4867.0, 10008.0, 22005.0, 56288.0, 154796.0, 328586.0, 279248.0, 113680.0, 41739.0, 16743.0, 7605.0, 3605.0, 1810.0, 954.0, 543.0, 310.0, 190.0, 99.0, 64.0, 42.0, 21.0, 17.0, 8.0, 11.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0215606689453125, -0.02081298828125, -0.0200653076171875, -0.019317626953125, -0.0185699462890625, -0.017822265625, -0.0170745849609375, -0.016326904296875, -0.0155792236328125, -0.01483154296875, -0.0140838623046875, -0.013336181640625, -0.0125885009765625, -0.0118408203125, -0.0110931396484375, -0.010345458984375, -0.0095977783203125, -0.00885009765625, -0.0081024169921875, -0.007354736328125, -0.0066070556640625, -0.005859375, -0.0051116943359375, -0.004364013671875, -0.0036163330078125, -0.00286865234375, -0.0021209716796875, -0.001373291015625, -0.0006256103515625, 0.0001220703125, 0.0008697509765625, 0.001617431640625, 0.0023651123046875, 0.00311279296875, 0.0038604736328125, 0.004608154296875, 0.0053558349609375, 0.006103515625, 0.0068511962890625, 0.007598876953125, 0.0083465576171875, 0.00909423828125, 0.0098419189453125, 0.010589599609375, 0.0113372802734375, 0.0120849609375, 0.0128326416015625, 0.013580322265625, 0.0143280029296875, 0.01507568359375, 0.0158233642578125, 0.016571044921875, 0.0173187255859375, 0.01806640625, 0.0188140869140625, 0.019561767578125, 0.0203094482421875, 0.02105712890625, 0.0218048095703125, 0.022552490234375, 0.0233001708984375, 0.0240478515625, 0.0247955322265625, 0.025543212890625, 0.0262908935546875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 3.0, 5.0, 10.0, 4.0, 9.0, 19.0, 22.0, 15.0, 40.0, 50.0, 47.0, 70.0, 80.0, 81.0, 78.0, 87.0, 72.0, 58.0, 64.0, 40.0, 34.0, 22.0, 18.0, 18.0, 9.0, 13.0, 6.0, 5.0, 3.0, 7.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01059722900390625, -0.010306000709533691, -0.010014772415161133, -0.009723544120788574, -0.009432315826416016, -0.009141087532043457, -0.008849859237670898, -0.00855863094329834, -0.008267402648925781, -0.007976174354553223, -0.007684946060180664, -0.0073937177658081055, -0.007102489471435547, -0.006811261177062988, -0.00652003288269043, -0.006228804588317871, -0.0059375762939453125, -0.005646347999572754, -0.005355119705200195, -0.005063891410827637, -0.004772663116455078, -0.0044814348220825195, -0.004190206527709961, -0.0038989782333374023, -0.0036077499389648438, -0.003316521644592285, -0.0030252933502197266, -0.002734065055847168, -0.0024428367614746094, -0.0021516084671020508, -0.0018603801727294922, -0.0015691518783569336, -0.001277923583984375, -0.0009866952896118164, -0.0006954669952392578, -0.0004042387008666992, -0.00011301040649414062, 0.00017821788787841797, 0.00046944618225097656, 0.0007606744766235352, 0.0010519027709960938, 0.0013431310653686523, 0.001634359359741211, 0.0019255876541137695, 0.002216815948486328, 0.0025080442428588867, 0.0027992725372314453, 0.003090500831604004, 0.0033817291259765625, 0.003672957420349121, 0.00396418571472168, 0.004255414009094238, 0.004546642303466797, 0.0048378705978393555, 0.005129098892211914, 0.005420327186584473, 0.005711555480957031, 0.00600278377532959, 0.0062940120697021484, 0.006585240364074707, 0.006876468658447266, 0.007167696952819824, 0.007458925247192383, 0.007750153541564941, 0.0080413818359375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 4.0, 3.0, 13.0, 16.0, 14.0, 28.0, 34.0, 39.0, 37.0, 44.0, 48.0, 58.0, 60.0, 72.0, 64.0, 72.0, 62.0, 71.0, 50.0, 35.0, 42.0, 34.0, 22.0, 18.0, 15.0, 10.0, 9.0, 9.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1898532509803772, -0.18336260318756104, -0.17687194049358368, -0.17038129270076752, -0.16389063000679016, -0.157399982213974, -0.15090933442115784, -0.14441867172718048, -0.13792800903320312, -0.13143736124038696, -0.1249466985464096, -0.11845605075359344, -0.11196538805961609, -0.10547474026679993, -0.09898408502340317, -0.09249342978000641, -0.08600278198719025, -0.07951212674379349, -0.07302147150039673, -0.06653082370758057, -0.06004016473889351, -0.05354950949549675, -0.04705885797739029, -0.04056820273399353, -0.03407754749059677, -0.027586892247200012, -0.021096238866448402, -0.014605585485696793, -0.008114930242300034, -0.0016242749989032745, 0.004866376519203186, 0.011357031762599945, 0.017847701907157898, 0.024338357150554657, 0.030829010531306267, 0.03731966391205788, 0.043810319155454636, 0.050300974398851395, 0.056791625916957855, 0.06328228116035461, 0.06977293640375137, 0.07626359164714813, 0.08275424689054489, 0.08924490213394165, 0.09573554992675781, 0.10222621262073517, 0.10871686041355133, 0.11520751565694809, 0.12169817090034485, 0.128188818693161, 0.13467948138713837, 0.14117012917995453, 0.14766079187393188, 0.15415143966674805, 0.1606420874595642, 0.16713275015354156, 0.17362341284751892, 0.18011406064033508, 0.18660472333431244, 0.1930953711271286, 0.19958603382110596, 0.20607668161392212, 0.21256732940673828, 0.21905799210071564, 0.2255486398935318]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 8.0, 8.0, 12.0, 14.0, 19.0, 19.0, 22.0, 30.0, 29.0, 34.0, 29.0, 52.0, 33.0, 54.0, 58.0, 35.0, 41.0, 44.0, 48.0, 42.0, 44.0, 41.0, 43.0, 38.0, 29.0, 36.0, 29.0, 26.0, 20.0, 18.0, 13.0, 9.0, 4.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16634730994701385, -0.16081269085407257, -0.1552780717611313, -0.14974345266819, -0.14420883357524872, -0.13867421448230743, -0.13313959538936615, -0.12760497629642487, -0.12207035720348358, -0.1165357381105423, -0.11100111901760101, -0.10546649992465973, -0.09993188083171844, -0.09439726173877716, -0.08886264264583588, -0.08332802355289459, -0.07779340445995331, -0.07225878536701202, -0.06672416627407074, -0.061189547181129456, -0.05565492808818817, -0.05012030899524689, -0.0445856899023056, -0.03905107080936432, -0.033516451716423035, -0.02798183262348175, -0.022447213530540466, -0.016912594437599182, -0.011377975344657898, -0.005843356251716614, -0.0003087371587753296, 0.005225881934165955, 0.010760486125946045, 0.01629510521888733, 0.021829724311828613, 0.027364343404769897, 0.03289896249771118, 0.038433581590652466, 0.04396820068359375, 0.049502819776535034, 0.05503743886947632, 0.0605720579624176, 0.06610667705535889, 0.07164129614830017, 0.07717591524124146, 0.08271053433418274, 0.08824515342712402, 0.09377977252006531, 0.09931439161300659, 0.10484901070594788, 0.11038362979888916, 0.11591824889183044, 0.12145286798477173, 0.126987487077713, 0.1325221061706543, 0.13805672526359558, 0.14359134435653687, 0.14912596344947815, 0.15466058254241943, 0.16019520163536072, 0.165729820728302, 0.1712644398212433, 0.17679905891418457, 0.18233367800712585, 0.18786829710006714]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 8.0, 6.0, 15.0, 23.0, 25.0, 43.0, 102.0, 173.0, 309.0, 637.0, 1298.0, 3040.0, 7615.0, 23223.0, 96065.0, 396680.0, 389458.0, 93854.0, 22860.0, 7547.0, 3005.0, 1263.0, 616.0, 298.0, 158.0, 79.0, 57.0, 35.0, 22.0, 18.0, 8.0, 5.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.379638671875, -0.3655738830566406, -0.35150909423828125, -0.3374443054199219, -0.3233795166015625, -0.3093147277832031, -0.29524993896484375, -0.2811851501464844, -0.267120361328125, -0.2530555725097656, -0.23899078369140625, -0.22492599487304688, -0.2108612060546875, -0.19679641723632812, -0.18273162841796875, -0.16866683959960938, -0.15460205078125, -0.14053726196289062, -0.12647247314453125, -0.11240768432617188, -0.0983428955078125, -0.08427810668945312, -0.07021331787109375, -0.056148529052734375, -0.042083740234375, -0.028018951416015625, -0.01395416259765625, 0.000110626220703125, 0.0141754150390625, 0.028240203857421875, 0.04230499267578125, 0.056369781494140625, 0.0704345703125, 0.08449935913085938, 0.09856414794921875, 0.11262893676757812, 0.1266937255859375, 0.14075851440429688, 0.15482330322265625, 0.16888809204101562, 0.182952880859375, 0.19701766967773438, 0.21108245849609375, 0.22514724731445312, 0.2392120361328125, 0.2532768249511719, 0.26734161376953125, 0.2814064025878906, 0.29547119140625, 0.3095359802246094, 0.32360076904296875, 0.3376655578613281, 0.3517303466796875, 0.3657951354980469, 0.37985992431640625, 0.3939247131347656, 0.407989501953125, 0.4220542907714844, 0.43611907958984375, 0.4501838684082031, 0.4642486572265625, 0.4783134460449219, 0.49237823486328125, 0.5064430236816406, 0.5205078125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 6.0, 9.0, 25.0, 13.0, 22.0, 15.0, 32.0, 28.0, 40.0, 42.0, 42.0, 53.0, 47.0, 49.0, 61.0, 46.0, 59.0, 48.0, 48.0, 43.0, 36.0, 35.0, 39.0, 32.0, 30.0, 24.0, 17.0, 15.0, 13.0, 5.0, 7.0, 8.0, 4.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.353271484375, -0.3416404724121094, -0.33000946044921875, -0.3183784484863281, -0.3067474365234375, -0.2951164245605469, -0.28348541259765625, -0.2718544006347656, -0.260223388671875, -0.24859237670898438, -0.23696136474609375, -0.22533035278320312, -0.2136993408203125, -0.20206832885742188, -0.19043731689453125, -0.17880630493164062, -0.16717529296875, -0.15554428100585938, -0.14391326904296875, -0.13228225708007812, -0.1206512451171875, -0.10902023315429688, -0.09738922119140625, -0.08575820922851562, -0.074127197265625, -0.062496185302734375, -0.05086517333984375, -0.039234161376953125, -0.0276031494140625, -0.015972137451171875, -0.00434112548828125, 0.007289886474609375, 0.0189208984375, 0.030551910400390625, 0.04218292236328125, 0.053813934326171875, 0.0654449462890625, 0.07707595825195312, 0.08870697021484375, 0.10033798217773438, 0.111968994140625, 0.12360000610351562, 0.13523101806640625, 0.14686203002929688, 0.1584930419921875, 0.17012405395507812, 0.18175506591796875, 0.19338607788085938, 0.20501708984375, 0.21664810180664062, 0.22827911376953125, 0.23991012573242188, 0.2515411376953125, 0.2631721496582031, 0.27480316162109375, 0.2864341735839844, 0.298065185546875, 0.3096961975097656, 0.32132720947265625, 0.3329582214355469, 0.3445892333984375, 0.3562202453613281, 0.36785125732421875, 0.3794822692871094, 0.39111328125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 6.0, 8.0, 9.0, 19.0, 39.0, 47.0, 80.0, 120.0, 219.0, 339.0, 635.0, 1192.0, 2421.0, 5686.0, 15839.0, 53791.0, 214402.0, 482237.0, 196650.0, 49728.0, 14780.0, 5353.0, 2301.0, 1176.0, 627.0, 332.0, 187.0, 121.0, 72.0, 43.0, 19.0, 12.0, 22.0, 11.0, 9.0, 6.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4619140625, -0.4485130310058594, -0.43511199951171875, -0.4217109680175781, -0.4083099365234375, -0.3949089050292969, -0.38150787353515625, -0.3681068420410156, -0.354705810546875, -0.3413047790527344, -0.32790374755859375, -0.3145027160644531, -0.3011016845703125, -0.2877006530761719, -0.27429962158203125, -0.2608985900878906, -0.24749755859375, -0.23409652709960938, -0.22069549560546875, -0.20729446411132812, -0.1938934326171875, -0.18049240112304688, -0.16709136962890625, -0.15369033813476562, -0.140289306640625, -0.12688827514648438, -0.11348724365234375, -0.10008621215820312, -0.0866851806640625, -0.07328414916992188, -0.05988311767578125, -0.046482086181640625, -0.0330810546875, -0.019680023193359375, -0.00627899169921875, 0.007122039794921875, 0.0205230712890625, 0.033924102783203125, 0.04732513427734375, 0.060726165771484375, 0.074127197265625, 0.08752822875976562, 0.10092926025390625, 0.11433029174804688, 0.1277313232421875, 0.14113235473632812, 0.15453338623046875, 0.16793441772460938, 0.18133544921875, 0.19473648071289062, 0.20813751220703125, 0.22153854370117188, 0.2349395751953125, 0.24834060668945312, 0.26174163818359375, 0.2751426696777344, 0.288543701171875, 0.3019447326660156, 0.31534576416015625, 0.3287467956542969, 0.3421478271484375, 0.3555488586425781, 0.36894989013671875, 0.3823509216308594, 0.395751953125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 0.0, 6.0, 5.0, 15.0, 10.0, 9.0, 9.0, 16.0, 16.0, 24.0, 21.0, 27.0, 30.0, 27.0, 45.0, 50.0, 31.0, 60.0, 40.0, 39.0, 52.0, 46.0, 45.0, 39.0, 42.0, 36.0, 40.0, 43.0, 25.0, 18.0, 22.0, 24.0, 15.0, 15.0, 13.0, 10.0, 9.0, 6.0, 3.0, 3.0, 10.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.335693359375, -0.3252449035644531, -0.31479644775390625, -0.3043479919433594, -0.2938995361328125, -0.2834510803222656, -0.27300262451171875, -0.2625541687011719, -0.252105712890625, -0.24165725708007812, -0.23120880126953125, -0.22076034545898438, -0.2103118896484375, -0.19986343383789062, -0.18941497802734375, -0.17896652221679688, -0.16851806640625, -0.15806961059570312, -0.14762115478515625, -0.13717269897460938, -0.1267242431640625, -0.11627578735351562, -0.10582733154296875, -0.09537887573242188, -0.084930419921875, -0.07448196411132812, -0.06403350830078125, -0.053585052490234375, -0.0431365966796875, -0.032688140869140625, -0.02223968505859375, -0.011791229248046875, -0.0013427734375, 0.009105682373046875, 0.01955413818359375, 0.030002593994140625, 0.0404510498046875, 0.050899505615234375, 0.06134796142578125, 0.07179641723632812, 0.082244873046875, 0.09269332885742188, 0.10314178466796875, 0.11359024047851562, 0.1240386962890625, 0.13448715209960938, 0.14493560791015625, 0.15538406372070312, 0.16583251953125, 0.17628097534179688, 0.18672943115234375, 0.19717788696289062, 0.2076263427734375, 0.21807479858398438, 0.22852325439453125, 0.23897171020507812, 0.249420166015625, 0.2598686218261719, 0.27031707763671875, 0.2807655334472656, 0.2912139892578125, 0.3016624450683594, 0.31211090087890625, 0.3225593566894531, 0.3330078125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 11.0, 4.0, 7.0, 6.0, 4.0, 15.0, 19.0, 30.0, 29.0, 35.0, 60.0, 95.0, 129.0, 224.0, 351.0, 642.0, 1080.0, 1906.0, 3581.0, 6613.0, 13996.0, 32585.0, 82746.0, 211037.0, 394075.0, 177922.0, 68680.0, 27416.0, 12155.0, 5856.0, 3077.0, 1690.0, 966.0, 546.0, 342.0, 196.0, 150.0, 89.0, 52.0, 37.0, 23.0, 21.0, 9.0, 14.0, 14.0, 5.0, 5.0, 7.0, 7.0, 1.0, 0.0, 3.0, 3.0, 1.0], "bins": [-0.06292724609375, -0.06109809875488281, -0.059268951416015625, -0.05743980407714844, -0.05561065673828125, -0.05378150939941406, -0.051952362060546875, -0.05012321472167969, -0.0482940673828125, -0.04646492004394531, -0.044635772705078125, -0.04280662536621094, -0.04097747802734375, -0.03914833068847656, -0.037319183349609375, -0.03549003601074219, -0.033660888671875, -0.03183174133300781, -0.030002593994140625, -0.028173446655273438, -0.02634429931640625, -0.024515151977539062, -0.022686004638671875, -0.020856857299804688, -0.0190277099609375, -0.017198562622070312, -0.015369415283203125, -0.013540267944335938, -0.01171112060546875, -0.009881973266601562, -0.008052825927734375, -0.0062236785888671875, -0.00439453125, -0.0025653839111328125, -0.000736236572265625, 0.0010929107666015625, 0.00292205810546875, 0.0047512054443359375, 0.006580352783203125, 0.008409500122070312, 0.0102386474609375, 0.012067794799804688, 0.013896942138671875, 0.015726089477539062, 0.01755523681640625, 0.019384384155273438, 0.021213531494140625, 0.023042678833007812, 0.024871826171875, 0.026700973510742188, 0.028530120849609375, 0.030359268188476562, 0.03218841552734375, 0.03401756286621094, 0.035846710205078125, 0.03767585754394531, 0.0395050048828125, 0.04133415222167969, 0.043163299560546875, 0.04499244689941406, 0.04682159423828125, 0.04865074157714844, 0.050479888916015625, 0.05230903625488281, 0.05413818359375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 5.0, 8.0, 21.0, 26.0, 39.0, 57.0, 69.0, 72.0, 122.0, 183.0, 92.0, 88.0, 57.0, 54.0, 29.0, 18.0, 19.0, 12.0, 7.0, 10.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2411346435546875e-05, -2.1777115762233734e-05, -2.1142885088920593e-05, -2.0508654415607452e-05, -1.987442374229431e-05, -1.924019306898117e-05, -1.860596239566803e-05, -1.797173172235489e-05, -1.7337501049041748e-05, -1.6703270375728607e-05, -1.6069039702415466e-05, -1.5434809029102325e-05, -1.4800578355789185e-05, -1.4166347682476044e-05, -1.3532117009162903e-05, -1.2897886335849762e-05, -1.2263655662536621e-05, -1.162942498922348e-05, -1.099519431591034e-05, -1.0360963642597198e-05, -9.726732969284058e-06, -9.092502295970917e-06, -8.458271622657776e-06, -7.824040949344635e-06, -7.189810276031494e-06, -6.555579602718353e-06, -5.921348929405212e-06, -5.2871182560920715e-06, -4.652887582778931e-06, -4.01865690946579e-06, -3.384426236152649e-06, -2.750195562839508e-06, -2.115964889526367e-06, -1.4817342162132263e-06, -8.475035429000854e-07, -2.1327286958694458e-07, 4.209578037261963e-07, 1.0551884770393372e-06, 1.689419150352478e-06, 2.323649823665619e-06, 2.9578804969787598e-06, 3.5921111702919006e-06, 4.2263418436050415e-06, 4.860572516918182e-06, 5.494803190231323e-06, 6.129033863544464e-06, 6.763264536857605e-06, 7.397495210170746e-06, 8.031725883483887e-06, 8.665956556797028e-06, 9.300187230110168e-06, 9.93441790342331e-06, 1.056864857673645e-05, 1.1202879250049591e-05, 1.1837109923362732e-05, 1.2471340596675873e-05, 1.3105571269989014e-05, 1.3739801943302155e-05, 1.4374032616615295e-05, 1.5008263289928436e-05, 1.5642493963241577e-05, 1.6276724636554718e-05, 1.691095530986786e-05, 1.7545185983181e-05, 1.817941665649414e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 13.0, 29.0, 20.0, 34.0, 36.0, 70.0, 113.0, 158.0, 227.0, 339.0, 505.0, 842.0, 1465.0, 2611.0, 5404.0, 11781.0, 32163.0, 104408.0, 377768.0, 351455.0, 103623.0, 31882.0, 11857.0, 5120.0, 2545.0, 1511.0, 933.0, 556.0, 342.0, 212.0, 166.0, 115.0, 74.0, 39.0, 43.0, 30.0, 17.0, 10.0, 9.0, 12.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07281494140625, -0.07030391693115234, -0.06779289245605469, -0.06528186798095703, -0.06277084350585938, -0.06025981903076172, -0.05774879455566406, -0.055237770080566406, -0.05272674560546875, -0.050215721130371094, -0.04770469665527344, -0.04519367218017578, -0.042682647705078125, -0.04017162322998047, -0.03766059875488281, -0.035149574279785156, -0.0326385498046875, -0.030127525329589844, -0.027616500854492188, -0.02510547637939453, -0.022594451904296875, -0.02008342742919922, -0.017572402954101562, -0.015061378479003906, -0.01255035400390625, -0.010039329528808594, -0.0075283050537109375, -0.005017280578613281, -0.002506256103515625, 4.76837158203125e-06, 0.0025157928466796875, 0.005026817321777344, 0.007537841796875, 0.010048866271972656, 0.012559890747070312, 0.015070915222167969, 0.017581939697265625, 0.02009296417236328, 0.022603988647460938, 0.025115013122558594, 0.02762603759765625, 0.030137062072753906, 0.03264808654785156, 0.03515911102294922, 0.037670135498046875, 0.04018115997314453, 0.04269218444824219, 0.045203208923339844, 0.0477142333984375, 0.050225257873535156, 0.05273628234863281, 0.05524730682373047, 0.057758331298828125, 0.06026935577392578, 0.06278038024902344, 0.0652914047241211, 0.06780242919921875, 0.0703134536743164, 0.07282447814941406, 0.07533550262451172, 0.07784652709960938, 0.08035755157470703, 0.08286857604980469, 0.08537960052490234, 0.087890625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 3.0, 3.0, 5.0, 7.0, 9.0, 12.0, 24.0, 20.0, 28.0, 34.0, 52.0, 71.0, 88.0, 103.0, 148.0, 102.0, 82.0, 42.0, 44.0, 35.0, 27.0, 19.0, 17.0, 5.0, 6.0, 6.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05755615234375, -0.05576324462890625, -0.0539703369140625, -0.05217742919921875, -0.050384521484375, -0.04859161376953125, -0.0467987060546875, -0.04500579833984375, -0.043212890625, -0.04141998291015625, -0.0396270751953125, -0.03783416748046875, -0.036041259765625, -0.03424835205078125, -0.0324554443359375, -0.03066253662109375, -0.02886962890625, -0.02707672119140625, -0.0252838134765625, -0.02349090576171875, -0.021697998046875, -0.01990509033203125, -0.0181121826171875, -0.01631927490234375, -0.0145263671875, -0.01273345947265625, -0.0109405517578125, -0.00914764404296875, -0.007354736328125, -0.00556182861328125, -0.0037689208984375, -0.00197601318359375, -0.00018310546875, 0.00160980224609375, 0.0034027099609375, 0.00519561767578125, 0.006988525390625, 0.00878143310546875, 0.0105743408203125, 0.01236724853515625, 0.01416015625, 0.01595306396484375, 0.0177459716796875, 0.01953887939453125, 0.021331787109375, 0.02312469482421875, 0.0249176025390625, 0.02671051025390625, 0.02850341796875, 0.03029632568359375, 0.0320892333984375, 0.03388214111328125, 0.035675048828125, 0.03746795654296875, 0.0392608642578125, 0.04105377197265625, 0.0428466796875, 0.04463958740234375, 0.0464324951171875, 0.04822540283203125, 0.050018310546875, 0.05181121826171875, 0.0536041259765625, 0.05539703369140625, 0.05718994140625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 9.0, 13.0, 17.0, 76.0, 145.0, 236.0, 245.0, 152.0, 70.0, 28.0, 9.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6368203163146973, -1.5886907577514648, -1.5405611991882324, -1.492431640625, -1.4443020820617676, -1.3961725234985352, -1.3480429649353027, -1.2999135255813599, -1.2517839670181274, -1.203654408454895, -1.1555248498916626, -1.1073952913284302, -1.0592657327651978, -1.0111362934112549, -0.9630066752433777, -0.91487717628479, -0.8667475581169128, -0.8186179995536804, -0.770488440990448, -0.7223589420318604, -0.6742293834686279, -0.6260998249053955, -0.5779702663421631, -0.5298407077789307, -0.48171117901802063, -0.4335816204547882, -0.3854520916938782, -0.33732253313064575, -0.28919297456741333, -0.2410634458065033, -0.19293388724327087, -0.14480435848236084, -0.09667479991912842, -0.04854525253176689, -0.000415705144405365, 0.04771384596824646, 0.09584338963031769, 0.14397293329238892, 0.19210249185562134, 0.24023202061653137, 0.2883615791797638, 0.3364911377429962, 0.38462066650390625, 0.43275022506713867, 0.4808797836303711, 0.5290093421936035, 0.5771389007568359, 0.6252683997154236, 0.673397958278656, 0.7215275168418884, 0.7696570754051208, 0.8177865743637085, 0.8659161329269409, 0.9140456914901733, 0.9621752500534058, 1.0103048086166382, 1.0584343671798706, 1.106563925743103, 1.1546934843063354, 1.2028230428695679, 1.2509526014328003, 1.2990820407867432, 1.3472115993499756, 1.395341157913208, 1.4434707164764404]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 7.0, 5.0, 9.0, 7.0, 5.0, 18.0, 10.0, 12.0, 11.0, 19.0, 28.0, 22.0, 32.0, 20.0, 31.0, 36.0, 26.0, 46.0, 52.0, 34.0, 45.0, 36.0, 38.0, 32.0, 44.0, 37.0, 42.0, 37.0, 37.0, 30.0, 33.0, 19.0, 17.0, 21.0, 15.0, 21.0, 12.0, 14.0, 12.0, 8.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.4828285574913025, -0.4659769833087921, -0.44912540912628174, -0.43227383494377136, -0.415422260761261, -0.398570716381073, -0.3817191421985626, -0.36486756801605225, -0.34801599383354187, -0.3311644196510315, -0.3143128454685211, -0.29746127128601074, -0.28060972690582275, -0.26375812292099, -0.246906578540802, -0.23005500435829163, -0.21320343017578125, -0.19635185599327087, -0.1795002818107605, -0.16264872252941132, -0.14579714834690094, -0.12894557416439056, -0.11209400743246078, -0.095242440700531, -0.07839086651802063, -0.06153929606080055, -0.044687725603580475, -0.027836155146360397, -0.01098458468914032, 0.005866989493370056, 0.022718556225299835, 0.039570122957229614, 0.056421756744384766, 0.07327333092689514, 0.09012489765882492, 0.1069764643907547, 0.12382803857326508, 0.14067961275577545, 0.15753117203712463, 0.174382746219635, 0.19123432040214539, 0.20808589458465576, 0.22493746876716614, 0.24178902804851532, 0.2586405873298645, 0.27549219131469727, 0.29234373569488525, 0.30919530987739563, 0.326046884059906, 0.3428984582424164, 0.35975003242492676, 0.37660160660743713, 0.3934531807899475, 0.4103047251701355, 0.4271562993526459, 0.44400787353515625, 0.4608594477176666, 0.477711021900177, 0.4945625960826874, 0.5114141702651978, 0.5282657146453857, 0.5451173186302185, 0.5619688630104065, 0.5788204669952393, 0.5956720113754272]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 5.0, 8.0, 5.0, 12.0, 8.0, 16.0, 22.0, 32.0, 35.0, 51.0, 62.0, 73.0, 94.0, 111.0, 150.0, 173.0, 235.0, 292.0, 358.0, 522.0, 656.0, 1075.0, 1762.0, 3424.0, 6230.0, 1022313.0, 5154.0, 2755.0, 1446.0, 897.0, 602.0, 418.0, 334.0, 250.0, 216.0, 154.0, 122.0, 109.0, 87.0, 78.0, 57.0, 44.0, 44.0, 25.0, 26.0, 11.0, 16.0, 13.0, 5.0, 7.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.5101166367530823, -0.49481111764907837, -0.47950559854507446, -0.46420007944107056, -0.44889456033706665, -0.43358904123306274, -0.41828352212905884, -0.40297800302505493, -0.387672483921051, -0.3723669648170471, -0.3570614457130432, -0.3417559266090393, -0.3264504075050354, -0.3111448884010315, -0.2958393692970276, -0.2805338501930237, -0.2652283310890198, -0.24992281198501587, -0.23461729288101196, -0.21931177377700806, -0.20400625467300415, -0.18870073556900024, -0.17339521646499634, -0.15808969736099243, -0.1427842080593109, -0.127478688955307, -0.1121731698513031, -0.0968676507472992, -0.08156213164329529, -0.06625661998987198, -0.05095110088586807, -0.035645581781864166, -0.020340055227279663, -0.0050345370545983315, 0.010270981118083, 0.025576498359441757, 0.04088201746344566, 0.05618753284215927, 0.07149305194616318, 0.08679857105016708, 0.10210409015417099, 0.1174096092581749, 0.1327151209115982, 0.1480206400156021, 0.16332615911960602, 0.17863167822360992, 0.19393719732761383, 0.20924271643161774, 0.22454823553562164, 0.23985375463962555, 0.25515925884246826, 0.27046477794647217, 0.2857702970504761, 0.30107581615448, 0.3163813352584839, 0.3316868543624878, 0.3469923734664917, 0.3622978925704956, 0.3776034116744995, 0.3929089307785034, 0.4082144498825073, 0.42351996898651123, 0.43882548809051514, 0.45413100719451904, 0.46943652629852295]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 6.0, 14.0, 12.0, 44.0, 76.0, 134.0, 260.0, 440.0, 977.0, 3176.0, 51460712.0, 2589.0, 855.0, 459.0, 272.0, 129.0, 71.0, 44.0, 19.0, 8.0, 10.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.461135864257812, -13.101757049560547, -12.742379188537598, -12.383000373840332, -12.023622512817383, -11.664243698120117, -11.304864883422852, -10.945487022399902, -10.586109161376953, -10.226730346679688, -9.867352485656738, -9.507973670959473, -9.148595809936523, -8.789216995239258, -8.429838180541992, -8.070460319519043, -7.711081504821777, -7.35170316696167, -6.9923248291015625, -6.632946014404297, -6.273568153381348, -5.914189338684082, -5.554811000823975, -5.195432662963867, -4.83605432510376, -4.476675987243652, -4.117297649383545, -3.7579190731048584, -3.398540735244751, -3.0391623973846436, -2.679783821105957, -2.3204054832458496, -1.9610261917114258, -1.6016478538513184, -1.2422693967819214, -0.8828909397125244, -0.523512601852417, -0.16413426399230957, 0.19524431228637695, 0.5546226501464844, 0.9140009880065918, 1.2733793258666992, 1.6327577829360962, 1.9921362400054932, 2.3515145778656006, 2.710892915725708, 3.0702714920043945, 3.429649829864502, 3.7890281677246094, 4.148406505584717, 4.507784843444824, 4.86716365814209, 5.226541519165039, 5.585920333862305, 5.945298671722412, 6.3046770095825195, 6.664055347442627, 7.023433685302734, 7.382812023162842, 7.742190361022949, 8.101569175720215, 8.460947036743164, 8.82032585144043, 9.179704666137695, 9.539082527160645]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 8.0, 9.0, 10.0, 17.0, 31.0, 43.0, 69.0, 127.0, 175.0, 252.0, 448.0, 716.0, 1230.0, 2018.0, 3539.0, 5622.0, 9967.0, 17205.0, 30138.0, 53068.0, 93071.0, 159083.0, 257784.0, 382826.0, 1025818.0, 3044189.0, 445323.0, 301240.0, 190758.0, 113970.0, 65532.0, 37203.0, 20872.0, 12068.0, 6825.0, 4025.0, 2455.0, 1430.0, 885.0, 530.0, 328.0, 218.0, 123.0, 70.0, 41.0, 32.0, 20.0, 10.0, 8.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.47412109375, -0.45938873291015625, -0.4446563720703125, -0.42992401123046875, -0.415191650390625, -0.40045928955078125, -0.3857269287109375, -0.37099456787109375, -0.35626220703125, -0.34152984619140625, -0.3267974853515625, -0.31206512451171875, -0.297332763671875, -0.28260040283203125, -0.2678680419921875, -0.25313568115234375, -0.2384033203125, -0.22367095947265625, -0.2089385986328125, -0.19420623779296875, -0.179473876953125, -0.16474151611328125, -0.1500091552734375, -0.13527679443359375, -0.12054443359375, -0.10581207275390625, -0.0910797119140625, -0.07634735107421875, -0.061614990234375, -0.04688262939453125, -0.0321502685546875, -0.01741790771484375, -0.002685546875, 0.01204681396484375, 0.0267791748046875, 0.04151153564453125, 0.056243896484375, 0.07097625732421875, 0.0857086181640625, 0.10044097900390625, 0.11517333984375, 0.12990570068359375, 0.1446380615234375, 0.15937042236328125, 0.174102783203125, 0.18883514404296875, 0.2035675048828125, 0.21829986572265625, 0.2330322265625, 0.24776458740234375, 0.2624969482421875, 0.27722930908203125, 0.291961669921875, 0.30669403076171875, 0.3214263916015625, 0.33615875244140625, 0.35089111328125, 0.36562347412109375, 0.3803558349609375, 0.39508819580078125, 0.409820556640625, 0.42455291748046875, 0.4392852783203125, 0.45401763916015625, 0.46875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 3.0, 2.0, 8.0, 8.0, 6.0, 14.0, 18.0, 23.0, 18.0, 25.0, 27.0, 29.0, 33.0, 46.0, 50.0, 47.0, 60.0, 260.0, 835.0, 92.0, 45.0, 61.0, 42.0, 58.0, 40.0, 32.0, 29.0, 22.0, 17.0, 14.0, 19.0, 12.0, 10.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.560546875, -3.430206298828125, -3.29986572265625, -3.169525146484375, -3.0391845703125, -2.908843994140625, -2.77850341796875, -2.648162841796875, -2.517822265625, -2.387481689453125, -2.25714111328125, -2.126800537109375, -1.9964599609375, -1.866119384765625, -1.73577880859375, -1.605438232421875, -1.47509765625, -1.344757080078125, -1.21441650390625, -1.084075927734375, -0.9537353515625, -0.823394775390625, -0.69305419921875, -0.562713623046875, -0.432373046875, -0.302032470703125, -0.17169189453125, -0.041351318359375, 0.0889892578125, 0.219329833984375, 0.34967041015625, 0.480010986328125, 0.6103515625, 0.740692138671875, 0.87103271484375, 1.001373291015625, 1.1317138671875, 1.262054443359375, 1.39239501953125, 1.522735595703125, 1.653076171875, 1.783416748046875, 1.91375732421875, 2.044097900390625, 2.1744384765625, 2.304779052734375, 2.43511962890625, 2.565460205078125, 2.69580078125, 2.826141357421875, 2.95648193359375, 3.086822509765625, 3.2171630859375, 3.347503662109375, 3.47784423828125, 3.608184814453125, 3.738525390625, 3.868865966796875, 3.99920654296875, 4.129547119140625, 4.2598876953125, 4.390228271484375, 4.52056884765625, 4.650909423828125, 4.78125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 7.0, 13.0, 31.0, 37.0, 51.0, 86.0, 143.0, 186.0, 360.0, 530.0, 811.0, 1267.0, 2002.0, 3169.0, 5327.0, 8052.0, 13148.0, 20268.0, 31999.0, 49602.0, 75519.0, 111304.0, 159323.0, 217196.0, 277324.0, 361737.0, 2876094.0, 919415.0, 310966.0, 250368.0, 190162.0, 136919.0, 93830.0, 62304.0, 40750.0, 26139.0, 16748.0, 10447.0, 6654.0, 4179.0, 2562.0, 1611.0, 1032.0, 622.0, 403.0, 264.0, 178.0, 107.0, 65.0, 44.0, 26.0, 19.0, 19.0, 8.0, 6.0, 4.0, 0.0, 2.0], "bins": [-0.284912109375, -0.2762184143066406, -0.26752471923828125, -0.2588310241699219, -0.2501373291015625, -0.24144363403320312, -0.23274993896484375, -0.22405624389648438, -0.215362548828125, -0.20666885375976562, -0.19797515869140625, -0.18928146362304688, -0.1805877685546875, -0.17189407348632812, -0.16320037841796875, -0.15450668334960938, -0.14581298828125, -0.13711929321289062, -0.12842559814453125, -0.11973190307617188, -0.1110382080078125, -0.10234451293945312, -0.09365081787109375, -0.08495712280273438, -0.076263427734375, -0.06756973266601562, -0.05887603759765625, -0.050182342529296875, -0.0414886474609375, -0.032794952392578125, -0.02410125732421875, -0.015407562255859375, -0.0067138671875, 0.001979827880859375, 0.01067352294921875, 0.019367218017578125, 0.0280609130859375, 0.036754608154296875, 0.04544830322265625, 0.054141998291015625, 0.062835693359375, 0.07152938842773438, 0.08022308349609375, 0.08891677856445312, 0.0976104736328125, 0.10630416870117188, 0.11499786376953125, 0.12369155883789062, 0.13238525390625, 0.14107894897460938, 0.14977264404296875, 0.15846633911132812, 0.1671600341796875, 0.17585372924804688, 0.18454742431640625, 0.19324111938476562, 0.201934814453125, 0.21062850952148438, 0.21932220458984375, 0.22801589965820312, 0.2367095947265625, 0.24540328979492188, 0.25409698486328125, 0.2627906799316406, 0.271484375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 5.0, 2.0, 8.0, 11.0, 17.0, 16.0, 14.0, 25.0, 19.0, 37.0, 38.0, 40.0, 37.0, 58.0, 65.0, 47.0, 194.0, 886.0, 101.0, 42.0, 50.0, 44.0, 51.0, 31.0, 27.0, 26.0, 30.0, 19.0, 18.0, 16.0, 13.0, 13.0, 6.0, 9.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.568359375, -3.46173095703125, -3.3551025390625, -3.24847412109375, -3.141845703125, -3.03521728515625, -2.9285888671875, -2.82196044921875, -2.71533203125, -2.60870361328125, -2.5020751953125, -2.39544677734375, -2.288818359375, -2.18218994140625, -2.0755615234375, -1.96893310546875, -1.8623046875, -1.75567626953125, -1.6490478515625, -1.54241943359375, -1.435791015625, -1.32916259765625, -1.2225341796875, -1.11590576171875, -1.00927734375, -0.90264892578125, -0.7960205078125, -0.68939208984375, -0.582763671875, -0.47613525390625, -0.3695068359375, -0.26287841796875, -0.15625, -0.04962158203125, 0.0570068359375, 0.16363525390625, 0.270263671875, 0.37689208984375, 0.4835205078125, 0.59014892578125, 0.69677734375, 0.80340576171875, 0.9100341796875, 1.01666259765625, 1.123291015625, 1.22991943359375, 1.3365478515625, 1.44317626953125, 1.5498046875, 1.65643310546875, 1.7630615234375, 1.86968994140625, 1.976318359375, 2.08294677734375, 2.1895751953125, 2.29620361328125, 2.40283203125, 2.50946044921875, 2.6160888671875, 2.72271728515625, 2.829345703125, 2.93597412109375, 3.0426025390625, 3.14923095703125, 3.255859375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 4.0, 6.0, 11.0, 10.0, 8.0, 9.0, 16.0, 29.0, 38.0, 58.0, 66.0, 78.0, 105.0, 128.0, 198.0, 243.0, 341.0, 510.0, 872.0, 1468.0, 2877.0, 5912.0, 14983.0, 42601.0, 117875.0, 5529323.0, 430905.0, 88615.0, 31591.0, 11684.0, 4864.0, 2333.0, 1267.0, 764.0, 494.0, 264.0, 218.0, 155.0, 124.0, 113.0, 68.0, 64.0, 35.0, 20.0, 20.0, 28.0, 12.0, 10.0, 4.0, 4.0, 9.0, 4.0, 3.0, 1.0, 2.0, 1.0], "bins": [-1.396484375, -1.3552398681640625, -1.313995361328125, -1.2727508544921875, -1.23150634765625, -1.1902618408203125, -1.149017333984375, -1.1077728271484375, -1.0665283203125, -1.0252838134765625, -0.984039306640625, -0.9427947998046875, -0.90155029296875, -0.8603057861328125, -0.819061279296875, -0.7778167724609375, -0.736572265625, -0.6953277587890625, -0.654083251953125, -0.6128387451171875, -0.57159423828125, -0.5303497314453125, -0.489105224609375, -0.4478607177734375, -0.4066162109375, -0.3653717041015625, -0.324127197265625, -0.2828826904296875, -0.24163818359375, -0.2003936767578125, -0.159149169921875, -0.1179046630859375, -0.07666015625, -0.0354156494140625, 0.005828857421875, 0.0470733642578125, 0.08831787109375, 0.1295623779296875, 0.170806884765625, 0.2120513916015625, 0.2532958984375, 0.2945404052734375, 0.335784912109375, 0.3770294189453125, 0.41827392578125, 0.4595184326171875, 0.500762939453125, 0.5420074462890625, 0.583251953125, 0.6244964599609375, 0.665740966796875, 0.7069854736328125, 0.74822998046875, 0.7894744873046875, 0.830718994140625, 0.8719635009765625, 0.9132080078125, 0.9544525146484375, 0.995697021484375, 1.0369415283203125, 1.07818603515625, 1.1194305419921875, 1.160675048828125, 1.2019195556640625, 1.2431640625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 9.0, 9.0, 5.0, 11.0, 7.0, 9.0, 15.0, 19.0, 22.0, 22.0, 28.0, 26.0, 41.0, 22.0, 38.0, 30.0, 42.0, 41.0, 45.0, 294.0, 770.0, 77.0, 38.0, 37.0, 43.0, 32.0, 43.0, 35.0, 30.0, 30.0, 27.0, 23.0, 21.0, 11.0, 14.0, 8.0, 9.0, 9.0, 7.0, 6.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.787109375, -2.7034912109375, -2.619873046875, -2.5362548828125, -2.45263671875, -2.3690185546875, -2.285400390625, -2.2017822265625, -2.1181640625, -2.0345458984375, -1.950927734375, -1.8673095703125, -1.78369140625, -1.7000732421875, -1.616455078125, -1.5328369140625, -1.44921875, -1.3656005859375, -1.281982421875, -1.1983642578125, -1.11474609375, -1.0311279296875, -0.947509765625, -0.8638916015625, -0.7802734375, -0.6966552734375, -0.613037109375, -0.5294189453125, -0.44580078125, -0.3621826171875, -0.278564453125, -0.1949462890625, -0.111328125, -0.0277099609375, 0.055908203125, 0.1395263671875, 0.22314453125, 0.3067626953125, 0.390380859375, 0.4739990234375, 0.5576171875, 0.6412353515625, 0.724853515625, 0.8084716796875, 0.89208984375, 0.9757080078125, 1.059326171875, 1.1429443359375, 1.2265625, 1.3101806640625, 1.393798828125, 1.4774169921875, 1.56103515625, 1.6446533203125, 1.728271484375, 1.8118896484375, 1.8955078125, 1.9791259765625, 2.062744140625, 2.1463623046875, 2.22998046875, 2.3135986328125, 2.397216796875, 2.4808349609375, 2.564453125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 1.0, 7.0, 4.0, 18.0, 21.0, 30.0, 47.0, 66.0, 97.0, 215.0, 195.0, 98.0, 63.0, 46.0, 36.0, 31.0, 11.0, 3.0, 6.0, 6.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.649308204650879, -13.836520195007324, -13.023733139038086, -12.210945129394531, -11.398158073425293, -10.585370063781738, -9.7725830078125, -8.959794998168945, -8.14700698852539, -7.334219455718994, -6.521431922912598, -5.708643913269043, -4.895856857299805, -4.08306884765625, -3.2702813148498535, -2.457493782043457, -1.6447067260742188, -0.8319191336631775, -0.01913154125213623, 0.7936561107635498, 1.6064436435699463, 2.419231414794922, 3.2320189476013184, 4.044806480407715, 4.857594013214111, 5.670381546020508, 6.483169078826904, 7.295956611633301, 8.108744621276855, 8.921531677246094, 9.734319686889648, 10.547107696533203, 11.359895706176758, 12.172683715820312, 12.98547077178955, 13.798258781433105, 14.611045837402344, 15.423833847045898, 16.236621856689453, 17.049407958984375, 17.86219596862793, 18.674983978271484, 19.48777198791504, 20.30055809020996, 21.113346099853516, 21.92613410949707, 22.738922119140625, 23.551708221435547, 24.364498138427734, 25.17728614807129, 25.990074157714844, 26.802860260009766, 27.61564826965332, 28.428436279296875, 29.24122428894043, 30.054012298583984, 30.866798400878906, 31.67958641052246, 32.492374420166016, 33.30516052246094, 34.117950439453125, 34.93073654174805, 35.74352264404297, 36.556312561035156, 37.36909866333008]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 5.0, 4.0, 13.0, 12.0, 7.0, 15.0, 23.0, 23.0, 29.0, 25.0, 32.0, 58.0, 84.0, 91.0, 142.0, 106.0, 88.0, 48.0, 36.0, 28.0, 24.0, 19.0, 17.0, 19.0, 12.0, 9.0, 7.0, 4.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-43.04505157470703, -41.72314453125, -40.40123748779297, -39.0793342590332, -37.75742721557617, -36.43552017211914, -35.11361312866211, -33.79170608520508, -32.46980285644531, -31.14789581298828, -29.825990676879883, -28.50408363342285, -27.182178497314453, -25.860271453857422, -24.53836441040039, -23.21645736694336, -21.894550323486328, -20.572643280029297, -19.2507381439209, -17.928831100463867, -16.60692596435547, -15.285018920898438, -13.963111877441406, -12.641205787658691, -11.319299697875977, -9.997393608093262, -8.675487518310547, -7.353580474853516, -6.031674385070801, -4.709768295288086, -3.387861728668213, -2.06595516204834, -0.744049072265625, 0.577857255935669, 1.899763584136963, 3.221669912338257, 4.543576240539551, 5.865482330322266, 7.187388896942139, 8.509295463562012, 9.831201553344727, 11.153107643127441, 12.475013732910156, 13.796920776367188, 15.118826866149902, 16.440732955932617, 17.76263999938965, 19.084545135498047, 20.406452178955078, 21.72835922241211, 23.050264358520508, 24.37217140197754, 25.694076538085938, 27.01598358154297, 28.337890625, 29.65979766845703, 30.98170280456543, 32.30360794067383, 33.62551498413086, 34.94742202758789, 36.26932907104492, 37.59123229980469, 38.91313934326172, 40.23504638671875, 41.55695343017578]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 10.0, 7.0, 6.0, 22.0, 23.0, 23.0, 37.0, 41.0, 74.0, 91.0, 131.0, 194.0, 313.0, 497.0, 870.0, 1597.0, 3123.0, 6814.0, 18794.0, 77610.0, 3672268.0, 349515.0, 39735.0, 12243.0, 4860.0, 2307.0, 1128.0, 690.0, 416.0, 275.0, 161.0, 125.0, 77.0, 59.0, 33.0, 41.0, 23.0, 11.0, 10.0, 6.0, 8.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.10150146484375, -0.09866523742675781, -0.09582901000976562, -0.09299278259277344, -0.09015655517578125, -0.08732032775878906, -0.08448410034179688, -0.08164787292480469, -0.0788116455078125, -0.07597541809082031, -0.07313919067382812, -0.07030296325683594, -0.06746673583984375, -0.06463050842285156, -0.061794281005859375, -0.05895805358886719, -0.056121826171875, -0.05328559875488281, -0.050449371337890625, -0.04761314392089844, -0.04477691650390625, -0.04194068908691406, -0.039104461669921875, -0.03626823425292969, -0.0334320068359375, -0.030595779418945312, -0.027759552001953125, -0.024923324584960938, -0.02208709716796875, -0.019250869750976562, -0.016414642333984375, -0.013578414916992188, -0.0107421875, -0.007905960083007812, -0.005069732666015625, -0.0022335052490234375, 0.00060272216796875, 0.0034389495849609375, 0.006275177001953125, 0.009111404418945312, 0.0119476318359375, 0.014783859252929688, 0.017620086669921875, 0.020456314086914062, 0.02329254150390625, 0.026128768920898438, 0.028964996337890625, 0.03180122375488281, 0.034637451171875, 0.03747367858886719, 0.040309906005859375, 0.04314613342285156, 0.04598236083984375, 0.04881858825683594, 0.051654815673828125, 0.05449104309082031, 0.0573272705078125, 0.06016349792480469, 0.06299972534179688, 0.06583595275878906, 0.06867218017578125, 0.07150840759277344, 0.07434463500976562, 0.07718086242675781, 0.08001708984375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 4.0, 1.0, 3.0, 5.0, 2.0, 4.0, 7.0, 10.0, 12.0, 12.0, 15.0, 17.0, 18.0, 26.0, 36.0, 59.0, 62.0, 163.0, 210.0, 85.0, 43.0, 44.0, 35.0, 22.0, 19.0, 20.0, 10.0, 9.0, 7.0, 7.0, 7.0, 5.0, 3.0, 3.0, 5.0, 5.0, 4.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02532958984375, -0.024565696716308594, -0.023801803588867188, -0.02303791046142578, -0.022274017333984375, -0.02151012420654297, -0.020746231079101562, -0.019982337951660156, -0.01921844482421875, -0.018454551696777344, -0.017690658569335938, -0.01692676544189453, -0.016162872314453125, -0.015398979187011719, -0.014635086059570312, -0.013871192932128906, -0.0131072998046875, -0.012343406677246094, -0.011579513549804688, -0.010815620422363281, -0.010051727294921875, -0.009287834167480469, -0.008523941040039062, -0.007760047912597656, -0.00699615478515625, -0.006232261657714844, -0.0054683685302734375, -0.004704475402832031, -0.003940582275390625, -0.0031766891479492188, -0.0024127960205078125, -0.0016489028930664062, -0.000885009765625, -0.00012111663818359375, 0.0006427764892578125, 0.0014066696166992188, 0.002170562744140625, 0.0029344558715820312, 0.0036983489990234375, 0.004462242126464844, 0.00522613525390625, 0.005990028381347656, 0.0067539215087890625, 0.007517814636230469, 0.008281707763671875, 0.009045600891113281, 0.009809494018554688, 0.010573387145996094, 0.0113372802734375, 0.012101173400878906, 0.012865066528320312, 0.013628959655761719, 0.014392852783203125, 0.015156745910644531, 0.015920639038085938, 0.016684532165527344, 0.01744842529296875, 0.018212318420410156, 0.018976211547851562, 0.01974010467529297, 0.020503997802734375, 0.02126789093017578, 0.022031784057617188, 0.022795677185058594, 0.0235595703125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 10.0, 13.0, 17.0, 22.0, 27.0, 61.0, 85.0, 170.0, 323.0, 954.0, 3051.0, 12367.0, 72813.0, 1129495.0, 2828733.0, 122123.0, 17846.0, 3958.0, 1254.0, 477.0, 203.0, 111.0, 63.0, 38.0, 23.0, 13.0, 8.0, 7.0, 3.0, 1.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1063232421875, -0.10329532623291016, -0.10026741027832031, -0.09723949432373047, -0.09421157836914062, -0.09118366241455078, -0.08815574645996094, -0.0851278305053711, -0.08209991455078125, -0.0790719985961914, -0.07604408264160156, -0.07301616668701172, -0.06998825073242188, -0.06696033477783203, -0.06393241882324219, -0.060904502868652344, -0.0578765869140625, -0.054848670959472656, -0.05182075500488281, -0.04879283905029297, -0.045764923095703125, -0.04273700714111328, -0.03970909118652344, -0.036681175231933594, -0.03365325927734375, -0.030625343322753906, -0.027597427368164062, -0.02456951141357422, -0.021541595458984375, -0.01851367950439453, -0.015485763549804688, -0.012457847595214844, -0.009429931640625, -0.006402015686035156, -0.0033740997314453125, -0.00034618377685546875, 0.002681732177734375, 0.005709648132324219, 0.008737564086914062, 0.011765480041503906, 0.01479339599609375, 0.017821311950683594, 0.020849227905273438, 0.02387714385986328, 0.026905059814453125, 0.02993297576904297, 0.03296089172363281, 0.035988807678222656, 0.0390167236328125, 0.042044639587402344, 0.04507255554199219, 0.04810047149658203, 0.051128387451171875, 0.05415630340576172, 0.05718421936035156, 0.060212135314941406, 0.06324005126953125, 0.0662679672241211, 0.06929588317871094, 0.07232379913330078, 0.07535171508789062, 0.07837963104248047, 0.08140754699707031, 0.08443546295166016, 0.08746337890625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 7.0, 8.0, 8.0, 4.0, 19.0, 14.0, 22.0, 27.0, 31.0, 45.0, 52.0, 78.0, 124.0, 197.0, 347.0, 626.0, 985.0, 520.0, 314.0, 172.0, 123.0, 89.0, 86.0, 44.0, 38.0, 31.0, 20.0, 12.0, 11.0, 4.0, 5.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022186279296875, -0.02137613296508789, -0.02056598663330078, -0.019755840301513672, -0.018945693969726562, -0.018135547637939453, -0.017325401306152344, -0.016515254974365234, -0.015705108642578125, -0.014894962310791016, -0.014084815979003906, -0.013274669647216797, -0.012464523315429688, -0.011654376983642578, -0.010844230651855469, -0.01003408432006836, -0.00922393798828125, -0.00841379165649414, -0.007603645324707031, -0.006793498992919922, -0.0059833526611328125, -0.005173206329345703, -0.004363059997558594, -0.0035529136657714844, -0.002742767333984375, -0.0019326210021972656, -0.0011224746704101562, -0.0003123283386230469, 0.0004978179931640625, 0.0013079643249511719, 0.0021181106567382812, 0.0029282569885253906, 0.0037384033203125, 0.004548549652099609, 0.005358695983886719, 0.006168842315673828, 0.0069789886474609375, 0.007789134979248047, 0.008599281311035156, 0.009409427642822266, 0.010219573974609375, 0.011029720306396484, 0.011839866638183594, 0.012650012969970703, 0.013460159301757812, 0.014270305633544922, 0.015080451965332031, 0.01589059829711914, 0.01670074462890625, 0.01751089096069336, 0.01832103729248047, 0.019131183624267578, 0.019941329956054688, 0.020751476287841797, 0.021561622619628906, 0.022371768951416016, 0.023181915283203125, 0.023992061614990234, 0.024802207946777344, 0.025612354278564453, 0.026422500610351562, 0.027232646942138672, 0.02804279327392578, 0.02885293960571289, 0.0296630859375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 10.0, 31.0, 97.0, 258.0, 329.0, 173.0, 68.0, 20.0, 10.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2873302400112152, -0.277182936668396, -0.2670356333255768, -0.25688835978507996, -0.24674105644226074, -0.23659375309944153, -0.22644644975662231, -0.2162991613149643, -0.20615187287330627, -0.19600456953048706, -0.18585728108882904, -0.17570997774600983, -0.1655626893043518, -0.1554153859615326, -0.14526808261871338, -0.13512079417705536, -0.12497349083423615, -0.11482619494199753, -0.10467889904975891, -0.0945315957069397, -0.08438430726528168, -0.07423700392246246, -0.06408970803022385, -0.05394241213798523, -0.04379511624574661, -0.033647820353507996, -0.02350052259862423, -0.013353224843740463, -0.0032059289515018463, 0.006941366940736771, 0.017088666558265686, 0.027235962450504303, 0.03738325834274292, 0.04753055423498154, 0.057677850127220154, 0.06782515347003937, 0.07797244191169739, 0.0881197452545166, 0.09826704114675522, 0.10841433703899384, 0.11856163293123245, 0.12870892882347107, 0.13885623216629028, 0.1490035206079483, 0.15915082395076752, 0.16929811239242554, 0.17944541573524475, 0.18959271907806396, 0.19974000751972198, 0.2098873108625412, 0.22003459930419922, 0.23018190264701843, 0.24032919108867645, 0.2504764795303345, 0.2606237828731537, 0.2707710862159729, 0.2809183895587921, 0.29106569290161133, 0.30121299624443054, 0.31136026978492737, 0.3215075731277466, 0.3316548764705658, 0.341802179813385, 0.35194945335388184, 0.36209675669670105]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 2.0, 2.0, 8.0, 3.0, 8.0, 8.0, 13.0, 16.0, 15.0, 22.0, 25.0, 38.0, 46.0, 46.0, 26.0, 47.0, 57.0, 48.0, 52.0, 65.0, 49.0, 56.0, 38.0, 44.0, 37.0, 31.0, 35.0, 23.0, 29.0, 29.0, 13.0, 22.0, 9.0, 8.0, 6.0, 6.0, 9.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.10206902027130127, -0.09882151335477829, -0.09557400643825531, -0.09232649207115173, -0.08907898515462875, -0.08583147823810577, -0.0825839638710022, -0.07933645695447922, -0.07608895003795624, -0.07284144312143326, -0.06959393620491028, -0.0663464218378067, -0.06309891492128372, -0.05985140800476074, -0.056603897362947464, -0.053356386721134186, -0.050108879804611206, -0.046861372888088226, -0.04361386224627495, -0.04036635160446167, -0.03711884468793869, -0.03387133777141571, -0.030623827129602432, -0.027376318350434303, -0.024128809571266174, -0.020881300792098045, -0.017633792012929916, -0.014386283233761787, -0.011138774454593658, -0.00789126567542553, -0.0046437568962574005, -0.0013962481170892715, 0.0018512606620788574, 0.005098769441246986, 0.008346278220415115, 0.011593786999583244, 0.014841295778751373, 0.018088804557919502, 0.02133631333708763, 0.02458382211625576, 0.02783133089542389, 0.031078839674592018, 0.03432634845376015, 0.037573859095573425, 0.040821366012096405, 0.044068872928619385, 0.04731638357043266, 0.05056389421224594, 0.05381140112876892, 0.0570589080452919, 0.06030641868710518, 0.06355392932891846, 0.06680143624544144, 0.07004894316196442, 0.073296457529068, 0.07654396444559097, 0.07979147136211395, 0.08303897827863693, 0.08628648519515991, 0.08953399956226349, 0.09278150647878647, 0.09602901339530945, 0.09927652776241302, 0.102524034678936, 0.10577154159545898]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 6.0, 15.0, 22.0, 33.0, 46.0, 69.0, 95.0, 172.0, 217.0, 321.0, 485.0, 766.0, 1170.0, 1736.0, 2735.0, 4753.0, 7903.0, 14722.0, 29842.0, 71374.0, 331052.0, 431888.0, 79688.0, 32028.0, 15810.0, 8368.0, 4933.0, 2946.0, 1870.0, 1172.0, 763.0, 492.0, 354.0, 239.0, 150.0, 108.0, 69.0, 47.0, 31.0, 26.0, 11.0, 12.0, 7.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.08416748046875, -0.08176612854003906, -0.07936477661132812, -0.07696342468261719, -0.07456207275390625, -0.07216072082519531, -0.06975936889648438, -0.06735801696777344, -0.0649566650390625, -0.06255531311035156, -0.060153961181640625, -0.05775260925292969, -0.05535125732421875, -0.05294990539550781, -0.050548553466796875, -0.04814720153808594, -0.045745849609375, -0.04334449768066406, -0.040943145751953125, -0.03854179382324219, -0.03614044189453125, -0.03373908996582031, -0.031337738037109375, -0.028936386108398438, -0.0265350341796875, -0.024133682250976562, -0.021732330322265625, -0.019330978393554688, -0.01692962646484375, -0.014528274536132812, -0.012126922607421875, -0.009725570678710938, -0.00732421875, -0.0049228668212890625, -0.002521514892578125, -0.0001201629638671875, 0.00228118896484375, 0.0046825408935546875, 0.007083892822265625, 0.009485244750976562, 0.0118865966796875, 0.014287948608398438, 0.016689300537109375, 0.019090652465820312, 0.02149200439453125, 0.023893356323242188, 0.026294708251953125, 0.028696060180664062, 0.031097412109375, 0.03349876403808594, 0.035900115966796875, 0.03830146789550781, 0.04070281982421875, 0.04310417175292969, 0.045505523681640625, 0.04790687561035156, 0.0503082275390625, 0.05270957946777344, 0.055110931396484375, 0.05751228332519531, 0.05991363525390625, 0.06231498718261719, 0.06471633911132812, 0.06711769104003906, 0.06951904296875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 2.0, 3.0, 3.0, 5.0, 4.0, 8.0, 12.0, 18.0, 19.0, 18.0, 22.0, 33.0, 36.0, 50.0, 77.0, 205.0, 144.0, 79.0, 52.0, 45.0, 30.0, 19.0, 16.0, 12.0, 8.0, 21.0, 4.0, 6.0, 7.0, 7.0, 2.0, 6.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.02667236328125, -0.02595043182373047, -0.025228500366210938, -0.024506568908691406, -0.023784637451171875, -0.023062705993652344, -0.022340774536132812, -0.02161884307861328, -0.02089691162109375, -0.02017498016357422, -0.019453048706054688, -0.018731117248535156, -0.018009185791015625, -0.017287254333496094, -0.016565322875976562, -0.01584339141845703, -0.0151214599609375, -0.014399528503417969, -0.013677597045898438, -0.012955665588378906, -0.012233734130859375, -0.011511802673339844, -0.010789871215820312, -0.010067939758300781, -0.00934600830078125, -0.008624076843261719, -0.007902145385742188, -0.007180213928222656, -0.006458282470703125, -0.005736351013183594, -0.0050144195556640625, -0.004292488098144531, -0.003570556640625, -0.0028486251831054688, -0.0021266937255859375, -0.0014047622680664062, -0.000682830810546875, 3.910064697265625e-05, 0.0007610321044921875, 0.0014829635620117188, 0.00220489501953125, 0.0029268264770507812, 0.0036487579345703125, 0.004370689392089844, 0.005092620849609375, 0.005814552307128906, 0.0065364837646484375, 0.007258415222167969, 0.0079803466796875, 0.008702278137207031, 0.009424209594726562, 0.010146141052246094, 0.010868072509765625, 0.011590003967285156, 0.012311935424804688, 0.013033866882324219, 0.01375579833984375, 0.014477729797363281, 0.015199661254882812, 0.015921592712402344, 0.016643524169921875, 0.017365455627441406, 0.018087387084960938, 0.01880931854248047, 0.01953125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 4.0, 10.0, 9.0, 14.0, 11.0, 26.0, 24.0, 40.0, 59.0, 80.0, 114.0, 182.0, 330.0, 615.0, 1298.0, 3199.0, 9195.0, 31794.0, 140352.0, 547163.0, 243017.0, 49557.0, 13439.0, 4491.0, 1685.0, 764.0, 410.0, 197.0, 144.0, 99.0, 60.0, 47.0, 37.0, 27.0, 11.0, 17.0, 14.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06927490234375, -0.0670156478881836, -0.06475639343261719, -0.06249713897705078, -0.060237884521484375, -0.05797863006591797, -0.05571937561035156, -0.053460121154785156, -0.05120086669921875, -0.048941612243652344, -0.04668235778808594, -0.04442310333251953, -0.042163848876953125, -0.03990459442138672, -0.03764533996582031, -0.035386085510253906, -0.0331268310546875, -0.030867576599121094, -0.028608322143554688, -0.02634906768798828, -0.024089813232421875, -0.02183055877685547, -0.019571304321289062, -0.017312049865722656, -0.01505279541015625, -0.012793540954589844, -0.010534286499023438, -0.008275032043457031, -0.006015777587890625, -0.0037565231323242188, -0.0014972686767578125, 0.0007619857788085938, 0.003021240234375, 0.005280494689941406, 0.0075397491455078125, 0.009799003601074219, 0.012058258056640625, 0.014317512512207031, 0.016576766967773438, 0.018836021423339844, 0.02109527587890625, 0.023354530334472656, 0.025613784790039062, 0.02787303924560547, 0.030132293701171875, 0.03239154815673828, 0.03465080261230469, 0.036910057067871094, 0.0391693115234375, 0.041428565979003906, 0.04368782043457031, 0.04594707489013672, 0.048206329345703125, 0.05046558380126953, 0.05272483825683594, 0.054984092712402344, 0.05724334716796875, 0.059502601623535156, 0.06176185607910156, 0.06402111053466797, 0.06628036499023438, 0.06853961944580078, 0.07079887390136719, 0.0730581283569336, 0.0753173828125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 8.0, 5.0, 2.0, 7.0, 8.0, 15.0, 8.0, 10.0, 19.0, 28.0, 26.0, 25.0, 29.0, 38.0, 41.0, 56.0, 42.0, 47.0, 32.0, 46.0, 42.0, 49.0, 54.0, 35.0, 50.0, 43.0, 27.0, 24.0, 30.0, 31.0, 24.0, 18.0, 14.0, 21.0, 13.0, 12.0, 6.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.087646484375, -0.0846567153930664, -0.08166694641113281, -0.07867717742919922, -0.07568740844726562, -0.07269763946533203, -0.06970787048339844, -0.06671810150146484, -0.06372833251953125, -0.060738563537597656, -0.05774879455566406, -0.05475902557373047, -0.051769256591796875, -0.04877948760986328, -0.04578971862792969, -0.042799949645996094, -0.0398101806640625, -0.036820411682128906, -0.03383064270019531, -0.03084087371826172, -0.027851104736328125, -0.02486133575439453, -0.021871566772460938, -0.018881797790527344, -0.01589202880859375, -0.012902259826660156, -0.009912490844726562, -0.006922721862792969, -0.003932952880859375, -0.0009431838989257812, 0.0020465850830078125, 0.005036354064941406, 0.008026123046875, 0.011015892028808594, 0.014005661010742188, 0.01699542999267578, 0.019985198974609375, 0.02297496795654297, 0.025964736938476562, 0.028954505920410156, 0.03194427490234375, 0.034934043884277344, 0.03792381286621094, 0.04091358184814453, 0.043903350830078125, 0.04689311981201172, 0.04988288879394531, 0.052872657775878906, 0.0558624267578125, 0.058852195739746094, 0.06184196472167969, 0.06483173370361328, 0.06782150268554688, 0.07081127166748047, 0.07380104064941406, 0.07679080963134766, 0.07978057861328125, 0.08277034759521484, 0.08576011657714844, 0.08874988555908203, 0.09173965454101562, 0.09472942352294922, 0.09771919250488281, 0.1007089614868164, 0.10369873046875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 6.0, 8.0, 10.0, 15.0, 33.0, 45.0, 68.0, 100.0, 160.0, 293.0, 553.0, 1132.0, 2901.0, 9478.0, 56323.0, 754507.0, 196603.0, 18425.0, 4517.0, 1717.0, 723.0, 366.0, 215.0, 137.0, 73.0, 46.0, 34.0, 20.0, 13.0, 9.0, 11.0, 3.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07305908203125, -0.07010364532470703, -0.06714820861816406, -0.0641927719116211, -0.061237335205078125, -0.058281898498535156, -0.05532646179199219, -0.05237102508544922, -0.04941558837890625, -0.04646015167236328, -0.04350471496582031, -0.040549278259277344, -0.037593841552734375, -0.034638404846191406, -0.03168296813964844, -0.02872753143310547, -0.0257720947265625, -0.02281665802001953, -0.019861221313476562, -0.016905784606933594, -0.013950347900390625, -0.010994911193847656, -0.008039474487304688, -0.005084037780761719, -0.00212860107421875, 0.0008268356323242188, 0.0037822723388671875, 0.006737709045410156, 0.009693145751953125, 0.012648582458496094, 0.015604019165039062, 0.01855945587158203, 0.021514892578125, 0.02447032928466797, 0.027425765991210938, 0.030381202697753906, 0.033336639404296875, 0.036292076110839844, 0.03924751281738281, 0.04220294952392578, 0.04515838623046875, 0.04811382293701172, 0.05106925964355469, 0.054024696350097656, 0.056980133056640625, 0.059935569763183594, 0.06289100646972656, 0.06584644317626953, 0.0688018798828125, 0.07175731658935547, 0.07471275329589844, 0.0776681900024414, 0.08062362670898438, 0.08357906341552734, 0.08653450012207031, 0.08948993682861328, 0.09244537353515625, 0.09540081024169922, 0.09835624694824219, 0.10131168365478516, 0.10426712036132812, 0.1072225570678711, 0.11017799377441406, 0.11313343048095703, 0.1160888671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 4.0, 3.0, 3.0, 1.0, 5.0, 5.0, 11.0, 12.0, 13.0, 21.0, 28.0, 33.0, 32.0, 51.0, 55.0, 63.0, 77.0, 59.0, 51.0, 71.0, 59.0, 60.0, 47.0, 46.0, 41.0, 28.0, 22.0, 22.0, 16.0, 14.0, 9.0, 6.0, 14.0, 5.0, 2.0, 3.0, 3.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-4.1961669921875e-05, -4.0629878640174866e-05, -3.929808735847473e-05, -3.79662960767746e-05, -3.663450479507446e-05, -3.530271351337433e-05, -3.3970922231674194e-05, -3.263913094997406e-05, -3.1307339668273926e-05, -2.997554838657379e-05, -2.8643757104873657e-05, -2.7311965823173523e-05, -2.598017454147339e-05, -2.4648383259773254e-05, -2.331659197807312e-05, -2.1984800696372986e-05, -2.065300941467285e-05, -1.9321218132972717e-05, -1.7989426851272583e-05, -1.665763556957245e-05, -1.5325844287872314e-05, -1.399405300617218e-05, -1.2662261724472046e-05, -1.1330470442771912e-05, -9.998679161071777e-06, -8.666887879371643e-06, -7.335096597671509e-06, -6.0033053159713745e-06, -4.67151403427124e-06, -3.339722752571106e-06, -2.0079314708709717e-06, -6.761401891708374e-07, 6.556510925292969e-07, 1.987442374229431e-06, 3.3192336559295654e-06, 4.6510249376297e-06, 5.982816219329834e-06, 7.314607501029968e-06, 8.646398782730103e-06, 9.978190064430237e-06, 1.1309981346130371e-05, 1.2641772627830505e-05, 1.397356390953064e-05, 1.5305355191230774e-05, 1.6637146472930908e-05, 1.7968937754631042e-05, 1.9300729036331177e-05, 2.063252031803131e-05, 2.1964311599731445e-05, 2.329610288143158e-05, 2.4627894163131714e-05, 2.5959685444831848e-05, 2.7291476726531982e-05, 2.8623268008232117e-05, 2.995505928993225e-05, 3.1286850571632385e-05, 3.261864185333252e-05, 3.3950433135032654e-05, 3.528222441673279e-05, 3.661401569843292e-05, 3.794580698013306e-05, 3.927759826183319e-05, 4.0609389543533325e-05, 4.194118082523346e-05, 4.3272972106933594e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 0.0, 5.0, 7.0, 20.0, 19.0, 31.0, 49.0, 78.0, 137.0, 274.0, 509.0, 1241.0, 3416.0, 13541.0, 139384.0, 805082.0, 70595.0, 9544.0, 2710.0, 977.0, 445.0, 207.0, 113.0, 63.0, 27.0, 26.0, 12.0, 12.0, 8.0, 4.0, 4.0, 2.0, 4.0, 1.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1275634765625, -0.12415122985839844, -0.12073898315429688, -0.11732673645019531, -0.11391448974609375, -0.11050224304199219, -0.10708999633789062, -0.10367774963378906, -0.1002655029296875, -0.09685325622558594, -0.09344100952148438, -0.09002876281738281, -0.08661651611328125, -0.08320426940917969, -0.07979202270507812, -0.07637977600097656, -0.072967529296875, -0.06955528259277344, -0.06614303588867188, -0.06273078918457031, -0.05931854248046875, -0.05590629577636719, -0.052494049072265625, -0.04908180236816406, -0.0456695556640625, -0.04225730895996094, -0.038845062255859375, -0.03543281555175781, -0.03202056884765625, -0.028608322143554688, -0.025196075439453125, -0.021783828735351562, -0.01837158203125, -0.014959335327148438, -0.011547088623046875, -0.008134841918945312, -0.00472259521484375, -0.0013103485107421875, 0.002101898193359375, 0.0055141448974609375, 0.0089263916015625, 0.012338638305664062, 0.015750885009765625, 0.019163131713867188, 0.02257537841796875, 0.025987625122070312, 0.029399871826171875, 0.03281211853027344, 0.036224365234375, 0.03963661193847656, 0.043048858642578125, 0.04646110534667969, 0.04987335205078125, 0.05328559875488281, 0.056697845458984375, 0.06011009216308594, 0.0635223388671875, 0.06693458557128906, 0.07034683227539062, 0.07375907897949219, 0.07717132568359375, 0.08058357238769531, 0.08399581909179688, 0.08740806579589844, 0.0908203125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 13.0, 5.0, 16.0, 10.0, 9.0, 17.0, 42.0, 51.0, 69.0, 82.0, 81.0, 101.0, 95.0, 89.0, 78.0, 60.0, 52.0, 32.0, 22.0, 24.0, 11.0, 9.0, 5.0, 5.0, 2.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052581787109375, -0.05039072036743164, -0.04819965362548828, -0.04600858688354492, -0.04381752014160156, -0.0416264533996582, -0.039435386657714844, -0.037244319915771484, -0.035053253173828125, -0.032862186431884766, -0.030671119689941406, -0.028480052947998047, -0.026288986206054688, -0.024097919464111328, -0.02190685272216797, -0.01971578598022461, -0.01752471923828125, -0.01533365249633789, -0.013142585754394531, -0.010951519012451172, -0.008760452270507812, -0.006569385528564453, -0.004378318786621094, -0.0021872520446777344, 3.814697265625e-06, 0.0021948814392089844, 0.004385948181152344, 0.006577014923095703, 0.008768081665039062, 0.010959148406982422, 0.013150215148925781, 0.01534128189086914, 0.0175323486328125, 0.01972341537475586, 0.02191448211669922, 0.024105548858642578, 0.026296615600585938, 0.028487682342529297, 0.030678749084472656, 0.032869815826416016, 0.035060882568359375, 0.037251949310302734, 0.039443016052246094, 0.04163408279418945, 0.04382514953613281, 0.04601621627807617, 0.04820728302001953, 0.05039834976196289, 0.05258941650390625, 0.05478048324584961, 0.05697154998779297, 0.05916261672973633, 0.06135368347167969, 0.06354475021362305, 0.0657358169555664, 0.06792688369750977, 0.07011795043945312, 0.07230901718139648, 0.07450008392333984, 0.0766911506652832, 0.07888221740722656, 0.08107328414916992, 0.08326435089111328, 0.08545541763305664, 0.087646484375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 11.0, 17.0, 48.0, 95.0, 266.0, 287.0, 146.0, 61.0, 24.0, 16.0, 6.0, 7.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5372573733329773, -0.503674328327179, -0.4700912833213806, -0.4365082383155823, -0.40292519330978394, -0.3693421483039856, -0.33575907349586487, -0.30217602849006653, -0.2685929834842682, -0.23500993847846985, -0.2014268934726715, -0.16784383356571198, -0.13426078855991364, -0.1006777435541153, -0.06709468364715576, -0.03351163864135742, 7.140636444091797e-05, 0.033654455095529556, 0.0672375038266182, 0.10082055628299713, 0.13440360128879547, 0.1679866462945938, 0.20156970620155334, 0.23515275120735168, 0.26873579621315, 0.30231884121894836, 0.3359018862247467, 0.36948496103286743, 0.40306800603866577, 0.4366510510444641, 0.47023409605026245, 0.5038171410560608, 0.5374002456665039, 0.5709832906723022, 0.6045663356781006, 0.6381493806838989, 0.6717324256896973, 0.7053154706954956, 0.738898515701294, 0.7724815607070923, 0.8060646057128906, 0.839647650718689, 0.8732306957244873, 0.9068137407302856, 0.940396785736084, 0.9739798307418823, 1.0075628757476807, 1.041145920753479, 1.0747289657592773, 1.1083120107650757, 1.141895055770874, 1.1754781007766724, 1.2090611457824707, 1.242644190788269, 1.2762272357940674, 1.3098102807998657, 1.3433934450149536, 1.376976490020752, 1.4105595350265503, 1.4441425800323486, 1.477725625038147, 1.5113086700439453, 1.5448917150497437, 1.578474760055542, 1.6120578050613403]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 1.0, 2.0, 5.0, 1.0, 9.0, 4.0, 8.0, 8.0, 11.0, 19.0, 20.0, 45.0, 73.0, 88.0, 118.0, 147.0, 128.0, 96.0, 60.0, 49.0, 34.0, 14.0, 15.0, 12.0, 9.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.849938988685608, -1.7947429418563843, -1.7395468950271606, -1.684350848197937, -1.6291548013687134, -1.5739587545394897, -1.5187625885009766, -1.463566541671753, -1.4083704948425293, -1.3531744480133057, -1.297978401184082, -1.2427823543548584, -1.1875863075256348, -1.1323902606964111, -1.0771942138671875, -1.0219981670379639, -0.9668021202087402, -0.9116060733795166, -0.856410026550293, -0.8012139797210693, -0.7460179328918457, -0.6908218860626221, -0.6356257796287537, -0.58042973279953, -0.5252336859703064, -0.47003763914108276, -0.41484159231185913, -0.3596455156803131, -0.3044494688510895, -0.24925342202186584, -0.19405734539031982, -0.1388612985610962, -0.08366537094116211, -0.02846931666135788, 0.02672673761844635, 0.08192279934883118, 0.1371188461780548, 0.19231489300727844, 0.24751096963882446, 0.3027070164680481, 0.35790306329727173, 0.41309911012649536, 0.468295156955719, 0.5234912633895874, 0.578687310218811, 0.6338833570480347, 0.6890794038772583, 0.7442754507064819, 0.7994714975357056, 0.8546675443649292, 0.9098635911941528, 0.9650596380233765, 1.0202556848526, 1.0754517316818237, 1.130647897720337, 1.1858439445495605, 1.2410399913787842, 1.2962360382080078, 1.3514320850372314, 1.406628131866455, 1.4618241786956787, 1.5170202255249023, 1.572216272354126, 1.6274123191833496, 1.6826083660125732]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 1.0, 17.0, 17.0, 23.0, 43.0, 61.0, 102.0, 134.0, 240.0, 372.0, 643.0, 1177.0, 2437.0, 5030.0, 12055.0, 37077.0, 204679.0, 3688597.0, 181115.0, 36960.0, 12484.0, 5346.0, 2466.0, 1249.0, 805.0, 464.0, 221.0, 151.0, 104.0, 72.0, 46.0, 39.0, 17.0, 13.0, 3.0, 7.0, 4.0, 0.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.198486328125, -0.1919727325439453, -0.18545913696289062, -0.17894554138183594, -0.17243194580078125, -0.16591835021972656, -0.15940475463867188, -0.1528911590576172, -0.1463775634765625, -0.1398639678955078, -0.13335037231445312, -0.12683677673339844, -0.12032318115234375, -0.11380958557128906, -0.10729598999023438, -0.10078239440917969, -0.094268798828125, -0.08775520324707031, -0.08124160766601562, -0.07472801208496094, -0.06821441650390625, -0.06170082092285156, -0.055187225341796875, -0.04867362976074219, -0.0421600341796875, -0.03564643859863281, -0.029132843017578125, -0.022619247436523438, -0.01610565185546875, -0.009592056274414062, -0.003078460693359375, 0.0034351348876953125, 0.00994873046875, 0.016462326049804688, 0.022975921630859375, 0.029489517211914062, 0.03600311279296875, 0.04251670837402344, 0.049030303955078125, 0.05554389953613281, 0.0620574951171875, 0.06857109069824219, 0.07508468627929688, 0.08159828186035156, 0.08811187744140625, 0.09462547302246094, 0.10113906860351562, 0.10765266418457031, 0.114166259765625, 0.12067985534667969, 0.12719345092773438, 0.13370704650878906, 0.14022064208984375, 0.14673423767089844, 0.15324783325195312, 0.1597614288330078, 0.1662750244140625, 0.1727886199951172, 0.17930221557617188, 0.18581581115722656, 0.19232940673828125, 0.19884300231933594, 0.20535659790039062, 0.2118701934814453, 0.2183837890625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 3.0, 6.0, 4.0, 7.0, 6.0, 9.0, 9.0, 29.0, 22.0, 30.0, 32.0, 49.0, 71.0, 132.0, 131.0, 117.0, 81.0, 56.0, 32.0, 29.0, 34.0, 20.0, 18.0, 11.0, 12.0, 4.0, 6.0, 6.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0210723876953125, -0.020339012145996094, -0.019605636596679688, -0.01887226104736328, -0.018138885498046875, -0.01740550994873047, -0.016672134399414062, -0.015938758850097656, -0.01520538330078125, -0.014472007751464844, -0.013738632202148438, -0.013005256652832031, -0.012271881103515625, -0.011538505554199219, -0.010805130004882812, -0.010071754455566406, -0.00933837890625, -0.008605003356933594, -0.007871627807617188, -0.007138252258300781, -0.006404876708984375, -0.005671501159667969, -0.0049381256103515625, -0.004204750061035156, -0.00347137451171875, -0.0027379989624023438, -0.0020046234130859375, -0.0012712478637695312, -0.000537872314453125, 0.00019550323486328125, 0.0009288787841796875, 0.0016622543334960938, 0.0023956298828125, 0.0031290054321289062, 0.0038623809814453125, 0.004595756530761719, 0.005329132080078125, 0.006062507629394531, 0.0067958831787109375, 0.007529258728027344, 0.00826263427734375, 0.008996009826660156, 0.009729385375976562, 0.010462760925292969, 0.011196136474609375, 0.011929512023925781, 0.012662887573242188, 0.013396263122558594, 0.014129638671875, 0.014863014221191406, 0.015596389770507812, 0.01632976531982422, 0.017063140869140625, 0.01779651641845703, 0.018529891967773438, 0.019263267517089844, 0.01999664306640625, 0.020730018615722656, 0.021463394165039062, 0.02219676971435547, 0.022930145263671875, 0.02366352081298828, 0.024396896362304688, 0.025130271911621094, 0.0258636474609375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 5.0, 1.0, 2.0, 9.0, 8.0, 12.0, 15.0, 27.0, 47.0, 61.0, 112.0, 163.0, 210.0, 405.0, 776.0, 1632.0, 4044.0, 11229.0, 39163.0, 201437.0, 3053336.0, 757107.0, 90818.0, 21507.0, 6930.0, 2693.0, 1138.0, 606.0, 308.0, 162.0, 101.0, 68.0, 43.0, 25.0, 19.0, 12.0, 13.0, 7.0, 6.0, 8.0, 3.0, 3.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.140625, -0.13590240478515625, -0.1311798095703125, -0.12645721435546875, -0.121734619140625, -0.11701202392578125, -0.1122894287109375, -0.10756683349609375, -0.10284423828125, -0.09812164306640625, -0.0933990478515625, -0.08867645263671875, -0.083953857421875, -0.07923126220703125, -0.0745086669921875, -0.06978607177734375, -0.0650634765625, -0.06034088134765625, -0.0556182861328125, -0.05089569091796875, -0.046173095703125, -0.04145050048828125, -0.0367279052734375, -0.03200531005859375, -0.02728271484375, -0.02256011962890625, -0.0178375244140625, -0.01311492919921875, -0.008392333984375, -0.00366973876953125, 0.0010528564453125, 0.00577545166015625, 0.010498046875, 0.01522064208984375, 0.0199432373046875, 0.02466583251953125, 0.029388427734375, 0.03411102294921875, 0.0388336181640625, 0.04355621337890625, 0.04827880859375, 0.05300140380859375, 0.0577239990234375, 0.06244659423828125, 0.067169189453125, 0.07189178466796875, 0.0766143798828125, 0.08133697509765625, 0.0860595703125, 0.09078216552734375, 0.0955047607421875, 0.10022735595703125, 0.104949951171875, 0.10967254638671875, 0.1143951416015625, 0.11911773681640625, 0.12384033203125, 0.12856292724609375, 0.1332855224609375, 0.13800811767578125, 0.142730712890625, 0.14745330810546875, 0.1521759033203125, 0.15689849853515625, 0.16162109375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 9.0, 5.0, 7.0, 13.0, 21.0, 18.0, 39.0, 46.0, 47.0, 80.0, 123.0, 219.0, 392.0, 1174.0, 871.0, 341.0, 213.0, 138.0, 95.0, 64.0, 41.0, 27.0, 19.0, 16.0, 11.0, 6.0, 7.0, 7.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025604248046875, -0.024687767028808594, -0.023771286010742188, -0.02285480499267578, -0.021938323974609375, -0.02102184295654297, -0.020105361938476562, -0.019188880920410156, -0.01827239990234375, -0.017355918884277344, -0.016439437866210938, -0.015522956848144531, -0.014606475830078125, -0.013689994812011719, -0.012773513793945312, -0.011857032775878906, -0.0109405517578125, -0.010024070739746094, -0.009107589721679688, -0.008191108703613281, -0.007274627685546875, -0.006358146667480469, -0.0054416656494140625, -0.004525184631347656, -0.00360870361328125, -0.0026922225952148438, -0.0017757415771484375, -0.0008592605590820312, 5.7220458984375e-05, 0.0009737014770507812, 0.0018901824951171875, 0.0028066635131835938, 0.00372314453125, 0.004639625549316406, 0.0055561065673828125, 0.006472587585449219, 0.007389068603515625, 0.008305549621582031, 0.009222030639648438, 0.010138511657714844, 0.01105499267578125, 0.011971473693847656, 0.012887954711914062, 0.013804435729980469, 0.014720916748046875, 0.01563739776611328, 0.016553878784179688, 0.017470359802246094, 0.0183868408203125, 0.019303321838378906, 0.020219802856445312, 0.02113628387451172, 0.022052764892578125, 0.02296924591064453, 0.023885726928710938, 0.024802207946777344, 0.02571868896484375, 0.026635169982910156, 0.027551651000976562, 0.02846813201904297, 0.029384613037109375, 0.03030109405517578, 0.031217575073242188, 0.032134056091308594, 0.033050537109375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 9.0, 42.0, 109.0, 275.0, 292.0, 178.0, 60.0, 13.0, 6.0, 6.0, 1.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19298139214515686, -0.1829526126384735, -0.17292381823062897, -0.16289502382278442, -0.15286624431610107, -0.14283746480941772, -0.13280867040157318, -0.12277988344430923, -0.11275109648704529, -0.10272230952978134, -0.0926935225725174, -0.08266473561525345, -0.0726359486579895, -0.06260716170072556, -0.05257837474346161, -0.04254958778619766, -0.032520800828933716, -0.02249201387166977, -0.012463226914405823, -0.0024344399571418762, 0.00759434700012207, 0.017623133957386017, 0.027651920914649963, 0.03768070787191391, 0.047709494829177856, 0.0577382817864418, 0.06776706874370575, 0.0777958557009697, 0.08782464265823364, 0.09785342961549759, 0.10788221657276154, 0.11791100353002548, 0.12793979048728943, 0.13796856999397278, 0.14799736440181732, 0.15802615880966187, 0.16805493831634521, 0.17808371782302856, 0.1881125122308731, 0.19814130663871765, 0.208170086145401, 0.21819886565208435, 0.2282276600599289, 0.23825645446777344, 0.2482852339744568, 0.25831401348114014, 0.2683427929878235, 0.2783716022968292, 0.2884003818035126, 0.2984291613101959, 0.30845797061920166, 0.318486750125885, 0.32851552963256836, 0.3385443091392517, 0.34857308864593506, 0.3586018979549408, 0.36863067746162415, 0.3786594569683075, 0.38868826627731323, 0.3987170457839966, 0.40874582529067993, 0.4187746047973633, 0.42880338430404663, 0.43883219361305237, 0.4488609731197357]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 4.0, 16.0, 17.0, 16.0, 22.0, 32.0, 36.0, 43.0, 59.0, 78.0, 66.0, 80.0, 92.0, 77.0, 56.0, 57.0, 46.0, 42.0, 31.0, 28.0, 23.0, 15.0, 14.0, 9.0, 7.0, 7.0, 3.0, 5.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1550167202949524, -0.15049254894256592, -0.14596837759017944, -0.14144420623779297, -0.1369200348854065, -0.13239586353302002, -0.12787169218063354, -0.12334752082824707, -0.1188233494758606, -0.11429917812347412, -0.10977500677108765, -0.10525083541870117, -0.1007266640663147, -0.09620249271392822, -0.09167832136154175, -0.08715415000915527, -0.0826299786567688, -0.07810580730438232, -0.07358163595199585, -0.06905746459960938, -0.0645332932472229, -0.060009121894836426, -0.05548495054244995, -0.05096077919006348, -0.046436607837677, -0.04191243648529053, -0.03738826513290405, -0.03286409378051758, -0.028339922428131104, -0.02381575107574463, -0.019291579723358154, -0.01476740837097168, -0.010243237018585205, -0.0057190656661987305, -0.0011948943138122559, 0.0033292770385742188, 0.007853448390960693, 0.012377619743347168, 0.016901791095733643, 0.021425962448120117, 0.025950133800506592, 0.030474305152893066, 0.03499847650527954, 0.039522647857666016, 0.04404681921005249, 0.048570990562438965, 0.05309516191482544, 0.057619333267211914, 0.06214350461959839, 0.06666767597198486, 0.07119184732437134, 0.07571601867675781, 0.08024019002914429, 0.08476436138153076, 0.08928853273391724, 0.09381270408630371, 0.09833687543869019, 0.10286104679107666, 0.10738521814346313, 0.11190938949584961, 0.11643356084823608, 0.12095773220062256, 0.12548190355300903, 0.1300060749053955, 0.13453024625778198]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 6.0, 4.0, 3.0, 4.0, 7.0, 14.0, 11.0, 17.0, 29.0, 30.0, 40.0, 88.0, 75.0, 135.0, 200.0, 348.0, 499.0, 755.0, 1241.0, 2062.0, 3452.0, 6255.0, 12144.0, 25351.0, 62115.0, 214958.0, 497036.0, 134698.0, 44945.0, 19446.0, 9660.0, 5190.0, 2965.0, 1751.0, 1076.0, 608.0, 423.0, 270.0, 214.0, 120.0, 80.0, 73.0, 41.0, 34.0, 23.0, 14.0, 16.0, 12.0, 4.0, 7.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.10882568359375, -0.1055612564086914, -0.10229682922363281, -0.09903240203857422, -0.09576797485351562, -0.09250354766845703, -0.08923912048339844, -0.08597469329833984, -0.08271026611328125, -0.07944583892822266, -0.07618141174316406, -0.07291698455810547, -0.06965255737304688, -0.06638813018798828, -0.06312370300292969, -0.059859275817871094, -0.0565948486328125, -0.053330421447753906, -0.05006599426269531, -0.04680156707763672, -0.043537139892578125, -0.04027271270751953, -0.03700828552246094, -0.033743858337402344, -0.03047943115234375, -0.027215003967285156, -0.023950576782226562, -0.02068614959716797, -0.017421722412109375, -0.014157295227050781, -0.010892868041992188, -0.007628440856933594, -0.004364013671875, -0.0010995864868164062, 0.0021648406982421875, 0.005429267883300781, 0.008693695068359375, 0.011958122253417969, 0.015222549438476562, 0.018486976623535156, 0.02175140380859375, 0.025015830993652344, 0.028280258178710938, 0.03154468536376953, 0.034809112548828125, 0.03807353973388672, 0.04133796691894531, 0.044602394104003906, 0.0478668212890625, 0.051131248474121094, 0.05439567565917969, 0.05766010284423828, 0.060924530029296875, 0.06418895721435547, 0.06745338439941406, 0.07071781158447266, 0.07398223876953125, 0.07724666595458984, 0.08051109313964844, 0.08377552032470703, 0.08703994750976562, 0.09030437469482422, 0.09356880187988281, 0.0968332290649414, 0.10009765625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 8.0, 4.0, 2.0, 2.0, 5.0, 7.0, 7.0, 8.0, 13.0, 15.0, 14.0, 20.0, 28.0, 44.0, 43.0, 68.0, 100.0, 130.0, 120.0, 85.0, 54.0, 58.0, 35.0, 24.0, 21.0, 13.0, 20.0, 10.0, 12.0, 4.0, 3.0, 4.0, 8.0, 5.0, 1.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0231475830078125, -0.022467374801635742, -0.021787166595458984, -0.021106958389282227, -0.02042675018310547, -0.01974654197692871, -0.019066333770751953, -0.018386125564575195, -0.017705917358398438, -0.01702570915222168, -0.016345500946044922, -0.015665292739868164, -0.014985084533691406, -0.014304876327514648, -0.01362466812133789, -0.012944459915161133, -0.012264251708984375, -0.011584043502807617, -0.01090383529663086, -0.010223627090454102, -0.009543418884277344, -0.008863210678100586, -0.008183002471923828, -0.00750279426574707, -0.0068225860595703125, -0.006142377853393555, -0.005462169647216797, -0.004781961441040039, -0.004101753234863281, -0.0034215450286865234, -0.0027413368225097656, -0.002061128616333008, -0.00138092041015625, -0.0007007122039794922, -2.0503997802734375e-05, 0.0006597042083740234, 0.0013399124145507812, 0.002020120620727539, 0.002700328826904297, 0.0033805370330810547, 0.0040607452392578125, 0.00474095344543457, 0.005421161651611328, 0.006101369857788086, 0.006781578063964844, 0.0074617862701416016, 0.00814199447631836, 0.008822202682495117, 0.009502410888671875, 0.010182619094848633, 0.01086282730102539, 0.011543035507202148, 0.012223243713378906, 0.012903451919555664, 0.013583660125732422, 0.01426386833190918, 0.014944076538085938, 0.015624284744262695, 0.016304492950439453, 0.01698470115661621, 0.01766490936279297, 0.018345117568969727, 0.019025325775146484, 0.019705533981323242, 0.0203857421875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 1.0, 11.0, 9.0, 10.0, 17.0, 18.0, 40.0, 62.0, 82.0, 140.0, 217.0, 406.0, 749.0, 1468.0, 3274.0, 9272.0, 33653.0, 187660.0, 605458.0, 161643.0, 30181.0, 8129.0, 3005.0, 1385.0, 673.0, 375.0, 228.0, 145.0, 73.0, 53.0, 41.0, 20.0, 17.0, 5.0, 12.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.097900390625, -0.09478759765625, -0.0916748046875, -0.08856201171875, -0.08544921875, -0.08233642578125, -0.0792236328125, -0.07611083984375, -0.072998046875, -0.06988525390625, -0.0667724609375, -0.06365966796875, -0.060546875, -0.05743408203125, -0.0543212890625, -0.05120849609375, -0.048095703125, -0.04498291015625, -0.0418701171875, -0.03875732421875, -0.03564453125, -0.03253173828125, -0.0294189453125, -0.02630615234375, -0.023193359375, -0.02008056640625, -0.0169677734375, -0.01385498046875, -0.0107421875, -0.00762939453125, -0.0045166015625, -0.00140380859375, 0.001708984375, 0.00482177734375, 0.0079345703125, 0.01104736328125, 0.01416015625, 0.01727294921875, 0.0203857421875, 0.02349853515625, 0.026611328125, 0.02972412109375, 0.0328369140625, 0.03594970703125, 0.0390625, 0.04217529296875, 0.0452880859375, 0.04840087890625, 0.051513671875, 0.05462646484375, 0.0577392578125, 0.06085205078125, 0.06396484375, 0.06707763671875, 0.0701904296875, 0.07330322265625, 0.076416015625, 0.07952880859375, 0.0826416015625, 0.08575439453125, 0.0888671875, 0.09197998046875, 0.0950927734375, 0.09820556640625, 0.101318359375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 5.0, 3.0, 3.0, 4.0, 5.0, 10.0, 13.0, 22.0, 19.0, 37.0, 28.0, 30.0, 41.0, 58.0, 46.0, 59.0, 50.0, 70.0, 56.0, 54.0, 49.0, 49.0, 49.0, 50.0, 36.0, 33.0, 32.0, 27.0, 21.0, 8.0, 13.0, 12.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.09783935546875, -0.09509849548339844, -0.09235763549804688, -0.08961677551269531, -0.08687591552734375, -0.08413505554199219, -0.08139419555664062, -0.07865333557128906, -0.0759124755859375, -0.07317161560058594, -0.07043075561523438, -0.06768989562988281, -0.06494903564453125, -0.06220817565917969, -0.059467315673828125, -0.05672645568847656, -0.053985595703125, -0.05124473571777344, -0.048503875732421875, -0.04576301574707031, -0.04302215576171875, -0.04028129577636719, -0.037540435791015625, -0.03479957580566406, -0.0320587158203125, -0.029317855834960938, -0.026576995849609375, -0.023836135864257812, -0.02109527587890625, -0.018354415893554688, -0.015613555908203125, -0.012872695922851562, -0.0101318359375, -0.0073909759521484375, -0.004650115966796875, -0.0019092559814453125, 0.00083160400390625, 0.0035724639892578125, 0.006313323974609375, 0.009054183959960938, 0.0117950439453125, 0.014535903930664062, 0.017276763916015625, 0.020017623901367188, 0.02275848388671875, 0.025499343872070312, 0.028240203857421875, 0.030981063842773438, 0.033721923828125, 0.03646278381347656, 0.039203643798828125, 0.04194450378417969, 0.04468536376953125, 0.04742622375488281, 0.050167083740234375, 0.05290794372558594, 0.0556488037109375, 0.05838966369628906, 0.061130523681640625, 0.06387138366699219, 0.06661224365234375, 0.06935310363769531, 0.07209396362304688, 0.07483482360839844, 0.07757568359375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 8.0, 11.0, 13.0, 20.0, 24.0, 32.0, 50.0, 87.0, 145.0, 220.0, 392.0, 816.0, 1822.0, 4952.0, 17845.0, 135905.0, 763815.0, 99894.0, 14932.0, 4301.0, 1616.0, 794.0, 339.0, 187.0, 108.0, 63.0, 54.0, 29.0, 29.0, 22.0, 8.0, 9.0, 3.0, 4.0, 5.0, 1.0, 0.0, 3.0, 3.0], "bins": [-0.21875, -0.2134714126586914, -0.2081928253173828, -0.20291423797607422, -0.19763565063476562, -0.19235706329345703, -0.18707847595214844, -0.18179988861083984, -0.17652130126953125, -0.17124271392822266, -0.16596412658691406, -0.16068553924560547, -0.15540695190429688, -0.15012836456298828, -0.1448497772216797, -0.1395711898803711, -0.1342926025390625, -0.1290140151977539, -0.12373542785644531, -0.11845684051513672, -0.11317825317382812, -0.10789966583251953, -0.10262107849121094, -0.09734249114990234, -0.09206390380859375, -0.08678531646728516, -0.08150672912597656, -0.07622814178466797, -0.07094955444335938, -0.06567096710205078, -0.06039237976074219, -0.055113792419433594, -0.049835205078125, -0.044556617736816406, -0.03927803039550781, -0.03399944305419922, -0.028720855712890625, -0.02344226837158203, -0.018163681030273438, -0.012885093688964844, -0.00760650634765625, -0.0023279190063476562, 0.0029506683349609375, 0.008229255676269531, 0.013507843017578125, 0.01878643035888672, 0.024065017700195312, 0.029343605041503906, 0.0346221923828125, 0.039900779724121094, 0.04517936706542969, 0.05045795440673828, 0.055736541748046875, 0.06101512908935547, 0.06629371643066406, 0.07157230377197266, 0.07685089111328125, 0.08212947845458984, 0.08740806579589844, 0.09268665313720703, 0.09796524047851562, 0.10324382781982422, 0.10852241516113281, 0.1138010025024414, 0.11907958984375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 1.0, 4.0, 6.0, 17.0, 25.0, 30.0, 49.0, 63.0, 84.0, 111.0, 123.0, 109.0, 106.0, 81.0, 57.0, 46.0, 32.0, 23.0, 16.0, 3.0, 5.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011849403381347656, -0.00011452659964561462, -0.00011055916547775269, -0.00010659173130989075, -0.00010262429714202881, -9.865686297416687e-05, -9.468942880630493e-05, -9.072199463844299e-05, -8.675456047058105e-05, -8.278712630271912e-05, -7.881969213485718e-05, -7.485225796699524e-05, -7.08848237991333e-05, -6.691738963127136e-05, -6.294995546340942e-05, -5.8982521295547485e-05, -5.501508712768555e-05, -5.104765295982361e-05, -4.708021879196167e-05, -4.311278462409973e-05, -3.914535045623779e-05, -3.5177916288375854e-05, -3.1210482120513916e-05, -2.7243047952651978e-05, -2.327561378479004e-05, -1.93081796169281e-05, -1.5340745449066162e-05, -1.1373311281204224e-05, -7.405877113342285e-06, -3.4384429454803467e-06, 5.289912223815918e-07, 4.49642539024353e-06, 8.463859558105469e-06, 1.2431293725967407e-05, 1.6398727893829346e-05, 2.0366162061691284e-05, 2.4333596229553223e-05, 2.830103039741516e-05, 3.22684645652771e-05, 3.623589873313904e-05, 4.0203332901000977e-05, 4.4170767068862915e-05, 4.8138201236724854e-05, 5.210563540458679e-05, 5.607306957244873e-05, 6.004050374031067e-05, 6.400793790817261e-05, 6.797537207603455e-05, 7.194280624389648e-05, 7.591024041175842e-05, 7.987767457962036e-05, 8.38451087474823e-05, 8.781254291534424e-05, 9.177997708320618e-05, 9.574741125106812e-05, 9.971484541893005e-05, 0.00010368227958679199, 0.00010764971375465393, 0.00011161714792251587, 0.00011558458209037781, 0.00011955201625823975, 0.00012351945042610168, 0.00012748688459396362, 0.00013145431876182556, 0.0001354217529296875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 6.0, 3.0, 3.0, 4.0, 5.0, 7.0, 21.0, 22.0, 20.0, 26.0, 47.0, 68.0, 132.0, 197.0, 320.0, 614.0, 1446.0, 3277.0, 10297.0, 48882.0, 414320.0, 490756.0, 59444.0, 11965.0, 3557.0, 1467.0, 720.0, 337.0, 203.0, 130.0, 81.0, 40.0, 35.0, 28.0, 23.0, 16.0, 9.0, 9.0, 9.0, 5.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12548828125, -0.12157249450683594, -0.11765670776367188, -0.11374092102050781, -0.10982513427734375, -0.10590934753417969, -0.10199356079101562, -0.09807777404785156, -0.0941619873046875, -0.09024620056152344, -0.08633041381835938, -0.08241462707519531, -0.07849884033203125, -0.07458305358886719, -0.07066726684570312, -0.06675148010253906, -0.062835693359375, -0.05891990661621094, -0.055004119873046875, -0.05108833312988281, -0.04717254638671875, -0.04325675964355469, -0.039340972900390625, -0.03542518615722656, -0.0315093994140625, -0.027593612670898438, -0.023677825927734375, -0.019762039184570312, -0.01584625244140625, -0.011930465698242188, -0.008014678955078125, -0.0040988922119140625, -0.00018310546875, 0.0037326812744140625, 0.007648468017578125, 0.011564254760742188, 0.01548004150390625, 0.019395828247070312, 0.023311614990234375, 0.027227401733398438, 0.0311431884765625, 0.03505897521972656, 0.038974761962890625, 0.04289054870605469, 0.04680633544921875, 0.05072212219238281, 0.054637908935546875, 0.05855369567871094, 0.062469482421875, 0.06638526916503906, 0.07030105590820312, 0.07421684265136719, 0.07813262939453125, 0.08204841613769531, 0.08596420288085938, 0.08987998962402344, 0.0937957763671875, 0.09771156311035156, 0.10162734985351562, 0.10554313659667969, 0.10945892333984375, 0.11337471008300781, 0.11729049682617188, 0.12120628356933594, 0.1251220703125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 6.0, 12.0, 13.0, 20.0, 20.0, 20.0, 46.0, 57.0, 74.0, 104.0, 117.0, 89.0, 95.0, 72.0, 58.0, 42.0, 27.0, 32.0, 18.0, 22.0, 13.0, 5.0, 5.0, 9.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0653076171875, -0.06297492980957031, -0.060642242431640625, -0.05830955505371094, -0.05597686767578125, -0.05364418029785156, -0.051311492919921875, -0.04897880554199219, -0.0466461181640625, -0.04431343078613281, -0.041980743408203125, -0.03964805603027344, -0.03731536865234375, -0.03498268127441406, -0.032649993896484375, -0.030317306518554688, -0.027984619140625, -0.025651931762695312, -0.023319244384765625, -0.020986557006835938, -0.01865386962890625, -0.016321182250976562, -0.013988494873046875, -0.011655807495117188, -0.0093231201171875, -0.0069904327392578125, -0.004657745361328125, -0.0023250579833984375, 7.62939453125e-06, 0.0023403167724609375, 0.004673004150390625, 0.0070056915283203125, 0.00933837890625, 0.011671066284179688, 0.014003753662109375, 0.016336441040039062, 0.01866912841796875, 0.021001815795898438, 0.023334503173828125, 0.025667190551757812, 0.0279998779296875, 0.030332565307617188, 0.032665252685546875, 0.03499794006347656, 0.03733062744140625, 0.03966331481933594, 0.041996002197265625, 0.04432868957519531, 0.046661376953125, 0.04899406433105469, 0.051326751708984375, 0.05365943908691406, 0.05599212646484375, 0.05832481384277344, 0.060657501220703125, 0.06299018859863281, 0.0653228759765625, 0.06765556335449219, 0.06998825073242188, 0.07232093811035156, 0.07465362548828125, 0.07698631286621094, 0.07931900024414062, 0.08165168762207031, 0.083984375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 13.0, 40.0, 152.0, 438.0, 266.0, 65.0, 16.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.279052972793579, -1.2293123006820679, -1.1795716285705566, -1.1298309564590454, -1.0800902843475342, -1.030349612236023, -0.9806089997291565, -0.9308683276176453, -0.881127655506134, -0.8313869833946228, -0.7816463112831116, -0.7319056987762451, -0.6821650266647339, -0.6324243545532227, -0.5826836824417114, -0.5329430103302002, -0.48320233821868896, -0.43346166610717773, -0.3837209939956665, -0.33398035168647766, -0.28423967957496643, -0.2344990074634552, -0.18475836515426636, -0.13501769304275513, -0.0852770209312439, -0.03553635627031326, 0.01420430839061737, 0.06394496560096741, 0.11368563771247864, 0.16342630982398987, 0.2131669521331787, 0.26290762424468994, 0.3126484155654907, 0.36238908767700195, 0.4121297597885132, 0.461870402097702, 0.5116111040115356, 0.5613517761230469, 0.6110923886299133, 0.6608330607414246, 0.7105737328529358, 0.760314404964447, 0.8100550770759583, 0.8597956895828247, 0.9095363616943359, 0.9592770338058472, 1.0090177059173584, 1.0587583780288696, 1.1084990501403809, 1.158239722251892, 1.2079803943634033, 1.2577210664749146, 1.3074617385864258, 1.357202410697937, 1.4069430828094482, 1.45668363571167, 1.5064244270324707, 1.556165099143982, 1.6059057712554932, 1.6556464433670044, 1.7053871154785156, 1.7551277875900269, 1.804868459701538, 1.8546090126037598, 1.904349684715271]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 1.0, 3.0, 3.0, 5.0, 4.0, 6.0, 11.0, 12.0, 14.0, 15.0, 19.0, 27.0, 38.0, 47.0, 52.0, 60.0, 72.0, 68.0, 80.0, 63.0, 69.0, 63.0, 46.0, 53.0, 36.0, 32.0, 30.0, 17.0, 15.0, 11.0, 5.0, 2.0, 6.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.6587620973587036, -0.6381540894508362, -0.6175460815429688, -0.5969380736351013, -0.5763300657272339, -0.5557220578193665, -0.535114049911499, -0.5145059823989868, -0.4938980042934418, -0.47328999638557434, -0.4526819884777069, -0.4320739805698395, -0.41146594285964966, -0.3908579349517822, -0.3702499270439148, -0.34964191913604736, -0.32903391122817993, -0.3084259033203125, -0.28781789541244507, -0.26720988750457764, -0.246601864695549, -0.22599385678768158, -0.20538583397865295, -0.18477782607078552, -0.1641698181629181, -0.14356181025505066, -0.12295379489660263, -0.1023457795381546, -0.08173777163028717, -0.06112976372241974, -0.04052174836397171, -0.01991373300552368, 0.00069427490234375, 0.02130228653550148, 0.04191029816865921, 0.06251831352710724, 0.08312632143497467, 0.1037343293428421, 0.12434234470129013, 0.14495036005973816, 0.1655583679676056, 0.18616637587547302, 0.20677438378334045, 0.22738240659236908, 0.2479904145002365, 0.26859843730926514, 0.28920644521713257, 0.309814453125, 0.33042246103286743, 0.35103046894073486, 0.3716384768486023, 0.3922464847564697, 0.41285449266433716, 0.4334625005722046, 0.4540705382823944, 0.47467854619026184, 0.4952865540981293, 0.5158945918083191, 0.5365025997161865, 0.557110607624054, 0.5777186155319214, 0.5983266234397888, 0.6189346313476562, 0.6395426392555237, 0.6601506471633911]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 9.0, 6.0, 15.0, 18.0, 36.0, 32.0, 52.0, 57.0, 67.0, 102.0, 147.0, 163.0, 273.0, 341.0, 421.0, 594.0, 940.0, 1339.0, 2120.0, 3652.0, 6864.0, 14459.0, 38972.0, 182900.0, 3590924.0, 265041.0, 47462.0, 17002.0, 8115.0, 4293.0, 2522.0, 1576.0, 1099.0, 778.0, 544.0, 387.0, 252.0, 173.0, 153.0, 98.0, 71.0, 49.0, 48.0, 40.0, 22.0, 17.0, 9.0, 22.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.1978759765625, -0.19161033630371094, -0.18534469604492188, -0.1790790557861328, -0.17281341552734375, -0.1665477752685547, -0.16028213500976562, -0.15401649475097656, -0.1477508544921875, -0.14148521423339844, -0.13521957397460938, -0.1289539337158203, -0.12268829345703125, -0.11642265319824219, -0.11015701293945312, -0.10389137268066406, -0.097625732421875, -0.09136009216308594, -0.08509445190429688, -0.07882881164550781, -0.07256317138671875, -0.06629753112792969, -0.060031890869140625, -0.05376625061035156, -0.0475006103515625, -0.04123497009277344, -0.034969329833984375, -0.028703689575195312, -0.02243804931640625, -0.016172409057617188, -0.009906768798828125, -0.0036411285400390625, 0.00262451171875, 0.008890151977539062, 0.015155792236328125, 0.021421432495117188, 0.02768707275390625, 0.03395271301269531, 0.040218353271484375, 0.04648399353027344, 0.0527496337890625, 0.05901527404785156, 0.06528091430664062, 0.07154655456542969, 0.07781219482421875, 0.08407783508300781, 0.09034347534179688, 0.09660911560058594, 0.102874755859375, 0.10914039611816406, 0.11540603637695312, 0.12167167663574219, 0.12793731689453125, 0.1342029571533203, 0.14046859741210938, 0.14673423767089844, 0.1529998779296875, 0.15926551818847656, 0.16553115844726562, 0.1717967987060547, 0.17806243896484375, 0.1843280792236328, 0.19059371948242188, 0.19685935974121094, 0.203125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 8.0, 2.0, 7.0, 4.0, 5.0, 5.0, 9.0, 21.0, 15.0, 22.0, 47.0, 46.0, 49.0, 75.0, 104.0, 120.0, 109.0, 90.0, 47.0, 49.0, 33.0, 29.0, 23.0, 13.0, 15.0, 12.0, 6.0, 3.0, 9.0, 6.0, 7.0, 1.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0202789306640625, -0.019596576690673828, -0.018914222717285156, -0.018231868743896484, -0.017549514770507812, -0.01686716079711914, -0.01618480682373047, -0.015502452850341797, -0.014820098876953125, -0.014137744903564453, -0.013455390930175781, -0.01277303695678711, -0.012090682983398438, -0.011408329010009766, -0.010725975036621094, -0.010043621063232422, -0.00936126708984375, -0.008678913116455078, -0.007996559143066406, -0.007314205169677734, -0.0066318511962890625, -0.005949497222900391, -0.005267143249511719, -0.004584789276123047, -0.003902435302734375, -0.003220081329345703, -0.0025377273559570312, -0.0018553733825683594, -0.0011730194091796875, -0.0004906654357910156, 0.00019168853759765625, 0.0008740425109863281, 0.001556396484375, 0.002238750457763672, 0.0029211044311523438, 0.0036034584045410156, 0.0042858123779296875, 0.004968166351318359, 0.005650520324707031, 0.006332874298095703, 0.007015228271484375, 0.007697582244873047, 0.008379936218261719, 0.00906229019165039, 0.009744644165039062, 0.010426998138427734, 0.011109352111816406, 0.011791706085205078, 0.01247406005859375, 0.013156414031982422, 0.013838768005371094, 0.014521121978759766, 0.015203475952148438, 0.01588582992553711, 0.01656818389892578, 0.017250537872314453, 0.017932891845703125, 0.018615245819091797, 0.01929759979248047, 0.01997995376586914, 0.020662307739257812, 0.021344661712646484, 0.022027015686035156, 0.022709369659423828, 0.0233917236328125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 6.0, 11.0, 13.0, 28.0, 40.0, 70.0, 100.0, 187.0, 463.0, 1279.0, 4400.0, 21362.0, 225256.0, 3748624.0, 168311.0, 18094.0, 3897.0, 1200.0, 419.0, 212.0, 97.0, 68.0, 36.0, 36.0, 18.0, 12.0, 8.0, 6.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.309326171875, -0.300079345703125, -0.29083251953125, -0.281585693359375, -0.2723388671875, -0.263092041015625, -0.25384521484375, -0.244598388671875, -0.2353515625, -0.226104736328125, -0.21685791015625, -0.207611083984375, -0.1983642578125, -0.189117431640625, -0.17987060546875, -0.170623779296875, -0.161376953125, -0.152130126953125, -0.14288330078125, -0.133636474609375, -0.1243896484375, -0.115142822265625, -0.10589599609375, -0.096649169921875, -0.08740234375, -0.078155517578125, -0.06890869140625, -0.059661865234375, -0.0504150390625, -0.041168212890625, -0.03192138671875, -0.022674560546875, -0.013427734375, -0.004180908203125, 0.00506591796875, 0.014312744140625, 0.0235595703125, 0.032806396484375, 0.04205322265625, 0.051300048828125, 0.060546875, 0.069793701171875, 0.07904052734375, 0.088287353515625, 0.0975341796875, 0.106781005859375, 0.11602783203125, 0.125274658203125, 0.134521484375, 0.143768310546875, 0.15301513671875, 0.162261962890625, 0.1715087890625, 0.180755615234375, 0.19000244140625, 0.199249267578125, 0.20849609375, 0.217742919921875, 0.22698974609375, 0.236236572265625, 0.2454833984375, 0.254730224609375, 0.26397705078125, 0.273223876953125, 0.282470703125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 3.0, 7.0, 14.0, 13.0, 25.0, 31.0, 42.0, 42.0, 108.0, 173.0, 330.0, 827.0, 1440.0, 438.0, 221.0, 115.0, 78.0, 50.0, 30.0, 24.0, 12.0, 8.0, 9.0, 12.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.034027099609375, -0.0327754020690918, -0.031523704528808594, -0.03027200698852539, -0.029020309448242188, -0.027768611907958984, -0.02651691436767578, -0.025265216827392578, -0.024013519287109375, -0.022761821746826172, -0.02151012420654297, -0.020258426666259766, -0.019006729125976562, -0.01775503158569336, -0.016503334045410156, -0.015251636505126953, -0.01399993896484375, -0.012748241424560547, -0.011496543884277344, -0.01024484634399414, -0.008993148803710938, -0.007741451263427734, -0.006489753723144531, -0.005238056182861328, -0.003986358642578125, -0.002734661102294922, -0.0014829635620117188, -0.00023126602172851562, 0.0010204315185546875, 0.0022721290588378906, 0.0035238265991210938, 0.004775524139404297, 0.0060272216796875, 0.007278919219970703, 0.008530616760253906, 0.00978231430053711, 0.011034011840820312, 0.012285709381103516, 0.013537406921386719, 0.014789104461669922, 0.016040802001953125, 0.017292499542236328, 0.01854419708251953, 0.019795894622802734, 0.021047592163085938, 0.02229928970336914, 0.023550987243652344, 0.024802684783935547, 0.02605438232421875, 0.027306079864501953, 0.028557777404785156, 0.02980947494506836, 0.031061172485351562, 0.032312870025634766, 0.03356456756591797, 0.03481626510620117, 0.036067962646484375, 0.03731966018676758, 0.03857135772705078, 0.039823055267333984, 0.04107475280761719, 0.04232645034790039, 0.043578147888183594, 0.0448298454284668, 0.04608154296875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 6.0, 45.0, 253.0, 526.0, 146.0, 25.0, 8.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17907801270484924, -0.15777893364429474, -0.13647985458374023, -0.11518077552318573, -0.09388169646263123, -0.07258261740207672, -0.05128353834152222, -0.029984459280967712, -0.008685380220413208, 0.012613698840141296, 0.0339127779006958, 0.055211856961250305, 0.07651093602180481, 0.09781001508235931, 0.11910909414291382, 0.14040817320346832, 0.16170725226402283, 0.18300633132457733, 0.20430541038513184, 0.22560448944568634, 0.24690356850624084, 0.26820266246795654, 0.28950172662734985, 0.31080079078674316, 0.33209988474845886, 0.35339897871017456, 0.37469804286956787, 0.3959971070289612, 0.4172962009906769, 0.4385952949523926, 0.4598943591117859, 0.4811934232711792, 0.5024925470352173, 0.5237916111946106, 0.5450906753540039, 0.566389799118042, 0.5876888632774353, 0.6089879274368286, 0.6302870512008667, 0.65158611536026, 0.6728851795196533, 0.6941842436790466, 0.7154833078384399, 0.736782431602478, 0.7580814957618713, 0.7793805599212646, 0.8006796836853027, 0.821978747844696, 0.8432778120040894, 0.8645768761634827, 0.885875940322876, 0.9071750640869141, 0.9284741282463074, 0.9497731924057007, 0.9710723161697388, 0.9923713803291321, 1.0136704444885254, 1.0349695682525635, 1.056268572807312, 1.07756769657135, 1.0988667011260986, 1.1201658248901367, 1.1414649486541748, 1.1627639532089233, 1.1840630769729614]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 9.0, 6.0, 8.0, 15.0, 17.0, 17.0, 29.0, 41.0, 47.0, 50.0, 51.0, 60.0, 67.0, 65.0, 76.0, 79.0, 68.0, 52.0, 47.0, 44.0, 40.0, 26.0, 26.0, 18.0, 13.0, 8.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13987332582473755, -0.13462258875370026, -0.12937185168266296, -0.12412110716104507, -0.11887036263942719, -0.11361962556838989, -0.1083688884973526, -0.10311815142631531, -0.09786740690469742, -0.09261666983366013, -0.08736592531204224, -0.08211518824100494, -0.07686445116996765, -0.07161370664834976, -0.06636296957731247, -0.06111222878098488, -0.05586148798465729, -0.0506107471883297, -0.045360006392002106, -0.04010926932096481, -0.03485852852463722, -0.02960778772830963, -0.02435705065727234, -0.019106309860944748, -0.013855569064617157, -0.00860482919961214, -0.0033540893346071243, 0.0018966495990753174, 0.007147390395402908, 0.0123981311917305, 0.017648868262767792, 0.022899609059095383, 0.028150349855422974, 0.033401090651750565, 0.038651831448078156, 0.04390256851911545, 0.04915330931544304, 0.05440405011177063, 0.05965478718280792, 0.06490552425384521, 0.0701562687754631, 0.0754070058465004, 0.08065775036811829, 0.08590848743915558, 0.09115922451019287, 0.09640996903181076, 0.10166070610284805, 0.10691145062446594, 0.11216218769550323, 0.11741292476654053, 0.12266366928815842, 0.1279143989086151, 0.1331651508808136, 0.1384158879518509, 0.14366662502288818, 0.14891736209392548, 0.15416809916496277, 0.15941883623600006, 0.16466957330703735, 0.16992032527923584, 0.17517106235027313, 0.18042179942131042, 0.18567253649234772, 0.190923273563385, 0.1961740255355835]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 8.0, 4.0, 4.0, 6.0, 7.0, 11.0, 29.0, 36.0, 33.0, 55.0, 84.0, 110.0, 195.0, 315.0, 525.0, 864.0, 1412.0, 2577.0, 5307.0, 12258.0, 32483.0, 111144.0, 457812.0, 308831.0, 72156.0, 23634.0, 9300.0, 4211.0, 2071.0, 1181.0, 684.0, 403.0, 283.0, 185.0, 107.0, 77.0, 54.0, 36.0, 22.0, 18.0, 11.0, 9.0, 5.0, 6.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1593017578125, -0.15459442138671875, -0.1498870849609375, -0.14517974853515625, -0.140472412109375, -0.13576507568359375, -0.1310577392578125, -0.12635040283203125, -0.12164306640625, -0.11693572998046875, -0.1122283935546875, -0.10752105712890625, -0.102813720703125, -0.09810638427734375, -0.0933990478515625, -0.08869171142578125, -0.083984375, -0.07927703857421875, -0.0745697021484375, -0.06986236572265625, -0.065155029296875, -0.06044769287109375, -0.0557403564453125, -0.05103302001953125, -0.04632568359375, -0.04161834716796875, -0.0369110107421875, -0.03220367431640625, -0.027496337890625, -0.02278900146484375, -0.0180816650390625, -0.01337432861328125, -0.0086669921875, -0.00395965576171875, 0.0007476806640625, 0.00545501708984375, 0.010162353515625, 0.01486968994140625, 0.0195770263671875, 0.02428436279296875, 0.02899169921875, 0.03369903564453125, 0.0384063720703125, 0.04311370849609375, 0.047821044921875, 0.05252838134765625, 0.0572357177734375, 0.06194305419921875, 0.066650390625, 0.07135772705078125, 0.0760650634765625, 0.08077239990234375, 0.085479736328125, 0.09018707275390625, 0.0948944091796875, 0.09960174560546875, 0.10430908203125, 0.10901641845703125, 0.1137237548828125, 0.11843109130859375, 0.123138427734375, 0.12784576416015625, 0.1325531005859375, 0.13726043701171875, 0.1419677734375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 5.0, 8.0, 5.0, 9.0, 15.0, 10.0, 14.0, 29.0, 19.0, 47.0, 79.0, 83.0, 96.0, 110.0, 97.0, 81.0, 78.0, 48.0, 42.0, 29.0, 22.0, 15.0, 13.0, 10.0, 7.0, 8.0, 2.0, 6.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0192108154296875, -0.018521785736083984, -0.01783275604248047, -0.017143726348876953, -0.016454696655273438, -0.015765666961669922, -0.015076637268066406, -0.01438760757446289, -0.013698577880859375, -0.01300954818725586, -0.012320518493652344, -0.011631488800048828, -0.010942459106445312, -0.010253429412841797, -0.009564399719238281, -0.008875370025634766, -0.00818634033203125, -0.007497310638427734, -0.006808280944824219, -0.006119251251220703, -0.0054302215576171875, -0.004741191864013672, -0.004052162170410156, -0.0033631324768066406, -0.002674102783203125, -0.0019850730895996094, -0.0012960433959960938, -0.0006070137023925781, 8.20159912109375e-05, 0.0007710456848144531, 0.0014600753784179688, 0.0021491050720214844, 0.002838134765625, 0.0035271644592285156, 0.004216194152832031, 0.004905223846435547, 0.0055942535400390625, 0.006283283233642578, 0.006972312927246094, 0.007661342620849609, 0.008350372314453125, 0.00903940200805664, 0.009728431701660156, 0.010417461395263672, 0.011106491088867188, 0.011795520782470703, 0.012484550476074219, 0.013173580169677734, 0.01386260986328125, 0.014551639556884766, 0.015240669250488281, 0.015929698944091797, 0.016618728637695312, 0.017307758331298828, 0.017996788024902344, 0.01868581771850586, 0.019374847412109375, 0.02006387710571289, 0.020752906799316406, 0.021441936492919922, 0.022130966186523438, 0.022819995880126953, 0.02350902557373047, 0.024198055267333984, 0.0248870849609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 11.0, 6.0, 14.0, 16.0, 18.0, 27.0, 50.0, 58.0, 100.0, 129.0, 250.0, 390.0, 684.0, 1546.0, 4284.0, 19283.0, 126172.0, 615546.0, 236696.0, 32369.0, 6712.0, 2031.0, 884.0, 483.0, 281.0, 163.0, 101.0, 70.0, 48.0, 27.0, 23.0, 17.0, 15.0, 11.0, 7.0, 3.0, 5.0, 5.0, 1.0, 3.0, 2.0, 3.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1739501953125, -0.16765975952148438, -0.16136932373046875, -0.15507888793945312, -0.1487884521484375, -0.14249801635742188, -0.13620758056640625, -0.12991714477539062, -0.123626708984375, -0.11733627319335938, -0.11104583740234375, -0.10475540161132812, -0.0984649658203125, -0.09217453002929688, -0.08588409423828125, -0.07959365844726562, -0.07330322265625, -0.06701278686523438, -0.06072235107421875, -0.054431915283203125, -0.0481414794921875, -0.041851043701171875, -0.03556060791015625, -0.029270172119140625, -0.022979736328125, -0.016689300537109375, -0.01039886474609375, -0.004108428955078125, 0.0021820068359375, 0.008472442626953125, 0.01476287841796875, 0.021053314208984375, 0.02734375, 0.033634185791015625, 0.03992462158203125, 0.046215057373046875, 0.0525054931640625, 0.058795928955078125, 0.06508636474609375, 0.07137680053710938, 0.077667236328125, 0.08395767211914062, 0.09024810791015625, 0.09653854370117188, 0.1028289794921875, 0.10911941528320312, 0.11540985107421875, 0.12170028686523438, 0.12799072265625, 0.13428115844726562, 0.14057159423828125, 0.14686203002929688, 0.1531524658203125, 0.15944290161132812, 0.16573333740234375, 0.17202377319335938, 0.178314208984375, 0.18460464477539062, 0.19089508056640625, 0.19718551635742188, 0.2034759521484375, 0.20976638793945312, 0.21605682373046875, 0.22234725952148438, 0.2286376953125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 6.0, 8.0, 10.0, 4.0, 9.0, 12.0, 29.0, 19.0, 26.0, 21.0, 32.0, 19.0, 34.0, 31.0, 37.0, 49.0, 46.0, 39.0, 48.0, 48.0, 52.0, 44.0, 32.0, 42.0, 36.0, 27.0, 33.0, 34.0, 33.0, 25.0, 19.0, 22.0, 8.0, 11.0, 9.0, 9.0, 9.0, 4.0, 5.0, 6.0, 3.0, 2.0, 4.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07415771484375, -0.07146263122558594, -0.06876754760742188, -0.06607246398925781, -0.06337738037109375, -0.06068229675292969, -0.057987213134765625, -0.05529212951660156, -0.0525970458984375, -0.04990196228027344, -0.047206878662109375, -0.04451179504394531, -0.04181671142578125, -0.03912162780761719, -0.036426544189453125, -0.03373146057128906, -0.031036376953125, -0.028341293334960938, -0.025646209716796875, -0.022951126098632812, -0.02025604248046875, -0.017560958862304688, -0.014865875244140625, -0.012170791625976562, -0.0094757080078125, -0.0067806243896484375, -0.004085540771484375, -0.0013904571533203125, 0.00130462646484375, 0.0039997100830078125, 0.006694793701171875, 0.009389877319335938, 0.0120849609375, 0.014780044555664062, 0.017475128173828125, 0.020170211791992188, 0.02286529541015625, 0.025560379028320312, 0.028255462646484375, 0.030950546264648438, 0.0336456298828125, 0.03634071350097656, 0.039035797119140625, 0.04173088073730469, 0.04442596435546875, 0.04712104797363281, 0.049816131591796875, 0.05251121520996094, 0.055206298828125, 0.05790138244628906, 0.060596466064453125, 0.06329154968261719, 0.06598663330078125, 0.06868171691894531, 0.07137680053710938, 0.07407188415527344, 0.0767669677734375, 0.07946205139160156, 0.08215713500976562, 0.08485221862792969, 0.08754730224609375, 0.09024238586425781, 0.09293746948242188, 0.09563255310058594, 0.09832763671875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 6.0, 5.0, 8.0, 11.0, 17.0, 29.0, 46.0, 62.0, 99.0, 172.0, 382.0, 636.0, 1248.0, 2794.0, 7011.0, 21499.0, 92707.0, 483973.0, 349325.0, 62457.0, 15881.0, 5567.0, 2272.0, 1087.0, 576.0, 272.0, 176.0, 83.0, 58.0, 28.0, 18.0, 17.0, 9.0, 6.0, 6.0, 4.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11090087890625, -0.10730934143066406, -0.10371780395507812, -0.10012626647949219, -0.09653472900390625, -0.09294319152832031, -0.08935165405273438, -0.08576011657714844, -0.0821685791015625, -0.07857704162597656, -0.07498550415039062, -0.07139396667480469, -0.06780242919921875, -0.06421089172363281, -0.060619354248046875, -0.05702781677246094, -0.053436279296875, -0.04984474182128906, -0.046253204345703125, -0.04266166687011719, -0.03907012939453125, -0.03547859191894531, -0.031887054443359375, -0.028295516967773438, -0.0247039794921875, -0.021112442016601562, -0.017520904541015625, -0.013929367065429688, -0.01033782958984375, -0.0067462921142578125, -0.003154754638671875, 0.0004367828369140625, 0.0040283203125, 0.0076198577880859375, 0.011211395263671875, 0.014802932739257812, 0.01839447021484375, 0.021986007690429688, 0.025577545166015625, 0.029169082641601562, 0.0327606201171875, 0.03635215759277344, 0.039943695068359375, 0.04353523254394531, 0.04712677001953125, 0.05071830749511719, 0.054309844970703125, 0.05790138244628906, 0.061492919921875, 0.06508445739746094, 0.06867599487304688, 0.07226753234863281, 0.07585906982421875, 0.07945060729980469, 0.08304214477539062, 0.08663368225097656, 0.0902252197265625, 0.09381675720214844, 0.09740829467773438, 0.10099983215332031, 0.10459136962890625, 0.10818290710449219, 0.11177444458007812, 0.11536598205566406, 0.11895751953125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 9.0, 10.0, 16.0, 19.0, 42.0, 39.0, 42.0, 54.0, 74.0, 85.0, 96.0, 101.0, 90.0, 86.0, 56.0, 53.0, 41.0, 25.0, 26.0, 6.0, 10.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.654594421386719e-05, -8.392985910177231e-05, -8.131377398967743e-05, -7.869768887758255e-05, -7.608160376548767e-05, -7.346551865339279e-05, -7.084943354129791e-05, -6.823334842920303e-05, -6.561726331710815e-05, -6.300117820501328e-05, -6.0385093092918396e-05, -5.776900798082352e-05, -5.515292286872864e-05, -5.253683775663376e-05, -4.992075264453888e-05, -4.7304667532444e-05, -4.468858242034912e-05, -4.207249730825424e-05, -3.945641219615936e-05, -3.6840327084064484e-05, -3.4224241971969604e-05, -3.1608156859874725e-05, -2.8992071747779846e-05, -2.6375986635684967e-05, -2.3759901523590088e-05, -2.114381641149521e-05, -1.852773129940033e-05, -1.591164618730545e-05, -1.3295561075210571e-05, -1.0679475963115692e-05, -8.063390851020813e-06, -5.447305738925934e-06, -2.8312206268310547e-06, -2.1513551473617554e-07, 2.4009495973587036e-06, 5.017034709453583e-06, 7.633119821548462e-06, 1.0249204933643341e-05, 1.286529004573822e-05, 1.54813751578331e-05, 1.809746026992798e-05, 2.0713545382022858e-05, 2.3329630494117737e-05, 2.5945715606212616e-05, 2.8561800718307495e-05, 3.1177885830402374e-05, 3.3793970942497253e-05, 3.641005605459213e-05, 3.902614116668701e-05, 4.164222627878189e-05, 4.425831139087677e-05, 4.687439650297165e-05, 4.949048161506653e-05, 5.210656672716141e-05, 5.472265183925629e-05, 5.7338736951351166e-05, 5.9954822063446045e-05, 6.257090717554092e-05, 6.51869922876358e-05, 6.780307739973068e-05, 7.041916251182556e-05, 7.303524762392044e-05, 7.565133273601532e-05, 7.82674178481102e-05, 8.088350296020508e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 6.0, 4.0, 5.0, 3.0, 7.0, 13.0, 10.0, 17.0, 29.0, 58.0, 61.0, 104.0, 167.0, 299.0, 551.0, 1192.0, 3179.0, 10573.0, 46612.0, 358577.0, 537408.0, 68261.0, 14362.0, 4106.0, 1444.0, 661.0, 341.0, 173.0, 113.0, 71.0, 58.0, 36.0, 25.0, 8.0, 11.0, 5.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.142578125, -0.1381378173828125, -0.133697509765625, -0.1292572021484375, -0.12481689453125, -0.1203765869140625, -0.115936279296875, -0.1114959716796875, -0.1070556640625, -0.1026153564453125, -0.098175048828125, -0.0937347412109375, -0.08929443359375, -0.0848541259765625, -0.080413818359375, -0.0759735107421875, -0.071533203125, -0.0670928955078125, -0.062652587890625, -0.0582122802734375, -0.05377197265625, -0.0493316650390625, -0.044891357421875, -0.0404510498046875, -0.0360107421875, -0.0315704345703125, -0.027130126953125, -0.0226898193359375, -0.01824951171875, -0.0138092041015625, -0.009368896484375, -0.0049285888671875, -0.00048828125, 0.0039520263671875, 0.008392333984375, 0.0128326416015625, 0.01727294921875, 0.0217132568359375, 0.026153564453125, 0.0305938720703125, 0.0350341796875, 0.0394744873046875, 0.043914794921875, 0.0483551025390625, 0.05279541015625, 0.0572357177734375, 0.061676025390625, 0.0661163330078125, 0.070556640625, 0.0749969482421875, 0.079437255859375, 0.0838775634765625, 0.08831787109375, 0.0927581787109375, 0.097198486328125, 0.1016387939453125, 0.1060791015625, 0.1105194091796875, 0.114959716796875, 0.1194000244140625, 0.12384033203125, 0.1282806396484375, 0.132720947265625, 0.1371612548828125, 0.1416015625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 3.0, 7.0, 6.0, 6.0, 5.0, 4.0, 8.0, 8.0, 6.0, 20.0, 13.0, 23.0, 24.0, 39.0, 27.0, 53.0, 61.0, 59.0, 71.0, 65.0, 66.0, 75.0, 50.0, 49.0, 49.0, 35.0, 27.0, 20.0, 18.0, 15.0, 14.0, 7.0, 14.0, 10.0, 11.0, 6.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.05047607421875, -0.04904937744140625, -0.0476226806640625, -0.04619598388671875, -0.044769287109375, -0.04334259033203125, -0.0419158935546875, -0.04048919677734375, -0.0390625, -0.03763580322265625, -0.0362091064453125, -0.03478240966796875, -0.033355712890625, -0.03192901611328125, -0.0305023193359375, -0.02907562255859375, -0.02764892578125, -0.02622222900390625, -0.0247955322265625, -0.02336883544921875, -0.021942138671875, -0.02051544189453125, -0.0190887451171875, -0.01766204833984375, -0.0162353515625, -0.01480865478515625, -0.0133819580078125, -0.01195526123046875, -0.010528564453125, -0.00910186767578125, -0.0076751708984375, -0.00624847412109375, -0.00482177734375, -0.00339508056640625, -0.0019683837890625, -0.00054168701171875, 0.000885009765625, 0.00231170654296875, 0.0037384033203125, 0.00516510009765625, 0.006591796875, 0.00801849365234375, 0.0094451904296875, 0.01087188720703125, 0.012298583984375, 0.01372528076171875, 0.0151519775390625, 0.01657867431640625, 0.01800537109375, 0.01943206787109375, 0.0208587646484375, 0.02228546142578125, 0.023712158203125, 0.02513885498046875, 0.0265655517578125, 0.02799224853515625, 0.0294189453125, 0.03084564208984375, 0.0322723388671875, 0.03369903564453125, 0.035125732421875, 0.03655242919921875, 0.0379791259765625, 0.03940582275390625, 0.04083251953125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 9.0, 23.0, 92.0, 238.0, 333.0, 188.0, 77.0, 30.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2105929851531982, -1.1513837575912476, -1.0921745300292969, -1.0329654216766357, -0.9737561345100403, -0.9145469665527344, -0.8553377389907837, -0.796128511428833, -0.7369192838668823, -0.6777100563049316, -0.6185008883476257, -0.559291660785675, -0.5000824332237244, -0.44087323546409607, -0.3816640377044678, -0.3224548101425171, -0.2632456421852112, -0.2040364295244217, -0.1448272168636322, -0.0856180191040039, -0.026408806443214417, 0.03280040621757507, 0.09200960397720337, 0.15121883153915405, 0.21042802929878235, 0.26963722705841064, 0.32884645462036133, 0.3880556523799896, 0.4472648501396179, 0.5064740777015686, 0.5656832456588745, 0.6248924732208252, 0.6841017007827759, 0.7433109283447266, 0.8025200963020325, 0.8617293238639832, 0.9209385514259338, 0.9801477193832397, 1.0393569469451904, 1.0985661745071411, 1.1577754020690918, 1.2169846296310425, 1.2761938571929932, 1.3354029655456543, 1.394612193107605, 1.4538214206695557, 1.5130306482315063, 1.572239875793457, 1.6314489841461182, 1.6906582117080688, 1.7498674392700195, 1.8090765476226807, 1.8682857751846313, 1.927495002746582, 1.9867042303085327, 2.0459134578704834, 2.1051228046417236, 2.1643319129943848, 2.223541259765625, 2.282750368118286, 2.3419597148895264, 2.4011688232421875, 2.4603781700134277, 2.519587278366089, 2.57879638671875]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 5.0, 2.0, 8.0, 11.0, 8.0, 14.0, 24.0, 24.0, 33.0, 29.0, 52.0, 42.0, 57.0, 51.0, 46.0, 61.0, 72.0, 55.0, 63.0, 45.0, 44.0, 45.0, 29.0, 25.0, 37.0, 26.0, 25.0, 20.0, 12.0, 10.0, 8.0, 11.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8658173084259033, -0.8387893438339233, -0.8117614388465881, -0.7847334742546082, -0.757705569267273, -0.730677604675293, -0.703649640083313, -0.676621675491333, -0.6495937705039978, -0.6225658059120178, -0.5955379009246826, -0.5685099363327026, -0.5414819717407227, -0.5144540667533875, -0.48742610216140747, -0.4603981673717499, -0.4333702325820923, -0.4063422977924347, -0.3793143630027771, -0.3522863984107971, -0.3252584636211395, -0.29823052883148193, -0.27120256423950195, -0.24417462944984436, -0.21714669466018677, -0.19011875987052917, -0.1630908101797104, -0.1360628604888916, -0.10903492569923401, -0.08200699090957642, -0.05497904121875763, -0.027951091527938843, -0.00092315673828125, 0.02610478550195694, 0.05313272774219513, 0.08016066998243332, 0.10718861222267151, 0.1342165470123291, 0.1612444967031479, 0.18827244639396667, 0.21530038118362427, 0.24232831597328186, 0.26935625076293945, 0.29638421535491943, 0.323412150144577, 0.3504400849342346, 0.3774680495262146, 0.4044959843158722, 0.4315239191055298, 0.4585518538951874, 0.48557978868484497, 0.512607753276825, 0.5396356582641602, 0.5666636228561401, 0.5936915874481201, 0.6207195520401001, 0.6477474570274353, 0.6747754216194153, 0.7018033266067505, 0.7288312911987305, 0.7558592557907104, 0.7828871607780457, 0.8099151253700256, 0.8369430303573608, 0.8639709949493408]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 6.0, 11.0, 16.0, 23.0, 44.0, 72.0, 160.0, 317.0, 807.0, 2650.0, 15186.0, 729545.0, 3420041.0, 20225.0, 3353.0, 966.0, 429.0, 190.0, 92.0, 45.0, 27.0, 32.0, 7.0, 7.0, 6.0, 8.0, 7.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43994140625, -0.42305755615234375, -0.4061737060546875, -0.38928985595703125, -0.372406005859375, -0.35552215576171875, -0.3386383056640625, -0.32175445556640625, -0.30487060546875, -0.28798675537109375, -0.2711029052734375, -0.25421905517578125, -0.237335205078125, -0.22045135498046875, -0.2035675048828125, -0.18668365478515625, -0.1697998046875, -0.15291595458984375, -0.1360321044921875, -0.11914825439453125, -0.102264404296875, -0.08538055419921875, -0.0684967041015625, -0.05161285400390625, -0.03472900390625, -0.01784515380859375, -0.0009613037109375, 0.01592254638671875, 0.032806396484375, 0.04969024658203125, 0.0665740966796875, 0.08345794677734375, 0.100341796875, 0.11722564697265625, 0.1341094970703125, 0.15099334716796875, 0.167877197265625, 0.18476104736328125, 0.2016448974609375, 0.21852874755859375, 0.23541259765625, 0.25229644775390625, 0.2691802978515625, 0.28606414794921875, 0.302947998046875, 0.31983184814453125, 0.3367156982421875, 0.35359954833984375, 0.3704833984375, 0.38736724853515625, 0.4042510986328125, 0.42113494873046875, 0.438018798828125, 0.45490264892578125, 0.4717864990234375, 0.48867034912109375, 0.50555419921875, 0.5224380493164062, 0.5393218994140625, 0.5562057495117188, 0.573089599609375, 0.5899734497070312, 0.6068572998046875, 0.6237411499023438, 0.640625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 6.0, 11.0, 8.0, 17.0, 34.0, 33.0, 60.0, 74.0, 81.0, 86.0, 97.0, 105.0, 80.0, 80.0, 50.0, 55.0, 40.0, 20.0, 15.0, 13.0, 6.0, 7.0, 2.0, 6.0, 4.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0219879150390625, -0.021027803421020508, -0.020067691802978516, -0.019107580184936523, -0.01814746856689453, -0.01718735694885254, -0.016227245330810547, -0.015267133712768555, -0.014307022094726562, -0.01334691047668457, -0.012386798858642578, -0.011426687240600586, -0.010466575622558594, -0.009506464004516602, -0.00854635238647461, -0.007586240768432617, -0.006626129150390625, -0.005666017532348633, -0.004705905914306641, -0.0037457942962646484, -0.0027856826782226562, -0.001825571060180664, -0.0008654594421386719, 9.465217590332031e-05, 0.0010547637939453125, 0.0020148754119873047, 0.002974987030029297, 0.003935098648071289, 0.004895210266113281, 0.0058553218841552734, 0.006815433502197266, 0.007775545120239258, 0.00873565673828125, 0.009695768356323242, 0.010655879974365234, 0.011615991592407227, 0.012576103210449219, 0.013536214828491211, 0.014496326446533203, 0.015456438064575195, 0.016416549682617188, 0.01737666130065918, 0.018336772918701172, 0.019296884536743164, 0.020256996154785156, 0.02121710777282715, 0.02217721939086914, 0.023137331008911133, 0.024097442626953125, 0.025057554244995117, 0.02601766586303711, 0.0269777774810791, 0.027937889099121094, 0.028898000717163086, 0.029858112335205078, 0.03081822395324707, 0.03177833557128906, 0.032738447189331055, 0.03369855880737305, 0.03465867042541504, 0.03561878204345703, 0.03657889366149902, 0.037539005279541016, 0.03849911689758301, 0.039459228515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 2.0, 6.0, 7.0, 12.0, 9.0, 23.0, 27.0, 59.0, 110.0, 189.0, 373.0, 1002.0, 3164.0, 14934.0, 151110.0, 3778657.0, 220913.0, 18511.0, 3430.0, 961.0, 370.0, 183.0, 99.0, 67.0, 20.0, 12.0, 15.0, 10.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3955078125, -0.3857574462890625, -0.376007080078125, -0.3662567138671875, -0.35650634765625, -0.3467559814453125, -0.337005615234375, -0.3272552490234375, -0.3175048828125, -0.3077545166015625, -0.298004150390625, -0.2882537841796875, -0.27850341796875, -0.2687530517578125, -0.259002685546875, -0.2492523193359375, -0.239501953125, -0.2297515869140625, -0.220001220703125, -0.2102508544921875, -0.20050048828125, -0.1907501220703125, -0.180999755859375, -0.1712493896484375, -0.1614990234375, -0.1517486572265625, -0.141998291015625, -0.1322479248046875, -0.12249755859375, -0.1127471923828125, -0.102996826171875, -0.0932464599609375, -0.08349609375, -0.0737457275390625, -0.063995361328125, -0.0542449951171875, -0.04449462890625, -0.0347442626953125, -0.024993896484375, -0.0152435302734375, -0.0054931640625, 0.0042572021484375, 0.014007568359375, 0.0237579345703125, 0.03350830078125, 0.0432586669921875, 0.053009033203125, 0.0627593994140625, 0.072509765625, 0.0822601318359375, 0.092010498046875, 0.1017608642578125, 0.11151123046875, 0.1212615966796875, 0.131011962890625, 0.1407623291015625, 0.1505126953125, 0.1602630615234375, 0.170013427734375, 0.1797637939453125, 0.18951416015625, 0.1992645263671875, 0.209014892578125, 0.2187652587890625, 0.228515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 8.0, 5.0, 8.0, 19.0, 19.0, 31.0, 39.0, 70.0, 93.0, 118.0, 190.0, 431.0, 1492.0, 754.0, 286.0, 167.0, 113.0, 76.0, 36.0, 32.0, 22.0, 18.0, 10.0, 9.0, 8.0, 4.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053497314453125, -0.05211925506591797, -0.05074119567871094, -0.049363136291503906, -0.047985076904296875, -0.046607017517089844, -0.04522895812988281, -0.04385089874267578, -0.04247283935546875, -0.04109477996826172, -0.03971672058105469, -0.038338661193847656, -0.036960601806640625, -0.035582542419433594, -0.03420448303222656, -0.03282642364501953, -0.0314483642578125, -0.03007030487060547, -0.028692245483398438, -0.027314186096191406, -0.025936126708984375, -0.024558067321777344, -0.023180007934570312, -0.02180194854736328, -0.02042388916015625, -0.01904582977294922, -0.017667770385742188, -0.016289710998535156, -0.014911651611328125, -0.013533592224121094, -0.012155532836914062, -0.010777473449707031, -0.0093994140625, -0.008021354675292969, -0.0066432952880859375, -0.005265235900878906, -0.003887176513671875, -0.0025091171264648438, -0.0011310577392578125, 0.00024700164794921875, 0.00162506103515625, 0.0030031204223632812, 0.0043811798095703125, 0.005759239196777344, 0.007137298583984375, 0.008515357971191406, 0.009893417358398438, 0.011271476745605469, 0.0126495361328125, 0.014027595520019531, 0.015405654907226562, 0.016783714294433594, 0.018161773681640625, 0.019539833068847656, 0.020917892456054688, 0.02229595184326172, 0.02367401123046875, 0.02505207061767578, 0.026430130004882812, 0.027808189392089844, 0.029186248779296875, 0.030564308166503906, 0.03194236755371094, 0.03332042694091797, 0.034698486328125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 8.0, 19.0, 69.0, 267.0, 411.0, 174.0, 43.0, 14.0, 3.0, 1.0, 2.0], "bins": [-1.2653367519378662, -1.243304967880249, -1.2212731838226318, -1.1992413997650146, -1.1772096157073975, -1.1551779508590698, -1.1331461668014526, -1.1111143827438354, -1.0890825986862183, -1.067050814628601, -1.0450190305709839, -1.0229872465133667, -1.0009554624557495, -0.9789237380027771, -0.9568919539451599, -0.9348602294921875, -0.9128284454345703, -0.8907966613769531, -0.8687648773193359, -0.8467331528663635, -0.8247013688087463, -0.8026695847511292, -0.780637800693512, -0.7586060762405396, -0.7365742325782776, -0.7145424485206604, -0.6925106644630432, -0.6704789400100708, -0.6484471559524536, -0.6264153718948364, -0.6043835878372192, -0.582351803779602, -0.5603200793266296, -0.5382882952690125, -0.5162565112113953, -0.49422475695610046, -0.47219300270080566, -0.4501612186431885, -0.4281294345855713, -0.4060976803302765, -0.3840659260749817, -0.3620341420173645, -0.3400023877620697, -0.3179706037044525, -0.2959388494491577, -0.2739070653915405, -0.25187528133392334, -0.22984352707862854, -0.20781175792217255, -0.18577998876571655, -0.16374821960926056, -0.14171645045280457, -0.11968467384576797, -0.09765290468931198, -0.07562112808227539, -0.0535893589258194, -0.0315575897693634, -0.00952581875026226, 0.012505952268838882, 0.034537725150585175, 0.05656949430704117, 0.07860126346349716, 0.10063304007053375, 0.12266480922698975, 0.14469657838344574]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 5.0, 3.0, 3.0, 7.0, 11.0, 17.0, 15.0, 13.0, 19.0, 14.0, 25.0, 22.0, 24.0, 25.0, 35.0, 39.0, 42.0, 49.0, 58.0, 44.0, 48.0, 56.0, 58.0, 39.0, 36.0, 33.0, 37.0, 36.0, 26.0, 24.0, 23.0, 22.0, 17.0, 9.0, 16.0, 13.0, 10.0, 9.0, 7.0, 4.0, 2.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.16236263513565063, -0.15772852301597595, -0.15309441089630127, -0.1484602838754654, -0.1438261717557907, -0.13919205963611603, -0.13455794751644135, -0.12992383539676666, -0.1252897083759308, -0.1206555962562561, -0.11602147668600082, -0.11138736456632614, -0.10675324499607086, -0.10211913287639618, -0.0974850207567215, -0.09285090863704681, -0.08821679651737213, -0.08358268439769745, -0.07894856482744217, -0.07431445270776749, -0.06968033313751221, -0.06504622101783752, -0.06041210889816284, -0.05577799305319786, -0.05114387720823288, -0.0465097613632679, -0.04187564551830292, -0.037241533398628235, -0.032607417553663254, -0.027973301708698273, -0.02333918772637844, -0.01870507374405861, -0.014070957899093628, -0.009436842985451221, -0.004802728071808815, -0.00016861315816640854, 0.004465501755475998, 0.009099617600440979, 0.01373373158276081, 0.018367845565080643, 0.023001961410045624, 0.027636077255010605, 0.032270193099975586, 0.03690430521965027, 0.04153842106461525, 0.04617253690958023, 0.05080664902925491, 0.055440764874219894, 0.060074880719184875, 0.06470899283885956, 0.06934311240911484, 0.07397722452878952, 0.0786113440990448, 0.08324545621871948, 0.08787956833839417, 0.09251368045806885, 0.09714780002832413, 0.10178191214799881, 0.10641603171825409, 0.11105014383792877, 0.11568425595760345, 0.12031837552785873, 0.12495248764753342, 0.1295866072177887, 0.13422071933746338]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 6.0, 10.0, 14.0, 13.0, 20.0, 42.0, 70.0, 86.0, 125.0, 195.0, 348.0, 607.0, 1094.0, 2044.0, 4445.0, 10525.0, 32480.0, 117342.0, 402597.0, 339840.0, 92984.0, 26756.0, 9094.0, 3691.0, 1852.0, 925.0, 517.0, 280.0, 195.0, 114.0, 81.0, 47.0, 35.0, 27.0, 16.0, 11.0, 9.0, 7.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1422119140625, -0.13761138916015625, -0.1330108642578125, -0.12841033935546875, -0.123809814453125, -0.11920928955078125, -0.1146087646484375, -0.11000823974609375, -0.10540771484375, -0.10080718994140625, -0.0962066650390625, -0.09160614013671875, -0.087005615234375, -0.08240509033203125, -0.0778045654296875, -0.07320404052734375, -0.068603515625, -0.06400299072265625, -0.0594024658203125, -0.05480194091796875, -0.050201416015625, -0.04560089111328125, -0.0410003662109375, -0.03639984130859375, -0.03179931640625, -0.02719879150390625, -0.0225982666015625, -0.01799774169921875, -0.013397216796875, -0.00879669189453125, -0.0041961669921875, 0.00040435791015625, 0.0050048828125, 0.00960540771484375, 0.0142059326171875, 0.01880645751953125, 0.023406982421875, 0.02800750732421875, 0.0326080322265625, 0.03720855712890625, 0.04180908203125, 0.04640960693359375, 0.0510101318359375, 0.05561065673828125, 0.060211181640625, 0.06481170654296875, 0.0694122314453125, 0.07401275634765625, 0.07861328125, 0.08321380615234375, 0.0878143310546875, 0.09241485595703125, 0.097015380859375, 0.10161590576171875, 0.1062164306640625, 0.11081695556640625, 0.11541748046875, 0.12001800537109375, 0.1246185302734375, 0.12921905517578125, 0.133819580078125, 0.13842010498046875, 0.1430206298828125, 0.14762115478515625, 0.1522216796875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 1.0, 5.0, 7.0, 12.0, 21.0, 33.0, 30.0, 60.0, 78.0, 78.0, 88.0, 90.0, 81.0, 91.0, 96.0, 51.0, 39.0, 32.0, 32.0, 21.0, 14.0, 11.0, 7.0, 6.0, 6.0, 1.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0247039794921875, -0.023755311965942383, -0.022806644439697266, -0.02185797691345215, -0.02090930938720703, -0.019960641860961914, -0.019011974334716797, -0.01806330680847168, -0.017114639282226562, -0.016165971755981445, -0.015217304229736328, -0.014268636703491211, -0.013319969177246094, -0.012371301651000977, -0.01142263412475586, -0.010473966598510742, -0.009525299072265625, -0.008576631546020508, -0.007627964019775391, -0.0066792964935302734, -0.005730628967285156, -0.004781961441040039, -0.003833293914794922, -0.0028846263885498047, -0.0019359588623046875, -0.0009872913360595703, -3.8623809814453125e-05, 0.0009100437164306641, 0.0018587112426757812, 0.0028073787689208984, 0.0037560462951660156, 0.004704713821411133, 0.00565338134765625, 0.006602048873901367, 0.007550716400146484, 0.008499383926391602, 0.009448051452636719, 0.010396718978881836, 0.011345386505126953, 0.01229405403137207, 0.013242721557617188, 0.014191389083862305, 0.015140056610107422, 0.01608872413635254, 0.017037391662597656, 0.017986059188842773, 0.01893472671508789, 0.019883394241333008, 0.020832061767578125, 0.021780729293823242, 0.02272939682006836, 0.023678064346313477, 0.024626731872558594, 0.02557539939880371, 0.026524066925048828, 0.027472734451293945, 0.028421401977539062, 0.02937006950378418, 0.030318737030029297, 0.031267404556274414, 0.03221607208251953, 0.03316473960876465, 0.034113407135009766, 0.03506207466125488, 0.0360107421875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 10.0, 11.0, 15.0, 11.0, 29.0, 53.0, 83.0, 121.0, 177.0, 278.0, 426.0, 710.0, 1571.0, 4103.0, 15542.0, 82017.0, 456111.0, 397578.0, 69010.0, 13628.0, 3744.0, 1425.0, 706.0, 409.0, 256.0, 154.0, 125.0, 80.0, 42.0, 38.0, 22.0, 20.0, 10.0, 6.0, 10.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1727294921875, -0.1665496826171875, -0.160369873046875, -0.1541900634765625, -0.14801025390625, -0.1418304443359375, -0.135650634765625, -0.1294708251953125, -0.123291015625, -0.1171112060546875, -0.110931396484375, -0.1047515869140625, -0.09857177734375, -0.0923919677734375, -0.086212158203125, -0.0800323486328125, -0.0738525390625, -0.0676727294921875, -0.061492919921875, -0.0553131103515625, -0.04913330078125, -0.0429534912109375, -0.036773681640625, -0.0305938720703125, -0.0244140625, -0.0182342529296875, -0.012054443359375, -0.0058746337890625, 0.00030517578125, 0.0064849853515625, 0.012664794921875, 0.0188446044921875, 0.0250244140625, 0.0312042236328125, 0.037384033203125, 0.0435638427734375, 0.04974365234375, 0.0559234619140625, 0.062103271484375, 0.0682830810546875, 0.074462890625, 0.0806427001953125, 0.086822509765625, 0.0930023193359375, 0.09918212890625, 0.1053619384765625, 0.111541748046875, 0.1177215576171875, 0.1239013671875, 0.1300811767578125, 0.136260986328125, 0.1424407958984375, 0.14862060546875, 0.1548004150390625, 0.160980224609375, 0.1671600341796875, 0.17333984375, 0.1795196533203125, 0.185699462890625, 0.1918792724609375, 0.19805908203125, 0.2042388916015625, 0.210418701171875, 0.2165985107421875, 0.2227783203125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 8.0, 0.0, 4.0, 7.0, 5.0, 11.0, 11.0, 14.0, 17.0, 18.0, 24.0, 25.0, 24.0, 31.0, 28.0, 33.0, 37.0, 47.0, 46.0, 48.0, 48.0, 46.0, 55.0, 43.0, 55.0, 30.0, 35.0, 33.0, 31.0, 37.0, 20.0, 25.0, 15.0, 16.0, 19.0, 10.0, 12.0, 10.0, 5.0, 11.0, 4.0, 0.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.105712890625, -0.1022186279296875, -0.098724365234375, -0.0952301025390625, -0.09173583984375, -0.0882415771484375, -0.084747314453125, -0.0812530517578125, -0.0777587890625, -0.0742645263671875, -0.070770263671875, -0.0672760009765625, -0.06378173828125, -0.0602874755859375, -0.056793212890625, -0.0532989501953125, -0.0498046875, -0.0463104248046875, -0.042816162109375, -0.0393218994140625, -0.03582763671875, -0.0323333740234375, -0.028839111328125, -0.0253448486328125, -0.0218505859375, -0.0183563232421875, -0.014862060546875, -0.0113677978515625, -0.00787353515625, -0.0043792724609375, -0.000885009765625, 0.0026092529296875, 0.006103515625, 0.0095977783203125, 0.013092041015625, 0.0165863037109375, 0.02008056640625, 0.0235748291015625, 0.027069091796875, 0.0305633544921875, 0.0340576171875, 0.0375518798828125, 0.041046142578125, 0.0445404052734375, 0.04803466796875, 0.0515289306640625, 0.055023193359375, 0.0585174560546875, 0.06201171875, 0.0655059814453125, 0.069000244140625, 0.0724945068359375, 0.07598876953125, 0.0794830322265625, 0.082977294921875, 0.0864715576171875, 0.0899658203125, 0.0934600830078125, 0.096954345703125, 0.1004486083984375, 0.10394287109375, 0.1074371337890625, 0.110931396484375, 0.1144256591796875, 0.117919921875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 4.0, 6.0, 12.0, 14.0, 16.0, 23.0, 52.0, 80.0, 125.0, 175.0, 259.0, 505.0, 893.0, 1627.0, 3148.0, 6202.0, 14028.0, 33621.0, 91838.0, 308287.0, 392924.0, 119879.0, 42142.0, 17073.0, 7556.0, 3699.0, 1870.0, 1020.0, 553.0, 357.0, 214.0, 129.0, 73.0, 56.0, 20.0, 25.0, 19.0, 13.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06939697265625, -0.0670928955078125, -0.064788818359375, -0.0624847412109375, -0.0601806640625, -0.0578765869140625, -0.055572509765625, -0.0532684326171875, -0.05096435546875, -0.0486602783203125, -0.046356201171875, -0.0440521240234375, -0.041748046875, -0.0394439697265625, -0.037139892578125, -0.0348358154296875, -0.03253173828125, -0.0302276611328125, -0.027923583984375, -0.0256195068359375, -0.0233154296875, -0.0210113525390625, -0.018707275390625, -0.0164031982421875, -0.01409912109375, -0.0117950439453125, -0.009490966796875, -0.0071868896484375, -0.0048828125, -0.0025787353515625, -0.000274658203125, 0.0020294189453125, 0.00433349609375, 0.0066375732421875, 0.008941650390625, 0.0112457275390625, 0.0135498046875, 0.0158538818359375, 0.018157958984375, 0.0204620361328125, 0.02276611328125, 0.0250701904296875, 0.027374267578125, 0.0296783447265625, 0.031982421875, 0.0342864990234375, 0.036590576171875, 0.0388946533203125, 0.04119873046875, 0.0435028076171875, 0.045806884765625, 0.0481109619140625, 0.0504150390625, 0.0527191162109375, 0.055023193359375, 0.0573272705078125, 0.05963134765625, 0.0619354248046875, 0.064239501953125, 0.0665435791015625, 0.06884765625, 0.0711517333984375, 0.073455810546875, 0.0757598876953125, 0.07806396484375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 11.0, 13.0, 18.0, 41.0, 72.0, 74.0, 88.0, 123.0, 141.0, 93.0, 84.0, 76.0, 47.0, 42.0, 22.0, 11.0, 9.0, 8.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.465217590332031e-05, -9.172502905130386e-05, -8.879788219928741e-05, -8.587073534727097e-05, -8.294358849525452e-05, -8.001644164323807e-05, -7.708929479122162e-05, -7.416214793920517e-05, -7.123500108718872e-05, -6.830785423517227e-05, -6.538070738315582e-05, -6.245356053113937e-05, -5.9526413679122925e-05, -5.6599266827106476e-05, -5.367211997509003e-05, -5.074497312307358e-05, -4.781782627105713e-05, -4.489067941904068e-05, -4.196353256702423e-05, -3.903638571500778e-05, -3.610923886299133e-05, -3.3182092010974884e-05, -3.0254945158958435e-05, -2.7327798306941986e-05, -2.4400651454925537e-05, -2.1473504602909088e-05, -1.854635775089264e-05, -1.561921089887619e-05, -1.2692064046859741e-05, -9.764917194843292e-06, -6.837770342826843e-06, -3.910623490810394e-06, -9.834766387939453e-07, 1.9436702132225037e-06, 4.870817065238953e-06, 7.797963917255402e-06, 1.072511076927185e-05, 1.36522576212883e-05, 1.657940447330475e-05, 1.9506551325321198e-05, 2.2433698177337646e-05, 2.5360845029354095e-05, 2.8287991881370544e-05, 3.1215138733386993e-05, 3.414228558540344e-05, 3.706943243741989e-05, 3.999657928943634e-05, 4.292372614145279e-05, 4.585087299346924e-05, 4.877801984548569e-05, 5.1705166697502136e-05, 5.4632313549518585e-05, 5.7559460401535034e-05, 6.048660725355148e-05, 6.341375410556793e-05, 6.634090095758438e-05, 6.926804780960083e-05, 7.219519466161728e-05, 7.512234151363373e-05, 7.804948836565018e-05, 8.097663521766663e-05, 8.390378206968307e-05, 8.683092892169952e-05, 8.975807577371597e-05, 9.268522262573242e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 8.0, 16.0, 13.0, 20.0, 31.0, 37.0, 42.0, 83.0, 110.0, 183.0, 291.0, 476.0, 840.0, 1809.0, 4367.0, 13768.0, 54590.0, 311771.0, 541155.0, 87177.0, 20869.0, 6021.0, 2305.0, 1017.0, 573.0, 343.0, 193.0, 138.0, 83.0, 43.0, 41.0, 38.0, 22.0, 19.0, 11.0, 6.0, 6.0, 8.0, 3.0, 6.0, 4.0, 4.0, 0.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.1197509765625, -0.1160268783569336, -0.11230278015136719, -0.10857868194580078, -0.10485458374023438, -0.10113048553466797, -0.09740638732910156, -0.09368228912353516, -0.08995819091796875, -0.08623409271240234, -0.08250999450683594, -0.07878589630126953, -0.07506179809570312, -0.07133769989013672, -0.06761360168457031, -0.0638895034790039, -0.0601654052734375, -0.056441307067871094, -0.05271720886230469, -0.04899311065673828, -0.045269012451171875, -0.04154491424560547, -0.03782081604003906, -0.034096717834472656, -0.03037261962890625, -0.026648521423339844, -0.022924423217773438, -0.01920032501220703, -0.015476226806640625, -0.011752128601074219, -0.008028030395507812, -0.004303932189941406, -0.000579833984375, 0.0031442642211914062, 0.0068683624267578125, 0.010592460632324219, 0.014316558837890625, 0.01804065704345703, 0.021764755249023438, 0.025488853454589844, 0.02921295166015625, 0.032937049865722656, 0.03666114807128906, 0.04038524627685547, 0.044109344482421875, 0.04783344268798828, 0.05155754089355469, 0.055281639099121094, 0.0590057373046875, 0.0627298355102539, 0.06645393371582031, 0.07017803192138672, 0.07390213012695312, 0.07762622833251953, 0.08135032653808594, 0.08507442474365234, 0.08879852294921875, 0.09252262115478516, 0.09624671936035156, 0.09997081756591797, 0.10369491577148438, 0.10741901397705078, 0.11114311218261719, 0.1148672103881836, 0.11859130859375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 4.0, 10.0, 7.0, 19.0, 12.0, 12.0, 26.0, 34.0, 28.0, 46.0, 63.0, 106.0, 89.0, 107.0, 100.0, 65.0, 62.0, 44.0, 30.0, 27.0, 22.0, 19.0, 12.0, 14.0, 5.0, 7.0, 7.0, 4.0, 4.0, 3.0, 0.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0689697265625, -0.06684303283691406, -0.06471633911132812, -0.06258964538574219, -0.06046295166015625, -0.05833625793457031, -0.056209564208984375, -0.05408287048339844, -0.0519561767578125, -0.04982948303222656, -0.047702789306640625, -0.04557609558105469, -0.04344940185546875, -0.04132270812988281, -0.039196014404296875, -0.03706932067871094, -0.034942626953125, -0.03281593322753906, -0.030689239501953125, -0.028562545776367188, -0.02643585205078125, -0.024309158325195312, -0.022182464599609375, -0.020055770874023438, -0.0179290771484375, -0.015802383422851562, -0.013675689697265625, -0.011548995971679688, -0.00942230224609375, -0.0072956085205078125, -0.005168914794921875, -0.0030422210693359375, -0.00091552734375, 0.0012111663818359375, 0.003337860107421875, 0.0054645538330078125, 0.00759124755859375, 0.009717941284179688, 0.011844635009765625, 0.013971328735351562, 0.0160980224609375, 0.018224716186523438, 0.020351409912109375, 0.022478103637695312, 0.02460479736328125, 0.026731491088867188, 0.028858184814453125, 0.030984878540039062, 0.033111572265625, 0.03523826599121094, 0.037364959716796875, 0.03949165344238281, 0.04161834716796875, 0.04374504089355469, 0.045871734619140625, 0.04799842834472656, 0.0501251220703125, 0.05225181579589844, 0.054378509521484375, 0.05650520324707031, 0.05863189697265625, 0.06075859069824219, 0.06288528442382812, 0.06501197814941406, 0.067138671875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 6.0, 5.0, 6.0, 11.0, 23.0, 35.0, 57.0, 87.0, 136.0, 166.0, 174.0, 118.0, 82.0, 38.0, 20.0, 13.0, 8.0, 8.0, 5.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2780095338821411, -1.2444459199905396, -1.210882306098938, -1.1773186922073364, -1.1437550783157349, -1.1101914644241333, -1.0766278505325317, -1.0430642366409302, -1.0095006227493286, -0.975937008857727, -0.9423733949661255, -0.9088097810745239, -0.8752461671829224, -0.8416825532913208, -0.8081189393997192, -0.7745553255081177, -0.7409917116165161, -0.7074280977249146, -0.673864483833313, -0.6403008699417114, -0.6067372560501099, -0.5731736421585083, -0.5396100282669067, -0.5060464143753052, -0.4724828004837036, -0.43891918659210205, -0.4053555727005005, -0.3717919588088989, -0.33822834491729736, -0.3046647310256958, -0.27110111713409424, -0.23753750324249268, -0.2039739489555359, -0.17041033506393433, -0.13684672117233276, -0.1032831072807312, -0.06971949338912964, -0.036155879497528076, -0.0025922656059265137, 0.03097134828567505, 0.06453496217727661, 0.09809857606887817, 0.13166218996047974, 0.1652258038520813, 0.19878941774368286, 0.23235303163528442, 0.265916645526886, 0.29948025941848755, 0.3330438733100891, 0.3666074872016907, 0.40017110109329224, 0.4337347149848938, 0.46729832887649536, 0.5008619427680969, 0.5344255566596985, 0.5679891705513, 0.6015527844429016, 0.6351163983345032, 0.6686800122261047, 0.7022436261177063, 0.7358072400093079, 0.7693708539009094, 0.802934467792511, 0.8364980816841125, 0.8700616955757141]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 5.0, 7.0, 5.0, 11.0, 13.0, 11.0, 13.0, 21.0, 24.0, 24.0, 17.0, 35.0, 29.0, 34.0, 39.0, 45.0, 43.0, 45.0, 46.0, 42.0, 38.0, 49.0, 37.0, 37.0, 35.0, 35.0, 29.0, 38.0, 22.0, 18.0, 21.0, 25.0, 21.0, 11.0, 10.0, 12.0, 9.0, 10.0, 6.0, 4.0, 2.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6594053506851196, -0.6379721164703369, -0.6165388822555542, -0.5951056480407715, -0.5736724138259888, -0.552239179611206, -0.5308059453964233, -0.5093727111816406, -0.4879395067691803, -0.4665062725543976, -0.44507303833961487, -0.42363983392715454, -0.4022065997123718, -0.3807733654975891, -0.3593401312828064, -0.3379068970680237, -0.31647366285324097, -0.29504042863845825, -0.27360719442367554, -0.2521739602088928, -0.2307407408952713, -0.2093075066804886, -0.18787428736686707, -0.16644105315208435, -0.14500781893730164, -0.12357458472251892, -0.1021413579583168, -0.08070813119411469, -0.05927489697933197, -0.037841662764549255, -0.016408443450927734, 0.0050247907638549805, 0.02645808458328247, 0.04789131507277489, 0.0693245455622673, 0.09075777232646942, 0.11219100654125214, 0.13362424075603485, 0.15505746006965637, 0.1764906942844391, 0.1979239284992218, 0.21935716271400452, 0.24079039692878723, 0.26222360134124756, 0.2836568355560303, 0.305090069770813, 0.3265233039855957, 0.3479565382003784, 0.36938977241516113, 0.39082300662994385, 0.41225624084472656, 0.4336894750595093, 0.455122709274292, 0.4765559434890747, 0.49798914790153503, 0.5194224119186401, 0.5408556461334229, 0.5622888803482056, 0.5837221145629883, 0.605155348777771, 0.6265885829925537, 0.6480218172073364, 0.6694550514221191, 0.6908882856369019, 0.7123214602470398]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 13.0, 12.0, 15.0, 30.0, 45.0, 62.0, 99.0, 155.0, 192.0, 378.0, 630.0, 1106.0, 2273.0, 5360.0, 15761.0, 70049.0, 2651013.0, 1354962.0, 65962.0, 15461.0, 5448.0, 2368.0, 1180.0, 578.0, 397.0, 232.0, 154.0, 103.0, 68.0, 57.0, 28.0, 17.0, 16.0, 16.0, 11.0, 11.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.196533203125, -0.19038772583007812, -0.18424224853515625, -0.17809677124023438, -0.1719512939453125, -0.16580581665039062, -0.15966033935546875, -0.15351486206054688, -0.147369384765625, -0.14122390747070312, -0.13507843017578125, -0.12893295288085938, -0.1227874755859375, -0.11664199829101562, -0.11049652099609375, -0.10435104370117188, -0.09820556640625, -0.09206008911132812, -0.08591461181640625, -0.07976913452148438, -0.0736236572265625, -0.06747817993164062, -0.06133270263671875, -0.055187225341796875, -0.049041748046875, -0.042896270751953125, -0.03675079345703125, -0.030605316162109375, -0.0244598388671875, -0.018314361572265625, -0.01216888427734375, -0.006023406982421875, 0.0001220703125, 0.006267547607421875, 0.01241302490234375, 0.018558502197265625, 0.0247039794921875, 0.030849456787109375, 0.03699493408203125, 0.043140411376953125, 0.049285888671875, 0.055431365966796875, 0.06157684326171875, 0.06772232055664062, 0.0738677978515625, 0.08001327514648438, 0.08615875244140625, 0.09230422973632812, 0.09844970703125, 0.10459518432617188, 0.11074066162109375, 0.11688613891601562, 0.1230316162109375, 0.12917709350585938, 0.13532257080078125, 0.14146804809570312, 0.147613525390625, 0.15375900268554688, 0.15990447998046875, 0.16604995727539062, 0.1721954345703125, 0.17834091186523438, 0.18448638916015625, 0.19063186645507812, 0.19677734375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 6.0, 11.0, 11.0, 10.0, 19.0, 23.0, 34.0, 32.0, 49.0, 43.0, 57.0, 62.0, 62.0, 75.0, 64.0, 72.0, 64.0, 65.0, 49.0, 38.0, 35.0, 25.0, 21.0, 19.0, 11.0, 6.0, 15.0, 5.0, 8.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0238037109375, -0.02289104461669922, -0.021978378295898438, -0.021065711975097656, -0.020153045654296875, -0.019240379333496094, -0.018327713012695312, -0.01741504669189453, -0.01650238037109375, -0.015589714050292969, -0.014677047729492188, -0.013764381408691406, -0.012851715087890625, -0.011939048767089844, -0.011026382446289062, -0.010113716125488281, -0.0092010498046875, -0.008288383483886719, -0.0073757171630859375, -0.006463050842285156, -0.005550384521484375, -0.004637718200683594, -0.0037250518798828125, -0.0028123855590820312, -0.00189971923828125, -0.0009870529174804688, -7.43865966796875e-05, 0.0008382797241210938, 0.001750946044921875, 0.0026636123657226562, 0.0035762786865234375, 0.004488945007324219, 0.005401611328125, 0.006314277648925781, 0.0072269439697265625, 0.008139610290527344, 0.009052276611328125, 0.009964942932128906, 0.010877609252929688, 0.011790275573730469, 0.01270294189453125, 0.013615608215332031, 0.014528274536132812, 0.015440940856933594, 0.016353607177734375, 0.017266273498535156, 0.018178939819335938, 0.01909160614013672, 0.0200042724609375, 0.02091693878173828, 0.021829605102539062, 0.022742271423339844, 0.023654937744140625, 0.024567604064941406, 0.025480270385742188, 0.02639293670654297, 0.02730560302734375, 0.02821826934814453, 0.029130935668945312, 0.030043601989746094, 0.030956268310546875, 0.031868934631347656, 0.03278160095214844, 0.03369426727294922, 0.03460693359375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 7.0, 9.0, 6.0, 12.0, 25.0, 35.0, 59.0, 96.0, 153.0, 284.0, 517.0, 1005.0, 2167.0, 5221.0, 14986.0, 54312.0, 354763.0, 3409758.0, 280800.0, 46965.0, 13575.0, 5039.0, 2142.0, 1048.0, 540.0, 291.0, 159.0, 90.0, 79.0, 38.0, 23.0, 22.0, 13.0, 11.0, 8.0, 7.0, 8.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1531982421875, -0.14832687377929688, -0.14345550537109375, -0.13858413696289062, -0.1337127685546875, -0.12884140014648438, -0.12397003173828125, -0.11909866333007812, -0.114227294921875, -0.10935592651367188, -0.10448455810546875, -0.09961318969726562, -0.0947418212890625, -0.08987045288085938, -0.08499908447265625, -0.08012771606445312, -0.07525634765625, -0.07038497924804688, -0.06551361083984375, -0.060642242431640625, -0.0557708740234375, -0.050899505615234375, -0.04602813720703125, -0.041156768798828125, -0.036285400390625, -0.031414031982421875, -0.02654266357421875, -0.021671295166015625, -0.0167999267578125, -0.011928558349609375, -0.00705718994140625, -0.002185821533203125, 0.002685546875, 0.007556915283203125, 0.01242828369140625, 0.017299652099609375, 0.0221710205078125, 0.027042388916015625, 0.03191375732421875, 0.036785125732421875, 0.041656494140625, 0.046527862548828125, 0.05139923095703125, 0.056270599365234375, 0.0611419677734375, 0.06601333618164062, 0.07088470458984375, 0.07575607299804688, 0.08062744140625, 0.08549880981445312, 0.09037017822265625, 0.09524154663085938, 0.1001129150390625, 0.10498428344726562, 0.10985565185546875, 0.11472702026367188, 0.119598388671875, 0.12446975708007812, 0.12934112548828125, 0.13421249389648438, 0.1390838623046875, 0.14395523071289062, 0.14882659912109375, 0.15369796752929688, 0.1585693359375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 1.0, 5.0, 10.0, 17.0, 26.0, 25.0, 37.0, 59.0, 82.0, 118.0, 183.0, 424.0, 1514.0, 763.0, 300.0, 181.0, 90.0, 58.0, 42.0, 24.0, 22.0, 22.0, 19.0, 8.0, 12.0, 7.0, 2.0, 5.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035430908203125, -0.03410625457763672, -0.03278160095214844, -0.031456947326660156, -0.030132293701171875, -0.028807640075683594, -0.027482986450195312, -0.02615833282470703, -0.02483367919921875, -0.02350902557373047, -0.022184371948242188, -0.020859718322753906, -0.019535064697265625, -0.018210411071777344, -0.016885757446289062, -0.015561103820800781, -0.0142364501953125, -0.012911796569824219, -0.011587142944335938, -0.010262489318847656, -0.008937835693359375, -0.007613182067871094, -0.0062885284423828125, -0.004963874816894531, -0.00363922119140625, -0.0023145675659179688, -0.0009899139404296875, 0.00033473968505859375, 0.001659393310546875, 0.0029840469360351562, 0.0043087005615234375, 0.005633354187011719, 0.0069580078125, 0.008282661437988281, 0.009607315063476562, 0.010931968688964844, 0.012256622314453125, 0.013581275939941406, 0.014905929565429688, 0.01623058319091797, 0.01755523681640625, 0.01887989044189453, 0.020204544067382812, 0.021529197692871094, 0.022853851318359375, 0.024178504943847656, 0.025503158569335938, 0.02682781219482422, 0.0281524658203125, 0.02947711944580078, 0.030801773071289062, 0.032126426696777344, 0.033451080322265625, 0.034775733947753906, 0.03610038757324219, 0.03742504119873047, 0.03874969482421875, 0.04007434844970703, 0.04139900207519531, 0.042723655700683594, 0.044048309326171875, 0.045372962951660156, 0.04669761657714844, 0.04802227020263672, 0.049346923828125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 8.0, 16.0, 64.0, 295.0, 434.0, 148.0, 39.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5539562702178955, -0.5278787016868591, -0.5018011927604675, -0.47572362422943115, -0.4496460556983948, -0.4235685169696808, -0.3974909782409668, -0.3714134097099304, -0.34533587098121643, -0.31925833225250244, -0.29318076372146606, -0.2671032249927521, -0.2410256713628769, -0.2149481177330017, -0.18887057900428772, -0.16279302537441254, -0.13671547174453735, -0.11063791811466217, -0.08456037193536758, -0.058482825756073, -0.032405272126197815, -0.006327718496322632, 0.019749820232391357, 0.04582737386226654, 0.07190492749214172, 0.0979824811220169, 0.12406002730131149, 0.15013757348060608, 0.17621512711048126, 0.20229268074035645, 0.22837021946907043, 0.2544477581977844, 0.2805253267288208, 0.3066028654575348, 0.33268043398857117, 0.35875797271728516, 0.38483554124832153, 0.4109130799770355, 0.4369906187057495, 0.4630681872367859, 0.4891457259654999, 0.5152232646942139, 0.5413008332252502, 0.5673784017562866, 0.5934559106826782, 0.6195334792137146, 0.645611047744751, 0.6716885566711426, 0.697766125202179, 0.7238436937332153, 0.7499212026596069, 0.7759987711906433, 0.8020763397216797, 0.8281538486480713, 0.8542314171791077, 0.880308985710144, 0.9063864946365356, 0.932464063167572, 0.9585415720939636, 0.984619140625, 1.0106966495513916, 1.0367742776870728, 1.0628517866134644, 1.088929295539856, 1.115006923675537]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 3.0, 7.0, 7.0, 9.0, 17.0, 16.0, 18.0, 25.0, 18.0, 12.0, 35.0, 39.0, 29.0, 36.0, 40.0, 52.0, 59.0, 48.0, 57.0, 46.0, 47.0, 51.0, 45.0, 44.0, 41.0, 29.0, 28.0, 26.0, 27.0, 22.0, 17.0, 12.0, 11.0, 10.0, 6.0, 8.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15133535861968994, -0.1461365967988968, -0.14093783497810364, -0.1357390582561493, -0.13054029643535614, -0.125341534614563, -0.12014277279376984, -0.11494401097297668, -0.10974524170160294, -0.10454647988080978, -0.09934771060943604, -0.09414894878864288, -0.08895018696784973, -0.08375141769647598, -0.07855265587568283, -0.07335388660430908, -0.06815512478351593, -0.06295636296272278, -0.05775759369134903, -0.05255883187055588, -0.04736006632447243, -0.04216130077838898, -0.036962538957595825, -0.031763773411512375, -0.026565007865428925, -0.021366242319345474, -0.016167478635907173, -0.010968714021146297, -0.005769949406385422, -0.0005711838603019714, 0.00462757982313633, 0.00982634350657463, 0.015025109052658081, 0.02022387459874153, 0.025422638282179832, 0.030621401965618134, 0.035820167511701584, 0.041018933057785034, 0.046217694878578186, 0.051416460424661636, 0.05661522597074509, 0.06181399151682854, 0.06701275706291199, 0.07221151888370514, 0.07741028070449829, 0.08260904997587204, 0.08780781179666519, 0.09300658106803894, 0.09820534288883209, 0.10340410470962524, 0.10860287398099899, 0.11380163580179214, 0.1190004050731659, 0.12419916689395905, 0.1293979287147522, 0.13459669053554535, 0.1397954523563385, 0.14499421417713165, 0.1501929759979248, 0.15539175271987915, 0.1605905145406723, 0.16578927636146545, 0.1709880381822586, 0.17618680000305176, 0.1813855767250061]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 6.0, 9.0, 13.0, 26.0, 37.0, 47.0, 49.0, 91.0, 139.0, 192.0, 271.0, 471.0, 710.0, 1170.0, 1929.0, 3364.0, 6255.0, 11652.0, 23011.0, 46273.0, 98074.0, 202375.0, 299399.0, 181019.0, 86797.0, 41144.0, 20205.0, 10296.0, 5588.0, 3198.0, 1743.0, 1106.0, 668.0, 385.0, 258.0, 173.0, 119.0, 95.0, 55.0, 41.0, 31.0, 19.0, 15.0, 17.0, 9.0, 3.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0789794921875, -0.07646560668945312, -0.07395172119140625, -0.07143783569335938, -0.0689239501953125, -0.06641006469726562, -0.06389617919921875, -0.061382293701171875, -0.058868408203125, -0.056354522705078125, -0.05384063720703125, -0.051326751708984375, -0.0488128662109375, -0.046298980712890625, -0.04378509521484375, -0.041271209716796875, -0.03875732421875, -0.036243438720703125, -0.03372955322265625, -0.031215667724609375, -0.0287017822265625, -0.026187896728515625, -0.02367401123046875, -0.021160125732421875, -0.018646240234375, -0.016132354736328125, -0.01361846923828125, -0.011104583740234375, -0.0085906982421875, -0.006076812744140625, -0.00356292724609375, -0.001049041748046875, 0.00146484375, 0.003978729248046875, 0.00649261474609375, 0.009006500244140625, 0.0115203857421875, 0.014034271240234375, 0.01654815673828125, 0.019062042236328125, 0.021575927734375, 0.024089813232421875, 0.02660369873046875, 0.029117584228515625, 0.0316314697265625, 0.034145355224609375, 0.03665924072265625, 0.039173126220703125, 0.04168701171875, 0.044200897216796875, 0.04671478271484375, 0.049228668212890625, 0.0517425537109375, 0.054256439208984375, 0.05677032470703125, 0.059284210205078125, 0.061798095703125, 0.06431198120117188, 0.06682586669921875, 0.06933975219726562, 0.0718536376953125, 0.07436752319335938, 0.07688140869140625, 0.07939529418945312, 0.0819091796875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 9.0, 11.0, 15.0, 15.0, 15.0, 13.0, 29.0, 34.0, 43.0, 42.0, 53.0, 64.0, 56.0, 63.0, 67.0, 66.0, 57.0, 43.0, 71.0, 43.0, 35.0, 38.0, 23.0, 17.0, 11.0, 13.0, 14.0, 9.0, 9.0, 5.0, 5.0, 0.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0227203369140625, -0.021863698959350586, -0.021007061004638672, -0.020150423049926758, -0.019293785095214844, -0.01843714714050293, -0.017580509185791016, -0.0167238712310791, -0.015867233276367188, -0.015010595321655273, -0.01415395736694336, -0.013297319412231445, -0.012440681457519531, -0.011584043502807617, -0.010727405548095703, -0.009870767593383789, -0.009014129638671875, -0.008157491683959961, -0.007300853729248047, -0.006444215774536133, -0.005587577819824219, -0.004730939865112305, -0.0038743019104003906, -0.0030176639556884766, -0.0021610260009765625, -0.0013043880462646484, -0.0004477500915527344, 0.0004088878631591797, 0.0012655258178710938, 0.002122163772583008, 0.002978801727294922, 0.003835439682006836, 0.00469207763671875, 0.005548715591430664, 0.006405353546142578, 0.007261991500854492, 0.008118629455566406, 0.00897526741027832, 0.009831905364990234, 0.010688543319702148, 0.011545181274414062, 0.012401819229125977, 0.01325845718383789, 0.014115095138549805, 0.014971733093261719, 0.015828371047973633, 0.016685009002685547, 0.01754164695739746, 0.018398284912109375, 0.01925492286682129, 0.020111560821533203, 0.020968198776245117, 0.02182483673095703, 0.022681474685668945, 0.02353811264038086, 0.024394750595092773, 0.025251388549804688, 0.0261080265045166, 0.026964664459228516, 0.02782130241394043, 0.028677940368652344, 0.029534578323364258, 0.030391216278076172, 0.031247854232788086, 0.0321044921875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 4.0, 3.0, 6.0, 8.0, 10.0, 19.0, 26.0, 28.0, 38.0, 69.0, 86.0, 114.0, 149.0, 243.0, 330.0, 534.0, 936.0, 1629.0, 3729.0, 9606.0, 30429.0, 110373.0, 366191.0, 365029.0, 110905.0, 30372.0, 9702.0, 3711.0, 1732.0, 885.0, 553.0, 330.0, 214.0, 174.0, 110.0, 75.0, 65.0, 33.0, 28.0, 22.0, 21.0, 8.0, 8.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.122802734375, -0.11908149719238281, -0.11536026000976562, -0.11163902282714844, -0.10791778564453125, -0.10419654846191406, -0.10047531127929688, -0.09675407409667969, -0.0930328369140625, -0.08931159973144531, -0.08559036254882812, -0.08186912536621094, -0.07814788818359375, -0.07442665100097656, -0.07070541381835938, -0.06698417663574219, -0.063262939453125, -0.05954170227050781, -0.055820465087890625, -0.05209922790527344, -0.04837799072265625, -0.04465675354003906, -0.040935516357421875, -0.03721427917480469, -0.0334930419921875, -0.029771804809570312, -0.026050567626953125, -0.022329330444335938, -0.01860809326171875, -0.014886856079101562, -0.011165618896484375, -0.0074443817138671875, -0.00372314453125, -1.9073486328125e-06, 0.003719329833984375, 0.0074405670166015625, 0.01116180419921875, 0.014883041381835938, 0.018604278564453125, 0.022325515747070312, 0.0260467529296875, 0.029767990112304688, 0.033489227294921875, 0.03721046447753906, 0.04093170166015625, 0.04465293884277344, 0.048374176025390625, 0.05209541320800781, 0.055816650390625, 0.05953788757324219, 0.06325912475585938, 0.06698036193847656, 0.07070159912109375, 0.07442283630371094, 0.07814407348632812, 0.08186531066894531, 0.0855865478515625, 0.08930778503417969, 0.09302902221679688, 0.09675025939941406, 0.10047149658203125, 0.10419273376464844, 0.10791397094726562, 0.11163520812988281, 0.1153564453125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 1.0, 2.0, 7.0, 8.0, 12.0, 13.0, 14.0, 13.0, 12.0, 33.0, 28.0, 32.0, 29.0, 40.0, 38.0, 48.0, 57.0, 45.0, 54.0, 51.0, 55.0, 50.0, 47.0, 43.0, 38.0, 32.0, 33.0, 37.0, 21.0, 24.0, 16.0, 14.0, 13.0, 11.0, 5.0, 4.0, 7.0, 3.0, 4.0, 1.0, 6.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1390380859375, -0.13510990142822266, -0.1311817169189453, -0.12725353240966797, -0.12332534790039062, -0.11939716339111328, -0.11546897888183594, -0.1115407943725586, -0.10761260986328125, -0.1036844253540039, -0.09975624084472656, -0.09582805633544922, -0.09189987182617188, -0.08797168731689453, -0.08404350280761719, -0.08011531829833984, -0.0761871337890625, -0.07225894927978516, -0.06833076477050781, -0.06440258026123047, -0.060474395751953125, -0.05654621124267578, -0.05261802673339844, -0.048689842224121094, -0.04476165771484375, -0.040833473205566406, -0.03690528869628906, -0.03297710418701172, -0.029048919677734375, -0.02512073516845703, -0.021192550659179688, -0.017264366149902344, -0.013336181640625, -0.009407997131347656, -0.0054798126220703125, -0.0015516281127929688, 0.002376556396484375, 0.006304740905761719, 0.010232925415039062, 0.014161109924316406, 0.01808929443359375, 0.022017478942871094, 0.025945663452148438, 0.02987384796142578, 0.033802032470703125, 0.03773021697998047, 0.04165840148925781, 0.045586585998535156, 0.0495147705078125, 0.053442955017089844, 0.05737113952636719, 0.06129932403564453, 0.06522750854492188, 0.06915569305419922, 0.07308387756347656, 0.0770120620727539, 0.08094024658203125, 0.0848684310913086, 0.08879661560058594, 0.09272480010986328, 0.09665298461914062, 0.10058116912841797, 0.10450935363769531, 0.10843753814697266, 0.11236572265625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 11.0, 15.0, 12.0, 24.0, 24.0, 43.0, 67.0, 109.0, 189.0, 397.0, 826.0, 1959.0, 5302.0, 16946.0, 69285.0, 380389.0, 457268.0, 85426.0, 20012.0, 6087.0, 2229.0, 923.0, 439.0, 238.0, 110.0, 78.0, 47.0, 23.0, 15.0, 8.0, 12.0, 12.0, 7.0, 8.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07647705078125, -0.07423210144042969, -0.07198715209960938, -0.06974220275878906, -0.06749725341796875, -0.06525230407714844, -0.06300735473632812, -0.06076240539550781, -0.0585174560546875, -0.05627250671386719, -0.054027557373046875, -0.05178260803222656, -0.04953765869140625, -0.04729270935058594, -0.045047760009765625, -0.04280281066894531, -0.040557861328125, -0.03831291198730469, -0.036067962646484375, -0.03382301330566406, -0.03157806396484375, -0.029333114624023438, -0.027088165283203125, -0.024843215942382812, -0.0225982666015625, -0.020353317260742188, -0.018108367919921875, -0.015863418579101562, -0.01361846923828125, -0.011373519897460938, -0.009128570556640625, -0.0068836212158203125, -0.004638671875, -0.0023937225341796875, -0.000148773193359375, 0.0020961761474609375, 0.00434112548828125, 0.0065860748291015625, 0.008831024169921875, 0.011075973510742188, 0.0133209228515625, 0.015565872192382812, 0.017810821533203125, 0.020055770874023438, 0.02230072021484375, 0.024545669555664062, 0.026790618896484375, 0.029035568237304688, 0.031280517578125, 0.03352546691894531, 0.035770416259765625, 0.03801536560058594, 0.04026031494140625, 0.04250526428222656, 0.044750213623046875, 0.04699516296386719, 0.0492401123046875, 0.05148506164550781, 0.053730010986328125, 0.05597496032714844, 0.05821990966796875, 0.06046485900878906, 0.06270980834960938, 0.06495475769042969, 0.06719970703125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 4.0, 4.0, 4.0, 7.0, 8.0, 12.0, 14.0, 18.0, 23.0, 37.0, 44.0, 50.0, 48.0, 69.0, 66.0, 79.0, 85.0, 70.0, 67.0, 55.0, 50.0, 39.0, 36.0, 24.0, 21.0, 23.0, 8.0, 12.0, 6.0, 4.0, 5.0, 5.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.9723854064941406e-05, -5.8113597333431244e-05, -5.650334060192108e-05, -5.489308387041092e-05, -5.328282713890076e-05, -5.1672570407390594e-05, -5.006231367588043e-05, -4.845205694437027e-05, -4.684180021286011e-05, -4.5231543481349945e-05, -4.362128674983978e-05, -4.201103001832962e-05, -4.040077328681946e-05, -3.8790516555309296e-05, -3.718025982379913e-05, -3.557000309228897e-05, -3.395974636077881e-05, -3.2349489629268646e-05, -3.0739232897758484e-05, -2.912897616624832e-05, -2.751871943473816e-05, -2.5908462703227997e-05, -2.4298205971717834e-05, -2.2687949240207672e-05, -2.107769250869751e-05, -1.9467435777187347e-05, -1.7857179045677185e-05, -1.6246922314167023e-05, -1.463666558265686e-05, -1.3026408851146698e-05, -1.1416152119636536e-05, -9.805895388126373e-06, -8.195638656616211e-06, -6.585381925106049e-06, -4.975125193595886e-06, -3.364868462085724e-06, -1.7546117305755615e-06, -1.4435499906539917e-07, 1.4659017324447632e-06, 3.0761584639549255e-06, 4.686415195465088e-06, 6.29667192697525e-06, 7.906928658485413e-06, 9.517185389995575e-06, 1.1127442121505737e-05, 1.27376988530159e-05, 1.4347955584526062e-05, 1.5958212316036224e-05, 1.7568469047546387e-05, 1.917872577905655e-05, 2.078898251056671e-05, 2.2399239242076874e-05, 2.4009495973587036e-05, 2.56197527050972e-05, 2.723000943660736e-05, 2.8840266168117523e-05, 3.0450522899627686e-05, 3.206077963113785e-05, 3.367103636264801e-05, 3.528129309415817e-05, 3.6891549825668335e-05, 3.85018065571785e-05, 4.011206328868866e-05, 4.172232002019882e-05, 4.3332576751708984e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 3.0, 8.0, 13.0, 10.0, 21.0, 38.0, 60.0, 115.0, 236.0, 600.0, 1762.0, 7426.0, 57076.0, 749038.0, 210089.0, 17157.0, 3174.0, 967.0, 381.0, 177.0, 95.0, 45.0, 26.0, 12.0, 9.0, 9.0, 6.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.136474609375, -0.13265514373779297, -0.12883567810058594, -0.1250162124633789, -0.12119674682617188, -0.11737728118896484, -0.11355781555175781, -0.10973834991455078, -0.10591888427734375, -0.10209941864013672, -0.09827995300292969, -0.09446048736572266, -0.09064102172851562, -0.0868215560913086, -0.08300209045410156, -0.07918262481689453, -0.0753631591796875, -0.07154369354248047, -0.06772422790527344, -0.0639047622680664, -0.060085296630859375, -0.056265830993652344, -0.05244636535644531, -0.04862689971923828, -0.04480743408203125, -0.04098796844482422, -0.03716850280761719, -0.033349037170410156, -0.029529571533203125, -0.025710105895996094, -0.021890640258789062, -0.01807117462158203, -0.014251708984375, -0.010432243347167969, -0.0066127777099609375, -0.0027933120727539062, 0.001026153564453125, 0.004845619201660156, 0.008665084838867188, 0.012484550476074219, 0.01630401611328125, 0.02012348175048828, 0.023942947387695312, 0.027762413024902344, 0.031581878662109375, 0.035401344299316406, 0.03922080993652344, 0.04304027557373047, 0.0468597412109375, 0.05067920684814453, 0.05449867248535156, 0.058318138122558594, 0.062137603759765625, 0.06595706939697266, 0.06977653503417969, 0.07359600067138672, 0.07741546630859375, 0.08123493194580078, 0.08505439758300781, 0.08887386322021484, 0.09269332885742188, 0.0965127944946289, 0.10033226013183594, 0.10415172576904297, 0.10797119140625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 8.0, 9.0, 15.0, 9.0, 11.0, 21.0, 35.0, 40.0, 56.0, 83.0, 96.0, 134.0, 124.0, 92.0, 83.0, 57.0, 36.0, 26.0, 19.0, 14.0, 6.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04364013671875, -0.041728973388671875, -0.03981781005859375, -0.037906646728515625, -0.0359954833984375, -0.034084320068359375, -0.03217315673828125, -0.030261993408203125, -0.028350830078125, -0.026439666748046875, -0.02452850341796875, -0.022617340087890625, -0.0207061767578125, -0.018795013427734375, -0.01688385009765625, -0.014972686767578125, -0.0130615234375, -0.011150360107421875, -0.00923919677734375, -0.007328033447265625, -0.0054168701171875, -0.003505706787109375, -0.00159454345703125, 0.000316619873046875, 0.002227783203125, 0.004138946533203125, 0.00605010986328125, 0.007961273193359375, 0.0098724365234375, 0.011783599853515625, 0.01369476318359375, 0.015605926513671875, 0.01751708984375, 0.019428253173828125, 0.02133941650390625, 0.023250579833984375, 0.0251617431640625, 0.027072906494140625, 0.02898406982421875, 0.030895233154296875, 0.032806396484375, 0.034717559814453125, 0.03662872314453125, 0.038539886474609375, 0.0404510498046875, 0.042362213134765625, 0.04427337646484375, 0.046184539794921875, 0.048095703125, 0.050006866455078125, 0.05191802978515625, 0.053829193115234375, 0.0557403564453125, 0.057651519775390625, 0.05956268310546875, 0.061473846435546875, 0.063385009765625, 0.06529617309570312, 0.06720733642578125, 0.06911849975585938, 0.0710296630859375, 0.07294082641601562, 0.07485198974609375, 0.07676315307617188, 0.07867431640625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 7.0, 5.0, 5.0, 3.0, 11.0, 26.0, 34.0, 46.0, 85.0, 104.0, 149.0, 156.0, 119.0, 86.0, 68.0, 40.0, 24.0, 12.0, 7.0, 4.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5689632296562195, -0.5446256995201111, -0.5202881693840027, -0.4959506094455719, -0.4716130793094635, -0.4472755193710327, -0.4229379892349243, -0.3986004590988159, -0.3742629289627075, -0.3499253988265991, -0.32558783888816833, -0.30125030875205994, -0.27691277861595154, -0.25257521867752075, -0.22823768854141235, -0.20390015840530396, -0.17956259846687317, -0.15522505342960358, -0.13088752329349518, -0.10654997825622559, -0.08221244066953659, -0.057874903082847595, -0.033537358045578, -0.009199827909469604, 0.015137717127799988, 0.03947525471448898, 0.06381279230117798, 0.08815033733844757, 0.11248787492513657, 0.13682541251182556, 0.16116295754909515, 0.18550048768520355, 0.20983803272247314, 0.23417557775974274, 0.25851312279701233, 0.2828506529331207, 0.3071881830692291, 0.3315257430076599, 0.3558632731437683, 0.3802008032798767, 0.4045383334159851, 0.4288758635520935, 0.4532134234905243, 0.4775509536266327, 0.5018885135650635, 0.5262260437011719, 0.5505635738372803, 0.5749011039733887, 0.5992386341094971, 0.6235761642456055, 0.6479136943817139, 0.6722512245178223, 0.6965888142585754, 0.7209263443946838, 0.7452638745307922, 0.7696014046669006, 0.7939389944076538, 0.8182765245437622, 0.8426140546798706, 0.866951584815979, 0.8912891745567322, 0.9156267046928406, 0.939964234828949, 0.9643017649650574, 0.9886392951011658]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 6.0, 2.0, 4.0, 7.0, 8.0, 9.0, 11.0, 11.0, 17.0, 22.0, 23.0, 19.0, 16.0, 32.0, 34.0, 28.0, 39.0, 33.0, 40.0, 40.0, 34.0, 38.0, 42.0, 44.0, 48.0, 45.0, 49.0, 29.0, 41.0, 31.0, 32.0, 28.0, 22.0, 17.0, 17.0, 11.0, 10.0, 12.0, 6.0, 9.0, 8.0, 5.0, 6.0, 3.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.6068695187568665, -0.5884832739830017, -0.5700969696044922, -0.5517107248306274, -0.5333244800567627, -0.5149381756782532, -0.4965519309043884, -0.4781656563282013, -0.45977938175201416, -0.441393107175827, -0.4230068624019623, -0.40462058782577515, -0.386234313249588, -0.3678480386734009, -0.34946179389953613, -0.331075519323349, -0.31268927454948425, -0.2943029999732971, -0.2759167551994324, -0.25753048062324524, -0.2391442060470581, -0.22075794637203217, -0.20237168669700623, -0.1839854121208191, -0.16559915244579315, -0.1472128927707672, -0.12882661819458008, -0.11044035851955414, -0.0920540913939476, -0.07366782426834106, -0.055281564593315125, -0.03689529001712799, -0.01850903034210205, -0.00012276507914066315, 0.018263500183820724, 0.03664976358413696, 0.0550360307097435, 0.07342229783535004, 0.09180855751037598, 0.11019483208656311, 0.12858109176158905, 0.146967351436615, 0.16535362601280212, 0.18373988568782806, 0.202126145362854, 0.22051241993904114, 0.23889867961406708, 0.257284939289093, 0.27567121386528015, 0.2940574884414673, 0.31244373321533203, 0.33083000779151917, 0.3492162823677063, 0.36760252714157104, 0.3859888017177582, 0.4043750762939453, 0.42276132106781006, 0.4411475956439972, 0.45953384041786194, 0.4779201149940491, 0.4963063895702362, 0.5146926641464233, 0.5330789089202881, 0.5514651536941528, 0.5698514580726624]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 3.0, 4.0, 2.0, 8.0, 7.0, 11.0, 10.0, 20.0, 25.0, 46.0, 55.0, 110.0, 164.0, 282.0, 483.0, 886.0, 1504.0, 3277.0, 7949.0, 24573.0, 116143.0, 3633027.0, 339589.0, 43697.0, 12693.0, 4867.0, 2197.0, 1065.0, 636.0, 372.0, 230.0, 139.0, 81.0, 42.0, 34.0, 21.0, 17.0, 4.0, 3.0, 9.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1634521484375, -0.15860366821289062, -0.15375518798828125, -0.14890670776367188, -0.1440582275390625, -0.13920974731445312, -0.13436126708984375, -0.12951278686523438, -0.124664306640625, -0.11981582641601562, -0.11496734619140625, -0.11011886596679688, -0.1052703857421875, -0.10042190551757812, -0.09557342529296875, -0.09072494506835938, -0.08587646484375, -0.08102798461914062, -0.07617950439453125, -0.07133102416992188, -0.0664825439453125, -0.061634063720703125, -0.05678558349609375, -0.051937103271484375, -0.047088623046875, -0.042240142822265625, -0.03739166259765625, -0.032543182373046875, -0.0276947021484375, -0.022846221923828125, -0.01799774169921875, -0.013149261474609375, -0.00830078125, -0.003452301025390625, 0.00139617919921875, 0.006244659423828125, 0.0110931396484375, 0.015941619873046875, 0.02079010009765625, 0.025638580322265625, 0.030487060546875, 0.035335540771484375, 0.04018402099609375, 0.045032501220703125, 0.0498809814453125, 0.054729461669921875, 0.05957794189453125, 0.06442642211914062, 0.06927490234375, 0.07412338256835938, 0.07897186279296875, 0.08382034301757812, 0.0886688232421875, 0.09351730346679688, 0.09836578369140625, 0.10321426391601562, 0.108062744140625, 0.11291122436523438, 0.11775970458984375, 0.12260818481445312, 0.1274566650390625, 0.13230514526367188, 0.13715362548828125, 0.14200210571289062, 0.1468505859375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 9.0, 10.0, 15.0, 14.0, 11.0, 17.0, 30.0, 28.0, 43.0, 32.0, 53.0, 42.0, 54.0, 59.0, 47.0, 62.0, 60.0, 59.0, 51.0, 47.0, 38.0, 40.0, 35.0, 30.0, 25.0, 18.0, 14.0, 14.0, 9.0, 8.0, 7.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0238189697265625, -0.023005962371826172, -0.022192955017089844, -0.021379947662353516, -0.020566940307617188, -0.01975393295288086, -0.01894092559814453, -0.018127918243408203, -0.017314910888671875, -0.016501903533935547, -0.01568889617919922, -0.01487588882446289, -0.014062881469726562, -0.013249874114990234, -0.012436866760253906, -0.011623859405517578, -0.01081085205078125, -0.009997844696044922, -0.009184837341308594, -0.008371829986572266, -0.0075588226318359375, -0.006745815277099609, -0.005932807922363281, -0.005119800567626953, -0.004306793212890625, -0.003493785858154297, -0.0026807785034179688, -0.0018677711486816406, -0.0010547637939453125, -0.00024175643920898438, 0.0005712509155273438, 0.0013842582702636719, 0.002197265625, 0.003010272979736328, 0.0038232803344726562, 0.004636287689208984, 0.0054492950439453125, 0.006262302398681641, 0.007075309753417969, 0.007888317108154297, 0.008701324462890625, 0.009514331817626953, 0.010327339172363281, 0.01114034652709961, 0.011953353881835938, 0.012766361236572266, 0.013579368591308594, 0.014392375946044922, 0.01520538330078125, 0.016018390655517578, 0.016831398010253906, 0.017644405364990234, 0.018457412719726562, 0.01927042007446289, 0.02008342742919922, 0.020896434783935547, 0.021709442138671875, 0.022522449493408203, 0.02333545684814453, 0.02414846420288086, 0.024961471557617188, 0.025774478912353516, 0.026587486267089844, 0.027400493621826172, 0.0282135009765625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 10.0, 4.0, 11.0, 15.0, 22.0, 36.0, 38.0, 66.0, 84.0, 168.0, 424.0, 1838.0, 15464.0, 865479.0, 3283964.0, 22980.0, 2658.0, 574.0, 194.0, 94.0, 47.0, 32.0, 27.0, 14.0, 14.0, 7.0, 9.0, 5.0, 2.0, 4.0, 0.0, 5.0], "bins": [-0.5107421875, -0.49965476989746094, -0.4885673522949219, -0.4774799346923828, -0.46639251708984375, -0.4553050994873047, -0.4442176818847656, -0.43313026428222656, -0.4220428466796875, -0.41095542907714844, -0.3998680114746094, -0.3887805938720703, -0.37769317626953125, -0.3666057586669922, -0.3555183410644531, -0.34443092346191406, -0.333343505859375, -0.32225608825683594, -0.3111686706542969, -0.3000812530517578, -0.28899383544921875, -0.2779064178466797, -0.2668190002441406, -0.25573158264160156, -0.2446441650390625, -0.23355674743652344, -0.22246932983398438, -0.2113819122314453, -0.20029449462890625, -0.1892070770263672, -0.17811965942382812, -0.16703224182128906, -0.15594482421875, -0.14485740661621094, -0.13376998901367188, -0.12268257141113281, -0.11159515380859375, -0.10050773620605469, -0.08942031860351562, -0.07833290100097656, -0.0672454833984375, -0.05615806579589844, -0.045070648193359375, -0.03398323059082031, -0.02289581298828125, -0.011808395385742188, -0.000720977783203125, 0.010366439819335938, 0.021453857421875, 0.03254127502441406, 0.043628692626953125, 0.05471611022949219, 0.06580352783203125, 0.07689094543457031, 0.08797836303710938, 0.09906578063964844, 0.1101531982421875, 0.12124061584472656, 0.13232803344726562, 0.1434154510498047, 0.15450286865234375, 0.1655902862548828, 0.17667770385742188, 0.18776512145996094, 0.1988525390625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 6.0, 12.0, 31.0, 67.0, 110.0, 328.0, 1890.0, 1113.0, 253.0, 123.0, 50.0, 37.0, 16.0, 13.0, 8.0, 2.0, 5.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.107177734375, -0.10473775863647461, -0.10229778289794922, -0.09985780715942383, -0.09741783142089844, -0.09497785568237305, -0.09253787994384766, -0.09009790420532227, -0.08765792846679688, -0.08521795272827148, -0.0827779769897461, -0.0803380012512207, -0.07789802551269531, -0.07545804977416992, -0.07301807403564453, -0.07057809829711914, -0.06813812255859375, -0.06569814682006836, -0.06325817108154297, -0.06081819534301758, -0.05837821960449219, -0.0559382438659668, -0.053498268127441406, -0.051058292388916016, -0.048618316650390625, -0.046178340911865234, -0.043738365173339844, -0.04129838943481445, -0.03885841369628906, -0.03641843795776367, -0.03397846221923828, -0.03153848648071289, -0.0290985107421875, -0.02665853500366211, -0.02421855926513672, -0.021778583526611328, -0.019338607788085938, -0.016898632049560547, -0.014458656311035156, -0.012018680572509766, -0.009578704833984375, -0.007138729095458984, -0.004698753356933594, -0.002258777618408203, 0.0001811981201171875, 0.002621173858642578, 0.005061149597167969, 0.007501125335693359, 0.00994110107421875, 0.01238107681274414, 0.014821052551269531, 0.017261028289794922, 0.019701004028320312, 0.022140979766845703, 0.024580955505371094, 0.027020931243896484, 0.029460906982421875, 0.031900882720947266, 0.034340858459472656, 0.03678083419799805, 0.03922080993652344, 0.04166078567504883, 0.04410076141357422, 0.04654073715209961, 0.048980712890625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 8.0, 14.0, 32.0, 69.0, 161.0, 241.0, 232.0, 138.0, 65.0, 31.0, 13.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2084607481956482, -0.19439680874347687, -0.18033288419246674, -0.1662689447402954, -0.15220502018928528, -0.13814108073711395, -0.12407714873552322, -0.1100132167339325, -0.09594928473234177, -0.08188535273075104, -0.06782142072916031, -0.05375748500227928, -0.03969355300068855, -0.025629617273807526, -0.011565685272216797, 0.002498246729373932, 0.01656217873096466, 0.03062611073255539, 0.04469004273414612, 0.058753978461027145, 0.07281790673732758, 0.0868818461894989, 0.10094577819108963, 0.11500971019268036, 0.12907364964485168, 0.143137589097023, 0.15720151364803314, 0.17126545310020447, 0.1853293776512146, 0.19939331710338593, 0.21345725655555725, 0.22752118110656738, 0.24158510565757751, 0.25564903020858765, 0.26971298456192017, 0.2837769091129303, 0.29784083366394043, 0.31190478801727295, 0.3259687125682831, 0.3400326371192932, 0.35409656167030334, 0.3681604862213135, 0.382224440574646, 0.39628836512565613, 0.41035228967666626, 0.4244162440299988, 0.4384801685810089, 0.45254409313201904, 0.46660804748535156, 0.4806719720363617, 0.4947359263896942, 0.5087998509407043, 0.5228638052940369, 0.5369277000427246, 0.5509916543960571, 0.5650556087493896, 0.5791195034980774, 0.5931834578514099, 0.6072473526000977, 0.6213113069534302, 0.6353752613067627, 0.6494391560554504, 0.663503110408783, 0.6775670051574707, 0.6916309595108032]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 7.0, 5.0, 8.0, 9.0, 14.0, 7.0, 15.0, 17.0, 15.0, 26.0, 24.0, 29.0, 28.0, 35.0, 34.0, 36.0, 48.0, 42.0, 40.0, 38.0, 33.0, 33.0, 39.0, 32.0, 42.0, 30.0, 46.0, 28.0, 35.0, 30.0, 24.0, 25.0, 23.0, 13.0, 19.0, 20.0, 10.0, 11.0, 10.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1454206109046936, -0.14092865586280823, -0.13643671572208405, -0.13194476068019867, -0.1274528205394745, -0.12296086549758911, -0.11846891045570374, -0.11397696286439896, -0.10948501527309418, -0.1049930676817894, -0.10050112009048462, -0.09600916504859924, -0.09151721745729446, -0.08702526986598969, -0.08253331482410431, -0.07804136723279953, -0.07354941964149475, -0.06905747205018997, -0.06456552445888519, -0.06007356941699982, -0.05558162182569504, -0.05108967423439026, -0.04659772291779518, -0.042105771601200104, -0.037613824009895325, -0.033121876418590546, -0.028629925101995468, -0.02413797564804554, -0.01964602619409561, -0.015154076740145683, -0.010662127286195755, -0.0061701759696006775, -0.0016782283782958984, 0.00281372107565403, 0.007305670529603958, 0.011797619983553886, 0.016289569437503815, 0.020781518891453743, 0.02527346834540367, 0.02976541966199875, 0.03425736725330353, 0.03874931484460831, 0.043241266161203384, 0.04773321747779846, 0.05222516506910324, 0.05671711266040802, 0.0612090639770031, 0.06570101529359818, 0.07019296288490295, 0.07468491047620773, 0.07917685806751251, 0.08366881310939789, 0.08816076070070267, 0.09265270829200745, 0.09714466333389282, 0.1016366109251976, 0.10612855851650238, 0.11062050610780716, 0.11511245369911194, 0.11960440874099731, 0.1240963563323021, 0.12858830392360687, 0.13308025896549225, 0.13757219910621643, 0.1420641541481018]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 10.0, 14.0, 24.0, 34.0, 39.0, 85.0, 146.0, 232.0, 400.0, 712.0, 1333.0, 2923.0, 6059.0, 13817.0, 33547.0, 88164.0, 229902.0, 366251.0, 186139.0, 69983.0, 27295.0, 11410.0, 4947.0, 2404.0, 1171.0, 652.0, 355.0, 209.0, 105.0, 84.0, 33.0, 27.0, 15.0, 9.0, 8.0, 7.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.102294921875, -0.09923076629638672, -0.09616661071777344, -0.09310245513916016, -0.09003829956054688, -0.0869741439819336, -0.08390998840332031, -0.08084583282470703, -0.07778167724609375, -0.07471752166748047, -0.07165336608886719, -0.0685892105102539, -0.06552505493164062, -0.062460899353027344, -0.05939674377441406, -0.05633258819580078, -0.0532684326171875, -0.05020427703857422, -0.04714012145996094, -0.044075965881347656, -0.041011810302734375, -0.037947654724121094, -0.03488349914550781, -0.03181934356689453, -0.02875518798828125, -0.02569103240966797, -0.022626876831054688, -0.019562721252441406, -0.016498565673828125, -0.013434410095214844, -0.010370254516601562, -0.007306098937988281, -0.004241943359375, -0.0011777877807617188, 0.0018863677978515625, 0.004950523376464844, 0.008014678955078125, 0.011078834533691406, 0.014142990112304688, 0.01720714569091797, 0.02027130126953125, 0.02333545684814453, 0.026399612426757812, 0.029463768005371094, 0.032527923583984375, 0.035592079162597656, 0.03865623474121094, 0.04172039031982422, 0.0447845458984375, 0.04784870147705078, 0.05091285705566406, 0.053977012634277344, 0.057041168212890625, 0.060105323791503906, 0.06316947937011719, 0.06623363494873047, 0.06929779052734375, 0.07236194610595703, 0.07542610168457031, 0.0784902572631836, 0.08155441284179688, 0.08461856842041016, 0.08768272399902344, 0.09074687957763672, 0.09381103515625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 0.0, 4.0, 6.0, 6.0, 7.0, 7.0, 8.0, 17.0, 19.0, 12.0, 22.0, 28.0, 42.0, 44.0, 41.0, 48.0, 44.0, 55.0, 50.0, 38.0, 55.0, 57.0, 65.0, 57.0, 44.0, 29.0, 29.0, 26.0, 35.0, 20.0, 23.0, 16.0, 13.0, 9.0, 7.0, 7.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0224761962890625, -0.021669626235961914, -0.020863056182861328, -0.020056486129760742, -0.019249916076660156, -0.01844334602355957, -0.017636775970458984, -0.0168302059173584, -0.016023635864257812, -0.015217065811157227, -0.01441049575805664, -0.013603925704956055, -0.012797355651855469, -0.011990785598754883, -0.011184215545654297, -0.010377645492553711, -0.009571075439453125, -0.008764505386352539, -0.007957935333251953, -0.007151365280151367, -0.006344795227050781, -0.005538225173950195, -0.004731655120849609, -0.0039250850677490234, -0.0031185150146484375, -0.0023119449615478516, -0.0015053749084472656, -0.0006988048553466797, 0.00010776519775390625, 0.0009143352508544922, 0.0017209053039550781, 0.002527475357055664, 0.00333404541015625, 0.004140615463256836, 0.004947185516357422, 0.005753755569458008, 0.006560325622558594, 0.00736689567565918, 0.008173465728759766, 0.008980035781860352, 0.009786605834960938, 0.010593175888061523, 0.01139974594116211, 0.012206315994262695, 0.013012886047363281, 0.013819456100463867, 0.014626026153564453, 0.015432596206665039, 0.016239166259765625, 0.01704573631286621, 0.017852306365966797, 0.018658876419067383, 0.01946544647216797, 0.020272016525268555, 0.02107858657836914, 0.021885156631469727, 0.022691726684570312, 0.0234982967376709, 0.024304866790771484, 0.02511143684387207, 0.025918006896972656, 0.026724576950073242, 0.027531147003173828, 0.028337717056274414, 0.029144287109375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 5.0, 8.0, 7.0, 7.0, 25.0, 49.0, 65.0, 75.0, 92.0, 112.0, 220.0, 345.0, 542.0, 897.0, 1972.0, 4789.0, 16474.0, 68894.0, 315020.0, 476619.0, 122181.0, 27266.0, 7213.0, 2580.0, 1235.0, 677.0, 403.0, 234.0, 167.0, 116.0, 83.0, 44.0, 44.0, 19.0, 20.0, 20.0, 10.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10650634765625, -0.10243892669677734, -0.09837150573730469, -0.09430408477783203, -0.09023666381835938, -0.08616924285888672, -0.08210182189941406, -0.0780344009399414, -0.07396697998046875, -0.0698995590209961, -0.06583213806152344, -0.06176471710205078, -0.057697296142578125, -0.05362987518310547, -0.04956245422363281, -0.045495033264160156, -0.0414276123046875, -0.037360191345214844, -0.03329277038574219, -0.02922534942626953, -0.025157928466796875, -0.02109050750732422, -0.017023086547851562, -0.012955665588378906, -0.00888824462890625, -0.004820823669433594, -0.0007534027099609375, 0.0033140182495117188, 0.007381439208984375, 0.011448860168457031, 0.015516281127929688, 0.019583702087402344, 0.023651123046875, 0.027718544006347656, 0.03178596496582031, 0.03585338592529297, 0.039920806884765625, 0.04398822784423828, 0.04805564880371094, 0.052123069763183594, 0.05619049072265625, 0.060257911682128906, 0.06432533264160156, 0.06839275360107422, 0.07246017456054688, 0.07652759552001953, 0.08059501647949219, 0.08466243743896484, 0.0887298583984375, 0.09279727935791016, 0.09686470031738281, 0.10093212127685547, 0.10499954223632812, 0.10906696319580078, 0.11313438415527344, 0.1172018051147461, 0.12126922607421875, 0.1253366470336914, 0.12940406799316406, 0.13347148895263672, 0.13753890991210938, 0.14160633087158203, 0.1456737518310547, 0.14974117279052734, 0.15380859375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 5.0, 8.0, 7.0, 11.0, 14.0, 14.0, 13.0, 13.0, 14.0, 19.0, 31.0, 28.0, 40.0, 27.0, 35.0, 42.0, 52.0, 33.0, 52.0, 44.0, 48.0, 39.0, 42.0, 37.0, 43.0, 54.0, 43.0, 27.0, 22.0, 21.0, 21.0, 20.0, 10.0, 20.0, 16.0, 5.0, 8.0, 6.0, 6.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.089599609375, -0.0863351821899414, -0.08307075500488281, -0.07980632781982422, -0.07654190063476562, -0.07327747344970703, -0.07001304626464844, -0.06674861907958984, -0.06348419189453125, -0.060219764709472656, -0.05695533752441406, -0.05369091033935547, -0.050426483154296875, -0.04716205596923828, -0.04389762878417969, -0.040633201599121094, -0.0373687744140625, -0.034104347229003906, -0.030839920043945312, -0.02757549285888672, -0.024311065673828125, -0.02104663848876953, -0.017782211303710938, -0.014517784118652344, -0.01125335693359375, -0.007988929748535156, -0.0047245025634765625, -0.0014600753784179688, 0.001804351806640625, 0.005068778991699219, 0.008333206176757812, 0.011597633361816406, 0.014862060546875, 0.018126487731933594, 0.021390914916992188, 0.02465534210205078, 0.027919769287109375, 0.03118419647216797, 0.03444862365722656, 0.037713050842285156, 0.04097747802734375, 0.044241905212402344, 0.04750633239746094, 0.05077075958251953, 0.054035186767578125, 0.05729961395263672, 0.06056404113769531, 0.0638284683227539, 0.0670928955078125, 0.0703573226928711, 0.07362174987792969, 0.07688617706298828, 0.08015060424804688, 0.08341503143310547, 0.08667945861816406, 0.08994388580322266, 0.09320831298828125, 0.09647274017333984, 0.09973716735839844, 0.10300159454345703, 0.10626602172851562, 0.10953044891357422, 0.11279487609863281, 0.1160593032836914, 0.11932373046875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 11.0, 16.0, 35.0, 34.0, 73.0, 195.0, 459.0, 1340.0, 5019.0, 25110.0, 199132.0, 685038.0, 111106.0, 15962.0, 3349.0, 996.0, 362.0, 148.0, 70.0, 33.0, 23.0, 16.0, 8.0, 3.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.085205078125, -0.082489013671875, -0.07977294921875, -0.077056884765625, -0.0743408203125, -0.071624755859375, -0.06890869140625, -0.066192626953125, -0.0634765625, -0.060760498046875, -0.05804443359375, -0.055328369140625, -0.0526123046875, -0.049896240234375, -0.04718017578125, -0.044464111328125, -0.041748046875, -0.039031982421875, -0.03631591796875, -0.033599853515625, -0.0308837890625, -0.028167724609375, -0.02545166015625, -0.022735595703125, -0.02001953125, -0.017303466796875, -0.01458740234375, -0.011871337890625, -0.0091552734375, -0.006439208984375, -0.00372314453125, -0.001007080078125, 0.001708984375, 0.004425048828125, 0.00714111328125, 0.009857177734375, 0.0125732421875, 0.015289306640625, 0.01800537109375, 0.020721435546875, 0.0234375, 0.026153564453125, 0.02886962890625, 0.031585693359375, 0.0343017578125, 0.037017822265625, 0.03973388671875, 0.042449951171875, 0.045166015625, 0.047882080078125, 0.05059814453125, 0.053314208984375, 0.0560302734375, 0.058746337890625, 0.06146240234375, 0.064178466796875, 0.06689453125, 0.069610595703125, 0.07232666015625, 0.075042724609375, 0.0777587890625, 0.080474853515625, 0.08319091796875, 0.085906982421875, 0.088623046875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 13.0, 13.0, 18.0, 31.0, 48.0, 52.0, 76.0, 103.0, 130.0, 146.0, 101.0, 89.0, 61.0, 32.0, 31.0, 21.0, 13.0, 17.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.814168930053711e-05, -7.554329931735992e-05, -7.294490933418274e-05, -7.034651935100555e-05, -6.774812936782837e-05, -6.514973938465118e-05, -6.2551349401474e-05, -5.9952959418296814e-05, -5.735456943511963e-05, -5.4756179451942444e-05, -5.215778946876526e-05, -4.9559399485588074e-05, -4.696100950241089e-05, -4.4362619519233704e-05, -4.176422953605652e-05, -3.9165839552879333e-05, -3.656744956970215e-05, -3.396905958652496e-05, -3.137066960334778e-05, -2.8772279620170593e-05, -2.6173889636993408e-05, -2.3575499653816223e-05, -2.0977109670639038e-05, -1.8378719687461853e-05, -1.5780329704284668e-05, -1.3181939721107483e-05, -1.0583549737930298e-05, -7.985159754753113e-06, -5.386769771575928e-06, -2.7883797883987427e-06, -1.8998980522155762e-07, 2.4084001779556274e-06, 5.0067901611328125e-06, 7.6051801443099976e-06, 1.0203570127487183e-05, 1.2801960110664368e-05, 1.5400350093841553e-05, 1.7998740077018738e-05, 2.0597130060195923e-05, 2.3195520043373108e-05, 2.5793910026550293e-05, 2.8392300009727478e-05, 3.099068999290466e-05, 3.358907997608185e-05, 3.618746995925903e-05, 3.878585994243622e-05, 4.13842499256134e-05, 4.398263990879059e-05, 4.6581029891967773e-05, 4.917941987514496e-05, 5.1777809858322144e-05, 5.437619984149933e-05, 5.6974589824676514e-05, 5.95729798078537e-05, 6.217136979103088e-05, 6.476975977420807e-05, 6.736814975738525e-05, 6.996653974056244e-05, 7.256492972373962e-05, 7.516331970691681e-05, 7.7761709690094e-05, 8.036009967327118e-05, 8.295848965644836e-05, 8.555687963962555e-05, 8.815526962280273e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 1.0, 7.0, 4.0, 6.0, 8.0, 9.0, 15.0, 12.0, 32.0, 45.0, 52.0, 74.0, 120.0, 187.0, 362.0, 659.0, 1309.0, 2793.0, 8148.0, 30201.0, 164490.0, 615813.0, 178234.0, 31843.0, 8223.0, 3007.0, 1299.0, 618.0, 381.0, 207.0, 118.0, 95.0, 51.0, 32.0, 18.0, 21.0, 19.0, 12.0, 5.0, 9.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048858642578125, -0.04694414138793945, -0.045029640197753906, -0.04311513900756836, -0.04120063781738281, -0.039286136627197266, -0.03737163543701172, -0.03545713424682617, -0.033542633056640625, -0.03162813186645508, -0.02971363067626953, -0.027799129486083984, -0.025884628295898438, -0.02397012710571289, -0.022055625915527344, -0.020141124725341797, -0.01822662353515625, -0.016312122344970703, -0.014397621154785156, -0.01248311996459961, -0.010568618774414062, -0.008654117584228516, -0.006739616394042969, -0.004825115203857422, -0.002910614013671875, -0.0009961128234863281, 0.0009183883666992188, 0.0028328895568847656, 0.0047473907470703125, 0.006661891937255859, 0.008576393127441406, 0.010490894317626953, 0.0124053955078125, 0.014319896697998047, 0.016234397888183594, 0.01814889907836914, 0.020063400268554688, 0.021977901458740234, 0.02389240264892578, 0.025806903839111328, 0.027721405029296875, 0.029635906219482422, 0.03155040740966797, 0.033464908599853516, 0.03537940979003906, 0.03729391098022461, 0.039208412170410156, 0.0411229133605957, 0.04303741455078125, 0.0449519157409668, 0.046866416931152344, 0.04878091812133789, 0.05069541931152344, 0.052609920501708984, 0.05452442169189453, 0.05643892288208008, 0.058353424072265625, 0.06026792526245117, 0.06218242645263672, 0.06409692764282227, 0.06601142883300781, 0.06792593002319336, 0.0698404312133789, 0.07175493240356445, 0.07366943359375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 8.0, 5.0, 8.0, 11.0, 19.0, 16.0, 25.0, 41.0, 44.0, 61.0, 65.0, 80.0, 97.0, 85.0, 90.0, 79.0, 55.0, 40.0, 48.0, 33.0, 23.0, 17.0, 12.0, 9.0, 7.0, 4.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.038116455078125, -0.03685426712036133, -0.035592079162597656, -0.034329891204833984, -0.03306770324707031, -0.03180551528930664, -0.03054332733154297, -0.029281139373779297, -0.028018951416015625, -0.026756763458251953, -0.02549457550048828, -0.02423238754272461, -0.022970199584960938, -0.021708011627197266, -0.020445823669433594, -0.019183635711669922, -0.01792144775390625, -0.016659259796142578, -0.015397071838378906, -0.014134883880615234, -0.012872695922851562, -0.01161050796508789, -0.010348320007324219, -0.009086132049560547, -0.007823944091796875, -0.006561756134033203, -0.005299568176269531, -0.004037380218505859, -0.0027751922607421875, -0.0015130043029785156, -0.00025081634521484375, 0.0010113716125488281, 0.0022735595703125, 0.003535747528076172, 0.004797935485839844, 0.006060123443603516, 0.0073223114013671875, 0.00858449935913086, 0.009846687316894531, 0.011108875274658203, 0.012371063232421875, 0.013633251190185547, 0.014895439147949219, 0.01615762710571289, 0.017419815063476562, 0.018682003021240234, 0.019944190979003906, 0.021206378936767578, 0.02246856689453125, 0.023730754852294922, 0.024992942810058594, 0.026255130767822266, 0.027517318725585938, 0.02877950668334961, 0.03004169464111328, 0.03130388259887695, 0.032566070556640625, 0.0338282585144043, 0.03509044647216797, 0.03635263442993164, 0.03761482238769531, 0.038877010345458984, 0.040139198303222656, 0.04140138626098633, 0.04266357421875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 13.0, 29.0, 67.0, 109.0, 170.0, 202.0, 181.0, 121.0, 60.0, 27.0, 13.0, 5.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3740830421447754, -0.3383066654205322, -0.3025302588939667, -0.2667538821697235, -0.23097749054431915, -0.1952010989189148, -0.15942472219467163, -0.12364831566810608, -0.08787193894386292, -0.052095551043748856, -0.016319163143634796, 0.019457221031188965, 0.05523361265659332, 0.09101000428199768, 0.12678638100624084, 0.1625627875328064, 0.19833916425704956, 0.23411555588245392, 0.2698919475078583, 0.30566832423210144, 0.341444730758667, 0.37722110748291016, 0.4129974842071533, 0.44877389073371887, 0.48455026745796204, 0.5203266739845276, 0.5561030507087708, 0.5918794274330139, 0.6276558041572571, 0.663432240486145, 0.6992086172103882, 0.7349849939346313, 0.7707613706588745, 0.8065377473831177, 0.8423141241073608, 0.878090500831604, 0.9138669371604919, 0.9496433138847351, 0.9854196906089783, 1.0211961269378662, 1.0569725036621094, 1.0927488803863525, 1.1285252571105957, 1.1643016338348389, 1.200078010559082, 1.2358543872833252, 1.2716307640075684, 1.307407259941101, 1.3431835174560547, 1.3789598941802979, 1.414736270904541, 1.4505126476287842, 1.4862890243530273, 1.5220654010772705, 1.5578417778015137, 1.5936182737350464, 1.6293946504592896, 1.6651710271835327, 1.7009474039077759, 1.736723780632019, 1.7725001573562622, 1.808276653289795, 1.844053030014038, 1.8798294067382812, 1.9156057834625244]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 5.0, 5.0, 5.0, 10.0, 14.0, 12.0, 20.0, 20.0, 18.0, 34.0, 25.0, 33.0, 32.0, 35.0, 42.0, 38.0, 47.0, 43.0, 45.0, 46.0, 55.0, 41.0, 40.0, 47.0, 38.0, 30.0, 29.0, 24.0, 23.0, 31.0, 22.0, 16.0, 12.0, 11.0, 9.0, 13.0, 5.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5758402347564697, -0.5574343800544739, -0.5390284657478333, -0.5206226110458374, -0.5022166967391968, -0.4838108420372009, -0.4654049575328827, -0.44699907302856445, -0.4285931885242462, -0.410187304019928, -0.39178141951560974, -0.3733755350112915, -0.35496968030929565, -0.33656376600265503, -0.3181579113006592, -0.29975202679634094, -0.2813461422920227, -0.26294025778770447, -0.24453437328338623, -0.2261285036802292, -0.20772261917591095, -0.1893167346715927, -0.17091086506843567, -0.15250498056411743, -0.1340990960597992, -0.11569321155548096, -0.09728733450174332, -0.07888145744800568, -0.06047557294368744, -0.0420696884393692, -0.02366381138563156, -0.005257934331893921, 0.013148009777069092, 0.03155389055609703, 0.04995977133512497, 0.06836564838886261, 0.08677153289318085, 0.10517741739749908, 0.12358329445123672, 0.14198917150497437, 0.1603950560092926, 0.17880094051361084, 0.19720682501792908, 0.21561269462108612, 0.23401857912540436, 0.2524244785308838, 0.27083033323287964, 0.2892362177371979, 0.3076421022415161, 0.32604798674583435, 0.3444538712501526, 0.3628597557544708, 0.38126564025878906, 0.3996714949607849, 0.41807737946510315, 0.4364832639694214, 0.4548891484737396, 0.47329503297805786, 0.4917009174823761, 0.5101068019866943, 0.5285126566886902, 0.5469185709953308, 0.5653244256973267, 0.5837303400039673, 0.6021361947059631]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 8.0, 8.0, 14.0, 26.0, 27.0, 35.0, 68.0, 68.0, 132.0, 205.0, 356.0, 543.0, 845.0, 1569.0, 2896.0, 5814.0, 13914.0, 39427.0, 170138.0, 3232404.0, 603934.0, 79945.0, 23270.0, 9081.0, 4316.0, 2251.0, 1193.0, 653.0, 411.0, 244.0, 159.0, 117.0, 57.0, 44.0, 32.0, 19.0, 17.0, 14.0, 7.0, 9.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1297607421875, -0.12602901458740234, -0.12229728698730469, -0.11856555938720703, -0.11483383178710938, -0.11110210418701172, -0.10737037658691406, -0.1036386489868164, -0.09990692138671875, -0.0961751937866211, -0.09244346618652344, -0.08871173858642578, -0.08498001098632812, -0.08124828338623047, -0.07751655578613281, -0.07378482818603516, -0.0700531005859375, -0.06632137298583984, -0.06258964538574219, -0.05885791778564453, -0.055126190185546875, -0.05139446258544922, -0.04766273498535156, -0.043931007385253906, -0.04019927978515625, -0.036467552185058594, -0.03273582458496094, -0.02900409698486328, -0.025272369384765625, -0.02154064178466797, -0.017808914184570312, -0.014077186584472656, -0.010345458984375, -0.006613731384277344, -0.0028820037841796875, 0.0008497238159179688, 0.004581451416015625, 0.008313179016113281, 0.012044906616210938, 0.015776634216308594, 0.01950836181640625, 0.023240089416503906, 0.026971817016601562, 0.03070354461669922, 0.034435272216796875, 0.03816699981689453, 0.04189872741699219, 0.045630455017089844, 0.0493621826171875, 0.053093910217285156, 0.05682563781738281, 0.06055736541748047, 0.06428909301757812, 0.06802082061767578, 0.07175254821777344, 0.0754842758178711, 0.07921600341796875, 0.0829477310180664, 0.08667945861816406, 0.09041118621826172, 0.09414291381835938, 0.09787464141845703, 0.10160636901855469, 0.10533809661865234, 0.10906982421875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 4.0, 10.0, 7.0, 11.0, 13.0, 11.0, 11.0, 20.0, 27.0, 26.0, 35.0, 39.0, 47.0, 40.0, 46.0, 43.0, 52.0, 35.0, 50.0, 63.0, 37.0, 72.0, 38.0, 38.0, 44.0, 29.0, 25.0, 22.0, 16.0, 26.0, 10.0, 9.0, 10.0, 11.0, 4.0, 7.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.020782470703125, -0.020015954971313477, -0.019249439239501953, -0.01848292350769043, -0.017716407775878906, -0.016949892044067383, -0.01618337631225586, -0.015416860580444336, -0.014650344848632812, -0.013883829116821289, -0.013117313385009766, -0.012350797653198242, -0.011584281921386719, -0.010817766189575195, -0.010051250457763672, -0.009284734725952148, -0.008518218994140625, -0.0077517032623291016, -0.006985187530517578, -0.006218671798706055, -0.005452156066894531, -0.004685640335083008, -0.003919124603271484, -0.003152608871459961, -0.0023860931396484375, -0.001619577407836914, -0.0008530616760253906, -8.654594421386719e-05, 0.0006799697875976562, 0.0014464855194091797, 0.002213001251220703, 0.0029795169830322266, 0.00374603271484375, 0.0045125484466552734, 0.005279064178466797, 0.00604557991027832, 0.006812095642089844, 0.007578611373901367, 0.00834512710571289, 0.009111642837524414, 0.009878158569335938, 0.010644674301147461, 0.011411190032958984, 0.012177705764770508, 0.012944221496582031, 0.013710737228393555, 0.014477252960205078, 0.015243768692016602, 0.016010284423828125, 0.01677680015563965, 0.017543315887451172, 0.018309831619262695, 0.01907634735107422, 0.019842863082885742, 0.020609378814697266, 0.02137589454650879, 0.022142410278320312, 0.022908926010131836, 0.02367544174194336, 0.024441957473754883, 0.025208473205566406, 0.02597498893737793, 0.026741504669189453, 0.027508020401000977, 0.0282745361328125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 9.0, 12.0, 14.0, 21.0, 45.0, 83.0, 118.0, 219.0, 603.0, 2507.0, 21351.0, 1492518.0, 2647651.0, 25087.0, 2894.0, 643.0, 260.0, 102.0, 58.0, 38.0, 23.0, 15.0, 4.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.423583984375, -0.41396331787109375, -0.4043426513671875, -0.39472198486328125, -0.385101318359375, -0.37548065185546875, -0.3658599853515625, -0.35623931884765625, -0.34661865234375, -0.33699798583984375, -0.3273773193359375, -0.31775665283203125, -0.308135986328125, -0.29851531982421875, -0.2888946533203125, -0.27927398681640625, -0.2696533203125, -0.26003265380859375, -0.2504119873046875, -0.24079132080078125, -0.231170654296875, -0.22154998779296875, -0.2119293212890625, -0.20230865478515625, -0.19268798828125, -0.18306732177734375, -0.1734466552734375, -0.16382598876953125, -0.154205322265625, -0.14458465576171875, -0.1349639892578125, -0.12534332275390625, -0.11572265625, -0.10610198974609375, -0.0964813232421875, -0.08686065673828125, -0.077239990234375, -0.06761932373046875, -0.0579986572265625, -0.04837799072265625, -0.03875732421875, -0.02913665771484375, -0.0195159912109375, -0.00989532470703125, -0.000274658203125, 0.00934600830078125, 0.0189666748046875, 0.02858734130859375, 0.0382080078125, 0.04782867431640625, 0.0574493408203125, 0.06707000732421875, 0.076690673828125, 0.08631134033203125, 0.0959320068359375, 0.10555267333984375, 0.11517333984375, 0.12479400634765625, 0.1344146728515625, 0.14403533935546875, 0.153656005859375, 0.16327667236328125, 0.1728973388671875, 0.18251800537109375, 0.192138671875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 11.0, 39.0, 38.0, 72.0, 117.0, 299.0, 678.0, 1764.0, 548.0, 231.0, 111.0, 59.0, 30.0, 22.0, 15.0, 17.0, 5.0, 4.0, 3.0, 5.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1043701171875, -0.10172557830810547, -0.09908103942871094, -0.0964365005493164, -0.09379196166992188, -0.09114742279052734, -0.08850288391113281, -0.08585834503173828, -0.08321380615234375, -0.08056926727294922, -0.07792472839355469, -0.07528018951416016, -0.07263565063476562, -0.0699911117553711, -0.06734657287597656, -0.06470203399658203, -0.0620574951171875, -0.05941295623779297, -0.05676841735839844, -0.054123878479003906, -0.051479339599609375, -0.048834800720214844, -0.04619026184082031, -0.04354572296142578, -0.04090118408203125, -0.03825664520263672, -0.03561210632324219, -0.032967567443847656, -0.030323028564453125, -0.027678489685058594, -0.025033950805664062, -0.02238941192626953, -0.019744873046875, -0.01710033416748047, -0.014455795288085938, -0.011811256408691406, -0.009166717529296875, -0.006522178649902344, -0.0038776397705078125, -0.0012331008911132812, 0.00141143798828125, 0.004055976867675781, 0.0067005157470703125, 0.009345054626464844, 0.011989593505859375, 0.014634132385253906, 0.017278671264648438, 0.01992321014404297, 0.0225677490234375, 0.02521228790283203, 0.027856826782226562, 0.030501365661621094, 0.033145904541015625, 0.035790443420410156, 0.03843498229980469, 0.04107952117919922, 0.04372406005859375, 0.04636859893798828, 0.04901313781738281, 0.051657676696777344, 0.054302215576171875, 0.056946754455566406, 0.05959129333496094, 0.06223583221435547, 0.06488037109375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 7.0, 8.0, 34.0, 55.0, 113.0, 167.0, 191.0, 184.0, 123.0, 61.0, 32.0, 18.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.887373685836792, -0.8696142435073853, -0.8518548607826233, -0.8340954780578613, -0.8163360357284546, -0.7985765933990479, -0.7808172106742859, -0.7630578279495239, -0.7452983856201172, -0.7275389432907104, -0.7097795605659485, -0.6920201778411865, -0.6742607355117798, -0.656501293182373, -0.6387419104576111, -0.6209825277328491, -0.6032230854034424, -0.5854636430740356, -0.5677042603492737, -0.5499448776245117, -0.532185435295105, -0.5144259929656982, -0.4966666102409363, -0.47890719771385193, -0.4611477851867676, -0.4433883726596832, -0.4256289601325989, -0.4078695476055145, -0.3901101350784302, -0.3723507225513458, -0.3545913100242615, -0.3368318974971771, -0.319072425365448, -0.30131301283836365, -0.2835536003112793, -0.26579418778419495, -0.2480347752571106, -0.23027536273002625, -0.2125159502029419, -0.19475653767585754, -0.1769971251487732, -0.15923771262168884, -0.1414783000946045, -0.12371888756752014, -0.10595947504043579, -0.08820006251335144, -0.07044064998626709, -0.05268123745918274, -0.03492182493209839, -0.017162412405014038, 0.0005970001220703125, 0.018356412649154663, 0.036115825176239014, 0.053875237703323364, 0.07163465023040771, 0.08939406275749207, 0.10715347528457642, 0.12491288781166077, 0.14267230033874512, 0.16043171286582947, 0.17819112539291382, 0.19595053791999817, 0.21370995044708252, 0.23146936297416687, 0.24922877550125122]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 9.0, 7.0, 11.0, 16.0, 20.0, 26.0, 19.0, 27.0, 36.0, 31.0, 36.0, 39.0, 50.0, 43.0, 57.0, 55.0, 60.0, 55.0, 51.0, 45.0, 48.0, 38.0, 44.0, 36.0, 31.0, 26.0, 21.0, 20.0, 8.0, 12.0, 15.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.33886516094207764, -0.3301357924938202, -0.32140642404556274, -0.3126770555973053, -0.30394768714904785, -0.295218288898468, -0.28648892045021057, -0.2777595520019531, -0.2690301835536957, -0.26030081510543823, -0.2515714466571808, -0.24284206330776215, -0.2341126948595047, -0.22538332641124725, -0.2166539430618286, -0.20792457461357117, -0.19919520616531372, -0.19046583771705627, -0.18173646926879883, -0.1730070859193802, -0.16427771747112274, -0.1555483490228653, -0.14681896567344666, -0.1380895972251892, -0.12936022877693176, -0.12063086032867432, -0.11190148442983627, -0.10317210853099823, -0.09444274008274078, -0.08571337163448334, -0.0769839957356453, -0.06825461983680725, -0.059525251388549805, -0.05079587921500206, -0.042066507041454315, -0.03333713486790657, -0.024607762694358826, -0.01587839052081108, -0.007149018347263336, 0.0015803538262844086, 0.010309725999832153, 0.019039098173379898, 0.027768470346927643, 0.03649784252047539, 0.04522721469402313, 0.05395658686757088, 0.06268595904111862, 0.07141533493995667, 0.08014470338821411, 0.08887407183647156, 0.0976034477353096, 0.10633282363414764, 0.11506219208240509, 0.12379156053066254, 0.13252094388008118, 0.14125031232833862, 0.14997968077659607, 0.15870904922485352, 0.16743841767311096, 0.1761678010225296, 0.18489716947078705, 0.1936265379190445, 0.20235592126846313, 0.21108528971672058, 0.21981465816497803]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 9.0, 12.0, 13.0, 20.0, 28.0, 42.0, 63.0, 143.0, 218.0, 455.0, 1057.0, 3155.0, 9534.0, 33429.0, 134208.0, 532904.0, 251313.0, 58331.0, 15764.0, 4794.0, 1723.0, 682.0, 283.0, 157.0, 79.0, 47.0, 30.0, 25.0, 14.0, 11.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16357421875, -0.1582469940185547, -0.15291976928710938, -0.14759254455566406, -0.14226531982421875, -0.13693809509277344, -0.13161087036132812, -0.1262836456298828, -0.1209564208984375, -0.11562919616699219, -0.11030197143554688, -0.10497474670410156, -0.09964752197265625, -0.09432029724121094, -0.08899307250976562, -0.08366584777832031, -0.078338623046875, -0.07301139831542969, -0.06768417358398438, -0.06235694885253906, -0.05702972412109375, -0.05170249938964844, -0.046375274658203125, -0.04104804992675781, -0.0357208251953125, -0.030393600463867188, -0.025066375732421875, -0.019739151000976562, -0.01441192626953125, -0.009084701538085938, -0.003757476806640625, 0.0015697479248046875, 0.00689697265625, 0.012224197387695312, 0.017551422119140625, 0.022878646850585938, 0.02820587158203125, 0.03353309631347656, 0.038860321044921875, 0.04418754577636719, 0.0495147705078125, 0.05484199523925781, 0.060169219970703125, 0.06549644470214844, 0.07082366943359375, 0.07615089416503906, 0.08147811889648438, 0.08680534362792969, 0.092132568359375, 0.09745979309082031, 0.10278701782226562, 0.10811424255371094, 0.11344146728515625, 0.11876869201660156, 0.12409591674804688, 0.1294231414794922, 0.1347503662109375, 0.1400775909423828, 0.14540481567382812, 0.15073204040527344, 0.15605926513671875, 0.16138648986816406, 0.16671371459960938, 0.1720409393310547, 0.1773681640625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 1.0, 3.0, 5.0, 9.0, 9.0, 9.0, 21.0, 19.0, 24.0, 21.0, 31.0, 32.0, 32.0, 41.0, 42.0, 45.0, 64.0, 37.0, 50.0, 52.0, 57.0, 35.0, 43.0, 36.0, 42.0, 43.0, 29.0, 36.0, 29.0, 14.0, 20.0, 13.0, 13.0, 12.0, 10.0, 2.0, 3.0, 3.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.022735595703125, -0.021979808807373047, -0.021224021911621094, -0.02046823501586914, -0.019712448120117188, -0.018956661224365234, -0.01820087432861328, -0.017445087432861328, -0.016689300537109375, -0.015933513641357422, -0.015177726745605469, -0.014421939849853516, -0.013666152954101562, -0.01291036605834961, -0.012154579162597656, -0.011398792266845703, -0.01064300537109375, -0.009887218475341797, -0.009131431579589844, -0.00837564468383789, -0.0076198577880859375, -0.006864070892333984, -0.006108283996582031, -0.005352497100830078, -0.004596710205078125, -0.003840923309326172, -0.0030851364135742188, -0.0023293495178222656, -0.0015735626220703125, -0.0008177757263183594, -6.198883056640625e-05, 0.0006937980651855469, 0.0014495849609375, 0.002205371856689453, 0.0029611587524414062, 0.0037169456481933594, 0.0044727325439453125, 0.005228519439697266, 0.005984306335449219, 0.006740093231201172, 0.007495880126953125, 0.008251667022705078, 0.009007453918457031, 0.009763240814208984, 0.010519027709960938, 0.01127481460571289, 0.012030601501464844, 0.012786388397216797, 0.01354217529296875, 0.014297962188720703, 0.015053749084472656, 0.01580953598022461, 0.016565322875976562, 0.017321109771728516, 0.01807689666748047, 0.018832683563232422, 0.019588470458984375, 0.020344257354736328, 0.02110004425048828, 0.021855831146240234, 0.022611618041992188, 0.02336740493774414, 0.024123191833496094, 0.024878978729248047, 0.025634765625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 12.0, 9.0, 13.0, 19.0, 36.0, 49.0, 79.0, 143.0, 204.0, 393.0, 663.0, 1198.0, 2698.0, 7775.0, 30163.0, 160099.0, 600739.0, 194326.0, 35498.0, 8427.0, 2953.0, 1334.0, 723.0, 399.0, 222.0, 132.0, 83.0, 42.0, 31.0, 26.0, 19.0, 12.0, 11.0, 6.0, 4.0, 2.0, 2.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1611328125, -0.15618324279785156, -0.15123367309570312, -0.1462841033935547, -0.14133453369140625, -0.1363849639892578, -0.13143539428710938, -0.12648582458496094, -0.1215362548828125, -0.11658668518066406, -0.11163711547851562, -0.10668754577636719, -0.10173797607421875, -0.09678840637207031, -0.09183883666992188, -0.08688926696777344, -0.081939697265625, -0.07699012756347656, -0.07204055786132812, -0.06709098815917969, -0.06214141845703125, -0.05719184875488281, -0.052242279052734375, -0.04729270935058594, -0.0423431396484375, -0.03739356994628906, -0.032444000244140625, -0.027494430541992188, -0.02254486083984375, -0.017595291137695312, -0.012645721435546875, -0.0076961517333984375, -0.00274658203125, 0.0022029876708984375, 0.007152557373046875, 0.012102127075195312, 0.01705169677734375, 0.022001266479492188, 0.026950836181640625, 0.03190040588378906, 0.0368499755859375, 0.04179954528808594, 0.046749114990234375, 0.05169868469238281, 0.05664825439453125, 0.06159782409667969, 0.06654739379882812, 0.07149696350097656, 0.076446533203125, 0.08139610290527344, 0.08634567260742188, 0.09129524230957031, 0.09624481201171875, 0.10119438171386719, 0.10614395141601562, 0.11109352111816406, 0.1160430908203125, 0.12099266052246094, 0.12594223022460938, 0.1308917999267578, 0.13584136962890625, 0.1407909393310547, 0.14574050903320312, 0.15069007873535156, 0.1556396484375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 5.0, 8.0, 7.0, 12.0, 19.0, 25.0, 27.0, 34.0, 44.0, 53.0, 59.0, 57.0, 60.0, 50.0, 65.0, 64.0, 74.0, 44.0, 36.0, 49.0, 57.0, 35.0, 27.0, 18.0, 15.0, 14.0, 14.0, 9.0, 6.0, 8.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1534423828125, -0.14836692810058594, -0.14329147338867188, -0.1382160186767578, -0.13314056396484375, -0.1280651092529297, -0.12298965454101562, -0.11791419982910156, -0.1128387451171875, -0.10776329040527344, -0.10268783569335938, -0.09761238098144531, -0.09253692626953125, -0.08746147155761719, -0.08238601684570312, -0.07731056213378906, -0.072235107421875, -0.06715965270996094, -0.062084197998046875, -0.05700874328613281, -0.05193328857421875, -0.04685783386230469, -0.041782379150390625, -0.03670692443847656, -0.0316314697265625, -0.026556015014648438, -0.021480560302734375, -0.016405105590820312, -0.01132965087890625, -0.0062541961669921875, -0.001178741455078125, 0.0038967132568359375, 0.00897216796875, 0.014047622680664062, 0.019123077392578125, 0.024198532104492188, 0.02927398681640625, 0.03434944152832031, 0.039424896240234375, 0.04450035095214844, 0.0495758056640625, 0.05465126037597656, 0.059726715087890625, 0.06480216979980469, 0.06987762451171875, 0.07495307922363281, 0.08002853393554688, 0.08510398864746094, 0.090179443359375, 0.09525489807128906, 0.10033035278320312, 0.10540580749511719, 0.11048126220703125, 0.11555671691894531, 0.12063217163085938, 0.12570762634277344, 0.1307830810546875, 0.13585853576660156, 0.14093399047851562, 0.1460094451904297, 0.15108489990234375, 0.1561603546142578, 0.16123580932617188, 0.16631126403808594, 0.17138671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 4.0, 7.0, 9.0, 8.0, 15.0, 12.0, 24.0, 43.0, 54.0, 86.0, 129.0, 200.0, 302.0, 549.0, 1008.0, 2048.0, 4927.0, 15675.0, 84839.0, 700337.0, 199235.0, 26005.0, 7247.0, 2726.0, 1306.0, 660.0, 404.0, 216.0, 144.0, 100.0, 67.0, 60.0, 28.0, 24.0, 23.0, 13.0, 11.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.088623046875, -0.08488082885742188, -0.08113861083984375, -0.07739639282226562, -0.0736541748046875, -0.06991195678710938, -0.06616973876953125, -0.062427520751953125, -0.058685302734375, -0.054943084716796875, -0.05120086669921875, -0.047458648681640625, -0.0437164306640625, -0.039974212646484375, -0.03623199462890625, -0.032489776611328125, -0.02874755859375, -0.025005340576171875, -0.02126312255859375, -0.017520904541015625, -0.0137786865234375, -0.010036468505859375, -0.00629425048828125, -0.002552032470703125, 0.001190185546875, 0.004932403564453125, 0.00867462158203125, 0.012416839599609375, 0.0161590576171875, 0.019901275634765625, 0.02364349365234375, 0.027385711669921875, 0.0311279296875, 0.034870147705078125, 0.03861236572265625, 0.042354583740234375, 0.0460968017578125, 0.049839019775390625, 0.05358123779296875, 0.057323455810546875, 0.061065673828125, 0.06480789184570312, 0.06855010986328125, 0.07229232788085938, 0.0760345458984375, 0.07977676391601562, 0.08351898193359375, 0.08726119995117188, 0.09100341796875, 0.09474563598632812, 0.09848785400390625, 0.10223007202148438, 0.1059722900390625, 0.10971450805664062, 0.11345672607421875, 0.11719894409179688, 0.120941162109375, 0.12468338012695312, 0.12842559814453125, 0.13216781616210938, 0.1359100341796875, 0.13965225219726562, 0.14339447021484375, 0.14713668823242188, 0.15087890625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 11.0, 8.0, 7.0, 16.0, 11.0, 12.0, 25.0, 31.0, 41.0, 60.0, 67.0, 74.0, 87.0, 65.0, 72.0, 68.0, 68.0, 64.0, 47.0, 37.0, 32.0, 19.0, 16.0, 15.0, 10.0, 5.0, 9.0, 3.0, 6.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.319450378417969e-05, -7.109809666872025e-05, -6.90016895532608e-05, -6.690528243780136e-05, -6.480887532234192e-05, -6.271246820688248e-05, -6.0616061091423035e-05, -5.851965397596359e-05, -5.642324686050415e-05, -5.432683974504471e-05, -5.2230432629585266e-05, -5.0134025514125824e-05, -4.803761839866638e-05, -4.594121128320694e-05, -4.38448041677475e-05, -4.1748397052288055e-05, -3.965198993682861e-05, -3.755558282136917e-05, -3.545917570590973e-05, -3.336276859045029e-05, -3.1266361474990845e-05, -2.9169954359531403e-05, -2.707354724407196e-05, -2.497714012861252e-05, -2.2880733013153076e-05, -2.0784325897693634e-05, -1.8687918782234192e-05, -1.659151166677475e-05, -1.4495104551315308e-05, -1.2398697435855865e-05, -1.0302290320396423e-05, -8.205883204936981e-06, -6.109476089477539e-06, -4.013068974018097e-06, -1.9166618585586548e-06, 1.7974525690078735e-07, 2.2761523723602295e-06, 4.372559487819672e-06, 6.468966603279114e-06, 8.565373718738556e-06, 1.0661780834197998e-05, 1.275818794965744e-05, 1.4854595065116882e-05, 1.6951002180576324e-05, 1.9047409296035767e-05, 2.114381641149521e-05, 2.324022352695465e-05, 2.5336630642414093e-05, 2.7433037757873535e-05, 2.9529444873332977e-05, 3.162585198879242e-05, 3.372225910425186e-05, 3.5818666219711304e-05, 3.7915073335170746e-05, 4.001148045063019e-05, 4.210788756608963e-05, 4.420429468154907e-05, 4.6300701797008514e-05, 4.8397108912467957e-05, 5.04935160279274e-05, 5.258992314338684e-05, 5.468633025884628e-05, 5.6782737374305725e-05, 5.887914448976517e-05, 6.097555160522461e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 6.0, 3.0, 7.0, 3.0, 11.0, 11.0, 14.0, 30.0, 26.0, 48.0, 84.0, 131.0, 214.0, 330.0, 658.0, 1352.0, 3177.0, 8565.0, 33503.0, 361351.0, 573787.0, 47590.0, 10603.0, 3760.0, 1535.0, 719.0, 403.0, 211.0, 143.0, 95.0, 57.0, 39.0, 23.0, 17.0, 8.0, 14.0, 9.0, 4.0, 4.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11639404296875, -0.11287689208984375, -0.1093597412109375, -0.10584259033203125, -0.102325439453125, -0.09880828857421875, -0.0952911376953125, -0.09177398681640625, -0.0882568359375, -0.08473968505859375, -0.0812225341796875, -0.07770538330078125, -0.074188232421875, -0.07067108154296875, -0.0671539306640625, -0.06363677978515625, -0.06011962890625, -0.05660247802734375, -0.0530853271484375, -0.04956817626953125, -0.046051025390625, -0.04253387451171875, -0.0390167236328125, -0.03549957275390625, -0.031982421875, -0.02846527099609375, -0.0249481201171875, -0.02143096923828125, -0.017913818359375, -0.01439666748046875, -0.0108795166015625, -0.00736236572265625, -0.00384521484375, -0.00032806396484375, 0.0031890869140625, 0.00670623779296875, 0.010223388671875, 0.01374053955078125, 0.0172576904296875, 0.02077484130859375, 0.0242919921875, 0.02780914306640625, 0.0313262939453125, 0.03484344482421875, 0.038360595703125, 0.04187774658203125, 0.0453948974609375, 0.04891204833984375, 0.05242919921875, 0.05594635009765625, 0.0594635009765625, 0.06298065185546875, 0.066497802734375, 0.07001495361328125, 0.0735321044921875, 0.07704925537109375, 0.08056640625, 0.08408355712890625, 0.0876007080078125, 0.09111785888671875, 0.094635009765625, 0.09815216064453125, 0.1016693115234375, 0.10518646240234375, 0.10870361328125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 7.0, 11.0, 6.0, 19.0, 27.0, 25.0, 66.0, 67.0, 121.0, 173.0, 146.0, 94.0, 71.0, 45.0, 29.0, 28.0, 17.0, 13.0, 4.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08807373046875, -0.085479736328125, -0.0828857421875, -0.080291748046875, -0.07769775390625, -0.075103759765625, -0.072509765625, -0.069915771484375, -0.06732177734375, -0.064727783203125, -0.0621337890625, -0.059539794921875, -0.05694580078125, -0.054351806640625, -0.0517578125, -0.049163818359375, -0.04656982421875, -0.043975830078125, -0.0413818359375, -0.038787841796875, -0.03619384765625, -0.033599853515625, -0.031005859375, -0.028411865234375, -0.02581787109375, -0.023223876953125, -0.0206298828125, -0.018035888671875, -0.01544189453125, -0.012847900390625, -0.01025390625, -0.007659912109375, -0.00506591796875, -0.002471923828125, 0.0001220703125, 0.002716064453125, 0.00531005859375, 0.007904052734375, 0.010498046875, 0.013092041015625, 0.01568603515625, 0.018280029296875, 0.0208740234375, 0.023468017578125, 0.02606201171875, 0.028656005859375, 0.03125, 0.033843994140625, 0.03643798828125, 0.039031982421875, 0.0416259765625, 0.044219970703125, 0.04681396484375, 0.049407958984375, 0.052001953125, 0.054595947265625, 0.05718994140625, 0.059783935546875, 0.0623779296875, 0.064971923828125, 0.06756591796875, 0.070159912109375, 0.07275390625, 0.075347900390625, 0.07794189453125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 9.0, 13.0, 25.0, 64.0, 111.0, 207.0, 193.0, 175.0, 94.0, 62.0, 28.0, 13.0, 8.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2362054586410522, -1.1895357370376587, -1.1428661346435547, -1.0961964130401611, -1.0495268106460571, -1.0028570890426636, -0.9561874270439148, -0.909517765045166, -0.8628481030464172, -0.8161784410476685, -0.7695087790489197, -0.7228391170501709, -0.6761693954467773, -0.6294997930526733, -0.5828300714492798, -0.536160409450531, -0.4894907474517822, -0.44282108545303345, -0.39615142345428467, -0.3494817316532135, -0.3028120696544647, -0.25614240765571594, -0.20947271585464478, -0.162803053855896, -0.11613339185714722, -0.06946372240781784, -0.022794052958488464, 0.02387562394142151, 0.07054528594017029, 0.11721494793891907, 0.16388463973999023, 0.210554301738739, 0.2572239637374878, 0.3038936257362366, 0.35056328773498535, 0.3972329795360565, 0.4439026415348053, 0.4905723035335541, 0.5372419953346252, 0.583911657333374, 0.6305813193321228, 0.6772509813308716, 0.7239206433296204, 0.7705903053283691, 0.8172600269317627, 0.8639296293258667, 0.9105993509292603, 0.957269012928009, 1.0039386749267578, 1.0506083965301514, 1.0972779989242554, 1.143947720527649, 1.190617322921753, 1.2372870445251465, 1.28395676612854, 1.330626368522644, 1.377295970916748, 1.4239656925201416, 1.4706352949142456, 1.5173050165176392, 1.5639746189117432, 1.6106443405151367, 1.6573140621185303, 1.7039836645126343, 1.7506533861160278]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 4.0, 4.0, 5.0, 8.0, 14.0, 7.0, 22.0, 15.0, 22.0, 34.0, 26.0, 22.0, 31.0, 31.0, 35.0, 42.0, 39.0, 41.0, 56.0, 50.0, 43.0, 54.0, 49.0, 37.0, 42.0, 30.0, 34.0, 27.0, 24.0, 27.0, 28.0, 12.0, 12.0, 14.0, 16.0, 6.0, 10.0, 10.0, 7.0, 2.0, 3.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.763144314289093, -0.741420567035675, -0.7196968197822571, -0.6979730725288391, -0.6762493848800659, -0.654525637626648, -0.63280189037323, -0.611078143119812, -0.589354395866394, -0.5676306486129761, -0.5459069013595581, -0.5241831541061401, -0.5024594068527222, -0.4807356894016266, -0.459011971950531, -0.43728822469711304, -0.41556447744369507, -0.3938407301902771, -0.37211698293685913, -0.35039326548576355, -0.3286695182323456, -0.3069457709789276, -0.28522205352783203, -0.26349830627441406, -0.2417745590209961, -0.22005081176757812, -0.19832707941532135, -0.17660334706306458, -0.1548795998096466, -0.13315585255622864, -0.11143212020397186, -0.08970838785171509, -0.06798464059829712, -0.04626090079545975, -0.024537160992622375, -0.0028134211897850037, 0.018910318613052368, 0.04063405841588974, 0.06235779821872711, 0.08408153057098389, 0.10580527782440186, 0.12752902507781982, 0.1492527574300766, 0.17097648978233337, 0.19270023703575134, 0.2144239842891693, 0.2361477166414261, 0.25787144899368286, 0.27959519624710083, 0.3013189435005188, 0.32304269075393677, 0.34476640820503235, 0.3664901554584503, 0.3882139027118683, 0.40993762016296387, 0.43166136741638184, 0.4533851146697998, 0.4751088619232178, 0.49683260917663574, 0.5185563564300537, 0.5402801036834717, 0.5620037913322449, 0.5837275385856628, 0.6054512858390808, 0.6271750330924988]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 11.0, 6.0, 11.0, 9.0, 12.0, 15.0, 24.0, 20.0, 57.0, 59.0, 77.0, 133.0, 169.0, 251.0, 370.0, 543.0, 828.0, 1466.0, 2372.0, 4175.0, 8034.0, 16961.0, 43740.0, 178132.0, 3435755.0, 388248.0, 66754.0, 23066.0, 10170.0, 5115.0, 2908.0, 1689.0, 1053.0, 655.0, 409.0, 307.0, 173.0, 151.0, 98.0, 83.0, 47.0, 33.0, 23.0, 23.0, 14.0, 9.0, 9.0, 5.0, 4.0, 4.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.107421875, -0.10391998291015625, -0.1004180908203125, -0.09691619873046875, -0.093414306640625, -0.08991241455078125, -0.0864105224609375, -0.08290863037109375, -0.07940673828125, -0.07590484619140625, -0.0724029541015625, -0.06890106201171875, -0.065399169921875, -0.06189727783203125, -0.0583953857421875, -0.05489349365234375, -0.0513916015625, -0.04788970947265625, -0.0443878173828125, -0.04088592529296875, -0.037384033203125, -0.03388214111328125, -0.0303802490234375, -0.02687835693359375, -0.02337646484375, -0.01987457275390625, -0.0163726806640625, -0.01287078857421875, -0.009368896484375, -0.00586700439453125, -0.0023651123046875, 0.00113677978515625, 0.004638671875, 0.00814056396484375, 0.0116424560546875, 0.01514434814453125, 0.018646240234375, 0.02214813232421875, 0.0256500244140625, 0.02915191650390625, 0.03265380859375, 0.03615570068359375, 0.0396575927734375, 0.04315948486328125, 0.046661376953125, 0.05016326904296875, 0.0536651611328125, 0.05716705322265625, 0.0606689453125, 0.06417083740234375, 0.0676727294921875, 0.07117462158203125, 0.074676513671875, 0.07817840576171875, 0.0816802978515625, 0.08518218994140625, 0.08868408203125, 0.09218597412109375, 0.0956878662109375, 0.09918975830078125, 0.102691650390625, 0.10619354248046875, 0.1096954345703125, 0.11319732666015625, 0.11669921875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 13.0, 6.0, 8.0, 10.0, 18.0, 27.0, 20.0, 28.0, 37.0, 27.0, 22.0, 34.0, 53.0, 55.0, 53.0, 50.0, 58.0, 29.0, 43.0, 41.0, 51.0, 49.0, 41.0, 40.0, 34.0, 25.0, 21.0, 22.0, 10.0, 11.0, 12.0, 10.0, 11.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.023895263671875, -0.023090362548828125, -0.02228546142578125, -0.021480560302734375, -0.0206756591796875, -0.019870758056640625, -0.01906585693359375, -0.018260955810546875, -0.0174560546875, -0.016651153564453125, -0.01584625244140625, -0.015041351318359375, -0.0142364501953125, -0.013431549072265625, -0.01262664794921875, -0.011821746826171875, -0.011016845703125, -0.010211944580078125, -0.00940704345703125, -0.008602142333984375, -0.0077972412109375, -0.006992340087890625, -0.00618743896484375, -0.005382537841796875, -0.00457763671875, -0.003772735595703125, -0.00296783447265625, -0.002162933349609375, -0.0013580322265625, -0.000553131103515625, 0.00025177001953125, 0.001056671142578125, 0.001861572265625, 0.002666473388671875, 0.00347137451171875, 0.004276275634765625, 0.0050811767578125, 0.005886077880859375, 0.00669097900390625, 0.007495880126953125, 0.00830078125, 0.009105682373046875, 0.00991058349609375, 0.010715484619140625, 0.0115203857421875, 0.012325286865234375, 0.01313018798828125, 0.013935089111328125, 0.014739990234375, 0.015544891357421875, 0.01634979248046875, 0.017154693603515625, 0.0179595947265625, 0.018764495849609375, 0.01956939697265625, 0.020374298095703125, 0.02117919921875, 0.021984100341796875, 0.02278900146484375, 0.023593902587890625, 0.0243988037109375, 0.025203704833984375, 0.02600860595703125, 0.026813507080078125, 0.027618408203125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 1.0, 8.0, 7.0, 22.0, 27.0, 33.0, 47.0, 100.0, 171.0, 311.0, 716.0, 1989.0, 8170.0, 56427.0, 3529340.0, 559708.0, 29017.0, 5372.0, 1566.0, 559.0, 288.0, 172.0, 88.0, 51.0, 27.0, 23.0, 17.0, 8.0, 7.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33349609375, -0.3244457244873047, -0.3153953552246094, -0.30634498596191406, -0.29729461669921875, -0.28824424743652344, -0.2791938781738281, -0.2701435089111328, -0.2610931396484375, -0.2520427703857422, -0.24299240112304688, -0.23394203186035156, -0.22489166259765625, -0.21584129333496094, -0.20679092407226562, -0.1977405548095703, -0.188690185546875, -0.1796398162841797, -0.17058944702148438, -0.16153907775878906, -0.15248870849609375, -0.14343833923339844, -0.13438796997070312, -0.1253376007080078, -0.1162872314453125, -0.10723686218261719, -0.09818649291992188, -0.08913612365722656, -0.08008575439453125, -0.07103538513183594, -0.061985015869140625, -0.05293464660644531, -0.04388427734375, -0.03483390808105469, -0.025783538818359375, -0.016733169555664062, -0.00768280029296875, 0.0013675689697265625, 0.010417938232421875, 0.019468307495117188, 0.0285186767578125, 0.03756904602050781, 0.046619415283203125, 0.05566978454589844, 0.06472015380859375, 0.07377052307128906, 0.08282089233398438, 0.09187126159667969, 0.100921630859375, 0.10997200012207031, 0.11902236938476562, 0.12807273864746094, 0.13712310791015625, 0.14617347717285156, 0.15522384643554688, 0.1642742156982422, 0.1733245849609375, 0.1823749542236328, 0.19142532348632812, 0.20047569274902344, 0.20952606201171875, 0.21857643127441406, 0.22762680053710938, 0.2366771697998047, 0.2457275390625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 10.0, 12.0, 16.0, 44.0, 68.0, 107.0, 257.0, 1304.0, 1639.0, 310.0, 141.0, 64.0, 36.0, 26.0, 14.0, 10.0, 2.0, 6.0, 5.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10064697265625, -0.09750652313232422, -0.09436607360839844, -0.09122562408447266, -0.08808517456054688, -0.0849447250366211, -0.08180427551269531, -0.07866382598876953, -0.07552337646484375, -0.07238292694091797, -0.06924247741699219, -0.0661020278930664, -0.06296157836914062, -0.059821128845214844, -0.05668067932128906, -0.05354022979736328, -0.0503997802734375, -0.04725933074951172, -0.04411888122558594, -0.040978431701660156, -0.037837982177734375, -0.034697532653808594, -0.03155708312988281, -0.02841663360595703, -0.02527618408203125, -0.02213573455810547, -0.018995285034179688, -0.015854835510253906, -0.012714385986328125, -0.009573936462402344, -0.0064334869384765625, -0.0032930374145507812, -0.000152587890625, 0.0029878616333007812, 0.0061283111572265625, 0.009268760681152344, 0.012409210205078125, 0.015549659729003906, 0.018690109252929688, 0.02183055877685547, 0.02497100830078125, 0.02811145782470703, 0.03125190734863281, 0.034392356872558594, 0.037532806396484375, 0.040673255920410156, 0.04381370544433594, 0.04695415496826172, 0.0500946044921875, 0.05323505401611328, 0.05637550354003906, 0.059515953063964844, 0.06265640258789062, 0.0657968521118164, 0.06893730163574219, 0.07207775115966797, 0.07521820068359375, 0.07835865020751953, 0.08149909973144531, 0.0846395492553711, 0.08777999877929688, 0.09092044830322266, 0.09406089782714844, 0.09720134735107422, 0.100341796875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 11.0, 23.0, 29.0, 55.0, 88.0, 152.0, 185.0, 155.0, 124.0, 81.0, 52.0, 24.0, 12.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.548175573348999, -0.5317947864532471, -0.5154139995574951, -0.49903321266174316, -0.4826524257659912, -0.46627163887023926, -0.4498908817768097, -0.43351009488105774, -0.4171293079853058, -0.40074852108955383, -0.3843677341938019, -0.3679869472980499, -0.35160619020462036, -0.3352254033088684, -0.31884461641311646, -0.3024638295173645, -0.28608304262161255, -0.2697022557258606, -0.25332146883010864, -0.23694069683551788, -0.22055990993976593, -0.20417912304401398, -0.18779835104942322, -0.17141756415367126, -0.1550367772579193, -0.13865599036216736, -0.122275210916996, -0.10589443147182465, -0.08951364457607269, -0.07313285768032074, -0.056752078235149384, -0.04037129878997803, -0.0239904522895813, -0.007609669119119644, 0.00877111405134201, 0.025151897221803665, 0.04153268039226532, 0.05791346728801727, 0.07429424673318863, 0.09067502617835999, 0.10705581307411194, 0.12343659996986389, 0.13981738686561584, 0.1561981588602066, 0.17257894575595856, 0.1889597326517105, 0.20534050464630127, 0.22172129154205322, 0.23810207843780518, 0.25448286533355713, 0.2708636522293091, 0.28724443912506104, 0.303625226020813, 0.32000601291656494, 0.3363867700099945, 0.35276755690574646, 0.3691483438014984, 0.38552913069725037, 0.4019099175930023, 0.4182907044887543, 0.43467146158218384, 0.4510522484779358, 0.46743303537368774, 0.4838138222694397, 0.5001946091651917]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 5.0, 3.0, 2.0, 4.0, 3.0, 4.0, 6.0, 7.0, 10.0, 10.0, 9.0, 18.0, 15.0, 21.0, 16.0, 12.0, 21.0, 18.0, 25.0, 25.0, 21.0, 22.0, 30.0, 39.0, 35.0, 26.0, 32.0, 31.0, 36.0, 35.0, 25.0, 29.0, 24.0, 33.0, 30.0, 41.0, 31.0, 32.0, 34.0, 27.0, 13.0, 18.0, 15.0, 14.0, 13.0, 14.0, 16.0, 12.0, 13.0, 6.0, 3.0, 6.0, 4.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.17574048042297363, -0.1703668087720871, -0.16499315202236176, -0.15961948037147522, -0.15424582362174988, -0.14887215197086334, -0.1434984803199768, -0.13812482357025146, -0.13275116682052612, -0.1273774951696396, -0.12200383841991425, -0.11663016676902771, -0.11125651001930237, -0.10588283836841583, -0.1005091741681099, -0.09513550996780396, -0.08976183831691742, -0.08438817411661148, -0.07901450991630554, -0.073640838265419, -0.06826718151569366, -0.06289350986480713, -0.05751984566450119, -0.05214618146419525, -0.04677251726388931, -0.041398853063583374, -0.036025188863277435, -0.030651520937681198, -0.02527785673737526, -0.01990419253706932, -0.014530524611473083, -0.009156860411167145, -0.003783196210861206, 0.0015904689207673073, 0.006964134052395821, 0.012337800115346909, 0.017711464315652847, 0.023085128515958786, 0.028458796441555023, 0.03383246064186096, 0.0392061248421669, 0.04457978904247284, 0.04995345324277878, 0.055327121168375015, 0.060700785368680954, 0.0660744458436966, 0.07144811749458313, 0.07682178169488907, 0.08219544589519501, 0.08756911009550095, 0.09294277429580688, 0.09831644594669342, 0.10369010269641876, 0.1090637743473053, 0.11443743854761124, 0.11981110274791718, 0.1251847743988037, 0.13055844604969025, 0.1359321027994156, 0.14130577445030212, 0.14667943120002747, 0.152053102850914, 0.15742677450180054, 0.16280043125152588, 0.16817408800125122]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 9.0, 12.0, 10.0, 14.0, 19.0, 49.0, 58.0, 68.0, 98.0, 148.0, 229.0, 373.0, 528.0, 868.0, 1283.0, 2076.0, 3251.0, 5304.0, 8896.0, 14797.0, 25464.0, 44707.0, 80797.0, 151192.0, 257682.0, 202762.0, 107315.0, 58898.0, 33389.0, 19409.0, 11096.0, 6666.0, 4072.0, 2494.0, 1550.0, 994.0, 637.0, 456.0, 266.0, 177.0, 148.0, 95.0, 53.0, 43.0, 23.0, 31.0, 14.0, 15.0, 10.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0748291015625, -0.07239437103271484, -0.06995964050292969, -0.06752490997314453, -0.06509017944335938, -0.06265544891357422, -0.06022071838378906, -0.057785987854003906, -0.05535125732421875, -0.052916526794433594, -0.05048179626464844, -0.04804706573486328, -0.045612335205078125, -0.04317760467529297, -0.04074287414550781, -0.038308143615722656, -0.0358734130859375, -0.033438682556152344, -0.031003952026367188, -0.02856922149658203, -0.026134490966796875, -0.02369976043701172, -0.021265029907226562, -0.018830299377441406, -0.01639556884765625, -0.013960838317871094, -0.011526107788085938, -0.009091377258300781, -0.006656646728515625, -0.004221916198730469, -0.0017871856689453125, 0.0006475448608398438, 0.003082275390625, 0.005517005920410156, 0.007951736450195312, 0.010386466979980469, 0.012821197509765625, 0.015255928039550781, 0.017690658569335938, 0.020125389099121094, 0.02256011962890625, 0.024994850158691406, 0.027429580688476562, 0.02986431121826172, 0.032299041748046875, 0.03473377227783203, 0.03716850280761719, 0.039603233337402344, 0.0420379638671875, 0.044472694396972656, 0.04690742492675781, 0.04934215545654297, 0.051776885986328125, 0.05421161651611328, 0.05664634704589844, 0.059081077575683594, 0.06151580810546875, 0.0639505386352539, 0.06638526916503906, 0.06881999969482422, 0.07125473022460938, 0.07368946075439453, 0.07612419128417969, 0.07855892181396484, 0.08099365234375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 6.0, 6.0, 13.0, 5.0, 12.0, 17.0, 25.0, 17.0, 36.0, 34.0, 36.0, 38.0, 38.0, 45.0, 42.0, 59.0, 64.0, 52.0, 48.0, 41.0, 51.0, 38.0, 43.0, 33.0, 34.0, 27.0, 26.0, 19.0, 19.0, 16.0, 9.0, 19.0, 10.0, 4.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0289764404296875, -0.028099775314331055, -0.02722311019897461, -0.026346445083618164, -0.02546977996826172, -0.024593114852905273, -0.023716449737548828, -0.022839784622192383, -0.021963119506835938, -0.021086454391479492, -0.020209789276123047, -0.0193331241607666, -0.018456459045410156, -0.01757979393005371, -0.016703128814697266, -0.01582646369934082, -0.014949798583984375, -0.01407313346862793, -0.013196468353271484, -0.012319803237915039, -0.011443138122558594, -0.010566473007202148, -0.009689807891845703, -0.008813142776489258, -0.007936477661132812, -0.007059812545776367, -0.006183147430419922, -0.0053064823150634766, -0.004429817199707031, -0.003553152084350586, -0.0026764869689941406, -0.0017998218536376953, -0.00092315673828125, -4.649162292480469e-05, 0.0008301734924316406, 0.001706838607788086, 0.0025835037231445312, 0.0034601688385009766, 0.004336833953857422, 0.005213499069213867, 0.0060901641845703125, 0.006966829299926758, 0.007843494415283203, 0.008720159530639648, 0.009596824645996094, 0.010473489761352539, 0.011350154876708984, 0.01222681999206543, 0.013103485107421875, 0.01398015022277832, 0.014856815338134766, 0.01573348045349121, 0.016610145568847656, 0.0174868106842041, 0.018363475799560547, 0.019240140914916992, 0.020116806030273438, 0.020993471145629883, 0.021870136260986328, 0.022746801376342773, 0.02362346649169922, 0.024500131607055664, 0.02537679672241211, 0.026253461837768555, 0.027130126953125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 7.0, 8.0, 6.0, 19.0, 21.0, 34.0, 30.0, 56.0, 63.0, 87.0, 114.0, 119.0, 215.0, 307.0, 486.0, 719.0, 1236.0, 2518.0, 6826.0, 23396.0, 99421.0, 451407.0, 356800.0, 75475.0, 18092.0, 5508.0, 2227.0, 1116.0, 674.0, 444.0, 309.0, 219.0, 168.0, 107.0, 72.0, 59.0, 55.0, 26.0, 31.0, 20.0, 14.0, 12.0, 8.0, 8.0, 10.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1510009765625, -0.1462688446044922, -0.14153671264648438, -0.13680458068847656, -0.13207244873046875, -0.12734031677246094, -0.12260818481445312, -0.11787605285644531, -0.1131439208984375, -0.10841178894042969, -0.10367965698242188, -0.09894752502441406, -0.09421539306640625, -0.08948326110839844, -0.08475112915039062, -0.08001899719238281, -0.075286865234375, -0.07055473327636719, -0.06582260131835938, -0.06109046936035156, -0.05635833740234375, -0.05162620544433594, -0.046894073486328125, -0.04216194152832031, -0.0374298095703125, -0.03269767761230469, -0.027965545654296875, -0.023233413696289062, -0.01850128173828125, -0.013769149780273438, -0.009037017822265625, -0.0043048858642578125, 0.00042724609375, 0.0051593780517578125, 0.009891510009765625, 0.014623641967773438, 0.01935577392578125, 0.024087905883789062, 0.028820037841796875, 0.03355216979980469, 0.0382843017578125, 0.04301643371582031, 0.047748565673828125, 0.05248069763183594, 0.05721282958984375, 0.06194496154785156, 0.06667709350585938, 0.07140922546386719, 0.076141357421875, 0.08087348937988281, 0.08560562133789062, 0.09033775329589844, 0.09506988525390625, 0.09980201721191406, 0.10453414916992188, 0.10926628112792969, 0.1139984130859375, 0.11873054504394531, 0.12346267700195312, 0.12819480895996094, 0.13292694091796875, 0.13765907287597656, 0.14239120483398438, 0.1471233367919922, 0.15185546875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 7.0, 7.0, 7.0, 13.0, 16.0, 12.0, 18.0, 17.0, 18.0, 23.0, 20.0, 30.0, 25.0, 38.0, 41.0, 34.0, 33.0, 41.0, 52.0, 42.0, 37.0, 38.0, 43.0, 38.0, 46.0, 36.0, 31.0, 30.0, 28.0, 30.0, 30.0, 23.0, 17.0, 13.0, 12.0, 9.0, 16.0, 7.0, 7.0, 5.0, 4.0, 2.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.127197265625, -0.12349224090576172, -0.11978721618652344, -0.11608219146728516, -0.11237716674804688, -0.1086721420288086, -0.10496711730957031, -0.10126209259033203, -0.09755706787109375, -0.09385204315185547, -0.09014701843261719, -0.0864419937133789, -0.08273696899414062, -0.07903194427490234, -0.07532691955566406, -0.07162189483642578, -0.0679168701171875, -0.06421184539794922, -0.06050682067871094, -0.056801795959472656, -0.053096771240234375, -0.049391746520996094, -0.04568672180175781, -0.04198169708251953, -0.03827667236328125, -0.03457164764404297, -0.030866622924804688, -0.027161598205566406, -0.023456573486328125, -0.019751548767089844, -0.016046524047851562, -0.012341499328613281, -0.008636474609375, -0.004931449890136719, -0.0012264251708984375, 0.0024785995483398438, 0.006183624267578125, 0.009888648986816406, 0.013593673706054688, 0.01729869842529297, 0.02100372314453125, 0.02470874786376953, 0.028413772583007812, 0.032118797302246094, 0.035823822021484375, 0.039528846740722656, 0.04323387145996094, 0.04693889617919922, 0.0506439208984375, 0.05434894561767578, 0.05805397033691406, 0.061758995056152344, 0.06546401977539062, 0.0691690444946289, 0.07287406921386719, 0.07657909393310547, 0.08028411865234375, 0.08398914337158203, 0.08769416809082031, 0.0913991928100586, 0.09510421752929688, 0.09880924224853516, 0.10251426696777344, 0.10621929168701172, 0.10992431640625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 8.0, 14.0, 18.0, 26.0, 58.0, 84.0, 147.0, 243.0, 463.0, 897.0, 1927.0, 4495.0, 11791.0, 37726.0, 168259.0, 557905.0, 199515.0, 42744.0, 13151.0, 4863.0, 2108.0, 976.0, 508.0, 263.0, 145.0, 75.0, 48.0, 35.0, 15.0, 8.0, 12.0, 11.0, 8.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07574462890625, -0.07309150695800781, -0.07043838500976562, -0.06778526306152344, -0.06513214111328125, -0.06247901916503906, -0.059825897216796875, -0.05717277526855469, -0.0545196533203125, -0.05186653137207031, -0.049213409423828125, -0.04656028747558594, -0.04390716552734375, -0.04125404357910156, -0.038600921630859375, -0.03594779968261719, -0.033294677734375, -0.030641555786132812, -0.027988433837890625, -0.025335311889648438, -0.02268218994140625, -0.020029067993164062, -0.017375946044921875, -0.014722824096679688, -0.0120697021484375, -0.009416580200195312, -0.006763458251953125, -0.0041103363037109375, -0.00145721435546875, 0.0011959075927734375, 0.003849029541015625, 0.0065021514892578125, 0.0091552734375, 0.011808395385742188, 0.014461517333984375, 0.017114639282226562, 0.01976776123046875, 0.022420883178710938, 0.025074005126953125, 0.027727127075195312, 0.0303802490234375, 0.03303337097167969, 0.035686492919921875, 0.03833961486816406, 0.04099273681640625, 0.04364585876464844, 0.046298980712890625, 0.04895210266113281, 0.051605224609375, 0.05425834655761719, 0.056911468505859375, 0.05956459045410156, 0.06221771240234375, 0.06487083435058594, 0.06752395629882812, 0.07017707824707031, 0.0728302001953125, 0.07548332214355469, 0.07813644409179688, 0.08078956604003906, 0.08344268798828125, 0.08609580993652344, 0.08874893188476562, 0.09140205383300781, 0.09405517578125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 6.0, 8.0, 14.0, 18.0, 18.0, 22.0, 37.0, 39.0, 50.0, 51.0, 57.0, 63.0, 64.0, 82.0, 60.0, 60.0, 63.0, 48.0, 47.0, 38.0, 20.0, 30.0, 30.0, 19.0, 11.0, 10.0, 5.0, 3.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.220008850097656e-05, -4.048086702823639e-05, -3.8761645555496216e-05, -3.704242408275604e-05, -3.532320261001587e-05, -3.3603981137275696e-05, -3.188475966453552e-05, -3.016553819179535e-05, -2.8446316719055176e-05, -2.6727095246315002e-05, -2.500787377357483e-05, -2.3288652300834656e-05, -2.1569430828094482e-05, -1.985020935535431e-05, -1.8130987882614136e-05, -1.6411766409873962e-05, -1.4692544937133789e-05, -1.2973323464393616e-05, -1.1254101991653442e-05, -9.534880518913269e-06, -7.815659046173096e-06, -6.096437573432922e-06, -4.377216100692749e-06, -2.6579946279525757e-06, -9.387731552124023e-07, 7.80448317527771e-07, 2.4996697902679443e-06, 4.218891263008118e-06, 5.938112735748291e-06, 7.657334208488464e-06, 9.376555681228638e-06, 1.1095777153968811e-05, 1.2814998626708984e-05, 1.4534220099449158e-05, 1.625344157218933e-05, 1.7972663044929504e-05, 1.9691884517669678e-05, 2.141110599040985e-05, 2.3130327463150024e-05, 2.4849548935890198e-05, 2.656877040863037e-05, 2.8287991881370544e-05, 3.0007213354110718e-05, 3.172643482685089e-05, 3.3445656299591064e-05, 3.516487777233124e-05, 3.688409924507141e-05, 3.8603320717811584e-05, 4.032254219055176e-05, 4.204176366329193e-05, 4.3760985136032104e-05, 4.548020660877228e-05, 4.719942808151245e-05, 4.8918649554252625e-05, 5.06378710269928e-05, 5.235709249973297e-05, 5.4076313972473145e-05, 5.579553544521332e-05, 5.751475691795349e-05, 5.9233978390693665e-05, 6.095319986343384e-05, 6.267242133617401e-05, 6.439164280891418e-05, 6.611086428165436e-05, 6.783008575439453e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 9.0, 4.0, 10.0, 12.0, 19.0, 32.0, 35.0, 53.0, 75.0, 129.0, 164.0, 267.0, 470.0, 877.0, 1814.0, 4547.0, 13858.0, 54879.0, 348403.0, 511859.0, 81789.0, 18717.0, 5866.0, 2240.0, 1019.0, 521.0, 304.0, 201.0, 123.0, 74.0, 55.0, 41.0, 32.0, 20.0, 12.0, 7.0, 4.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07958984375, -0.07685661315917969, -0.07412338256835938, -0.07139015197753906, -0.06865692138671875, -0.06592369079589844, -0.06319046020507812, -0.06045722961425781, -0.0577239990234375, -0.05499076843261719, -0.052257537841796875, -0.04952430725097656, -0.04679107666015625, -0.04405784606933594, -0.041324615478515625, -0.03859138488769531, -0.035858154296875, -0.03312492370605469, -0.030391693115234375, -0.027658462524414062, -0.02492523193359375, -0.022192001342773438, -0.019458770751953125, -0.016725540161132812, -0.0139923095703125, -0.011259078979492188, -0.008525848388671875, -0.0057926177978515625, -0.00305938720703125, -0.0003261566162109375, 0.002407073974609375, 0.0051403045654296875, 0.00787353515625, 0.010606765747070312, 0.013339996337890625, 0.016073226928710938, 0.01880645751953125, 0.021539688110351562, 0.024272918701171875, 0.027006149291992188, 0.0297393798828125, 0.03247261047363281, 0.035205841064453125, 0.03793907165527344, 0.04067230224609375, 0.04340553283691406, 0.046138763427734375, 0.04887199401855469, 0.051605224609375, 0.05433845520019531, 0.057071685791015625, 0.05980491638183594, 0.06253814697265625, 0.06527137756347656, 0.06800460815429688, 0.07073783874511719, 0.0734710693359375, 0.07620429992675781, 0.07893753051757812, 0.08167076110839844, 0.08440399169921875, 0.08713722229003906, 0.08987045288085938, 0.09260368347167969, 0.0953369140625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 1.0, 13.0, 8.0, 8.0, 8.0, 19.0, 21.0, 35.0, 31.0, 35.0, 63.0, 79.0, 78.0, 92.0, 105.0, 79.0, 78.0, 49.0, 49.0, 38.0, 19.0, 15.0, 12.0, 15.0, 9.0, 5.0, 4.0, 3.0, 4.0, 5.0, 2.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.059661865234375, -0.05780172348022461, -0.05594158172607422, -0.05408143997192383, -0.05222129821777344, -0.05036115646362305, -0.048501014709472656, -0.046640872955322266, -0.044780731201171875, -0.042920589447021484, -0.041060447692871094, -0.0392003059387207, -0.03734016418457031, -0.03548002243041992, -0.03361988067626953, -0.03175973892211914, -0.02989959716796875, -0.02803945541381836, -0.02617931365966797, -0.024319171905517578, -0.022459030151367188, -0.020598888397216797, -0.018738746643066406, -0.016878604888916016, -0.015018463134765625, -0.013158321380615234, -0.011298179626464844, -0.009438037872314453, -0.0075778961181640625, -0.005717754364013672, -0.0038576126098632812, -0.0019974708557128906, -0.0001373291015625, 0.0017228126525878906, 0.0035829544067382812, 0.005443096160888672, 0.0073032379150390625, 0.009163379669189453, 0.011023521423339844, 0.012883663177490234, 0.014743804931640625, 0.016603946685791016, 0.018464088439941406, 0.020324230194091797, 0.022184371948242188, 0.024044513702392578, 0.02590465545654297, 0.02776479721069336, 0.02962493896484375, 0.03148508071899414, 0.03334522247314453, 0.03520536422729492, 0.03706550598144531, 0.0389256477355957, 0.040785789489746094, 0.042645931243896484, 0.044506072998046875, 0.046366214752197266, 0.048226356506347656, 0.05008649826049805, 0.05194664001464844, 0.05380678176879883, 0.05566692352294922, 0.05752706527709961, 0.05938720703125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 26.0, 52.0, 100.0, 178.0, 189.0, 187.0, 125.0, 70.0, 36.0, 13.0, 11.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.8133844137191772, -1.7654263973236084, -1.717468500137329, -1.6695106029510498, -1.621552586555481, -1.573594570159912, -1.5256366729736328, -1.4776787757873535, -1.4297207593917847, -1.3817627429962158, -1.3338048458099365, -1.2858469486236572, -1.2378889322280884, -1.1899309158325195, -1.1419730186462402, -1.094015121459961, -1.046057105064392, -0.998099148273468, -0.950141191482544, -0.9021832346916199, -0.8542252779006958, -0.8062673211097717, -0.7583093643188477, -0.7103514075279236, -0.6623934507369995, -0.6144354939460754, -0.5664775371551514, -0.5185195803642273, -0.4705616235733032, -0.42260366678237915, -0.3746457099914551, -0.326687753200531, -0.2787296772003174, -0.2307717204093933, -0.18281376361846924, -0.13485580682754517, -0.0868978500366211, -0.03893989324569702, 0.00901806354522705, 0.05697602033615112, 0.1049339771270752, 0.15289193391799927, 0.20084989070892334, 0.2488078474998474, 0.2967658042907715, 0.34472376108169556, 0.39268171787261963, 0.4406396746635437, 0.4885976314544678, 0.5365555882453918, 0.5845135450363159, 0.63247150182724, 0.6804294586181641, 0.7283874154090881, 0.7763453722000122, 0.8243033289909363, 0.8722612857818604, 0.9202192425727844, 0.9681771993637085, 1.0161352157592773, 1.0640931129455566, 1.112051010131836, 1.1600090265274048, 1.2079670429229736, 1.255924940109253]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 7.0, 8.0, 7.0, 7.0, 7.0, 9.0, 5.0, 16.0, 14.0, 23.0, 16.0, 22.0, 29.0, 19.0, 29.0, 29.0, 34.0, 54.0, 32.0, 24.0, 39.0, 41.0, 39.0, 43.0, 42.0, 42.0, 40.0, 31.0, 43.0, 25.0, 23.0, 29.0, 21.0, 31.0, 16.0, 22.0, 15.0, 16.0, 7.0, 14.0, 5.0, 7.0, 6.0, 4.0, 2.0, 5.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.646960437297821, -0.6269792914390564, -0.6069981455802917, -0.5870169997215271, -0.5670359134674072, -0.5470547676086426, -0.5270736217498779, -0.5070924758911133, -0.48711133003234863, -0.467130184173584, -0.44714903831481934, -0.4271679222583771, -0.4071867763996124, -0.3872056305408478, -0.3672245144844055, -0.34724336862564087, -0.3272622227668762, -0.3072810769081116, -0.2872999310493469, -0.26731881499290466, -0.24733766913414001, -0.22735652327537537, -0.2073753923177719, -0.18739426136016846, -0.1674131155014038, -0.14743196964263916, -0.1274508386850357, -0.10746970027685165, -0.0874885618686676, -0.06750742346048355, -0.0475262850522995, -0.027545154094696045, -0.007563948631286621, 0.01241718977689743, 0.03239832818508148, 0.05237946659326553, 0.07236060500144958, 0.09234174340963364, 0.11232288181781769, 0.13230401277542114, 0.1522851586341858, 0.17226630449295044, 0.1922474354505539, 0.21222856640815735, 0.232209712266922, 0.25219085812568665, 0.2721719741821289, 0.29215312004089355, 0.3121342658996582, 0.33211541175842285, 0.3520965576171875, 0.37207767367362976, 0.3920588195323944, 0.41203996539115906, 0.4320210814476013, 0.45200222730636597, 0.4719833731651306, 0.49196451902389526, 0.5119456648826599, 0.5319268107414246, 0.5519078969955444, 0.5718890428543091, 0.5918701887130737, 0.6118513345718384, 0.631832480430603]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 7.0, 13.0, 15.0, 14.0, 29.0, 33.0, 64.0, 71.0, 137.0, 170.0, 265.0, 436.0, 704.0, 1161.0, 2074.0, 3739.0, 7716.0, 18809.0, 52989.0, 232675.0, 3371801.0, 387146.0, 70670.0, 23130.0, 9610.0, 4602.0, 2451.0, 1366.0, 862.0, 463.0, 312.0, 232.0, 154.0, 95.0, 86.0, 56.0, 42.0, 30.0, 17.0, 8.0, 6.0, 4.0, 5.0, 2.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.114990234375, -0.11123466491699219, -0.10747909545898438, -0.10372352600097656, -0.09996795654296875, -0.09621238708496094, -0.09245681762695312, -0.08870124816894531, -0.0849456787109375, -0.08119010925292969, -0.07743453979492188, -0.07367897033691406, -0.06992340087890625, -0.06616783142089844, -0.062412261962890625, -0.05865669250488281, -0.054901123046875, -0.05114555358886719, -0.047389984130859375, -0.04363441467285156, -0.03987884521484375, -0.03612327575683594, -0.032367706298828125, -0.028612136840820312, -0.0248565673828125, -0.021100997924804688, -0.017345428466796875, -0.013589859008789062, -0.00983428955078125, -0.0060787200927734375, -0.002323150634765625, 0.0014324188232421875, 0.00518798828125, 0.008943557739257812, 0.012699127197265625, 0.016454696655273438, 0.02021026611328125, 0.023965835571289062, 0.027721405029296875, 0.03147697448730469, 0.0352325439453125, 0.03898811340332031, 0.042743682861328125, 0.04649925231933594, 0.05025482177734375, 0.05401039123535156, 0.057765960693359375, 0.06152153015136719, 0.065277099609375, 0.06903266906738281, 0.07278823852539062, 0.07654380798339844, 0.08029937744140625, 0.08405494689941406, 0.08781051635742188, 0.09156608581542969, 0.0953216552734375, 0.09907722473144531, 0.10283279418945312, 0.10658836364746094, 0.11034393310546875, 0.11409950256347656, 0.11785507202148438, 0.12161064147949219, 0.1253662109375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 11.0, 6.0, 11.0, 13.0, 19.0, 23.0, 31.0, 18.0, 41.0, 49.0, 40.0, 65.0, 60.0, 53.0, 54.0, 44.0, 63.0, 47.0, 56.0, 41.0, 45.0, 42.0, 31.0, 32.0, 26.0, 13.0, 16.0, 12.0, 15.0, 10.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0243072509765625, -0.023263216018676758, -0.022219181060791016, -0.021175146102905273, -0.02013111114501953, -0.01908707618713379, -0.018043041229248047, -0.016999006271362305, -0.015954971313476562, -0.01491093635559082, -0.013866901397705078, -0.012822866439819336, -0.011778831481933594, -0.010734796524047852, -0.00969076156616211, -0.008646726608276367, -0.007602691650390625, -0.006558656692504883, -0.005514621734619141, -0.0044705867767333984, -0.0034265518188476562, -0.002382516860961914, -0.0013384819030761719, -0.0002944469451904297, 0.0007495880126953125, 0.0017936229705810547, 0.002837657928466797, 0.003881692886352539, 0.004925727844238281, 0.0059697628021240234, 0.007013797760009766, 0.008057832717895508, 0.00910186767578125, 0.010145902633666992, 0.011189937591552734, 0.012233972549438477, 0.013278007507324219, 0.014322042465209961, 0.015366077423095703, 0.016410112380981445, 0.017454147338867188, 0.01849818229675293, 0.019542217254638672, 0.020586252212524414, 0.021630287170410156, 0.0226743221282959, 0.02371835708618164, 0.024762392044067383, 0.025806427001953125, 0.026850461959838867, 0.02789449691772461, 0.02893853187561035, 0.029982566833496094, 0.031026601791381836, 0.03207063674926758, 0.03311467170715332, 0.03415870666503906, 0.035202741622924805, 0.03624677658081055, 0.03729081153869629, 0.03833484649658203, 0.03937888145446777, 0.040422916412353516, 0.04146695137023926, 0.042510986328125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 8.0, 7.0, 16.0, 24.0, 32.0, 63.0, 101.0, 159.0, 323.0, 591.0, 1485.0, 4545.0, 22073.0, 230034.0, 3750998.0, 159739.0, 17547.0, 3881.0, 1369.0, 564.0, 327.0, 157.0, 98.0, 63.0, 36.0, 18.0, 11.0, 2.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2359619140625, -0.22736167907714844, -0.21876144409179688, -0.2101612091064453, -0.20156097412109375, -0.1929607391357422, -0.18436050415039062, -0.17576026916503906, -0.1671600341796875, -0.15855979919433594, -0.14995956420898438, -0.1413593292236328, -0.13275909423828125, -0.12415885925292969, -0.11555862426757812, -0.10695838928222656, -0.098358154296875, -0.08975791931152344, -0.08115768432617188, -0.07255744934082031, -0.06395721435546875, -0.05535697937011719, -0.046756744384765625, -0.03815650939941406, -0.0295562744140625, -0.020956039428710938, -0.012355804443359375, -0.0037555694580078125, 0.00484466552734375, 0.013444900512695312, 0.022045135498046875, 0.030645370483398438, 0.03924560546875, 0.04784584045410156, 0.056446075439453125, 0.06504631042480469, 0.07364654541015625, 0.08224678039550781, 0.09084701538085938, 0.09944725036621094, 0.1080474853515625, 0.11664772033691406, 0.12524795532226562, 0.1338481903076172, 0.14244842529296875, 0.1510486602783203, 0.15964889526367188, 0.16824913024902344, 0.176849365234375, 0.18544960021972656, 0.19404983520507812, 0.2026500701904297, 0.21125030517578125, 0.2198505401611328, 0.22845077514648438, 0.23705101013183594, 0.2456512451171875, 0.25425148010253906, 0.2628517150878906, 0.2714519500732422, 0.28005218505859375, 0.2886524200439453, 0.2972526550292969, 0.30585289001464844, 0.314453125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 6.0, 2.0, 1.0, 9.0, 15.0, 13.0, 19.0, 36.0, 32.0, 61.0, 96.0, 146.0, 326.0, 897.0, 1385.0, 454.0, 201.0, 131.0, 76.0, 47.0, 47.0, 19.0, 18.0, 11.0, 10.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07666015625, -0.07394027709960938, -0.07122039794921875, -0.06850051879882812, -0.0657806396484375, -0.06306076049804688, -0.06034088134765625, -0.057621002197265625, -0.054901123046875, -0.052181243896484375, -0.04946136474609375, -0.046741485595703125, -0.0440216064453125, -0.041301727294921875, -0.03858184814453125, -0.035861968994140625, -0.03314208984375, -0.030422210693359375, -0.02770233154296875, -0.024982452392578125, -0.0222625732421875, -0.019542694091796875, -0.01682281494140625, -0.014102935791015625, -0.011383056640625, -0.008663177490234375, -0.00594329833984375, -0.003223419189453125, -0.0005035400390625, 0.002216339111328125, 0.00493621826171875, 0.007656097412109375, 0.0103759765625, 0.013095855712890625, 0.01581573486328125, 0.018535614013671875, 0.0212554931640625, 0.023975372314453125, 0.02669525146484375, 0.029415130615234375, 0.032135009765625, 0.034854888916015625, 0.03757476806640625, 0.040294647216796875, 0.0430145263671875, 0.045734405517578125, 0.04845428466796875, 0.051174163818359375, 0.05389404296875, 0.056613922119140625, 0.05933380126953125, 0.062053680419921875, 0.0647735595703125, 0.06749343872070312, 0.07021331787109375, 0.07293319702148438, 0.075653076171875, 0.07837295532226562, 0.08109283447265625, 0.08381271362304688, 0.0865325927734375, 0.08925247192382812, 0.09197235107421875, 0.09469223022460938, 0.097412109375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 8.0, 8.0, 46.0, 224.0, 376.0, 252.0, 73.0, 19.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3516697883605957, -1.3043086528778076, -1.256947636604309, -1.209586501121521, -1.1622254848480225, -1.1148643493652344, -1.0675033330917358, -1.0201421976089478, -0.9727811813354492, -0.9254201054573059, -0.8780590295791626, -0.8306979537010193, -0.783336877822876, -0.7359758019447327, -0.6886147260665894, -0.6412535905838013, -0.593892514705658, -0.5465314388275146, -0.49917036294937134, -0.451809287071228, -0.4044482111930847, -0.3570871353149414, -0.3097260296344757, -0.2623649537563324, -0.2150038778781891, -0.16764280200004578, -0.12028171867132187, -0.07292063534259796, -0.02555955946445465, 0.02180151641368866, 0.06916260719299316, 0.11652368307113647, 0.16388475894927979, 0.2112458348274231, 0.2586069107055664, 0.3059679865837097, 0.353329062461853, 0.40069013833999634, 0.44805124402046204, 0.49541231989860535, 0.5427733659744263, 0.5901344418525696, 0.6374955177307129, 0.6848565936088562, 0.7322176694869995, 0.7795787453651428, 0.8269398212432861, 0.8743009567260742, 0.9216620326042175, 0.9690231084823608, 1.016384243965149, 1.0637452602386475, 1.1111063957214355, 1.158467411994934, 1.2058285474777222, 1.2531895637512207, 1.3005506992340088, 1.3479118347167969, 1.3952728509902954, 1.4426339864730835, 1.489995002746582, 1.5373561382293701, 1.5847171545028687, 1.6320782899856567, 1.6794393062591553]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 4.0, 10.0, 12.0, 17.0, 19.0, 16.0, 24.0, 33.0, 28.0, 29.0, 42.0, 46.0, 30.0, 46.0, 50.0, 50.0, 46.0, 40.0, 55.0, 42.0, 48.0, 41.0, 48.0, 40.0, 19.0, 37.0, 14.0, 19.0, 18.0, 18.0, 10.0, 13.0, 9.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.3421061038970947, -0.3330096900463104, -0.3239132761955261, -0.31481683254241943, -0.30572041869163513, -0.29662400484085083, -0.28752759099006653, -0.2784311771392822, -0.26933473348617554, -0.26023831963539124, -0.25114190578460693, -0.24204547703266144, -0.23294904828071594, -0.22385263442993164, -0.21475622057914734, -0.20565979182720184, -0.19656337797641754, -0.18746696412563324, -0.17837053537368774, -0.16927412152290344, -0.16017769277095795, -0.15108127892017365, -0.14198485016822815, -0.13288843631744385, -0.12379201501607895, -0.11469559371471405, -0.10559917241334915, -0.09650275111198425, -0.08740633726119995, -0.07830990850925446, -0.06921349465847015, -0.060117073357105255, -0.051020652055740356, -0.04192423075437546, -0.03282780945301056, -0.02373139187693596, -0.01463497057557106, -0.0055385492742061615, 0.0035578683018684387, 0.012654289603233337, 0.021750710904598236, 0.030847132205963135, 0.03994355350732803, 0.049039971083402634, 0.05813639238476753, 0.06723281741142273, 0.07632923126220703, 0.08542565256357193, 0.09452207386493683, 0.10361849516630173, 0.11271491646766663, 0.12181133031845093, 0.13090775907039642, 0.14000417292118073, 0.14910060167312622, 0.15819701552391052, 0.16729342937469482, 0.17638984322547913, 0.18548627197742462, 0.19458268582820892, 0.20367911458015442, 0.21277552843093872, 0.22187194228172302, 0.23096837103366852, 0.240064799785614]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 11.0, 16.0, 10.0, 36.0, 25.0, 69.0, 84.0, 122.0, 180.0, 257.0, 421.0, 690.0, 1123.0, 1903.0, 3245.0, 6077.0, 11504.0, 24368.0, 55263.0, 170549.0, 532327.0, 144193.0, 49640.0, 22167.0, 10742.0, 5745.0, 3070.0, 1768.0, 1072.0, 638.0, 401.0, 264.0, 185.0, 114.0, 86.0, 54.0, 35.0, 31.0, 19.0, 19.0, 6.0, 7.0, 8.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.130126953125, -0.1262359619140625, -0.122344970703125, -0.1184539794921875, -0.11456298828125, -0.1106719970703125, -0.106781005859375, -0.1028900146484375, -0.0989990234375, -0.0951080322265625, -0.091217041015625, -0.0873260498046875, -0.08343505859375, -0.0795440673828125, -0.075653076171875, -0.0717620849609375, -0.06787109375, -0.0639801025390625, -0.060089111328125, -0.0561981201171875, -0.05230712890625, -0.0484161376953125, -0.044525146484375, -0.0406341552734375, -0.0367431640625, -0.0328521728515625, -0.028961181640625, -0.0250701904296875, -0.02117919921875, -0.0172882080078125, -0.013397216796875, -0.0095062255859375, -0.005615234375, -0.0017242431640625, 0.002166748046875, 0.0060577392578125, 0.00994873046875, 0.0138397216796875, 0.017730712890625, 0.0216217041015625, 0.0255126953125, 0.0294036865234375, 0.033294677734375, 0.0371856689453125, 0.04107666015625, 0.0449676513671875, 0.048858642578125, 0.0527496337890625, 0.056640625, 0.0605316162109375, 0.064422607421875, 0.0683135986328125, 0.07220458984375, 0.0760955810546875, 0.079986572265625, 0.0838775634765625, 0.0877685546875, 0.0916595458984375, 0.095550537109375, 0.0994415283203125, 0.10333251953125, 0.1072235107421875, 0.111114501953125, 0.1150054931640625, 0.118896484375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 5.0, 5.0, 11.0, 11.0, 17.0, 17.0, 19.0, 22.0, 21.0, 39.0, 26.0, 39.0, 31.0, 50.0, 45.0, 43.0, 58.0, 56.0, 38.0, 49.0, 47.0, 52.0, 44.0, 37.0, 40.0, 27.0, 22.0, 25.0, 21.0, 19.0, 10.0, 14.0, 10.0, 10.0, 5.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0289306640625, -0.02801990509033203, -0.027109146118164062, -0.026198387145996094, -0.025287628173828125, -0.024376869201660156, -0.023466110229492188, -0.02255535125732422, -0.02164459228515625, -0.02073383331298828, -0.019823074340820312, -0.018912315368652344, -0.018001556396484375, -0.017090797424316406, -0.016180038452148438, -0.015269279479980469, -0.0143585205078125, -0.013447761535644531, -0.012537002563476562, -0.011626243591308594, -0.010715484619140625, -0.009804725646972656, -0.008893966674804688, -0.007983207702636719, -0.00707244873046875, -0.006161689758300781, -0.0052509307861328125, -0.004340171813964844, -0.003429412841796875, -0.0025186538696289062, -0.0016078948974609375, -0.0006971359252929688, 0.000213623046875, 0.0011243820190429688, 0.0020351409912109375, 0.0029458999633789062, 0.003856658935546875, 0.004767417907714844, 0.0056781768798828125, 0.006588935852050781, 0.00749969482421875, 0.008410453796386719, 0.009321212768554688, 0.010231971740722656, 0.011142730712890625, 0.012053489685058594, 0.012964248657226562, 0.013875007629394531, 0.0147857666015625, 0.01569652557373047, 0.016607284545898438, 0.017518043518066406, 0.018428802490234375, 0.019339561462402344, 0.020250320434570312, 0.02116107940673828, 0.02207183837890625, 0.02298259735107422, 0.023893356323242188, 0.024804115295410156, 0.025714874267578125, 0.026625633239746094, 0.027536392211914062, 0.02844715118408203, 0.02935791015625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 7.0, 4.0, 3.0, 9.0, 8.0, 17.0, 13.0, 20.0, 28.0, 40.0, 48.0, 93.0, 100.0, 121.0, 170.0, 268.0, 339.0, 582.0, 858.0, 1686.0, 3811.0, 10707.0, 42327.0, 253634.0, 620608.0, 82761.0, 19013.0, 5672.0, 2255.0, 1182.0, 678.0, 409.0, 308.0, 219.0, 156.0, 101.0, 91.0, 52.0, 36.0, 40.0, 24.0, 17.0, 16.0, 5.0, 5.0, 5.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.16259765625, -0.15738868713378906, -0.15217971801757812, -0.1469707489013672, -0.14176177978515625, -0.1365528106689453, -0.13134384155273438, -0.12613487243652344, -0.1209259033203125, -0.11571693420410156, -0.11050796508789062, -0.10529899597167969, -0.10009002685546875, -0.09488105773925781, -0.08967208862304688, -0.08446311950683594, -0.079254150390625, -0.07404518127441406, -0.06883621215820312, -0.06362724304199219, -0.05841827392578125, -0.05320930480957031, -0.048000335693359375, -0.04279136657714844, -0.0375823974609375, -0.03237342834472656, -0.027164459228515625, -0.021955490112304688, -0.01674652099609375, -0.011537551879882812, -0.006328582763671875, -0.0011196136474609375, 0.00408935546875, 0.009298324584960938, 0.014507293701171875, 0.019716262817382812, 0.02492523193359375, 0.030134201049804688, 0.035343170166015625, 0.04055213928222656, 0.0457611083984375, 0.05097007751464844, 0.056179046630859375, 0.06138801574707031, 0.06659698486328125, 0.07180595397949219, 0.07701492309570312, 0.08222389221191406, 0.087432861328125, 0.09264183044433594, 0.09785079956054688, 0.10305976867675781, 0.10826873779296875, 0.11347770690917969, 0.11868667602539062, 0.12389564514160156, 0.1291046142578125, 0.13431358337402344, 0.13952255249023438, 0.1447315216064453, 0.14994049072265625, 0.1551494598388672, 0.16035842895507812, 0.16556739807128906, 0.1707763671875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 9.0, 15.0, 13.0, 21.0, 23.0, 27.0, 23.0, 33.0, 35.0, 34.0, 43.0, 44.0, 48.0, 49.0, 58.0, 62.0, 64.0, 62.0, 42.0, 34.0, 42.0, 26.0, 36.0, 26.0, 26.0, 20.0, 20.0, 13.0, 14.0, 10.0, 3.0, 4.0, 4.0, 5.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.140380859375, -0.13614463806152344, -0.13190841674804688, -0.1276721954345703, -0.12343597412109375, -0.11919975280761719, -0.11496353149414062, -0.11072731018066406, -0.1064910888671875, -0.10225486755371094, -0.09801864624023438, -0.09378242492675781, -0.08954620361328125, -0.08530998229980469, -0.08107376098632812, -0.07683753967285156, -0.072601318359375, -0.06836509704589844, -0.06412887573242188, -0.05989265441894531, -0.05565643310546875, -0.05142021179199219, -0.047183990478515625, -0.04294776916503906, -0.0387115478515625, -0.03447532653808594, -0.030239105224609375, -0.026002883911132812, -0.02176666259765625, -0.017530441284179688, -0.013294219970703125, -0.009057998657226562, -0.00482177734375, -0.0005855560302734375, 0.003650665283203125, 0.007886886596679688, 0.01212310791015625, 0.016359329223632812, 0.020595550537109375, 0.024831771850585938, 0.0290679931640625, 0.03330421447753906, 0.037540435791015625, 0.04177665710449219, 0.04601287841796875, 0.05024909973144531, 0.054485321044921875, 0.05872154235839844, 0.062957763671875, 0.06719398498535156, 0.07143020629882812, 0.07566642761230469, 0.07990264892578125, 0.08413887023925781, 0.08837509155273438, 0.09261131286621094, 0.0968475341796875, 0.10108375549316406, 0.10531997680664062, 0.10955619812011719, 0.11379241943359375, 0.11802864074707031, 0.12226486206054688, 0.12650108337402344, 0.1307373046875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 5.0, 7.0, 13.0, 12.0, 18.0, 34.0, 58.0, 71.0, 124.0, 275.0, 500.0, 1265.0, 3686.0, 12594.0, 61200.0, 796465.0, 141542.0, 21616.0, 5669.0, 1849.0, 759.0, 337.0, 182.0, 99.0, 63.0, 41.0, 22.0, 13.0, 11.0, 6.0, 8.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1558837890625, -0.15139007568359375, -0.1468963623046875, -0.14240264892578125, -0.137908935546875, -0.13341522216796875, -0.1289215087890625, -0.12442779541015625, -0.11993408203125, -0.11544036865234375, -0.1109466552734375, -0.10645294189453125, -0.101959228515625, -0.09746551513671875, -0.0929718017578125, -0.08847808837890625, -0.083984375, -0.07949066162109375, -0.0749969482421875, -0.07050323486328125, -0.066009521484375, -0.06151580810546875, -0.0570220947265625, -0.05252838134765625, -0.04803466796875, -0.04354095458984375, -0.0390472412109375, -0.03455352783203125, -0.030059814453125, -0.02556610107421875, -0.0210723876953125, -0.01657867431640625, -0.0120849609375, -0.00759124755859375, -0.0030975341796875, 0.00139617919921875, 0.005889892578125, 0.01038360595703125, 0.0148773193359375, 0.01937103271484375, 0.02386474609375, 0.02835845947265625, 0.0328521728515625, 0.03734588623046875, 0.041839599609375, 0.04633331298828125, 0.0508270263671875, 0.05532073974609375, 0.059814453125, 0.06430816650390625, 0.0688018798828125, 0.07329559326171875, 0.077789306640625, 0.08228302001953125, 0.0867767333984375, 0.09127044677734375, 0.09576416015625, 0.10025787353515625, 0.1047515869140625, 0.10924530029296875, 0.113739013671875, 0.11823272705078125, 0.1227264404296875, 0.12722015380859375, 0.1317138671875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 5.0, 4.0, 6.0, 16.0, 22.0, 27.0, 44.0, 63.0, 84.0, 108.0, 116.0, 146.0, 103.0, 75.0, 43.0, 43.0, 25.0, 21.0, 19.0, 9.0, 4.0, 8.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.00011807680130004883, -0.00011532846838235855, -0.00011258013546466827, -0.000109831802546978, -0.00010708346962928772, -0.00010433513671159744, -0.00010158680379390717, -9.883847087621689e-05, -9.609013795852661e-05, -9.334180504083633e-05, -9.059347212314606e-05, -8.784513920545578e-05, -8.50968062877655e-05, -8.234847337007523e-05, -7.960014045238495e-05, -7.685180753469467e-05, -7.41034746170044e-05, -7.135514169931412e-05, -6.860680878162384e-05, -6.585847586393356e-05, -6.311014294624329e-05, -6.036181002855301e-05, -5.761347711086273e-05, -5.4865144193172455e-05, -5.211681127548218e-05, -4.93684783577919e-05, -4.6620145440101624e-05, -4.3871812522411346e-05, -4.112347960472107e-05, -3.837514668703079e-05, -3.5626813769340515e-05, -3.287848085165024e-05, -3.013014793395996e-05, -2.7381815016269684e-05, -2.4633482098579407e-05, -2.188514918088913e-05, -1.9136816263198853e-05, -1.6388483345508575e-05, -1.3640150427818298e-05, -1.0891817510128021e-05, -8.143484592437744e-06, -5.395151674747467e-06, -2.64681875705719e-06, 1.0151416063308716e-07, 2.8498470783233643e-06, 5.598179996013641e-06, 8.346512913703918e-06, 1.1094845831394196e-05, 1.3843178749084473e-05, 1.659151166677475e-05, 1.9339844584465027e-05, 2.2088177502155304e-05, 2.483651041984558e-05, 2.7584843337535858e-05, 3.0333176255226135e-05, 3.308150917291641e-05, 3.582984209060669e-05, 3.8578175008296967e-05, 4.1326507925987244e-05, 4.407484084367752e-05, 4.68231737613678e-05, 4.9571506679058075e-05, 5.231983959674835e-05, 5.506817251443863e-05, 5.7816505432128906e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 9.0, 5.0, 7.0, 15.0, 11.0, 23.0, 20.0, 35.0, 44.0, 81.0, 102.0, 185.0, 278.0, 454.0, 841.0, 1839.0, 4911.0, 16165.0, 71741.0, 778610.0, 136304.0, 24936.0, 7018.0, 2433.0, 1059.0, 520.0, 283.0, 166.0, 137.0, 84.0, 67.0, 48.0, 33.0, 19.0, 19.0, 11.0, 11.0, 4.0, 11.0, 4.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.090087890625, -0.08657646179199219, -0.08306503295898438, -0.07955360412597656, -0.07604217529296875, -0.07253074645996094, -0.06901931762695312, -0.06550788879394531, -0.0619964599609375, -0.05848503112792969, -0.054973602294921875, -0.05146217346191406, -0.04795074462890625, -0.04443931579589844, -0.040927886962890625, -0.03741645812988281, -0.033905029296875, -0.030393600463867188, -0.026882171630859375, -0.023370742797851562, -0.01985931396484375, -0.016347885131835938, -0.012836456298828125, -0.009325027465820312, -0.0058135986328125, -0.0023021697998046875, 0.001209259033203125, 0.0047206878662109375, 0.00823211669921875, 0.011743545532226562, 0.015254974365234375, 0.018766403198242188, 0.02227783203125, 0.025789260864257812, 0.029300689697265625, 0.03281211853027344, 0.03632354736328125, 0.03983497619628906, 0.043346405029296875, 0.04685783386230469, 0.0503692626953125, 0.05388069152832031, 0.057392120361328125, 0.06090354919433594, 0.06441497802734375, 0.06792640686035156, 0.07143783569335938, 0.07494926452636719, 0.078460693359375, 0.08197212219238281, 0.08548355102539062, 0.08899497985839844, 0.09250640869140625, 0.09601783752441406, 0.09952926635742188, 0.10304069519042969, 0.1065521240234375, 0.11006355285644531, 0.11357498168945312, 0.11708641052246094, 0.12059783935546875, 0.12410926818847656, 0.12762069702148438, 0.1311321258544922, 0.1346435546875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 7.0, 5.0, 3.0, 2.0, 7.0, 10.0, 13.0, 17.0, 16.0, 30.0, 38.0, 65.0, 146.0, 193.0, 163.0, 91.0, 55.0, 37.0, 20.0, 7.0, 13.0, 13.0, 14.0, 5.0, 5.0, 2.0, 3.0, 3.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.07171630859375, -0.0693807601928711, -0.06704521179199219, -0.06470966339111328, -0.062374114990234375, -0.06003856658935547, -0.05770301818847656, -0.055367469787597656, -0.05303192138671875, -0.050696372985839844, -0.04836082458496094, -0.04602527618408203, -0.043689727783203125, -0.04135417938232422, -0.03901863098144531, -0.036683082580566406, -0.0343475341796875, -0.032011985778808594, -0.029676437377929688, -0.02734088897705078, -0.025005340576171875, -0.02266979217529297, -0.020334243774414062, -0.017998695373535156, -0.01566314697265625, -0.013327598571777344, -0.010992050170898438, -0.008656501770019531, -0.006320953369140625, -0.003985404968261719, -0.0016498565673828125, 0.0006856918334960938, 0.003021240234375, 0.005356788635253906, 0.0076923370361328125, 0.010027885437011719, 0.012363433837890625, 0.014698982238769531, 0.017034530639648438, 0.019370079040527344, 0.02170562744140625, 0.024041175842285156, 0.026376724243164062, 0.02871227264404297, 0.031047821044921875, 0.03338336944580078, 0.03571891784667969, 0.038054466247558594, 0.0403900146484375, 0.042725563049316406, 0.04506111145019531, 0.04739665985107422, 0.049732208251953125, 0.05206775665283203, 0.05440330505371094, 0.056738853454589844, 0.05907440185546875, 0.061409950256347656, 0.06374549865722656, 0.06608104705810547, 0.06841659545898438, 0.07075214385986328, 0.07308769226074219, 0.0754232406616211, 0.0777587890625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 10.0, 11.0, 42.0, 104.0, 167.0, 219.0, 215.0, 131.0, 67.0, 26.0, 5.0, 1.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9758763313293457, -1.9248700141906738, -1.873863697052002, -1.82285737991333, -1.7718510627746582, -1.7208447456359863, -1.6698384284973145, -1.6188321113586426, -1.5678257942199707, -1.5168194770812988, -1.465813159942627, -1.414806842803955, -1.3638005256652832, -1.3127942085266113, -1.2617878913879395, -1.2107815742492676, -1.1597752571105957, -1.1087689399719238, -1.057762622833252, -1.00675630569458, -0.9557499885559082, -0.9047436714172363, -0.8537373542785645, -0.8027310371398926, -0.7517248392105103, -0.7007185220718384, -0.6497122049331665, -0.5987058877944946, -0.5476995706558228, -0.49669328331947327, -0.4456869661808014, -0.3946806490421295, -0.34367430210113525, -0.2926679849624634, -0.2416616678237915, -0.19065536558628082, -0.13964904844760895, -0.08864274621009827, -0.03763642907142639, 0.013369888067245483, 0.06437620520591736, 0.11538252234458923, 0.1663888394832611, 0.2173951417207718, 0.26840144395828247, 0.31940776109695435, 0.3704140782356262, 0.4214203953742981, 0.47242671251296997, 0.5234330296516418, 0.5744393467903137, 0.6254456639289856, 0.6764519810676575, 0.7274582386016846, 0.7784645557403564, 0.8294708728790283, 0.8804771900177002, 0.9314835071563721, 0.982489824295044, 1.0334961414337158, 1.0845024585723877, 1.1355087757110596, 1.1865150928497314, 1.2375214099884033, 1.2885277271270752]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 3.0, 6.0, 5.0, 2.0, 11.0, 11.0, 5.0, 7.0, 7.0, 18.0, 15.0, 15.0, 22.0, 22.0, 21.0, 36.0, 41.0, 36.0, 38.0, 34.0, 34.0, 38.0, 45.0, 41.0, 36.0, 23.0, 43.0, 39.0, 37.0, 27.0, 26.0, 29.0, 24.0, 27.0, 30.0, 23.0, 20.0, 17.0, 15.0, 11.0, 11.0, 13.0, 11.0, 4.0, 3.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.4881681203842163, -0.47227415442466736, -0.4563801884651184, -0.44048619270324707, -0.4245922267436981, -0.40869826078414917, -0.39280426502227783, -0.3769102990627289, -0.36101633310317993, -0.345122367143631, -0.32922840118408203, -0.3133344054222107, -0.29744043946266174, -0.2815464735031128, -0.26565247774124146, -0.2497585117816925, -0.23386454582214355, -0.2179705798625946, -0.20207659900188446, -0.18618261814117432, -0.17028865218162537, -0.15439468622207642, -0.13850070536136627, -0.12260673195123672, -0.10671275854110718, -0.09081878513097763, -0.07492481172084808, -0.059030838310718536, -0.04313686490058899, -0.027242891490459442, -0.011348918080329895, 0.004545055329799652, 0.0204390287399292, 0.036333002150058746, 0.05222697556018829, 0.06812094897031784, 0.08401492238044739, 0.09990889579057693, 0.11580286920070648, 0.13169685006141663, 0.14759081602096558, 0.16348478198051453, 0.17937876284122467, 0.19527274370193481, 0.21116670966148376, 0.22706067562103271, 0.24295465648174286, 0.258848637342453, 0.27474260330200195, 0.2906365692615509, 0.30653053522109985, 0.3224245309829712, 0.33831849694252014, 0.3542124629020691, 0.37010645866394043, 0.3860004246234894, 0.40189439058303833, 0.4177883565425873, 0.43368232250213623, 0.44957631826400757, 0.4654702842235565, 0.48136425018310547, 0.4972582459449768, 0.5131521821022034, 0.5290461778640747]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 8.0, 11.0, 5.0, 15.0, 25.0, 43.0, 48.0, 77.0, 94.0, 150.0, 334.0, 540.0, 1260.0, 2668.0, 6349.0, 18458.0, 75574.0, 2718853.0, 1274535.0, 67522.0, 16782.0, 5928.0, 2470.0, 1155.0, 571.0, 303.0, 155.0, 117.0, 57.0, 58.0, 27.0, 27.0, 16.0, 14.0, 8.0, 6.0, 7.0, 3.0, 4.0, 2.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18115234375, -0.17581939697265625, -0.1704864501953125, -0.16515350341796875, -0.159820556640625, -0.15448760986328125, -0.1491546630859375, -0.14382171630859375, -0.13848876953125, -0.13315582275390625, -0.1278228759765625, -0.12248992919921875, -0.117156982421875, -0.11182403564453125, -0.1064910888671875, -0.10115814208984375, -0.0958251953125, -0.09049224853515625, -0.0851593017578125, -0.07982635498046875, -0.074493408203125, -0.06916046142578125, -0.0638275146484375, -0.05849456787109375, -0.05316162109375, -0.04782867431640625, -0.0424957275390625, -0.03716278076171875, -0.031829833984375, -0.02649688720703125, -0.0211639404296875, -0.01583099365234375, -0.010498046875, -0.00516510009765625, 0.0001678466796875, 0.00550079345703125, 0.010833740234375, 0.01616668701171875, 0.0214996337890625, 0.02683258056640625, 0.03216552734375, 0.03749847412109375, 0.0428314208984375, 0.04816436767578125, 0.053497314453125, 0.05883026123046875, 0.0641632080078125, 0.06949615478515625, 0.0748291015625, 0.08016204833984375, 0.0854949951171875, 0.09082794189453125, 0.096160888671875, 0.10149383544921875, 0.1068267822265625, 0.11215972900390625, 0.11749267578125, 0.12282562255859375, 0.1281585693359375, 0.13349151611328125, 0.138824462890625, 0.14415740966796875, 0.1494903564453125, 0.15482330322265625, 0.16015625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 4.0, 5.0, 3.0, 3.0, 9.0, 11.0, 10.0, 19.0, 21.0, 21.0, 18.0, 24.0, 32.0, 42.0, 40.0, 44.0, 38.0, 41.0, 44.0, 37.0, 55.0, 58.0, 46.0, 51.0, 48.0, 42.0, 37.0, 36.0, 26.0, 28.0, 14.0, 18.0, 17.0, 18.0, 7.0, 9.0, 9.0, 4.0, 0.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0295867919921875, -0.028638839721679688, -0.027690887451171875, -0.026742935180664062, -0.02579498291015625, -0.024847030639648438, -0.023899078369140625, -0.022951126098632812, -0.022003173828125, -0.021055221557617188, -0.020107269287109375, -0.019159317016601562, -0.01821136474609375, -0.017263412475585938, -0.016315460205078125, -0.015367507934570312, -0.0144195556640625, -0.013471603393554688, -0.012523651123046875, -0.011575698852539062, -0.01062774658203125, -0.009679794311523438, -0.008731842041015625, -0.0077838897705078125, -0.0068359375, -0.0058879852294921875, -0.004940032958984375, -0.0039920806884765625, -0.00304412841796875, -0.0020961761474609375, -0.001148223876953125, -0.0002002716064453125, 0.0007476806640625, 0.0016956329345703125, 0.002643585205078125, 0.0035915374755859375, 0.00453948974609375, 0.0054874420166015625, 0.006435394287109375, 0.0073833465576171875, 0.008331298828125, 0.009279251098632812, 0.010227203369140625, 0.011175155639648438, 0.01212310791015625, 0.013071060180664062, 0.014019012451171875, 0.014966964721679688, 0.0159149169921875, 0.016862869262695312, 0.017810821533203125, 0.018758773803710938, 0.01970672607421875, 0.020654678344726562, 0.021602630615234375, 0.022550582885742188, 0.02349853515625, 0.024446487426757812, 0.025394439697265625, 0.026342391967773438, 0.02729034423828125, 0.028238296508789062, 0.029186248779296875, 0.030134201049804688, 0.0310821533203125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 12.0, 14.0, 19.0, 35.0, 42.0, 72.0, 123.0, 205.0, 395.0, 890.0, 2873.0, 18266.0, 703775.0, 3433722.0, 28182.0, 3659.0, 1028.0, 400.0, 208.0, 113.0, 83.0, 54.0, 34.0, 20.0, 18.0, 14.0, 5.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5029296875, -0.4900627136230469, -0.47719573974609375, -0.4643287658691406, -0.4514617919921875, -0.4385948181152344, -0.42572784423828125, -0.4128608703613281, -0.399993896484375, -0.3871269226074219, -0.37425994873046875, -0.3613929748535156, -0.3485260009765625, -0.3356590270996094, -0.32279205322265625, -0.3099250793457031, -0.29705810546875, -0.2841911315917969, -0.27132415771484375, -0.2584571838378906, -0.2455902099609375, -0.23272323608398438, -0.21985626220703125, -0.20698928833007812, -0.194122314453125, -0.18125534057617188, -0.16838836669921875, -0.15552139282226562, -0.1426544189453125, -0.12978744506835938, -0.11692047119140625, -0.10405349731445312, -0.0911865234375, -0.07831954956054688, -0.06545257568359375, -0.052585601806640625, -0.0397186279296875, -0.026851654052734375, -0.01398468017578125, -0.001117706298828125, 0.011749267578125, 0.024616241455078125, 0.03748321533203125, 0.050350189208984375, 0.0632171630859375, 0.07608413696289062, 0.08895111083984375, 0.10181808471679688, 0.11468505859375, 0.12755203247070312, 0.14041900634765625, 0.15328598022460938, 0.1661529541015625, 0.17901992797851562, 0.19188690185546875, 0.20475387573242188, 0.217620849609375, 0.23048782348632812, 0.24335479736328125, 0.2562217712402344, 0.2690887451171875, 0.2819557189941406, 0.29482269287109375, 0.3076896667480469, 0.320556640625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 7.0, 9.0, 11.0, 13.0, 25.0, 60.0, 104.0, 319.0, 1926.0, 1123.0, 244.0, 112.0, 44.0, 36.0, 15.0, 11.0, 5.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1856689453125, -0.1814422607421875, -0.177215576171875, -0.1729888916015625, -0.16876220703125, -0.1645355224609375, -0.160308837890625, -0.1560821533203125, -0.15185546875, -0.1476287841796875, -0.143402099609375, -0.1391754150390625, -0.13494873046875, -0.1307220458984375, -0.126495361328125, -0.1222686767578125, -0.1180419921875, -0.1138153076171875, -0.109588623046875, -0.1053619384765625, -0.10113525390625, -0.0969085693359375, -0.092681884765625, -0.0884552001953125, -0.084228515625, -0.0800018310546875, -0.075775146484375, -0.0715484619140625, -0.06732177734375, -0.0630950927734375, -0.058868408203125, -0.0546417236328125, -0.0504150390625, -0.0461883544921875, -0.041961669921875, -0.0377349853515625, -0.03350830078125, -0.0292816162109375, -0.025054931640625, -0.0208282470703125, -0.0166015625, -0.0123748779296875, -0.008148193359375, -0.0039215087890625, 0.00030517578125, 0.0045318603515625, 0.008758544921875, 0.0129852294921875, 0.0172119140625, 0.0214385986328125, 0.025665283203125, 0.0298919677734375, 0.03411865234375, 0.0383453369140625, 0.042572021484375, 0.0467987060546875, 0.051025390625, 0.0552520751953125, 0.059478759765625, 0.0637054443359375, 0.06793212890625, 0.0721588134765625, 0.076385498046875, 0.0806121826171875, 0.0848388671875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 9.0, 3.0, 7.0, 12.0, 28.0, 59.0, 168.0, 333.0, 262.0, 101.0, 22.0, 7.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.1944665908813477, -2.155172109603882, -2.115877628326416, -2.07658314704895, -2.0372886657714844, -1.9979941844940186, -1.9586997032165527, -1.919405221939087, -1.880110740661621, -1.8408162593841553, -1.8015217781066895, -1.7622272968292236, -1.7229328155517578, -1.683638334274292, -1.6443438529968262, -1.6050493717193604, -1.565755009651184, -1.5264605283737183, -1.4871660470962524, -1.4478715658187866, -1.4085770845413208, -1.369282603263855, -1.3299881219863892, -1.290693759918213, -1.251399278640747, -1.2121047973632812, -1.1728103160858154, -1.1335158348083496, -1.0942213535308838, -1.054926872253418, -1.0156323909759521, -0.9763379693031311, -0.9370435476303101, -0.8977490663528442, -0.8584545850753784, -0.8191601037979126, -0.7798656225204468, -0.740571141242981, -0.7012767195701599, -0.6619822382926941, -0.6226877570152283, -0.5833932757377625, -0.5440987944602966, -0.5048043131828308, -0.4655098617076874, -0.42621538043022156, -0.3869209289550781, -0.3476264476776123, -0.3083319664001465, -0.26903748512268066, -0.22974301874637604, -0.1904485523700714, -0.1511540710926056, -0.11185958981513977, -0.07256512343883514, -0.03327065706253052, 0.006023824214935303, 0.045318298041820526, 0.08461277186870575, 0.12390724569559097, 0.1632017195224762, 0.20249620079994202, 0.24179066717624664, 0.28108513355255127, 0.3203796148300171]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 7.0, 4.0, 9.0, 7.0, 16.0, 16.0, 16.0, 24.0, 23.0, 18.0, 44.0, 35.0, 36.0, 41.0, 36.0, 48.0, 42.0, 50.0, 40.0, 50.0, 57.0, 39.0, 41.0, 39.0, 44.0, 24.0, 38.0, 21.0, 21.0, 28.0, 15.0, 19.0, 14.0, 12.0, 7.0, 6.0, 7.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.3971271514892578, -0.3860683739185333, -0.37500959634780884, -0.36395084857940674, -0.35289207100868225, -0.34183329343795776, -0.33077454566955566, -0.3197157680988312, -0.3086569905281067, -0.2975982129573822, -0.2865394353866577, -0.2754806876182556, -0.26442191004753113, -0.25336313247680664, -0.24230436980724335, -0.23124560713768005, -0.22018682956695557, -0.20912805199623108, -0.19806928932666779, -0.1870105266571045, -0.17595174908638, -0.16489297151565552, -0.15383420884609222, -0.14277544617652893, -0.13171666860580444, -0.12065789848566055, -0.10959912836551666, -0.09854035824537277, -0.08748158812522888, -0.07642281800508499, -0.0653640478849411, -0.05430527776479721, -0.04324650764465332, -0.03218773752450943, -0.02112896740436554, -0.01007019728422165, 0.0009885728359222412, 0.012047342956066132, 0.023106113076210022, 0.03416488319635391, 0.0452236533164978, 0.05628242343664169, 0.06734119355678558, 0.07839996367692947, 0.08945873379707336, 0.10051750391721725, 0.11157627403736115, 0.12263504415750504, 0.13369381427764893, 0.1447525918483734, 0.1558113545179367, 0.1668701171875, 0.1779288947582245, 0.18898767232894897, 0.20004643499851227, 0.21110519766807556, 0.22216397523880005, 0.23322275280952454, 0.24428151547908783, 0.2553402781486511, 0.2663990557193756, 0.2774578332901001, 0.2885165810585022, 0.2995753586292267, 0.31063413619995117]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 1.0, 8.0, 3.0, 5.0, 9.0, 11.0, 19.0, 22.0, 23.0, 37.0, 43.0, 67.0, 92.0, 135.0, 223.0, 355.0, 542.0, 995.0, 1666.0, 3079.0, 5930.0, 11402.0, 23915.0, 56239.0, 180791.0, 477148.0, 180985.0, 56369.0, 23867.0, 11454.0, 5783.0, 3050.0, 1742.0, 934.0, 563.0, 344.0, 216.0, 138.0, 88.0, 61.0, 48.0, 41.0, 21.0, 22.0, 14.0, 11.0, 8.0, 9.0, 4.0, 8.0, 6.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0], "bins": [-0.10113525390625, -0.0980234146118164, -0.09491157531738281, -0.09179973602294922, -0.08868789672851562, -0.08557605743408203, -0.08246421813964844, -0.07935237884521484, -0.07624053955078125, -0.07312870025634766, -0.07001686096191406, -0.06690502166748047, -0.06379318237304688, -0.06068134307861328, -0.05756950378417969, -0.054457664489746094, -0.0513458251953125, -0.048233985900878906, -0.04512214660644531, -0.04201030731201172, -0.038898468017578125, -0.03578662872314453, -0.03267478942871094, -0.029562950134277344, -0.02645111083984375, -0.023339271545410156, -0.020227432250976562, -0.01711559295654297, -0.014003753662109375, -0.010891914367675781, -0.0077800750732421875, -0.004668235778808594, -0.001556396484375, 0.0015554428100585938, 0.0046672821044921875, 0.007779121398925781, 0.010890960693359375, 0.014002799987792969, 0.017114639282226562, 0.020226478576660156, 0.02333831787109375, 0.026450157165527344, 0.029561996459960938, 0.03267383575439453, 0.035785675048828125, 0.03889751434326172, 0.04200935363769531, 0.045121192932128906, 0.0482330322265625, 0.051344871520996094, 0.05445671081542969, 0.05756855010986328, 0.060680389404296875, 0.06379222869873047, 0.06690406799316406, 0.07001590728759766, 0.07312774658203125, 0.07623958587646484, 0.07935142517089844, 0.08246326446533203, 0.08557510375976562, 0.08868694305419922, 0.09179878234863281, 0.0949106216430664, 0.0980224609375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 2.0, 2.0, 9.0, 5.0, 14.0, 10.0, 11.0, 15.0, 14.0, 15.0, 19.0, 30.0, 27.0, 27.0, 29.0, 30.0, 34.0, 28.0, 35.0, 30.0, 43.0, 36.0, 46.0, 36.0, 46.0, 47.0, 43.0, 37.0, 31.0, 25.0, 27.0, 24.0, 27.0, 20.0, 16.0, 18.0, 15.0, 14.0, 10.0, 12.0, 8.0, 7.0, 6.0, 4.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.02996826171875, -0.029040813446044922, -0.028113365173339844, -0.027185916900634766, -0.026258468627929688, -0.02533102035522461, -0.02440357208251953, -0.023476123809814453, -0.022548675537109375, -0.021621227264404297, -0.02069377899169922, -0.01976633071899414, -0.018838882446289062, -0.017911434173583984, -0.016983985900878906, -0.016056537628173828, -0.01512908935546875, -0.014201641082763672, -0.013274192810058594, -0.012346744537353516, -0.011419296264648438, -0.01049184799194336, -0.009564399719238281, -0.008636951446533203, -0.007709503173828125, -0.006782054901123047, -0.005854606628417969, -0.004927158355712891, -0.0039997100830078125, -0.0030722618103027344, -0.0021448135375976562, -0.0012173652648925781, -0.0002899169921875, 0.0006375312805175781, 0.0015649795532226562, 0.0024924278259277344, 0.0034198760986328125, 0.004347324371337891, 0.005274772644042969, 0.006202220916748047, 0.007129669189453125, 0.008057117462158203, 0.008984565734863281, 0.00991201400756836, 0.010839462280273438, 0.011766910552978516, 0.012694358825683594, 0.013621807098388672, 0.01454925537109375, 0.015476703643798828, 0.016404151916503906, 0.017331600189208984, 0.018259048461914062, 0.01918649673461914, 0.02011394500732422, 0.021041393280029297, 0.021968841552734375, 0.022896289825439453, 0.02382373809814453, 0.02475118637084961, 0.025678634643554688, 0.026606082916259766, 0.027533531188964844, 0.028460979461669922, 0.029388427734375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 6.0, 10.0, 7.0, 13.0, 19.0, 15.0, 17.0, 25.0, 41.0, 66.0, 88.0, 182.0, 262.0, 449.0, 901.0, 1929.0, 5260.0, 17451.0, 78168.0, 807341.0, 104741.0, 20841.0, 6043.0, 2334.0, 1056.0, 489.0, 313.0, 143.0, 111.0, 60.0, 46.0, 36.0, 29.0, 11.0, 10.0, 11.0, 5.0, 5.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.2418212890625, -0.2346172332763672, -0.22741317749023438, -0.22020912170410156, -0.21300506591796875, -0.20580101013183594, -0.19859695434570312, -0.1913928985595703, -0.1841888427734375, -0.1769847869873047, -0.16978073120117188, -0.16257667541503906, -0.15537261962890625, -0.14816856384277344, -0.14096450805664062, -0.1337604522705078, -0.126556396484375, -0.11935234069824219, -0.11214828491210938, -0.10494422912597656, -0.09774017333984375, -0.09053611755371094, -0.08333206176757812, -0.07612800598144531, -0.0689239501953125, -0.06171989440917969, -0.054515838623046875, -0.04731178283691406, -0.04010772705078125, -0.03290367126464844, -0.025699615478515625, -0.018495559692382812, -0.01129150390625, -0.0040874481201171875, 0.003116607666015625, 0.010320663452148438, 0.01752471923828125, 0.024728775024414062, 0.031932830810546875, 0.03913688659667969, 0.0463409423828125, 0.05354499816894531, 0.060749053955078125, 0.06795310974121094, 0.07515716552734375, 0.08236122131347656, 0.08956527709960938, 0.09676933288574219, 0.103973388671875, 0.11117744445800781, 0.11838150024414062, 0.12558555603027344, 0.13278961181640625, 0.13999366760253906, 0.14719772338867188, 0.1544017791748047, 0.1616058349609375, 0.1688098907470703, 0.17601394653320312, 0.18321800231933594, 0.19042205810546875, 0.19762611389160156, 0.20483016967773438, 0.2120342254638672, 0.21923828125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 2.0, 0.0, 3.0, 8.0, 6.0, 7.0, 5.0, 10.0, 15.0, 33.0, 44.0, 66.0, 48.0, 67.0, 78.0, 82.0, 90.0, 76.0, 81.0, 75.0, 55.0, 36.0, 39.0, 14.0, 13.0, 9.0, 7.0, 7.0, 9.0, 6.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.271240234375, -0.26287841796875, -0.2545166015625, -0.24615478515625, -0.23779296875, -0.22943115234375, -0.2210693359375, -0.21270751953125, -0.204345703125, -0.19598388671875, -0.1876220703125, -0.17926025390625, -0.1708984375, -0.16253662109375, -0.1541748046875, -0.14581298828125, -0.137451171875, -0.12908935546875, -0.1207275390625, -0.11236572265625, -0.10400390625, -0.09564208984375, -0.0872802734375, -0.07891845703125, -0.070556640625, -0.06219482421875, -0.0538330078125, -0.04547119140625, -0.037109375, -0.02874755859375, -0.0203857421875, -0.01202392578125, -0.003662109375, 0.00469970703125, 0.0130615234375, 0.02142333984375, 0.02978515625, 0.03814697265625, 0.0465087890625, 0.05487060546875, 0.063232421875, 0.07159423828125, 0.0799560546875, 0.08831787109375, 0.0966796875, 0.10504150390625, 0.1134033203125, 0.12176513671875, 0.130126953125, 0.13848876953125, 0.1468505859375, 0.15521240234375, 0.16357421875, 0.17193603515625, 0.1802978515625, 0.18865966796875, 0.197021484375, 0.20538330078125, 0.2137451171875, 0.22210693359375, 0.23046875, 0.23883056640625, 0.2471923828125, 0.25555419921875, 0.263916015625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 2.0, 7.0, 7.0, 6.0, 16.0, 20.0, 35.0, 33.0, 61.0, 108.0, 172.0, 249.0, 477.0, 771.0, 1286.0, 2311.0, 4561.0, 10911.0, 34098.0, 262206.0, 653270.0, 51444.0, 14343.0, 5643.0, 2770.0, 1489.0, 884.0, 504.0, 313.0, 213.0, 120.0, 74.0, 40.0, 38.0, 23.0, 14.0, 8.0, 11.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.10986328125, -0.10664558410644531, -0.10342788696289062, -0.10021018981933594, -0.09699249267578125, -0.09377479553222656, -0.09055709838867188, -0.08733940124511719, -0.0841217041015625, -0.08090400695800781, -0.07768630981445312, -0.07446861267089844, -0.07125091552734375, -0.06803321838378906, -0.06481552124023438, -0.06159782409667969, -0.058380126953125, -0.05516242980957031, -0.051944732666015625, -0.04872703552246094, -0.04550933837890625, -0.04229164123535156, -0.039073944091796875, -0.03585624694824219, -0.0326385498046875, -0.029420852661132812, -0.026203155517578125, -0.022985458374023438, -0.01976776123046875, -0.016550064086914062, -0.013332366943359375, -0.010114669799804688, -0.00689697265625, -0.0036792755126953125, -0.000461578369140625, 0.0027561187744140625, 0.00597381591796875, 0.009191513061523438, 0.012409210205078125, 0.015626907348632812, 0.0188446044921875, 0.022062301635742188, 0.025279998779296875, 0.028497695922851562, 0.03171539306640625, 0.03493309020996094, 0.038150787353515625, 0.04136848449707031, 0.044586181640625, 0.04780387878417969, 0.051021575927734375, 0.05423927307128906, 0.05745697021484375, 0.06067466735839844, 0.06389236450195312, 0.06711006164550781, 0.0703277587890625, 0.07354545593261719, 0.07676315307617188, 0.07998085021972656, 0.08319854736328125, 0.08641624450683594, 0.08963394165039062, 0.09285163879394531, 0.0960693359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 3.0, 6.0, 6.0, 2.0, 11.0, 19.0, 19.0, 32.0, 24.0, 47.0, 47.0, 51.0, 83.0, 81.0, 73.0, 90.0, 82.0, 61.0, 56.0, 51.0, 43.0, 28.0, 20.0, 21.0, 11.0, 7.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-6.252527236938477e-05, -6.0549937188625336e-05, -5.8574602007865906e-05, -5.6599266827106476e-05, -5.4623931646347046e-05, -5.2648596465587616e-05, -5.0673261284828186e-05, -4.8697926104068756e-05, -4.6722590923309326e-05, -4.4747255742549896e-05, -4.2771920561790466e-05, -4.0796585381031036e-05, -3.8821250200271606e-05, -3.6845915019512177e-05, -3.4870579838752747e-05, -3.289524465799332e-05, -3.091990947723389e-05, -2.8944574296474457e-05, -2.6969239115715027e-05, -2.4993903934955597e-05, -2.3018568754196167e-05, -2.1043233573436737e-05, -1.9067898392677307e-05, -1.7092563211917877e-05, -1.5117228031158447e-05, -1.3141892850399017e-05, -1.1166557669639587e-05, -9.191222488880157e-06, -7.2158873081207275e-06, -5.240552127361298e-06, -3.2652169466018677e-06, -1.2898817658424377e-06, 6.854534149169922e-07, 2.660788595676422e-06, 4.636123776435852e-06, 6.611458957195282e-06, 8.586794137954712e-06, 1.0562129318714142e-05, 1.2537464499473572e-05, 1.4512799680233002e-05, 1.648813486099243e-05, 1.846347004175186e-05, 2.043880522251129e-05, 2.241414040327072e-05, 2.438947558403015e-05, 2.636481076478958e-05, 2.834014594554901e-05, 3.031548112630844e-05, 3.229081630706787e-05, 3.42661514878273e-05, 3.624148666858673e-05, 3.821682184934616e-05, 4.019215703010559e-05, 4.216749221086502e-05, 4.414282739162445e-05, 4.611816257238388e-05, 4.809349775314331e-05, 5.006883293390274e-05, 5.204416811466217e-05, 5.40195032954216e-05, 5.599483847618103e-05, 5.797017365694046e-05, 5.994550883769989e-05, 6.192084401845932e-05, 6.389617919921875e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 4.0, 10.0, 11.0, 19.0, 18.0, 24.0, 37.0, 51.0, 82.0, 154.0, 209.0, 404.0, 711.0, 1455.0, 2973.0, 7242.0, 22237.0, 112134.0, 802762.0, 70029.0, 16652.0, 5965.0, 2582.0, 1208.0, 635.0, 336.0, 180.0, 120.0, 86.0, 58.0, 44.0, 33.0, 22.0, 12.0, 5.0, 5.0, 10.0, 2.0, 6.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.1033935546875, -0.10009956359863281, -0.09680557250976562, -0.09351158142089844, -0.09021759033203125, -0.08692359924316406, -0.08362960815429688, -0.08033561706542969, -0.0770416259765625, -0.07374763488769531, -0.07045364379882812, -0.06715965270996094, -0.06386566162109375, -0.06057167053222656, -0.057277679443359375, -0.05398368835449219, -0.050689697265625, -0.04739570617675781, -0.044101715087890625, -0.04080772399902344, -0.03751373291015625, -0.03421974182128906, -0.030925750732421875, -0.027631759643554688, -0.0243377685546875, -0.021043777465820312, -0.017749786376953125, -0.014455795288085938, -0.01116180419921875, -0.007867813110351562, -0.004573822021484375, -0.0012798309326171875, 0.00201416015625, 0.0053081512451171875, 0.008602142333984375, 0.011896133422851562, 0.01519012451171875, 0.018484115600585938, 0.021778106689453125, 0.025072097778320312, 0.0283660888671875, 0.03166007995605469, 0.034954071044921875, 0.03824806213378906, 0.04154205322265625, 0.04483604431152344, 0.048130035400390625, 0.05142402648925781, 0.054718017578125, 0.05801200866699219, 0.061305999755859375, 0.06459999084472656, 0.06789398193359375, 0.07118797302246094, 0.07448196411132812, 0.07777595520019531, 0.0810699462890625, 0.08436393737792969, 0.08765792846679688, 0.09095191955566406, 0.09424591064453125, 0.09753990173339844, 0.10083389282226562, 0.10412788391113281, 0.107421875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 7.0, 2.0, 6.0, 5.0, 3.0, 6.0, 7.0, 7.0, 9.0, 20.0, 15.0, 22.0, 48.0, 106.0, 209.0, 224.0, 123.0, 59.0, 31.0, 14.0, 13.0, 9.0, 13.0, 8.0, 4.0, 3.0, 4.0, 3.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.096923828125, -0.09407806396484375, -0.0912322998046875, -0.08838653564453125, -0.085540771484375, -0.08269500732421875, -0.0798492431640625, -0.07700347900390625, -0.07415771484375, -0.07131195068359375, -0.0684661865234375, -0.06562042236328125, -0.062774658203125, -0.05992889404296875, -0.0570831298828125, -0.05423736572265625, -0.0513916015625, -0.04854583740234375, -0.0457000732421875, -0.04285430908203125, -0.040008544921875, -0.03716278076171875, -0.0343170166015625, -0.03147125244140625, -0.02862548828125, -0.02577972412109375, -0.0229339599609375, -0.02008819580078125, -0.017242431640625, -0.01439666748046875, -0.0115509033203125, -0.00870513916015625, -0.005859375, -0.00301361083984375, -0.0001678466796875, 0.00267791748046875, 0.005523681640625, 0.00836944580078125, 0.0112152099609375, 0.01406097412109375, 0.01690673828125, 0.01975250244140625, 0.0225982666015625, 0.02544403076171875, 0.028289794921875, 0.03113555908203125, 0.0339813232421875, 0.03682708740234375, 0.0396728515625, 0.04251861572265625, 0.0453643798828125, 0.04821014404296875, 0.051055908203125, 0.05390167236328125, 0.0567474365234375, 0.05959320068359375, 0.06243896484375, 0.06528472900390625, 0.0681304931640625, 0.07097625732421875, 0.073822021484375, 0.07666778564453125, 0.0795135498046875, 0.08235931396484375, 0.085205078125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 11.0, 29.0, 114.0, 293.0, 311.0, 163.0, 59.0, 16.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9813679456710815, -0.9007859230041504, -0.8202039003372192, -0.7396219372749329, -0.6590399146080017, -0.5784578919410706, -0.4978758990764618, -0.417293906211853, -0.3367118835449219, -0.2561298608779907, -0.17554786801338196, -0.094965860247612, -0.014383852481842041, 0.06619817018508911, 0.14678016304969788, 0.22736215591430664, 0.3079441785812378, 0.38852620124816895, 0.4691081941127777, 0.5496901869773865, 0.6302722096443176, 0.7108542323112488, 0.7914361953735352, 0.8720182180404663, 0.9526002407073975, 1.0331822633743286, 1.1137642860412598, 1.194346308708191, 1.274928331375122, 1.3555102348327637, 1.4360922574996948, 1.516674280166626, 1.5972561836242676, 1.6778382062911987, 1.7584202289581299, 1.839002251625061, 1.9195842742919922, 2.000166177749634, 2.0807483196258545, 2.161330223083496, 2.241912364959717, 2.3224942684173584, 2.403076410293579, 2.4836583137512207, 2.5642404556274414, 2.644822359085083, 2.7254045009613037, 2.8059864044189453, 2.886568307876587, 2.9671502113342285, 3.047732353210449, 3.128314256668091, 3.2088963985443115, 3.289478302001953, 3.370060443878174, 3.4506423473358154, 3.531224250793457, 3.6118061542510986, 3.6923882961273193, 3.772970199584961, 3.8535523414611816, 3.9341342449188232, 4.014716148376465, 4.0952982902526855, 4.175880432128906]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 2.0, 6.0, 12.0, 16.0, 14.0, 7.0, 22.0, 13.0, 15.0, 25.0, 20.0, 19.0, 24.0, 18.0, 22.0, 32.0, 29.0, 41.0, 36.0, 42.0, 45.0, 27.0, 38.0, 40.0, 48.0, 37.0, 41.0, 30.0, 34.0, 24.0, 15.0, 19.0, 26.0, 30.0, 20.0, 12.0, 19.0, 10.0, 17.0, 9.0, 12.0, 9.0, 5.0, 5.0, 3.0, 4.0, 1.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.6211733818054199, -0.6012370586395264, -0.5813007354736328, -0.5613644123077393, -0.5414280891418457, -0.5214917659759521, -0.5015554428100586, -0.4816191494464874, -0.46168282628059387, -0.4417465031147003, -0.42181017994880676, -0.4018738567829132, -0.38193756341934204, -0.3620012402534485, -0.34206491708755493, -0.3221285939216614, -0.3021922707557678, -0.28225594758987427, -0.2623196244239807, -0.24238331615924835, -0.2224469929933548, -0.20251066982746124, -0.18257436156272888, -0.16263803839683533, -0.14270171523094177, -0.12276539206504822, -0.10282907634973526, -0.0828927606344223, -0.06295643746852875, -0.04302011430263519, -0.023083798587322235, -0.0031474828720092773, 0.016788840293884277, 0.036725159734487534, 0.05666147917509079, 0.07659779489040375, 0.0965341180562973, 0.11647044122219086, 0.13640674948692322, 0.15634307265281677, 0.17627939581871033, 0.19621571898460388, 0.21615204215049744, 0.2360883504152298, 0.25602465867996216, 0.2759609818458557, 0.29589730501174927, 0.3158336281776428, 0.3357699513435364, 0.35570627450942993, 0.3756425976753235, 0.39557892084121704, 0.4155152440071106, 0.43545156717300415, 0.4553878605365753, 0.47532418370246887, 0.4952605068683624, 0.5151968002319336, 0.5351331233978271, 0.5550694465637207, 0.5750057697296143, 0.5949420928955078, 0.6148784160614014, 0.6348147392272949, 0.6547510623931885]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 2.0, 3.0, 8.0, 5.0, 10.0, 25.0, 28.0, 52.0, 73.0, 122.0, 180.0, 341.0, 594.0, 1037.0, 1771.0, 3311.0, 6697.0, 15294.0, 45056.0, 274311.0, 3626938.0, 160182.0, 33887.0, 12305.0, 5557.0, 2807.0, 1516.0, 892.0, 544.0, 276.0, 174.0, 105.0, 70.0, 51.0, 15.0, 19.0, 10.0, 10.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.25537109375, -0.24920082092285156, -0.24303054809570312, -0.2368602752685547, -0.23069000244140625, -0.2245197296142578, -0.21834945678710938, -0.21217918395996094, -0.2060089111328125, -0.19983863830566406, -0.19366836547851562, -0.1874980926513672, -0.18132781982421875, -0.1751575469970703, -0.16898727416992188, -0.16281700134277344, -0.156646728515625, -0.15047645568847656, -0.14430618286132812, -0.1381359100341797, -0.13196563720703125, -0.1257953643798828, -0.11962509155273438, -0.11345481872558594, -0.1072845458984375, -0.10111427307128906, -0.09494400024414062, -0.08877372741699219, -0.08260345458984375, -0.07643318176269531, -0.07026290893554688, -0.06409263610839844, -0.05792236328125, -0.05175209045410156, -0.045581817626953125, -0.03941154479980469, -0.03324127197265625, -0.027070999145507812, -0.020900726318359375, -0.014730453491210938, -0.0085601806640625, -0.0023899078369140625, 0.003780364990234375, 0.009950637817382812, 0.01612091064453125, 0.022291183471679688, 0.028461456298828125, 0.03463172912597656, 0.040802001953125, 0.04697227478027344, 0.053142547607421875, 0.05931282043457031, 0.06548309326171875, 0.07165336608886719, 0.07782363891601562, 0.08399391174316406, 0.0901641845703125, 0.09633445739746094, 0.10250473022460938, 0.10867500305175781, 0.11484527587890625, 0.12101554870605469, 0.12718582153320312, 0.13335609436035156, 0.1395263671875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 9.0, 9.0, 15.0, 12.0, 17.0, 19.0, 21.0, 24.0, 17.0, 24.0, 19.0, 32.0, 31.0, 33.0, 34.0, 38.0, 42.0, 37.0, 43.0, 34.0, 38.0, 42.0, 43.0, 35.0, 29.0, 35.0, 32.0, 24.0, 29.0, 24.0, 28.0, 16.0, 17.0, 22.0, 14.0, 8.0, 15.0, 7.0, 6.0, 2.0, 1.0, 2.0, 6.0, 1.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.032196044921875, -0.03123307228088379, -0.030270099639892578, -0.029307126998901367, -0.028344154357910156, -0.027381181716918945, -0.026418209075927734, -0.025455236434936523, -0.024492263793945312, -0.0235292911529541, -0.02256631851196289, -0.02160334587097168, -0.02064037322998047, -0.019677400588989258, -0.018714427947998047, -0.017751455307006836, -0.016788482666015625, -0.015825510025024414, -0.014862537384033203, -0.013899564743041992, -0.012936592102050781, -0.01197361946105957, -0.01101064682006836, -0.010047674179077148, -0.009084701538085938, -0.008121728897094727, -0.007158756256103516, -0.006195783615112305, -0.005232810974121094, -0.004269838333129883, -0.003306865692138672, -0.002343893051147461, -0.00138092041015625, -0.00041794776916503906, 0.0005450248718261719, 0.0015079975128173828, 0.0024709701538085938, 0.0034339427947998047, 0.004396915435791016, 0.0053598880767822266, 0.0063228607177734375, 0.0072858333587646484, 0.00824880599975586, 0.00921177864074707, 0.010174751281738281, 0.011137723922729492, 0.012100696563720703, 0.013063669204711914, 0.014026641845703125, 0.014989614486694336, 0.015952587127685547, 0.016915559768676758, 0.01787853240966797, 0.01884150505065918, 0.01980447769165039, 0.0207674503326416, 0.021730422973632812, 0.022693395614624023, 0.023656368255615234, 0.024619340896606445, 0.025582313537597656, 0.026545286178588867, 0.027508258819580078, 0.02847123146057129, 0.0294342041015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 7.0, 5.0, 7.0, 12.0, 7.0, 31.0, 40.0, 32.0, 54.0, 102.0, 255.0, 727.0, 2937.0, 35754.0, 4089469.0, 59573.0, 3796.0, 832.0, 263.0, 125.0, 82.0, 50.0, 41.0, 26.0, 21.0, 9.0, 14.0, 0.0, 11.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65576171875, -0.6267013549804688, -0.5976409912109375, -0.5685806274414062, -0.539520263671875, -0.5104598999023438, -0.4813995361328125, -0.45233917236328125, -0.42327880859375, -0.39421844482421875, -0.3651580810546875, -0.33609771728515625, -0.307037353515625, -0.27797698974609375, -0.2489166259765625, -0.21985626220703125, -0.1907958984375, -0.16173553466796875, -0.1326751708984375, -0.10361480712890625, -0.074554443359375, -0.04549407958984375, -0.0164337158203125, 0.01262664794921875, 0.04168701171875, 0.07074737548828125, 0.0998077392578125, 0.12886810302734375, 0.157928466796875, 0.18698883056640625, 0.2160491943359375, 0.24510955810546875, 0.274169921875, 0.30323028564453125, 0.3322906494140625, 0.36135101318359375, 0.390411376953125, 0.41947174072265625, 0.4485321044921875, 0.47759246826171875, 0.50665283203125, 0.5357131958007812, 0.5647735595703125, 0.5938339233398438, 0.622894287109375, 0.6519546508789062, 0.6810150146484375, 0.7100753784179688, 0.7391357421875, 0.7681961059570312, 0.7972564697265625, 0.8263168334960938, 0.855377197265625, 0.8844375610351562, 0.9134979248046875, 0.9425582885742188, 0.97161865234375, 1.0006790161132812, 1.0297393798828125, 1.0587997436523438, 1.087860107421875, 1.1169204711914062, 1.1459808349609375, 1.1750411987304688, 1.2041015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 12.0, 24.0, 35.0, 97.0, 352.0, 2965.0, 394.0, 100.0, 40.0, 19.0, 19.0, 6.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1546630859375, -0.1458415985107422, -0.13702011108398438, -0.12819862365722656, -0.11937713623046875, -0.11055564880371094, -0.10173416137695312, -0.09291267395019531, -0.0840911865234375, -0.07526969909667969, -0.06644821166992188, -0.05762672424316406, -0.04880523681640625, -0.03998374938964844, -0.031162261962890625, -0.022340774536132812, -0.013519287109375, -0.0046977996826171875, 0.004123687744140625, 0.012945175170898438, 0.02176666259765625, 0.030588150024414062, 0.039409637451171875, 0.04823112487792969, 0.0570526123046875, 0.06587409973144531, 0.07469558715820312, 0.08351707458496094, 0.09233856201171875, 0.10116004943847656, 0.10998153686523438, 0.11880302429199219, 0.12762451171875, 0.1364459991455078, 0.14526748657226562, 0.15408897399902344, 0.16291046142578125, 0.17173194885253906, 0.18055343627929688, 0.1893749237060547, 0.1981964111328125, 0.2070178985595703, 0.21583938598632812, 0.22466087341308594, 0.23348236083984375, 0.24230384826660156, 0.2511253356933594, 0.2599468231201172, 0.268768310546875, 0.2775897979736328, 0.2864112854003906, 0.29523277282714844, 0.30405426025390625, 0.31287574768066406, 0.3216972351074219, 0.3305187225341797, 0.3393402099609375, 0.3481616973876953, 0.3569831848144531, 0.36580467224121094, 0.37462615966796875, 0.38344764709472656, 0.3922691345214844, 0.4010906219482422, 0.409912109375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 8.0, 22.0, 24.0, 40.0, 86.0, 119.0, 208.0, 171.0, 125.0, 76.0, 49.0, 28.0, 16.0, 8.0, 4.0, 2.0, 9.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1639801263809204, -1.1332707405090332, -1.1025614738464355, -1.0718520879745483, -1.0411428213119507, -1.0104334354400635, -0.979724109172821, -0.9490147829055786, -0.9183054566383362, -0.8875961303710938, -0.8568868041038513, -0.8261774778366089, -0.7954680919647217, -0.764758825302124, -0.7340494394302368, -0.7033401131629944, -0.672630786895752, -0.6419214606285095, -0.6112121343612671, -0.5805028080940247, -0.5497934818267822, -0.519084095954895, -0.4883747696876526, -0.45766544342041016, -0.4269561171531677, -0.3962467908859253, -0.36553746461868286, -0.33482810854911804, -0.3041187822818756, -0.2734094560146332, -0.24270011484622955, -0.21199077367782593, -0.18128150701522827, -0.15057218074798584, -0.11986283957958221, -0.08915350586175919, -0.05844417214393616, -0.027734845876693726, 0.0029744952917099, 0.033683836460113525, 0.06439316272735596, 0.09510249644517899, 0.12581183016300201, 0.15652117133140564, 0.18723049759864807, 0.2179398238658905, 0.24864916503429413, 0.27935850620269775, 0.3100678324699402, 0.3407771587371826, 0.37148648500442505, 0.40219584107398987, 0.4329051673412323, 0.46361449360847473, 0.49432384967803955, 0.525033175945282, 0.5557425022125244, 0.5864518284797668, 0.6171611547470093, 0.6478704810142517, 0.6785798072814941, 0.7092891931533813, 0.7399985194206238, 0.7707078456878662, 0.8014171719551086]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 6.0, 4.0, 6.0, 9.0, 12.0, 8.0, 8.0, 15.0, 20.0, 16.0, 21.0, 25.0, 24.0, 30.0, 38.0, 38.0, 44.0, 41.0, 47.0, 35.0, 33.0, 59.0, 50.0, 46.0, 42.0, 42.0, 41.0, 24.0, 41.0, 28.0, 30.0, 22.0, 14.0, 15.0, 18.0, 14.0, 6.0, 6.0, 8.0, 5.0, 6.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4577382802963257, -0.44301486015319824, -0.4282914698123932, -0.41356804966926575, -0.3988446295261383, -0.38412123918533325, -0.3693978190422058, -0.35467439889907837, -0.3399509787559509, -0.3252275586128235, -0.31050416827201843, -0.295780748128891, -0.28105732798576355, -0.2663339376449585, -0.25161051750183105, -0.2368870973587036, -0.22216370701789856, -0.2074403017759323, -0.19271688163280487, -0.17799347639083862, -0.16327005624771118, -0.14854665100574493, -0.1338232457637787, -0.11909983307123184, -0.104376420378685, -0.08965300768613815, -0.07492959499359131, -0.06020618975162506, -0.04548277705907822, -0.030759364366531372, -0.016035959124565125, -0.00131254643201828, 0.013410866260528564, 0.02813427709043026, 0.042857687920331955, 0.0575810968875885, 0.07230450958013535, 0.08702792227268219, 0.10175132751464844, 0.11647474020719528, 0.13119815289974213, 0.14592155814170837, 0.16064497828483582, 0.17536838352680206, 0.1900917887687683, 0.20481520891189575, 0.219538614153862, 0.23426201939582825, 0.2489854395389557, 0.26370885968208313, 0.2784322500228882, 0.2931556701660156, 0.30787909030914307, 0.3226025104522705, 0.33732590079307556, 0.352049320936203, 0.36677271127700806, 0.3814961314201355, 0.39621952176094055, 0.410942941904068, 0.42566636204719543, 0.4403897523880005, 0.45511317253112793, 0.46983659267425537, 0.4845600128173828]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 4.0, 7.0, 4.0, 14.0, 14.0, 43.0, 50.0, 91.0, 186.0, 317.0, 592.0, 1261.0, 2903.0, 7308.0, 19841.0, 62455.0, 214376.0, 493058.0, 168203.0, 50396.0, 16575.0, 6107.0, 2452.0, 1123.0, 536.0, 280.0, 156.0, 78.0, 44.0, 38.0, 17.0, 5.0, 10.0, 8.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1715087890625, -0.16475868225097656, -0.15800857543945312, -0.1512584686279297, -0.14450836181640625, -0.1377582550048828, -0.13100814819335938, -0.12425804138183594, -0.1175079345703125, -0.11075782775878906, -0.10400772094726562, -0.09725761413574219, -0.09050750732421875, -0.08375740051269531, -0.07700729370117188, -0.07025718688964844, -0.063507080078125, -0.05675697326660156, -0.050006866455078125, -0.04325675964355469, -0.03650665283203125, -0.029756546020507812, -0.023006439208984375, -0.016256332397460938, -0.0095062255859375, -0.0027561187744140625, 0.003993988037109375, 0.010744094848632812, 0.01749420166015625, 0.024244308471679688, 0.030994415283203125, 0.03774452209472656, 0.04449462890625, 0.05124473571777344, 0.057994842529296875, 0.06474494934082031, 0.07149505615234375, 0.07824516296386719, 0.08499526977539062, 0.09174537658691406, 0.0984954833984375, 0.10524559020996094, 0.11199569702148438, 0.11874580383300781, 0.12549591064453125, 0.1322460174560547, 0.13899612426757812, 0.14574623107910156, 0.152496337890625, 0.15924644470214844, 0.16599655151367188, 0.1727466583251953, 0.17949676513671875, 0.1862468719482422, 0.19299697875976562, 0.19974708557128906, 0.2064971923828125, 0.21324729919433594, 0.21999740600585938, 0.2267475128173828, 0.23349761962890625, 0.2402477264404297, 0.24699783325195312, 0.25374794006347656, 0.260498046875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 7.0, 5.0, 5.0, 7.0, 9.0, 9.0, 12.0, 10.0, 19.0, 18.0, 22.0, 23.0, 27.0, 29.0, 33.0, 27.0, 34.0, 26.0, 34.0, 33.0, 48.0, 34.0, 38.0, 42.0, 37.0, 42.0, 38.0, 36.0, 36.0, 33.0, 37.0, 28.0, 22.0, 24.0, 21.0, 14.0, 17.0, 16.0, 13.0, 7.0, 7.0, 4.0, 7.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.042266845703125, -0.04100465774536133, -0.039742469787597656, -0.038480281829833984, -0.03721809387207031, -0.03595590591430664, -0.03469371795654297, -0.0334315299987793, -0.032169342041015625, -0.030907154083251953, -0.02964496612548828, -0.02838277816772461, -0.027120590209960938, -0.025858402252197266, -0.024596214294433594, -0.023334026336669922, -0.02207183837890625, -0.020809650421142578, -0.019547462463378906, -0.018285274505615234, -0.017023086547851562, -0.01576089859008789, -0.014498710632324219, -0.013236522674560547, -0.011974334716796875, -0.010712146759033203, -0.009449958801269531, -0.00818777084350586, -0.0069255828857421875, -0.005663394927978516, -0.004401206970214844, -0.003139019012451172, -0.0018768310546875, -0.0006146430969238281, 0.0006475448608398438, 0.0019097328186035156, 0.0031719207763671875, 0.004434108734130859, 0.005696296691894531, 0.006958484649658203, 0.008220672607421875, 0.009482860565185547, 0.010745048522949219, 0.01200723648071289, 0.013269424438476562, 0.014531612396240234, 0.015793800354003906, 0.017055988311767578, 0.01831817626953125, 0.019580364227294922, 0.020842552185058594, 0.022104740142822266, 0.023366928100585938, 0.02462911605834961, 0.02589130401611328, 0.027153491973876953, 0.028415679931640625, 0.029677867889404297, 0.03094005584716797, 0.03220224380493164, 0.03346443176269531, 0.034726619720458984, 0.035988807678222656, 0.03725099563598633, 0.03851318359375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 6.0, 5.0, 11.0, 13.0, 17.0, 25.0, 39.0, 41.0, 69.0, 84.0, 118.0, 191.0, 236.0, 346.0, 600.0, 915.0, 1724.0, 3799.0, 10789.0, 44075.0, 250974.0, 606974.0, 95703.0, 20062.0, 5963.0, 2439.0, 1264.0, 688.0, 416.0, 264.0, 208.0, 137.0, 109.0, 63.0, 49.0, 27.0, 24.0, 31.0, 20.0, 6.0, 10.0, 4.0, 8.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.283935546875, -0.2748451232910156, -0.26575469970703125, -0.2566642761230469, -0.2475738525390625, -0.23848342895507812, -0.22939300537109375, -0.22030258178710938, -0.211212158203125, -0.20212173461914062, -0.19303131103515625, -0.18394088745117188, -0.1748504638671875, -0.16576004028320312, -0.15666961669921875, -0.14757919311523438, -0.13848876953125, -0.12939834594726562, -0.12030792236328125, -0.11121749877929688, -0.1021270751953125, -0.09303665161132812, -0.08394622802734375, -0.07485580444335938, -0.065765380859375, -0.056674957275390625, -0.04758453369140625, -0.038494110107421875, -0.0294036865234375, -0.020313262939453125, -0.01122283935546875, -0.002132415771484375, 0.0069580078125, 0.016048431396484375, 0.02513885498046875, 0.034229278564453125, 0.0433197021484375, 0.052410125732421875, 0.06150054931640625, 0.07059097290039062, 0.079681396484375, 0.08877182006835938, 0.09786224365234375, 0.10695266723632812, 0.1160430908203125, 0.12513351440429688, 0.13422393798828125, 0.14331436157226562, 0.15240478515625, 0.16149520874023438, 0.17058563232421875, 0.17967605590820312, 0.1887664794921875, 0.19785690307617188, 0.20694732666015625, 0.21603775024414062, 0.225128173828125, 0.23421859741210938, 0.24330902099609375, 0.2523994445800781, 0.2614898681640625, 0.2705802917480469, 0.27967071533203125, 0.2887611389160156, 0.2978515625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 7.0, 5.0, 15.0, 9.0, 15.0, 13.0, 19.0, 26.0, 25.0, 34.0, 40.0, 48.0, 37.0, 47.0, 61.0, 55.0, 70.0, 58.0, 55.0, 51.0, 42.0, 35.0, 30.0, 29.0, 31.0, 27.0, 21.0, 14.0, 15.0, 12.0, 13.0, 12.0, 4.0, 3.0, 6.0, 3.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.23681640625, -0.22795486450195312, -0.21909332275390625, -0.21023178100585938, -0.2013702392578125, -0.19250869750976562, -0.18364715576171875, -0.17478561401367188, -0.165924072265625, -0.15706253051757812, -0.14820098876953125, -0.13933944702148438, -0.1304779052734375, -0.12161636352539062, -0.11275482177734375, -0.10389328002929688, -0.09503173828125, -0.08617019653320312, -0.07730865478515625, -0.06844711303710938, -0.0595855712890625, -0.050724029541015625, -0.04186248779296875, -0.033000946044921875, -0.024139404296875, -0.015277862548828125, -0.00641632080078125, 0.002445220947265625, 0.0113067626953125, 0.020168304443359375, 0.02902984619140625, 0.037891387939453125, 0.0467529296875, 0.055614471435546875, 0.06447601318359375, 0.07333755493164062, 0.0821990966796875, 0.09106063842773438, 0.09992218017578125, 0.10878372192382812, 0.117645263671875, 0.12650680541992188, 0.13536834716796875, 0.14422988891601562, 0.1530914306640625, 0.16195297241210938, 0.17081451416015625, 0.17967605590820312, 0.18853759765625, 0.19739913940429688, 0.20626068115234375, 0.21512222290039062, 0.2239837646484375, 0.23284530639648438, 0.24170684814453125, 0.2505683898925781, 0.259429931640625, 0.2682914733886719, 0.27715301513671875, 0.2860145568847656, 0.2948760986328125, 0.3037376403808594, 0.31259918212890625, 0.3214607238769531, 0.330322265625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 6.0, 3.0, 16.0, 20.0, 27.0, 56.0, 81.0, 167.0, 345.0, 808.0, 2554.0, 20841.0, 997900.0, 21743.0, 2493.0, 791.0, 311.0, 160.0, 102.0, 46.0, 34.0, 17.0, 9.0, 7.0, 6.0, 9.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8583984375, -0.8342208862304688, -0.8100433349609375, -0.7858657836914062, -0.761688232421875, -0.7375106811523438, -0.7133331298828125, -0.6891555786132812, -0.66497802734375, -0.6408004760742188, -0.6166229248046875, -0.5924453735351562, -0.568267822265625, -0.5440902709960938, -0.5199127197265625, -0.49573516845703125, -0.4715576171875, -0.44738006591796875, -0.4232025146484375, -0.39902496337890625, -0.374847412109375, -0.35066986083984375, -0.3264923095703125, -0.30231475830078125, -0.27813720703125, -0.25395965576171875, -0.2297821044921875, -0.20560455322265625, -0.181427001953125, -0.15724945068359375, -0.1330718994140625, -0.10889434814453125, -0.084716796875, -0.06053924560546875, -0.0363616943359375, -0.01218414306640625, 0.011993408203125, 0.03617095947265625, 0.0603485107421875, 0.08452606201171875, 0.10870361328125, 0.13288116455078125, 0.1570587158203125, 0.18123626708984375, 0.205413818359375, 0.22959136962890625, 0.2537689208984375, 0.27794647216796875, 0.3021240234375, 0.32630157470703125, 0.3504791259765625, 0.37465667724609375, 0.398834228515625, 0.42301177978515625, 0.4471893310546875, 0.47136688232421875, 0.49554443359375, 0.5197219848632812, 0.5438995361328125, 0.5680770874023438, 0.592254638671875, 0.6164321899414062, 0.6406097412109375, 0.6647872924804688, 0.68896484375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 10.0, 15.0, 32.0, 33.0, 44.0, 46.0, 80.0, 107.0, 103.0, 107.0, 126.0, 87.0, 75.0, 35.0, 29.0, 27.0, 17.0, 9.0, 4.0, 8.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0001227855682373047, -0.00011971313506364822, -0.00011664070188999176, -0.0001135682687163353, -0.00011049583554267883, -0.00010742340236902237, -0.0001043509691953659, -0.00010127853602170944, -9.820610284805298e-05, -9.513366967439651e-05, -9.206123650074005e-05, -8.898880332708359e-05, -8.591637015342712e-05, -8.284393697977066e-05, -7.97715038061142e-05, -7.669907063245773e-05, -7.362663745880127e-05, -7.05542042851448e-05, -6.748177111148834e-05, -6.440933793783188e-05, -6.133690476417542e-05, -5.826447159051895e-05, -5.519203841686249e-05, -5.2119605243206024e-05, -4.904717206954956e-05, -4.59747388958931e-05, -4.290230572223663e-05, -3.982987254858017e-05, -3.6757439374923706e-05, -3.368500620126724e-05, -3.061257302761078e-05, -2.7540139853954315e-05, -2.446770668029785e-05, -2.1395273506641388e-05, -1.8322840332984924e-05, -1.525040715932846e-05, -1.2177973985671997e-05, -9.105540812015533e-06, -6.03310763835907e-06, -2.960674464702606e-06, 1.1175870895385742e-07, 3.184191882610321e-06, 6.256625056266785e-06, 9.329058229923248e-06, 1.2401491403579712e-05, 1.5473924577236176e-05, 1.854635775089264e-05, 2.1618790924549103e-05, 2.4691224098205566e-05, 2.776365727186203e-05, 3.0836090445518494e-05, 3.390852361917496e-05, 3.698095679283142e-05, 4.0053389966487885e-05, 4.312582314014435e-05, 4.619825631380081e-05, 4.9270689487457275e-05, 5.234312266111374e-05, 5.54155558347702e-05, 5.8487989008426666e-05, 6.156042218208313e-05, 6.46328553557396e-05, 6.770528852939606e-05, 7.077772170305252e-05, 7.385015487670898e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 5.0, 7.0, 7.0, 12.0, 21.0, 21.0, 41.0, 45.0, 87.0, 135.0, 235.0, 410.0, 1018.0, 2820.0, 11485.0, 326860.0, 685081.0, 14716.0, 3247.0, 1170.0, 488.0, 268.0, 134.0, 76.0, 59.0, 24.0, 21.0, 18.0, 19.0, 10.0, 3.0, 4.0, 4.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.430908203125, -0.4165763854980469, -0.40224456787109375, -0.3879127502441406, -0.3735809326171875, -0.3592491149902344, -0.34491729736328125, -0.3305854797363281, -0.316253662109375, -0.3019218444824219, -0.28759002685546875, -0.2732582092285156, -0.2589263916015625, -0.24459457397460938, -0.23026275634765625, -0.21593093872070312, -0.20159912109375, -0.18726730346679688, -0.17293548583984375, -0.15860366821289062, -0.1442718505859375, -0.12994003295898438, -0.11560821533203125, -0.10127639770507812, -0.086944580078125, -0.07261276245117188, -0.05828094482421875, -0.043949127197265625, -0.0296173095703125, -0.015285491943359375, -0.00095367431640625, 0.013378143310546875, 0.0277099609375, 0.042041778564453125, 0.05637359619140625, 0.07070541381835938, 0.0850372314453125, 0.09936904907226562, 0.11370086669921875, 0.12803268432617188, 0.142364501953125, 0.15669631958007812, 0.17102813720703125, 0.18535995483398438, 0.1996917724609375, 0.21402359008789062, 0.22835540771484375, 0.24268722534179688, 0.25701904296875, 0.2713508605957031, 0.28568267822265625, 0.3000144958496094, 0.3143463134765625, 0.3286781311035156, 0.34300994873046875, 0.3573417663574219, 0.371673583984375, 0.3860054016113281, 0.40033721923828125, 0.4146690368652344, 0.4290008544921875, 0.4433326721191406, 0.45766448974609375, 0.4719963073730469, 0.486328125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 0.0, 5.0, 4.0, 7.0, 6.0, 2.0, 9.0, 16.0, 22.0, 47.0, 62.0, 132.0, 215.0, 190.0, 107.0, 67.0, 44.0, 25.0, 16.0, 1.0, 5.0, 3.0, 3.0, 0.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.310791015625, -0.3018836975097656, -0.29297637939453125, -0.2840690612792969, -0.2751617431640625, -0.2662544250488281, -0.25734710693359375, -0.24843978881835938, -0.239532470703125, -0.23062515258789062, -0.22171783447265625, -0.21281051635742188, -0.2039031982421875, -0.19499588012695312, -0.18608856201171875, -0.17718124389648438, -0.16827392578125, -0.15936660766601562, -0.15045928955078125, -0.14155197143554688, -0.1326446533203125, -0.12373733520507812, -0.11483001708984375, -0.10592269897460938, -0.097015380859375, -0.08810806274414062, -0.07920074462890625, -0.07029342651367188, -0.0613861083984375, -0.052478790283203125, -0.04357147216796875, -0.034664154052734375, -0.0257568359375, -0.016849517822265625, -0.00794219970703125, 0.000965118408203125, 0.0098724365234375, 0.018779754638671875, 0.02768707275390625, 0.036594390869140625, 0.045501708984375, 0.054409027099609375, 0.06331634521484375, 0.07222366333007812, 0.0811309814453125, 0.09003829956054688, 0.09894561767578125, 0.10785293579101562, 0.11676025390625, 0.12566757202148438, 0.13457489013671875, 0.14348220825195312, 0.1523895263671875, 0.16129684448242188, 0.17020416259765625, 0.17911148071289062, 0.188018798828125, 0.19692611694335938, 0.20583343505859375, 0.21474075317382812, 0.2236480712890625, 0.23255538940429688, 0.24146270751953125, 0.2503700256347656, 0.25927734375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 6.0, 16.0, 18.0, 36.0, 88.0, 143.0, 191.0, 182.0, 129.0, 85.0, 55.0, 24.0, 11.0, 8.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7615129947662354, -2.662475347518921, -2.5634377002716064, -2.464400053024292, -2.3653626441955566, -2.266324996948242, -2.1672873497009277, -2.0682497024536133, -1.9692120552062988, -1.8701744079589844, -1.77113676071167, -1.672099232673645, -1.5730615854263306, -1.4740239381790161, -1.3749864101409912, -1.2759487628936768, -1.1769111156463623, -1.0778734683990479, -0.9788358807563782, -0.8797982931137085, -0.780760645866394, -0.6817229986190796, -0.5826854109764099, -0.48364782333374023, -0.3846101760864258, -0.2855725586414337, -0.18653494119644165, -0.08749732375144958, 0.01154029369354248, 0.11057791113853455, 0.2096155285835266, 0.3086531162261963, 0.40769052505493164, 0.5067281723022461, 0.6057657599449158, 0.7048033475875854, 0.8038409948348999, 0.9028786420822144, 1.0019161701202393, 1.1009538173675537, 1.1999914646148682, 1.2990291118621826, 1.398066759109497, 1.497104287147522, 1.5961419343948364, 1.6951795816421509, 1.7942171096801758, 1.8932547569274902, 1.9922924041748047, 2.091330051422119, 2.1903676986694336, 2.289405345916748, 2.3884429931640625, 2.487480401992798, 2.5865180492401123, 2.6855556964874268, 2.784593343734741, 2.8836309909820557, 2.98266863822937, 3.0817062854766846, 3.18074369430542, 3.2797813415527344, 3.378818988800049, 3.4778566360473633, 3.5768942832946777]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 3.0, 4.0, 4.0, 7.0, 6.0, 13.0, 14.0, 15.0, 10.0, 14.0, 19.0, 17.0, 23.0, 33.0, 22.0, 31.0, 34.0, 26.0, 48.0, 39.0, 44.0, 42.0, 34.0, 41.0, 45.0, 45.0, 41.0, 44.0, 40.0, 40.0, 35.0, 19.0, 23.0, 19.0, 18.0, 14.0, 11.0, 6.0, 7.0, 8.0, 8.0, 9.0, 14.0, 4.0, 1.0, 3.0, 0.0, 3.0, 3.0, 0.0, 3.0, 3.0], "bins": [-1.4417780637741089, -1.4001396894454956, -1.3585011959075928, -1.3168628215789795, -1.2752244472503662, -1.2335859537124634, -1.19194757938385, -1.1503090858459473, -1.108670711517334, -1.0670323371887207, -1.0253938436508179, -0.9837554693222046, -0.9421170353889465, -0.9004786014556885, -0.8588402271270752, -0.8172017931938171, -0.7755633592605591, -0.733924925327301, -0.692286491394043, -0.6506481170654297, -0.6090096831321716, -0.5673712491989136, -0.5257328748703003, -0.48409444093704224, -0.4424560070037842, -0.4008175730705261, -0.35917916893959045, -0.3175407648086548, -0.27590233087539673, -0.23426391184329987, -0.192625492811203, -0.15098708868026733, -0.10934877395629883, -0.06771035492420197, -0.026071935892105103, 0.01556648313999176, 0.05720490217208862, 0.09884332120418549, 0.14048174023628235, 0.18212014436721802, 0.22375857830047607, 0.26539701223373413, 0.3070354163646698, 0.34867382049560547, 0.3903122544288635, 0.4319506883621216, 0.47358909249305725, 0.5152274966239929, 0.556865930557251, 0.598504364490509, 0.6401427984237671, 0.6817811727523804, 0.7234196066856384, 0.7650580406188965, 0.8066964149475098, 0.8483348488807678, 0.8899732828140259, 0.9316117167472839, 0.973250150680542, 1.0148885250091553, 1.0565268993377686, 1.0981653928756714, 1.1398037672042847, 1.1814422607421875, 1.2230806350708008]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 8.0, 10.0, 8.0, 19.0, 27.0, 45.0, 41.0, 90.0, 113.0, 189.0, 268.0, 353.0, 615.0, 1126.0, 2172.0, 4697.0, 12432.0, 37876.0, 188206.0, 3652982.0, 227306.0, 41797.0, 13156.0, 5222.0, 2369.0, 1188.0, 692.0, 454.0, 249.0, 173.0, 121.0, 82.0, 64.0, 45.0, 24.0, 24.0, 16.0, 9.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.27392578125, -0.2659950256347656, -0.25806427001953125, -0.2501335144042969, -0.2422027587890625, -0.23427200317382812, -0.22634124755859375, -0.21841049194335938, -0.210479736328125, -0.20254898071289062, -0.19461822509765625, -0.18668746948242188, -0.1787567138671875, -0.17082595825195312, -0.16289520263671875, -0.15496444702148438, -0.14703369140625, -0.13910293579101562, -0.13117218017578125, -0.12324142456054688, -0.1153106689453125, -0.10737991333007812, -0.09944915771484375, -0.09151840209960938, -0.083587646484375, -0.07565689086914062, -0.06772613525390625, -0.059795379638671875, -0.0518646240234375, -0.043933868408203125, -0.03600311279296875, -0.028072357177734375, -0.0201416015625, -0.012210845947265625, -0.00428009033203125, 0.003650665283203125, 0.0115814208984375, 0.019512176513671875, 0.02744293212890625, 0.035373687744140625, 0.043304443359375, 0.051235198974609375, 0.05916595458984375, 0.06709671020507812, 0.0750274658203125, 0.08295822143554688, 0.09088897705078125, 0.09881973266601562, 0.10675048828125, 0.11468124389648438, 0.12261199951171875, 0.13054275512695312, 0.1384735107421875, 0.14640426635742188, 0.15433502197265625, 0.16226577758789062, 0.170196533203125, 0.17812728881835938, 0.18605804443359375, 0.19398880004882812, 0.2019195556640625, 0.20985031127929688, 0.21778106689453125, 0.22571182250976562, 0.233642578125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 8.0, 2.0, 10.0, 10.0, 9.0, 12.0, 11.0, 13.0, 25.0, 20.0, 29.0, 25.0, 40.0, 25.0, 39.0, 40.0, 44.0, 48.0, 38.0, 39.0, 26.0, 37.0, 41.0, 33.0, 34.0, 43.0, 36.0, 35.0, 29.0, 30.0, 18.0, 23.0, 15.0, 21.0, 19.0, 11.0, 8.0, 15.0, 10.0, 5.0, 5.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0404052734375, -0.03900623321533203, -0.03760719299316406, -0.036208152770996094, -0.034809112548828125, -0.033410072326660156, -0.03201103210449219, -0.03061199188232422, -0.02921295166015625, -0.02781391143798828, -0.026414871215820312, -0.025015830993652344, -0.023616790771484375, -0.022217750549316406, -0.020818710327148438, -0.01941967010498047, -0.0180206298828125, -0.01662158966064453, -0.015222549438476562, -0.013823509216308594, -0.012424468994140625, -0.011025428771972656, -0.009626388549804688, -0.008227348327636719, -0.00682830810546875, -0.005429267883300781, -0.0040302276611328125, -0.0026311874389648438, -0.001232147216796875, 0.00016689300537109375, 0.0015659332275390625, 0.0029649734497070312, 0.004364013671875, 0.005763053894042969, 0.0071620941162109375, 0.008561134338378906, 0.009960174560546875, 0.011359214782714844, 0.012758255004882812, 0.014157295227050781, 0.01555633544921875, 0.01695537567138672, 0.018354415893554688, 0.019753456115722656, 0.021152496337890625, 0.022551536560058594, 0.023950576782226562, 0.02534961700439453, 0.0267486572265625, 0.02814769744873047, 0.029546737670898438, 0.030945777893066406, 0.032344818115234375, 0.033743858337402344, 0.03514289855957031, 0.03654193878173828, 0.03794097900390625, 0.03934001922607422, 0.04073905944824219, 0.042138099670410156, 0.043537139892578125, 0.044936180114746094, 0.04633522033691406, 0.04773426055908203, 0.04913330078125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 5.0, 7.0, 13.0, 12.0, 40.0, 36.0, 86.0, 162.0, 264.0, 512.0, 1115.0, 2626.0, 8396.0, 37852.0, 601028.0, 3454243.0, 69087.0, 12425.0, 3665.0, 1353.0, 641.0, 291.0, 188.0, 105.0, 53.0, 34.0, 18.0, 19.0, 10.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47314453125, -0.45795440673828125, -0.4427642822265625, -0.42757415771484375, -0.412384033203125, -0.39719390869140625, -0.3820037841796875, -0.36681365966796875, -0.35162353515625, -0.33643341064453125, -0.3212432861328125, -0.30605316162109375, -0.290863037109375, -0.27567291259765625, -0.2604827880859375, -0.24529266357421875, -0.2301025390625, -0.21491241455078125, -0.1997222900390625, -0.18453216552734375, -0.169342041015625, -0.15415191650390625, -0.1389617919921875, -0.12377166748046875, -0.10858154296875, -0.09339141845703125, -0.0782012939453125, -0.06301116943359375, -0.047821044921875, -0.03263092041015625, -0.0174407958984375, -0.00225067138671875, 0.012939453125, 0.02812957763671875, 0.0433197021484375, 0.05850982666015625, 0.073699951171875, 0.08889007568359375, 0.1040802001953125, 0.11927032470703125, 0.13446044921875, 0.14965057373046875, 0.1648406982421875, 0.18003082275390625, 0.195220947265625, 0.21041107177734375, 0.2256011962890625, 0.24079132080078125, 0.2559814453125, 0.27117156982421875, 0.2863616943359375, 0.30155181884765625, 0.316741943359375, 0.33193206787109375, 0.3471221923828125, 0.36231231689453125, 0.37750244140625, 0.39269256591796875, 0.4078826904296875, 0.42307281494140625, 0.438262939453125, 0.45345306396484375, 0.4686431884765625, 0.48383331298828125, 0.4990234375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 12.0, 6.0, 11.0, 14.0, 22.0, 42.0, 64.0, 89.0, 224.0, 566.0, 2131.0, 457.0, 180.0, 94.0, 52.0, 32.0, 21.0, 15.0, 7.0, 9.0, 4.0, 2.0, 5.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1810302734375, -0.1746501922607422, -0.16827011108398438, -0.16189002990722656, -0.15550994873046875, -0.14912986755371094, -0.14274978637695312, -0.1363697052001953, -0.1299896240234375, -0.12360954284667969, -0.11722946166992188, -0.11084938049316406, -0.10446929931640625, -0.09808921813964844, -0.09170913696289062, -0.08532905578613281, -0.078948974609375, -0.07256889343261719, -0.06618881225585938, -0.05980873107910156, -0.05342864990234375, -0.04704856872558594, -0.040668487548828125, -0.03428840637207031, -0.0279083251953125, -0.021528244018554688, -0.015148162841796875, -0.008768081665039062, -0.00238800048828125, 0.0039920806884765625, 0.010372161865234375, 0.016752243041992188, 0.02313232421875, 0.029512405395507812, 0.035892486572265625, 0.04227256774902344, 0.04865264892578125, 0.05503273010253906, 0.061412811279296875, 0.06779289245605469, 0.0741729736328125, 0.08055305480957031, 0.08693313598632812, 0.09331321716308594, 0.09969329833984375, 0.10607337951660156, 0.11245346069335938, 0.11883354187011719, 0.125213623046875, 0.1315937042236328, 0.13797378540039062, 0.14435386657714844, 0.15073394775390625, 0.15711402893066406, 0.16349411010742188, 0.1698741912841797, 0.1762542724609375, 0.1826343536376953, 0.18901443481445312, 0.19539451599121094, 0.20177459716796875, 0.20815467834472656, 0.21453475952148438, 0.2209148406982422, 0.227294921875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 11.0, 22.0, 39.0, 93.0, 192.0, 281.0, 195.0, 104.0, 44.0, 10.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6991891860961914, -2.6360106468200684, -2.5728321075439453, -2.509653329849243, -2.44647479057312, -2.383296251296997, -2.320117712020874, -2.256938934326172, -2.193760395050049, -2.130581855773926, -2.0674033164978027, -2.0042245388031006, -1.9410459995269775, -1.8778674602508545, -1.8146889209747314, -1.7515102624893188, -1.6883317232131958, -1.6251531839370728, -1.5619745254516602, -1.498795986175537, -1.4356173276901245, -1.3724387884140015, -1.3092601299285889, -1.2460815906524658, -1.1829030513763428, -1.1197245121002197, -1.0565458536148071, -0.9933673143386841, -0.9301886558532715, -0.8670101165771484, -0.8038315176963806, -0.7406529188156128, -0.6774741411209106, -0.6142955422401428, -0.551116943359375, -0.48793837428092957, -0.42475977540016174, -0.3615811765193939, -0.2984026074409485, -0.23522400856018066, -0.17204540967941284, -0.10886681824922562, -0.04568822681903839, 0.017490357160568237, 0.08066895604133606, 0.14384755492210388, 0.20702612400054932, 0.27020472288131714, 0.33338332176208496, 0.3965619206428528, 0.4597405195236206, 0.5229190587997437, 0.5860977172851562, 0.6492762565612793, 0.7124548554420471, 0.7756334543228149, 0.8388120532035828, 0.9019906520843506, 0.9651692509651184, 1.0283478498458862, 1.0915263891220093, 1.1547050476074219, 1.217883586883545, 1.281062126159668, 1.3442407846450806]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 9.0, 8.0, 3.0, 7.0, 9.0, 11.0, 11.0, 17.0, 19.0, 22.0, 21.0, 32.0, 39.0, 27.0, 34.0, 30.0, 37.0, 35.0, 48.0, 42.0, 41.0, 41.0, 52.0, 47.0, 43.0, 31.0, 35.0, 31.0, 39.0, 18.0, 32.0, 17.0, 20.0, 14.0, 15.0, 16.0, 15.0, 12.0, 5.0, 5.0, 4.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5356293320655823, -0.5192423462867737, -0.5028553605079651, -0.4864684045314789, -0.4700814485549927, -0.4536944627761841, -0.4373074769973755, -0.4209204912185669, -0.4045335352420807, -0.3881465494632721, -0.3717595934867859, -0.3553726077079773, -0.3389856219291687, -0.3225986659526825, -0.3062116801738739, -0.2898247241973877, -0.2734377384185791, -0.2570507526397705, -0.2406637966632843, -0.2242768108844757, -0.2078898400068283, -0.1915028691291809, -0.17511588335037231, -0.15872891247272491, -0.14234194159507751, -0.12595497071743011, -0.10956799238920212, -0.09318101406097412, -0.07679404318332672, -0.06040707230567932, -0.044020093977451324, -0.027633115649223328, -0.011246144771575928, 0.005140829831361771, 0.02152780443429947, 0.03791477903723717, 0.054301753640174866, 0.07068872451782227, 0.08707570284605026, 0.10346268117427826, 0.11984965205192566, 0.13623662292957306, 0.15262359380722046, 0.16901057958602905, 0.18539755046367645, 0.20178452134132385, 0.21817150712013245, 0.23455847799777985, 0.25094544887542725, 0.26733243465423584, 0.28371939063072205, 0.30010637640953064, 0.31649333238601685, 0.33288031816482544, 0.34926730394363403, 0.3656542897224426, 0.38204124569892883, 0.3984282314777374, 0.41481518745422363, 0.4312021732330322, 0.4475891590118408, 0.463976114988327, 0.4803631007671356, 0.4967500567436218, 0.5131370425224304]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 7.0, 11.0, 11.0, 24.0, 56.0, 72.0, 137.0, 234.0, 458.0, 967.0, 2085.0, 4656.0, 10878.0, 27256.0, 70405.0, 180527.0, 340878.0, 244586.0, 100176.0, 38469.0, 15067.0, 6299.0, 2796.0, 1220.0, 597.0, 300.0, 154.0, 82.0, 80.0, 21.0, 19.0, 11.0, 11.0, 8.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1949462890625, -0.18932533264160156, -0.18370437622070312, -0.1780834197998047, -0.17246246337890625, -0.1668415069580078, -0.16122055053710938, -0.15559959411621094, -0.1499786376953125, -0.14435768127441406, -0.13873672485351562, -0.1331157684326172, -0.12749481201171875, -0.12187385559082031, -0.11625289916992188, -0.11063194274902344, -0.105010986328125, -0.09939002990722656, -0.09376907348632812, -0.08814811706542969, -0.08252716064453125, -0.07690620422363281, -0.07128524780273438, -0.06566429138183594, -0.0600433349609375, -0.05442237854003906, -0.048801422119140625, -0.04318046569824219, -0.03755950927734375, -0.03193855285644531, -0.026317596435546875, -0.020696640014648438, -0.01507568359375, -0.009454727172851562, -0.003833770751953125, 0.0017871856689453125, 0.00740814208984375, 0.013029098510742188, 0.018650054931640625, 0.024271011352539062, 0.0298919677734375, 0.03551292419433594, 0.041133880615234375, 0.04675483703613281, 0.05237579345703125, 0.05799674987792969, 0.06361770629882812, 0.06923866271972656, 0.074859619140625, 0.08048057556152344, 0.08610153198242188, 0.09172248840332031, 0.09734344482421875, 0.10296440124511719, 0.10858535766601562, 0.11420631408691406, 0.1198272705078125, 0.12544822692871094, 0.13106918334960938, 0.1366901397705078, 0.14231109619140625, 0.1479320526123047, 0.15355300903320312, 0.15917396545410156, 0.164794921875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 6.0, 3.0, 4.0, 5.0, 10.0, 8.0, 13.0, 17.0, 17.0, 22.0, 22.0, 26.0, 20.0, 35.0, 33.0, 37.0, 30.0, 39.0, 24.0, 45.0, 38.0, 44.0, 56.0, 40.0, 48.0, 38.0, 43.0, 31.0, 42.0, 22.0, 25.0, 22.0, 24.0, 19.0, 19.0, 11.0, 13.0, 10.0, 8.0, 15.0, 3.0, 4.0, 6.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.052001953125, -0.0504145622253418, -0.048827171325683594, -0.04723978042602539, -0.04565238952636719, -0.044064998626708984, -0.04247760772705078, -0.04089021682739258, -0.039302825927734375, -0.03771543502807617, -0.03612804412841797, -0.034540653228759766, -0.03295326232910156, -0.03136587142944336, -0.029778480529785156, -0.028191089630126953, -0.02660369873046875, -0.025016307830810547, -0.023428916931152344, -0.02184152603149414, -0.020254135131835938, -0.018666744232177734, -0.01707935333251953, -0.015491962432861328, -0.013904571533203125, -0.012317180633544922, -0.010729789733886719, -0.009142398834228516, -0.0075550079345703125, -0.005967617034912109, -0.004380226135253906, -0.002792835235595703, -0.0012054443359375, 0.0003819465637207031, 0.0019693374633789062, 0.0035567283630371094, 0.0051441192626953125, 0.006731510162353516, 0.008318901062011719, 0.009906291961669922, 0.011493682861328125, 0.013081073760986328, 0.014668464660644531, 0.016255855560302734, 0.017843246459960938, 0.01943063735961914, 0.021018028259277344, 0.022605419158935547, 0.02419281005859375, 0.025780200958251953, 0.027367591857910156, 0.02895498275756836, 0.030542373657226562, 0.032129764556884766, 0.03371715545654297, 0.03530454635620117, 0.036891937255859375, 0.03847932815551758, 0.04006671905517578, 0.041654109954833984, 0.04324150085449219, 0.04482889175415039, 0.046416282653808594, 0.0480036735534668, 0.049591064453125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 5.0, 7.0, 7.0, 17.0, 17.0, 26.0, 22.0, 33.0, 51.0, 63.0, 93.0, 158.0, 238.0, 376.0, 599.0, 1177.0, 3036.0, 11928.0, 78351.0, 591133.0, 314209.0, 35799.0, 6744.0, 2109.0, 872.0, 535.0, 298.0, 215.0, 124.0, 92.0, 49.0, 42.0, 33.0, 24.0, 19.0, 9.0, 9.0, 3.0, 8.0, 5.0, 5.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.383544921875, -0.37023162841796875, -0.3569183349609375, -0.34360504150390625, -0.330291748046875, -0.31697845458984375, -0.3036651611328125, -0.29035186767578125, -0.27703857421875, -0.26372528076171875, -0.2504119873046875, -0.23709869384765625, -0.223785400390625, -0.21047210693359375, -0.1971588134765625, -0.18384552001953125, -0.1705322265625, -0.15721893310546875, -0.1439056396484375, -0.13059234619140625, -0.117279052734375, -0.10396575927734375, -0.0906524658203125, -0.07733917236328125, -0.06402587890625, -0.05071258544921875, -0.0373992919921875, -0.02408599853515625, -0.010772705078125, 0.00254058837890625, 0.0158538818359375, 0.02916717529296875, 0.04248046875, 0.05579376220703125, 0.0691070556640625, 0.08242034912109375, 0.095733642578125, 0.10904693603515625, 0.1223602294921875, 0.13567352294921875, 0.14898681640625, 0.16230010986328125, 0.1756134033203125, 0.18892669677734375, 0.202239990234375, 0.21555328369140625, 0.2288665771484375, 0.24217987060546875, 0.2554931640625, 0.26880645751953125, 0.2821197509765625, 0.29543304443359375, 0.308746337890625, 0.32205963134765625, 0.3353729248046875, 0.34868621826171875, 0.36199951171875, 0.37531280517578125, 0.3886260986328125, 0.40193939208984375, 0.415252685546875, 0.42856597900390625, 0.4418792724609375, 0.45519256591796875, 0.468505859375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 1.0, 8.0, 11.0, 9.0, 12.0, 11.0, 28.0, 27.0, 28.0, 23.0, 29.0, 41.0, 42.0, 40.0, 41.0, 50.0, 49.0, 66.0, 53.0, 39.0, 35.0, 48.0, 47.0, 37.0, 32.0, 42.0, 25.0, 29.0, 21.0, 16.0, 14.0, 6.0, 10.0, 10.0, 7.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.339599609375, -0.32884979248046875, -0.3180999755859375, -0.30735015869140625, -0.296600341796875, -0.28585052490234375, -0.2751007080078125, -0.26435089111328125, -0.25360107421875, -0.24285125732421875, -0.2321014404296875, -0.22135162353515625, -0.210601806640625, -0.19985198974609375, -0.1891021728515625, -0.17835235595703125, -0.1676025390625, -0.15685272216796875, -0.1461029052734375, -0.13535308837890625, -0.124603271484375, -0.11385345458984375, -0.1031036376953125, -0.09235382080078125, -0.08160400390625, -0.07085418701171875, -0.0601043701171875, -0.04935455322265625, -0.038604736328125, -0.02785491943359375, -0.0171051025390625, -0.00635528564453125, 0.00439453125, 0.01514434814453125, 0.0258941650390625, 0.03664398193359375, 0.047393798828125, 0.05814361572265625, 0.0688934326171875, 0.07964324951171875, 0.09039306640625, 0.10114288330078125, 0.1118927001953125, 0.12264251708984375, 0.133392333984375, 0.14414215087890625, 0.1548919677734375, 0.16564178466796875, 0.1763916015625, 0.18714141845703125, 0.1978912353515625, 0.20864105224609375, 0.219390869140625, 0.23014068603515625, 0.2408905029296875, 0.25164031982421875, 0.26239013671875, 0.27313995361328125, 0.2838897705078125, 0.29463958740234375, 0.305389404296875, 0.31613922119140625, 0.3268890380859375, 0.33763885498046875, 0.348388671875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 14.0, 13.0, 19.0, 30.0, 51.0, 88.0, 127.0, 299.0, 762.0, 2808.0, 18151.0, 499875.0, 503819.0, 18265.0, 2815.0, 805.0, 286.0, 142.0, 72.0, 38.0, 27.0, 25.0, 14.0, 4.0, 4.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.54443359375, -0.5314712524414062, -0.5185089111328125, -0.5055465698242188, -0.492584228515625, -0.47962188720703125, -0.4666595458984375, -0.45369720458984375, -0.44073486328125, -0.42777252197265625, -0.4148101806640625, -0.40184783935546875, -0.388885498046875, -0.37592315673828125, -0.3629608154296875, -0.34999847412109375, -0.3370361328125, -0.32407379150390625, -0.3111114501953125, -0.29814910888671875, -0.285186767578125, -0.27222442626953125, -0.2592620849609375, -0.24629974365234375, -0.23333740234375, -0.22037506103515625, -0.2074127197265625, -0.19445037841796875, -0.181488037109375, -0.16852569580078125, -0.1555633544921875, -0.14260101318359375, -0.129638671875, -0.11667633056640625, -0.1037139892578125, -0.09075164794921875, -0.077789306640625, -0.06482696533203125, -0.0518646240234375, -0.03890228271484375, -0.02593994140625, -0.01297760009765625, -1.52587890625e-05, 0.01294708251953125, 0.025909423828125, 0.03887176513671875, 0.0518341064453125, 0.06479644775390625, 0.0777587890625, 0.09072113037109375, 0.1036834716796875, 0.11664581298828125, 0.129608154296875, 0.14257049560546875, 0.1555328369140625, 0.16849517822265625, 0.18145751953125, 0.19441986083984375, 0.2073822021484375, 0.22034454345703125, 0.233306884765625, 0.24626922607421875, 0.2592315673828125, 0.27219390869140625, 0.28515625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 8.0, 8.0, 14.0, 17.0, 23.0, 38.0, 40.0, 47.0, 59.0, 66.0, 75.0, 91.0, 84.0, 82.0, 71.0, 51.0, 50.0, 39.0, 36.0, 23.0, 25.0, 17.0, 13.0, 6.0, 5.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00010460615158081055, -0.00010221637785434723, -9.982660412788391e-05, -9.74368304014206e-05, -9.504705667495728e-05, -9.265728294849396e-05, -9.026750922203064e-05, -8.787773549556732e-05, -8.5487961769104e-05, -8.309818804264069e-05, -8.070841431617737e-05, -7.831864058971405e-05, -7.592886686325073e-05, -7.353909313678741e-05, -7.11493194103241e-05, -6.875954568386078e-05, -6.636977195739746e-05, -6.397999823093414e-05, -6.159022450447083e-05, -5.920045077800751e-05, -5.681067705154419e-05, -5.442090332508087e-05, -5.2031129598617554e-05, -4.9641355872154236e-05, -4.725158214569092e-05, -4.48618084192276e-05, -4.247203469276428e-05, -4.0082260966300964e-05, -3.7692487239837646e-05, -3.530271351337433e-05, -3.291293978691101e-05, -3.052316606044769e-05, -2.8133392333984375e-05, -2.5743618607521057e-05, -2.335384488105774e-05, -2.096407115459442e-05, -1.8574297428131104e-05, -1.6184523701667786e-05, -1.3794749975204468e-05, -1.140497624874115e-05, -9.015202522277832e-06, -6.625428795814514e-06, -4.235655069351196e-06, -1.8458813428878784e-06, 5.438923835754395e-07, 2.9336661100387573e-06, 5.323439836502075e-06, 7.713213562965393e-06, 1.0102987289428711e-05, 1.2492761015892029e-05, 1.4882534742355347e-05, 1.7272308468818665e-05, 1.9662082195281982e-05, 2.20518559217453e-05, 2.4441629648208618e-05, 2.6831403374671936e-05, 2.9221177101135254e-05, 3.161095082759857e-05, 3.400072455406189e-05, 3.639049828052521e-05, 3.8780272006988525e-05, 4.117004573345184e-05, 4.355981945991516e-05, 4.594959318637848e-05, 4.83393669128418e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 6.0, 8.0, 6.0, 14.0, 22.0, 30.0, 47.0, 78.0, 109.0, 204.0, 405.0, 957.0, 2346.0, 7318.0, 38546.0, 560956.0, 398654.0, 28938.0, 6211.0, 1990.0, 824.0, 373.0, 220.0, 111.0, 58.0, 42.0, 27.0, 17.0, 13.0, 5.0, 5.0, 7.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27490234375, -0.2653999328613281, -0.25589752197265625, -0.24639511108398438, -0.2368927001953125, -0.22739028930664062, -0.21788787841796875, -0.20838546752929688, -0.198883056640625, -0.18938064575195312, -0.17987823486328125, -0.17037582397460938, -0.1608734130859375, -0.15137100219726562, -0.14186859130859375, -0.13236618041992188, -0.12286376953125, -0.11336135864257812, -0.10385894775390625, -0.09435653686523438, -0.0848541259765625, -0.07535171508789062, -0.06584930419921875, -0.056346893310546875, -0.046844482421875, -0.037342071533203125, -0.02783966064453125, -0.018337249755859375, -0.0088348388671875, 0.000667572021484375, 0.01016998291015625, 0.019672393798828125, 0.0291748046875, 0.038677215576171875, 0.04817962646484375, 0.057682037353515625, 0.0671844482421875, 0.07668685913085938, 0.08618927001953125, 0.09569168090820312, 0.105194091796875, 0.11469650268554688, 0.12419891357421875, 0.13370132446289062, 0.1432037353515625, 0.15270614624023438, 0.16220855712890625, 0.17171096801757812, 0.18121337890625, 0.19071578979492188, 0.20021820068359375, 0.20972061157226562, 0.2192230224609375, 0.22872543334960938, 0.23822784423828125, 0.24773025512695312, 0.257232666015625, 0.2667350769042969, 0.27623748779296875, 0.2857398986816406, 0.2952423095703125, 0.3047447204589844, 0.31424713134765625, 0.3237495422363281, 0.333251953125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 4.0, 3.0, 6.0, 6.0, 5.0, 11.0, 15.0, 26.0, 35.0, 31.0, 53.0, 53.0, 71.0, 78.0, 96.0, 102.0, 85.0, 58.0, 66.0, 52.0, 29.0, 30.0, 19.0, 19.0, 9.0, 6.0, 5.0, 4.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.154052734375, -0.148712158203125, -0.14337158203125, -0.138031005859375, -0.1326904296875, -0.127349853515625, -0.12200927734375, -0.116668701171875, -0.111328125, -0.105987548828125, -0.10064697265625, -0.095306396484375, -0.0899658203125, -0.084625244140625, -0.07928466796875, -0.073944091796875, -0.068603515625, -0.063262939453125, -0.05792236328125, -0.052581787109375, -0.0472412109375, -0.041900634765625, -0.03656005859375, -0.031219482421875, -0.02587890625, -0.020538330078125, -0.01519775390625, -0.009857177734375, -0.0045166015625, 0.000823974609375, 0.00616455078125, 0.011505126953125, 0.016845703125, 0.022186279296875, 0.02752685546875, 0.032867431640625, 0.0382080078125, 0.043548583984375, 0.04888916015625, 0.054229736328125, 0.0595703125, 0.064910888671875, 0.07025146484375, 0.075592041015625, 0.0809326171875, 0.086273193359375, 0.09161376953125, 0.096954345703125, 0.102294921875, 0.107635498046875, 0.11297607421875, 0.118316650390625, 0.1236572265625, 0.128997802734375, 0.13433837890625, 0.139678955078125, 0.14501953125, 0.150360107421875, 0.15570068359375, 0.161041259765625, 0.1663818359375, 0.171722412109375, 0.17706298828125, 0.182403564453125, 0.187744140625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 25.0, 94.0, 198.0, 304.0, 236.0, 85.0, 39.0, 8.0, 5.0, 1.0, 0.0, 3.0, 2.0], "bins": [-9.819957733154297, -9.640528678894043, -9.461099624633789, -9.281670570373535, -9.102241516113281, -8.922812461853027, -8.743383407592773, -8.563955307006836, -8.384526252746582, -8.205097198486328, -8.025668144226074, -7.84623908996582, -7.666810512542725, -7.487381458282471, -7.307952404022217, -7.128523349761963, -6.949093818664551, -6.769664764404297, -6.590235710144043, -6.410806655883789, -6.231378078460693, -6.0519490242004395, -5.8725199699401855, -5.693090915679932, -5.513662338256836, -5.334233283996582, -5.154804229736328, -4.975375175476074, -4.7959465980529785, -4.616517543792725, -4.437088489532471, -4.257659435272217, -4.078230381011963, -3.898801326751709, -3.719372510910034, -3.5399434566497803, -3.3605144023895264, -3.1810855865478516, -3.0016565322875977, -2.8222274780273438, -2.64279842376709, -2.463369369506836, -2.283940553665161, -2.1045114994049072, -1.9250824451446533, -1.745653510093689, -1.5662245750427246, -1.3867955207824707, -1.207366704940796, -1.0279377698898315, -0.8485087156295776, -0.6690797805786133, -0.48965078592300415, -0.310221791267395, -0.13079285621643066, 0.04863619804382324, 0.2280651330947876, 0.40749412775039673, 0.5869231224060059, 0.7663520574569702, 0.9457810521125793, 1.1252100467681885, 1.3046389818191528, 1.4840680360794067, 1.663496971130371]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 9.0, 10.0, 14.0, 12.0, 8.0, 13.0, 21.0, 16.0, 22.0, 30.0, 34.0, 24.0, 28.0, 29.0, 41.0, 39.0, 56.0, 43.0, 53.0, 45.0, 39.0, 43.0, 51.0, 34.0, 33.0, 41.0, 34.0, 38.0, 30.0, 20.0, 15.0, 13.0, 12.0, 7.0, 7.0, 10.0, 6.0, 6.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6344897747039795, -1.5825459957122803, -1.530602216720581, -1.4786584377288818, -1.4267146587371826, -1.3747708797454834, -1.3228269815444946, -1.2708832025527954, -1.2189394235610962, -1.166995644569397, -1.1150518655776978, -1.0631080865859985, -1.0111641883850098, -0.9592204689979553, -0.9072766304016113, -0.8553328514099121, -0.8033890724182129, -0.7514452934265137, -0.6995015144348145, -0.6475576758384705, -0.5956138968467712, -0.543670117855072, -0.4917263090610504, -0.4397825002670288, -0.3878387212753296, -0.33589494228363037, -0.28395113348960876, -0.23200733959674835, -0.18006354570388794, -0.12811976671218872, -0.07617595791816711, -0.024232149124145508, 0.02771151065826416, 0.07965530455112457, 0.13159909844398499, 0.1835428923368454, 0.2354866862297058, 0.28743046522140503, 0.33937427401542664, 0.39131808280944824, 0.44326186180114746, 0.4952056407928467, 0.5471494197845459, 0.5990932583808899, 0.6510370373725891, 0.7029808163642883, 0.7549246549606323, 0.8068684339523315, 0.8588122129440308, 0.91075599193573, 0.9626997709274292, 1.0146435499191284, 1.0665874481201172, 1.1185312271118164, 1.1704750061035156, 1.2224187850952148, 1.274362564086914, 1.3263063430786133, 1.3782501220703125, 1.4301939010620117, 1.482137680053711, 1.5340814590454102, 1.586025357246399, 1.6379691362380981, 1.6899129152297974]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 5.0, 2.0, 10.0, 8.0, 7.0, 12.0, 35.0, 23.0, 59.0, 70.0, 91.0, 131.0, 182.0, 263.0, 341.0, 574.0, 844.0, 1394.0, 2487.0, 5183.0, 14126.0, 85795.0, 4011490.0, 50093.0, 10967.0, 4217.0, 2177.0, 1255.0, 761.0, 505.0, 333.0, 219.0, 166.0, 112.0, 90.0, 58.0, 48.0, 37.0, 35.0, 15.0, 27.0, 7.0, 7.0, 8.0, 8.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29638671875, -0.2872352600097656, -0.27808380126953125, -0.2689323425292969, -0.2597808837890625, -0.2506294250488281, -0.24147796630859375, -0.23232650756835938, -0.223175048828125, -0.21402359008789062, -0.20487213134765625, -0.19572067260742188, -0.1865692138671875, -0.17741775512695312, -0.16826629638671875, -0.15911483764648438, -0.14996337890625, -0.14081192016601562, -0.13166046142578125, -0.12250900268554688, -0.1133575439453125, -0.10420608520507812, -0.09505462646484375, -0.08590316772460938, -0.076751708984375, -0.06760025024414062, -0.05844879150390625, -0.049297332763671875, -0.0401458740234375, -0.030994415283203125, -0.02184295654296875, -0.012691497802734375, -0.0035400390625, 0.005611419677734375, 0.01476287841796875, 0.023914337158203125, 0.0330657958984375, 0.042217254638671875, 0.05136871337890625, 0.060520172119140625, 0.069671630859375, 0.07882308959960938, 0.08797454833984375, 0.09712600708007812, 0.1062774658203125, 0.11542892456054688, 0.12458038330078125, 0.13373184204101562, 0.14288330078125, 0.15203475952148438, 0.16118621826171875, 0.17033767700195312, 0.1794891357421875, 0.18864059448242188, 0.19779205322265625, 0.20694351196289062, 0.216094970703125, 0.22524642944335938, 0.23439788818359375, 0.24354934692382812, 0.2527008056640625, 0.2618522644042969, 0.27100372314453125, 0.2801551818847656, 0.289306640625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 6.0, 11.0, 12.0, 11.0, 27.0, 27.0, 29.0, 39.0, 51.0, 56.0, 65.0, 69.0, 76.0, 82.0, 72.0, 56.0, 68.0, 57.0, 35.0, 38.0, 25.0, 27.0, 14.0, 15.0, 11.0, 7.0, 8.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07501220703125, -0.07204246520996094, -0.06907272338867188, -0.06610298156738281, -0.06313323974609375, -0.06016349792480469, -0.057193756103515625, -0.05422401428222656, -0.0512542724609375, -0.04828453063964844, -0.045314788818359375, -0.04234504699707031, -0.03937530517578125, -0.03640556335449219, -0.033435821533203125, -0.030466079711914062, -0.027496337890625, -0.024526596069335938, -0.021556854248046875, -0.018587112426757812, -0.01561737060546875, -0.012647628784179688, -0.009677886962890625, -0.0067081451416015625, -0.0037384033203125, -0.0007686614990234375, 0.002201080322265625, 0.0051708221435546875, 0.00814056396484375, 0.011110305786132812, 0.014080047607421875, 0.017049789428710938, 0.02001953125, 0.022989273071289062, 0.025959014892578125, 0.028928756713867188, 0.03189849853515625, 0.03486824035644531, 0.037837982177734375, 0.04080772399902344, 0.0437774658203125, 0.04674720764160156, 0.049716949462890625, 0.05268669128417969, 0.05565643310546875, 0.05862617492675781, 0.061595916748046875, 0.06456565856933594, 0.067535400390625, 0.07050514221191406, 0.07347488403320312, 0.07644462585449219, 0.07941436767578125, 0.08238410949707031, 0.08535385131835938, 0.08832359313964844, 0.0912933349609375, 0.09426307678222656, 0.09723281860351562, 0.10020256042480469, 0.10317230224609375, 0.10614204406738281, 0.10911178588867188, 0.11208152770996094, 0.11505126953125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 7.0, 8.0, 17.0, 16.0, 37.0, 55.0, 69.0, 81.0, 132.0, 225.0, 482.0, 1191.0, 5659.0, 3658408.0, 520271.0, 5464.0, 1092.0, 393.0, 229.0, 132.0, 100.0, 61.0, 41.0, 27.0, 21.0, 18.0, 22.0, 4.0, 10.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.322265625, -1.2821807861328125, -1.242095947265625, -1.2020111083984375, -1.16192626953125, -1.1218414306640625, -1.081756591796875, -1.0416717529296875, -1.0015869140625, -0.9615020751953125, -0.921417236328125, -0.8813323974609375, -0.84124755859375, -0.8011627197265625, -0.761077880859375, -0.7209930419921875, -0.680908203125, -0.6408233642578125, -0.600738525390625, -0.5606536865234375, -0.52056884765625, -0.4804840087890625, -0.440399169921875, -0.4003143310546875, -0.3602294921875, -0.3201446533203125, -0.280059814453125, -0.2399749755859375, -0.19989013671875, -0.1598052978515625, -0.119720458984375, -0.0796356201171875, -0.03955078125, 0.0005340576171875, 0.040618896484375, 0.0807037353515625, 0.12078857421875, 0.1608734130859375, 0.200958251953125, 0.2410430908203125, 0.2811279296875, 0.3212127685546875, 0.361297607421875, 0.4013824462890625, 0.44146728515625, 0.4815521240234375, 0.521636962890625, 0.5617218017578125, 0.601806640625, 0.6418914794921875, 0.681976318359375, 0.7220611572265625, 0.76214599609375, 0.8022308349609375, 0.842315673828125, 0.8824005126953125, 0.9224853515625, 0.9625701904296875, 1.002655029296875, 1.0427398681640625, 1.08282470703125, 1.1229095458984375, 1.162994384765625, 1.2030792236328125, 1.2431640625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 5.0, 20.0, 41.0, 237.0, 3658.0, 76.0, 29.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.233154296875, -0.22516250610351562, -0.21717071533203125, -0.20917892456054688, -0.2011871337890625, -0.19319534301757812, -0.18520355224609375, -0.17721176147460938, -0.169219970703125, -0.16122817993164062, -0.15323638916015625, -0.14524459838867188, -0.1372528076171875, -0.12926101684570312, -0.12126922607421875, -0.11327743530273438, -0.10528564453125, -0.09729385375976562, -0.08930206298828125, -0.08131027221679688, -0.0733184814453125, -0.06532669067382812, -0.05733489990234375, -0.049343109130859375, -0.041351318359375, -0.033359527587890625, -0.02536773681640625, -0.017375946044921875, -0.0093841552734375, -0.001392364501953125, 0.00659942626953125, 0.014591217041015625, 0.0225830078125, 0.030574798583984375, 0.03856658935546875, 0.046558380126953125, 0.0545501708984375, 0.06254196166992188, 0.07053375244140625, 0.07852554321289062, 0.086517333984375, 0.09450912475585938, 0.10250091552734375, 0.11049270629882812, 0.1184844970703125, 0.12647628784179688, 0.13446807861328125, 0.14245986938476562, 0.15045166015625, 0.15844345092773438, 0.16643524169921875, 0.17442703247070312, 0.1824188232421875, 0.19041061401367188, 0.19840240478515625, 0.20639419555664062, 0.214385986328125, 0.22237777709960938, 0.23036956787109375, 0.23836135864257812, 0.2463531494140625, 0.2543449401855469, 0.26233673095703125, 0.2703285217285156, 0.2783203125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 17.0, 10.0, 33.0, 45.0, 72.0, 104.0, 141.0, 157.0, 148.0, 103.0, 63.0, 45.0, 26.0, 12.0, 11.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2764352560043335, -0.26142966747283936, -0.24642407894134521, -0.23141850531101227, -0.21641291677951813, -0.201407328248024, -0.18640175461769104, -0.1713961660861969, -0.15639057755470276, -0.14138498902320862, -0.12637940049171448, -0.11137382686138153, -0.09636823832988739, -0.08136264979839325, -0.0663570687174797, -0.05135148763656616, -0.03634589910507202, -0.02134031429886818, -0.006334729492664337, 0.008670855313539505, 0.023676440119743347, 0.03868202865123749, 0.05368760973215103, 0.06869319081306458, 0.08369877934455872, 0.09870436787605286, 0.1137099489569664, 0.12871553003787994, 0.14372111856937408, 0.15872670710086823, 0.17373228073120117, 0.1887378692626953, 0.20374345779418945, 0.2187490463256836, 0.23375463485717773, 0.24876020848751068, 0.263765811920166, 0.27877140045166016, 0.2937769591808319, 0.30878254771232605, 0.3237881362438202, 0.33879372477531433, 0.35379931330680847, 0.3688049018383026, 0.38381046056747437, 0.3988160490989685, 0.41382163763046265, 0.4288272261619568, 0.4438328146934509, 0.45883840322494507, 0.4738439917564392, 0.48884958028793335, 0.5038551688194275, 0.5188607573509216, 0.5338663458824158, 0.5488718748092651, 0.5638774633407593, 0.5788830518722534, 0.5938886404037476, 0.6088942289352417, 0.6238998174667358, 0.63890540599823, 0.6539109945297241, 0.6689165830612183, 0.6839221715927124]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 3.0, 7.0, 10.0, 9.0, 16.0, 16.0, 19.0, 12.0, 13.0, 31.0, 31.0, 38.0, 31.0, 43.0, 38.0, 34.0, 46.0, 57.0, 49.0, 43.0, 53.0, 49.0, 42.0, 39.0, 39.0, 38.0, 22.0, 22.0, 30.0, 20.0, 17.0, 14.0, 11.0, 13.0, 12.0, 9.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.23510068655014038, -0.22808532416820526, -0.22106997668743134, -0.21405461430549622, -0.2070392519235611, -0.20002388954162598, -0.19300854206085205, -0.18599317967891693, -0.1789778172969818, -0.1719624549150467, -0.16494710743427277, -0.15793174505233765, -0.15091638267040253, -0.1439010202884674, -0.13688567280769348, -0.12987031042575836, -0.12285496294498444, -0.11583960801362991, -0.1088242456316948, -0.10180889070034027, -0.09479352831840515, -0.08777817338705063, -0.0807628184556961, -0.07374745607376099, -0.06673210114240646, -0.05971674248576164, -0.05270138382911682, -0.0456860288977623, -0.03867067024111748, -0.031655311584472656, -0.024639956653118134, -0.017624597996473312, -0.010609239339828491, -0.0035938816145062447, 0.003421476110816002, 0.010436832904815674, 0.017452191561460495, 0.024467550218105316, 0.03148290514945984, 0.03849826380610466, 0.04551362246274948, 0.0525289811193943, 0.059544339776039124, 0.06655969470739365, 0.07357504963874817, 0.08059041202068329, 0.08760576695203781, 0.09462112188339233, 0.10163648426532745, 0.10865183919668198, 0.1156672015786171, 0.12268255650997162, 0.12969791889190674, 0.13671326637268066, 0.14372862875461578, 0.1507439911365509, 0.15775933861732483, 0.16477470099925995, 0.17179004848003387, 0.178805410861969, 0.1858207732439041, 0.19283613562583923, 0.19985148310661316, 0.20686684548854828, 0.2138822078704834]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 3.0, 10.0, 14.0, 18.0, 36.0, 40.0, 84.0, 151.0, 270.0, 466.0, 923.0, 1872.0, 3942.0, 8810.0, 21948.0, 58105.0, 160947.0, 339843.0, 274669.0, 109174.0, 39879.0, 15327.0, 6338.0, 2831.0, 1307.0, 655.0, 389.0, 195.0, 116.0, 75.0, 38.0, 26.0, 17.0, 8.0, 7.0, 6.0, 6.0, 3.0, 2.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1707763671875, -0.16463470458984375, -0.1584930419921875, -0.15235137939453125, -0.146209716796875, -0.14006805419921875, -0.1339263916015625, -0.12778472900390625, -0.12164306640625, -0.11550140380859375, -0.1093597412109375, -0.10321807861328125, -0.097076416015625, -0.09093475341796875, -0.0847930908203125, -0.07865142822265625, -0.072509765625, -0.06636810302734375, -0.0602264404296875, -0.05408477783203125, -0.047943115234375, -0.04180145263671875, -0.0356597900390625, -0.02951812744140625, -0.02337646484375, -0.01723480224609375, -0.0110931396484375, -0.00495147705078125, 0.001190185546875, 0.00733184814453125, 0.0134735107421875, 0.01961517333984375, 0.0257568359375, 0.03189849853515625, 0.0380401611328125, 0.04418182373046875, 0.050323486328125, 0.05646514892578125, 0.0626068115234375, 0.06874847412109375, 0.07489013671875, 0.08103179931640625, 0.0871734619140625, 0.09331512451171875, 0.099456787109375, 0.10559844970703125, 0.1117401123046875, 0.11788177490234375, 0.1240234375, 0.13016510009765625, 0.1363067626953125, 0.14244842529296875, 0.148590087890625, 0.15473175048828125, 0.1608734130859375, 0.16701507568359375, 0.17315673828125, 0.17929840087890625, 0.1854400634765625, 0.19158172607421875, 0.197723388671875, 0.20386505126953125, 0.2100067138671875, 0.21614837646484375, 0.2222900390625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 7.0, 9.0, 7.0, 17.0, 16.0, 18.0, 21.0, 30.0, 37.0, 52.0, 57.0, 46.0, 41.0, 56.0, 48.0, 71.0, 65.0, 56.0, 57.0, 49.0, 45.0, 25.0, 33.0, 26.0, 28.0, 19.0, 20.0, 11.0, 4.0, 7.0, 5.0, 5.0, 7.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0731201171875, -0.07024288177490234, -0.06736564636230469, -0.06448841094970703, -0.061611175537109375, -0.05873394012451172, -0.05585670471191406, -0.052979469299316406, -0.05010223388671875, -0.047224998474121094, -0.04434776306152344, -0.04147052764892578, -0.038593292236328125, -0.03571605682373047, -0.03283882141113281, -0.029961585998535156, -0.0270843505859375, -0.024207115173339844, -0.021329879760742188, -0.01845264434814453, -0.015575408935546875, -0.012698173522949219, -0.009820938110351562, -0.006943702697753906, -0.00406646728515625, -0.0011892318725585938, 0.0016880035400390625, 0.004565238952636719, 0.007442474365234375, 0.010319709777832031, 0.013196945190429688, 0.016074180603027344, 0.018951416015625, 0.021828651428222656, 0.024705886840820312, 0.02758312225341797, 0.030460357666015625, 0.03333759307861328, 0.03621482849121094, 0.039092063903808594, 0.04196929931640625, 0.044846534729003906, 0.04772377014160156, 0.05060100555419922, 0.053478240966796875, 0.05635547637939453, 0.05923271179199219, 0.062109947204589844, 0.0649871826171875, 0.06786441802978516, 0.07074165344238281, 0.07361888885498047, 0.07649612426757812, 0.07937335968017578, 0.08225059509277344, 0.0851278305053711, 0.08800506591796875, 0.0908823013305664, 0.09375953674316406, 0.09663677215576172, 0.09951400756835938, 0.10239124298095703, 0.10526847839355469, 0.10814571380615234, 0.11102294921875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 7.0, 8.0, 13.0, 19.0, 28.0, 47.0, 53.0, 73.0, 103.0, 149.0, 230.0, 323.0, 552.0, 995.0, 1876.0, 4399.0, 15306.0, 82925.0, 547758.0, 330516.0, 46266.0, 10027.0, 3204.0, 1391.0, 787.0, 485.0, 318.0, 230.0, 127.0, 85.0, 67.0, 66.0, 31.0, 28.0, 24.0, 10.0, 7.0, 7.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.39794921875, -0.38652801513671875, -0.3751068115234375, -0.36368560791015625, -0.352264404296875, -0.34084320068359375, -0.3294219970703125, -0.31800079345703125, -0.30657958984375, -0.29515838623046875, -0.2837371826171875, -0.27231597900390625, -0.260894775390625, -0.24947357177734375, -0.2380523681640625, -0.22663116455078125, -0.2152099609375, -0.20378875732421875, -0.1923675537109375, -0.18094635009765625, -0.169525146484375, -0.15810394287109375, -0.1466827392578125, -0.13526153564453125, -0.12384033203125, -0.11241912841796875, -0.1009979248046875, -0.08957672119140625, -0.078155517578125, -0.06673431396484375, -0.0553131103515625, -0.04389190673828125, -0.032470703125, -0.02104949951171875, -0.0096282958984375, 0.00179290771484375, 0.013214111328125, 0.02463531494140625, 0.0360565185546875, 0.04747772216796875, 0.05889892578125, 0.07032012939453125, 0.0817413330078125, 0.09316253662109375, 0.104583740234375, 0.11600494384765625, 0.1274261474609375, 0.13884735107421875, 0.1502685546875, 0.16168975830078125, 0.1731109619140625, 0.18453216552734375, 0.195953369140625, 0.20737457275390625, 0.2187957763671875, 0.23021697998046875, 0.24163818359375, 0.25305938720703125, 0.2644805908203125, 0.27590179443359375, 0.287322998046875, 0.29874420166015625, 0.3101654052734375, 0.32158660888671875, 0.3330078125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 1.0, 5.0, 6.0, 5.0, 6.0, 4.0, 6.0, 14.0, 20.0, 14.0, 12.0, 15.0, 24.0, 37.0, 28.0, 43.0, 36.0, 37.0, 56.0, 36.0, 46.0, 53.0, 42.0, 38.0, 35.0, 44.0, 32.0, 39.0, 47.0, 29.0, 36.0, 32.0, 27.0, 12.0, 17.0, 14.0, 10.0, 15.0, 11.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.385498046875, -0.3729896545410156, -0.36048126220703125, -0.3479728698730469, -0.3354644775390625, -0.3229560852050781, -0.31044769287109375, -0.2979393005371094, -0.285430908203125, -0.2729225158691406, -0.26041412353515625, -0.24790573120117188, -0.2353973388671875, -0.22288894653320312, -0.21038055419921875, -0.19787216186523438, -0.18536376953125, -0.17285537719726562, -0.16034698486328125, -0.14783859252929688, -0.1353302001953125, -0.12282180786132812, -0.11031341552734375, -0.09780502319335938, -0.085296630859375, -0.07278823852539062, -0.06027984619140625, -0.047771453857421875, -0.0352630615234375, -0.022754669189453125, -0.01024627685546875, 0.002262115478515625, 0.0147705078125, 0.027278900146484375, 0.03978729248046875, 0.052295684814453125, 0.0648040771484375, 0.07731246948242188, 0.08982086181640625, 0.10232925415039062, 0.114837646484375, 0.12734603881835938, 0.13985443115234375, 0.15236282348632812, 0.1648712158203125, 0.17737960815429688, 0.18988800048828125, 0.20239639282226562, 0.21490478515625, 0.22741317749023438, 0.23992156982421875, 0.2524299621582031, 0.2649383544921875, 0.2774467468261719, 0.28995513916015625, 0.3024635314941406, 0.314971923828125, 0.3274803161621094, 0.33998870849609375, 0.3524971008300781, 0.3650054931640625, 0.3775138854980469, 0.39002227783203125, 0.4025306701660156, 0.4150390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 8.0, 5.0, 10.0, 9.0, 9.0, 30.0, 55.0, 41.0, 117.0, 179.0, 349.0, 801.0, 1879.0, 6298.0, 30701.0, 294831.0, 625264.0, 71672.0, 11140.0, 2930.0, 1106.0, 506.0, 267.0, 157.0, 69.0, 46.0, 31.0, 10.0, 16.0, 6.0, 8.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1925048828125, -0.18652725219726562, -0.18054962158203125, -0.17457199096679688, -0.1685943603515625, -0.16261672973632812, -0.15663909912109375, -0.15066146850585938, -0.144683837890625, -0.13870620727539062, -0.13272857666015625, -0.12675094604492188, -0.1207733154296875, -0.11479568481445312, -0.10881805419921875, -0.10284042358398438, -0.09686279296875, -0.09088516235351562, -0.08490753173828125, -0.07892990112304688, -0.0729522705078125, -0.06697463989257812, -0.06099700927734375, -0.055019378662109375, -0.049041748046875, -0.043064117431640625, -0.03708648681640625, -0.031108856201171875, -0.0251312255859375, -0.019153594970703125, -0.01317596435546875, -0.007198333740234375, -0.001220703125, 0.004756927490234375, 0.01073455810546875, 0.016712188720703125, 0.0226898193359375, 0.028667449951171875, 0.03464508056640625, 0.040622711181640625, 0.046600341796875, 0.052577972412109375, 0.05855560302734375, 0.06453323364257812, 0.0705108642578125, 0.07648849487304688, 0.08246612548828125, 0.08844375610351562, 0.09442138671875, 0.10039901733398438, 0.10637664794921875, 0.11235427856445312, 0.1183319091796875, 0.12430953979492188, 0.13028717041015625, 0.13626480102539062, 0.142242431640625, 0.14822006225585938, 0.15419769287109375, 0.16017532348632812, 0.1661529541015625, 0.17213058471679688, 0.17810821533203125, 0.18408584594726562, 0.1900634765625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 6.0, 4.0, 6.0, 15.0, 14.0, 11.0, 21.0, 27.0, 24.0, 44.0, 50.0, 65.0, 87.0, 86.0, 93.0, 77.0, 80.0, 64.0, 51.0, 28.0, 50.0, 25.0, 21.0, 9.0, 18.0, 8.0, 8.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.963180541992188e-05, -7.7015720307827e-05, -7.439963519573212e-05, -7.178355008363724e-05, -6.916746497154236e-05, -6.655137985944748e-05, -6.39352947473526e-05, -6.131920963525772e-05, -5.870312452316284e-05, -5.608703941106796e-05, -5.3470954298973083e-05, -5.0854869186878204e-05, -4.8238784074783325e-05, -4.5622698962688446e-05, -4.300661385059357e-05, -4.039052873849869e-05, -3.777444362640381e-05, -3.515835851430893e-05, -3.254227340221405e-05, -2.992618829011917e-05, -2.7310103178024292e-05, -2.4694018065929413e-05, -2.2077932953834534e-05, -1.9461847841739655e-05, -1.6845762729644775e-05, -1.4229677617549896e-05, -1.1613592505455017e-05, -8.997507393360138e-06, -6.381422281265259e-06, -3.7653371691703796e-06, -1.1492520570755005e-06, 1.4668330550193787e-06, 4.082918167114258e-06, 6.699003279209137e-06, 9.315088391304016e-06, 1.1931173503398895e-05, 1.4547258615493774e-05, 1.7163343727588654e-05, 1.9779428839683533e-05, 2.2395513951778412e-05, 2.501159906387329e-05, 2.762768417596817e-05, 3.024376928806305e-05, 3.285985440015793e-05, 3.547593951225281e-05, 3.809202462434769e-05, 4.0708109736442566e-05, 4.3324194848537445e-05, 4.5940279960632324e-05, 4.85563650727272e-05, 5.117245018482208e-05, 5.378853529691696e-05, 5.640462040901184e-05, 5.902070552110672e-05, 6.16367906332016e-05, 6.425287574529648e-05, 6.686896085739136e-05, 6.948504596948624e-05, 7.210113108158112e-05, 7.4717216193676e-05, 7.733330130577087e-05, 7.994938641786575e-05, 8.256547152996063e-05, 8.518155664205551e-05, 8.779764175415039e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 7.0, 9.0, 13.0, 12.0, 17.0, 27.0, 31.0, 45.0, 70.0, 119.0, 213.0, 386.0, 732.0, 1622.0, 4280.0, 15315.0, 102866.0, 648904.0, 234788.0, 28199.0, 6454.0, 2255.0, 978.0, 480.0, 276.0, 147.0, 93.0, 51.0, 52.0, 21.0, 17.0, 21.0, 14.0, 16.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1903076171875, -0.18482017517089844, -0.17933273315429688, -0.1738452911376953, -0.16835784912109375, -0.1628704071044922, -0.15738296508789062, -0.15189552307128906, -0.1464080810546875, -0.14092063903808594, -0.13543319702148438, -0.1299457550048828, -0.12445831298828125, -0.11897087097167969, -0.11348342895507812, -0.10799598693847656, -0.102508544921875, -0.09702110290527344, -0.09153366088867188, -0.08604621887207031, -0.08055877685546875, -0.07507133483886719, -0.06958389282226562, -0.06409645080566406, -0.0586090087890625, -0.05312156677246094, -0.047634124755859375, -0.04214668273925781, -0.03665924072265625, -0.031171798706054688, -0.025684356689453125, -0.020196914672851562, -0.01470947265625, -0.009222030639648438, -0.003734588623046875, 0.0017528533935546875, 0.00724029541015625, 0.012727737426757812, 0.018215179443359375, 0.023702621459960938, 0.0291900634765625, 0.03467750549316406, 0.040164947509765625, 0.04565238952636719, 0.05113983154296875, 0.05662727355957031, 0.062114715576171875, 0.06760215759277344, 0.073089599609375, 0.07857704162597656, 0.08406448364257812, 0.08955192565917969, 0.09503936767578125, 0.10052680969238281, 0.10601425170898438, 0.11150169372558594, 0.1169891357421875, 0.12247657775878906, 0.12796401977539062, 0.1334514617919922, 0.13893890380859375, 0.1444263458251953, 0.14991378784179688, 0.15540122985839844, 0.160888671875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 6.0, 9.0, 4.0, 7.0, 14.0, 25.0, 41.0, 52.0, 66.0, 84.0, 100.0, 113.0, 95.0, 82.0, 86.0, 82.0, 45.0, 29.0, 16.0, 14.0, 9.0, 5.0, 6.0, 7.0, 6.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18310546875, -0.17737388610839844, -0.17164230346679688, -0.1659107208251953, -0.16017913818359375, -0.1544475555419922, -0.14871597290039062, -0.14298439025878906, -0.1372528076171875, -0.13152122497558594, -0.12578964233398438, -0.12005805969238281, -0.11432647705078125, -0.10859489440917969, -0.10286331176757812, -0.09713172912597656, -0.091400146484375, -0.08566856384277344, -0.07993698120117188, -0.07420539855957031, -0.06847381591796875, -0.06274223327636719, -0.057010650634765625, -0.05127906799316406, -0.0455474853515625, -0.03981590270996094, -0.034084320068359375, -0.028352737426757812, -0.02262115478515625, -0.016889572143554688, -0.011157989501953125, -0.0054264068603515625, 0.00030517578125, 0.0060367584228515625, 0.011768341064453125, 0.017499923706054688, 0.02323150634765625, 0.028963088989257812, 0.034694671630859375, 0.04042625427246094, 0.0461578369140625, 0.05188941955566406, 0.057621002197265625, 0.06335258483886719, 0.06908416748046875, 0.07481575012207031, 0.08054733276367188, 0.08627891540527344, 0.092010498046875, 0.09774208068847656, 0.10347366333007812, 0.10920524597167969, 0.11493682861328125, 0.12066841125488281, 0.12639999389648438, 0.13213157653808594, 0.1378631591796875, 0.14359474182128906, 0.14932632446289062, 0.1550579071044922, 0.16078948974609375, 0.1665210723876953, 0.17225265502929688, 0.17798423767089844, 0.1837158203125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 12.0, 16.0, 20.0, 46.0, 63.0, 103.0, 134.0, 160.0, 136.0, 112.0, 85.0, 40.0, 34.0, 19.0, 9.0, 7.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.426270008087158, -2.3378474712371826, -2.249425172805786, -2.1610026359558105, -2.072580099105835, -1.9841578006744385, -1.895735263824463, -1.8073128461837769, -1.7188904285430908, -1.6304680109024048, -1.5420454740524292, -1.4536230564117432, -1.3652006387710571, -1.276778221130371, -1.1883556842803955, -1.0999332666397095, -1.0115107297897339, -0.9230882525444031, -0.834665834903717, -0.7462433576583862, -0.6578209400177002, -0.5693984627723694, -0.4809759855270386, -0.39255356788635254, -0.30413109064102173, -0.2157086431980133, -0.1272861808538437, -0.03886371850967407, 0.04955872893333435, 0.13798117637634277, 0.22640365362167358, 0.3148260712623596, 0.40324854850769043, 0.49167099595069885, 0.5800934433937073, 0.6685159206390381, 0.7569383382797241, 0.8453608155250549, 0.9337832927703857, 1.0222057104110718, 1.1106281280517578, 1.1990505456924438, 1.2874730825424194, 1.3758955001831055, 1.4643179178237915, 1.5527403354644775, 1.6411628723144531, 1.7295852899551392, 1.8180078268051147, 1.9064302444458008, 1.9948527812957764, 2.083275318145752, 2.1716976165771484, 2.260120153427124, 2.3485426902770996, 2.436964988708496, 2.5253875255584717, 2.6138100624084473, 2.7022323608398438, 2.7906548976898193, 2.879077434539795, 2.9674997329711914, 3.055922269821167, 3.1443448066711426, 3.232767105102539]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 8.0, 11.0, 6.0, 7.0, 10.0, 15.0, 12.0, 16.0, 24.0, 15.0, 26.0, 32.0, 29.0, 35.0, 33.0, 41.0, 37.0, 45.0, 34.0, 46.0, 49.0, 43.0, 39.0, 42.0, 40.0, 37.0, 39.0, 36.0, 20.0, 31.0, 29.0, 13.0, 12.0, 14.0, 20.0, 12.0, 5.0, 6.0, 9.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.09592866897583, -2.039032459259033, -1.9821360111236572, -1.9252396821975708, -1.8683433532714844, -1.811447024345398, -1.7545506954193115, -1.697654366493225, -1.6407580375671387, -1.5838617086410522, -1.5269653797149658, -1.4700690507888794, -1.413172721862793, -1.3562763929367065, -1.2993800640106201, -1.2424837350845337, -1.1855874061584473, -1.1286910772323608, -1.0717947483062744, -1.014898419380188, -0.9580020904541016, -0.9011057615280151, -0.8442094326019287, -0.7873131036758423, -0.7304167747497559, -0.6735204458236694, -0.616624116897583, -0.5597277879714966, -0.5028314590454102, -0.44593513011932373, -0.3890388011932373, -0.3321424722671509, -0.275246262550354, -0.21834993362426758, -0.16145360469818115, -0.10455727577209473, -0.0476609468460083, 0.009235382080078125, 0.06613171100616455, 0.12302803993225098, 0.1799243688583374, 0.23682069778442383, 0.29371702671051025, 0.3506133556365967, 0.4075096845626831, 0.46440601348876953, 0.521302342414856, 0.5781986713409424, 0.6350950002670288, 0.6919913291931152, 0.7488876581192017, 0.8057839870452881, 0.8626803159713745, 0.9195766448974609, 0.9764729738235474, 1.0333693027496338, 1.0902656316757202, 1.1471619606018066, 1.204058289527893, 1.2609546184539795, 1.317850947380066, 1.3747472763061523, 1.4316436052322388, 1.4885399341583252, 1.5454362630844116]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 6.0, 7.0, 3.0, 9.0, 8.0, 6.0, 6.0, 8.0, 11.0, 18.0, 30.0, 26.0, 28.0, 57.0, 82.0, 99.0, 149.0, 237.0, 407.0, 577.0, 995.0, 1745.0, 3421.0, 7680.0, 21867.0, 171046.0, 3922996.0, 41231.0, 11226.0, 4707.0, 2221.0, 1248.0, 748.0, 412.0, 301.0, 184.0, 134.0, 90.0, 54.0, 45.0, 46.0, 24.0, 17.0, 17.0, 21.0, 12.0, 9.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.280517578125, -0.2718086242675781, -0.26309967041015625, -0.2543907165527344, -0.2456817626953125, -0.23697280883789062, -0.22826385498046875, -0.21955490112304688, -0.210845947265625, -0.20213699340820312, -0.19342803955078125, -0.18471908569335938, -0.1760101318359375, -0.16730117797851562, -0.15859222412109375, -0.14988327026367188, -0.14117431640625, -0.13246536254882812, -0.12375640869140625, -0.11504745483398438, -0.1063385009765625, -0.09762954711914062, -0.08892059326171875, -0.08021163940429688, -0.071502685546875, -0.06279373168945312, -0.05408477783203125, -0.045375823974609375, -0.0366668701171875, -0.027957916259765625, -0.01924896240234375, -0.010540008544921875, -0.0018310546875, 0.006877899169921875, 0.01558685302734375, 0.024295806884765625, 0.0330047607421875, 0.041713714599609375, 0.05042266845703125, 0.059131622314453125, 0.067840576171875, 0.07654953002929688, 0.08525848388671875, 0.09396743774414062, 0.1026763916015625, 0.11138534545898438, 0.12009429931640625, 0.12880325317382812, 0.13751220703125, 0.14622116088867188, 0.15493011474609375, 0.16363906860351562, 0.1723480224609375, 0.18105697631835938, 0.18976593017578125, 0.19847488403320312, 0.207183837890625, 0.21589279174804688, 0.22460174560546875, 0.23331069946289062, 0.2420196533203125, 0.2507286071777344, 0.25943756103515625, 0.2681465148925781, 0.27685546875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 10.0, 11.0, 9.0, 18.0, 24.0, 26.0, 42.0, 44.0, 40.0, 46.0, 35.0, 54.0, 48.0, 45.0, 66.0, 45.0, 60.0, 52.0, 48.0, 50.0, 38.0, 39.0, 26.0, 24.0, 19.0, 18.0, 6.0, 11.0, 13.0, 9.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08465576171875, -0.08185863494873047, -0.07906150817871094, -0.0762643814086914, -0.07346725463867188, -0.07067012786865234, -0.06787300109863281, -0.06507587432861328, -0.06227874755859375, -0.05948162078857422, -0.05668449401855469, -0.053887367248535156, -0.051090240478515625, -0.048293113708496094, -0.04549598693847656, -0.04269886016845703, -0.0399017333984375, -0.03710460662841797, -0.03430747985839844, -0.031510353088378906, -0.028713226318359375, -0.025916099548339844, -0.023118972778320312, -0.02032184600830078, -0.01752471923828125, -0.014727592468261719, -0.011930465698242188, -0.009133338928222656, -0.006336212158203125, -0.0035390853881835938, -0.0007419586181640625, 0.0020551681518554688, 0.004852294921875, 0.007649421691894531, 0.010446548461914062, 0.013243675231933594, 0.016040802001953125, 0.018837928771972656, 0.021635055541992188, 0.02443218231201172, 0.02722930908203125, 0.03002643585205078, 0.03282356262207031, 0.035620689392089844, 0.038417816162109375, 0.041214942932128906, 0.04401206970214844, 0.04680919647216797, 0.0496063232421875, 0.05240345001220703, 0.05520057678222656, 0.057997703552246094, 0.060794830322265625, 0.06359195709228516, 0.06638908386230469, 0.06918621063232422, 0.07198333740234375, 0.07478046417236328, 0.07757759094238281, 0.08037471771240234, 0.08317184448242188, 0.0859689712524414, 0.08876609802246094, 0.09156322479248047, 0.0943603515625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 9.0, 13.0, 9.0, 17.0, 11.0, 22.0, 29.0, 51.0, 66.0, 100.0, 141.0, 183.0, 306.0, 544.0, 889.0, 1731.0, 3225.0, 7229.0, 18783.0, 76370.0, 3873687.0, 164115.0, 27943.0, 9549.0, 4170.0, 2088.0, 1170.0, 671.0, 390.0, 253.0, 163.0, 108.0, 77.0, 44.0, 29.0, 21.0, 16.0, 15.0, 13.0, 4.0, 6.0, 9.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.27783203125, -0.2690582275390625, -0.260284423828125, -0.2515106201171875, -0.24273681640625, -0.2339630126953125, -0.225189208984375, -0.2164154052734375, -0.2076416015625, -0.1988677978515625, -0.190093994140625, -0.1813201904296875, -0.17254638671875, -0.1637725830078125, -0.154998779296875, -0.1462249755859375, -0.137451171875, -0.1286773681640625, -0.119903564453125, -0.1111297607421875, -0.10235595703125, -0.0935821533203125, -0.084808349609375, -0.0760345458984375, -0.0672607421875, -0.0584869384765625, -0.049713134765625, -0.0409393310546875, -0.03216552734375, -0.0233917236328125, -0.014617919921875, -0.0058441162109375, 0.0029296875, 0.0117034912109375, 0.020477294921875, 0.0292510986328125, 0.03802490234375, 0.0467987060546875, 0.055572509765625, 0.0643463134765625, 0.0731201171875, 0.0818939208984375, 0.090667724609375, 0.0994415283203125, 0.10821533203125, 0.1169891357421875, 0.125762939453125, 0.1345367431640625, 0.143310546875, 0.1520843505859375, 0.160858154296875, 0.1696319580078125, 0.17840576171875, 0.1871795654296875, 0.195953369140625, 0.2047271728515625, 0.2135009765625, 0.2222747802734375, 0.231048583984375, 0.2398223876953125, 0.24859619140625, 0.2573699951171875, 0.266143798828125, 0.2749176025390625, 0.28369140625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 1.0, 3.0, 4.0, 10.0, 8.0, 12.0, 9.0, 12.0, 26.0, 52.0, 101.0, 411.0, 3115.0, 153.0, 57.0, 40.0, 15.0, 16.0, 12.0, 8.0, 4.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09197998046875, -0.08929157257080078, -0.08660316467285156, -0.08391475677490234, -0.08122634887695312, -0.0785379409790039, -0.07584953308105469, -0.07316112518310547, -0.07047271728515625, -0.06778430938720703, -0.06509590148925781, -0.062407493591308594, -0.059719085693359375, -0.057030677795410156, -0.05434226989746094, -0.05165386199951172, -0.0489654541015625, -0.04627704620361328, -0.04358863830566406, -0.040900230407714844, -0.038211822509765625, -0.035523414611816406, -0.03283500671386719, -0.03014659881591797, -0.02745819091796875, -0.02476978302001953, -0.022081375122070312, -0.019392967224121094, -0.016704559326171875, -0.014016151428222656, -0.011327743530273438, -0.008639335632324219, -0.005950927734375, -0.0032625198364257812, -0.0005741119384765625, 0.0021142959594726562, 0.004802703857421875, 0.007491111755371094, 0.010179519653320312, 0.012867927551269531, 0.01555633544921875, 0.01824474334716797, 0.020933151245117188, 0.023621559143066406, 0.026309967041015625, 0.028998374938964844, 0.03168678283691406, 0.03437519073486328, 0.0370635986328125, 0.03975200653076172, 0.04244041442871094, 0.045128822326660156, 0.047817230224609375, 0.050505638122558594, 0.05319404602050781, 0.05588245391845703, 0.05857086181640625, 0.06125926971435547, 0.06394767761230469, 0.0666360855102539, 0.06932449340820312, 0.07201290130615234, 0.07470130920410156, 0.07738971710205078, 0.080078125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 9.0, 7.0, 11.0, 19.0, 19.0, 41.0, 43.0, 70.0, 88.0, 104.0, 88.0, 117.0, 95.0, 89.0, 61.0, 51.0, 25.0, 24.0, 16.0, 12.0, 3.0, 5.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2323429137468338, -0.22346237301826477, -0.21458184719085693, -0.2057013064622879, -0.19682076573371887, -0.18794023990631104, -0.179059699177742, -0.17017915844917297, -0.16129863262176514, -0.1524180918931961, -0.14353756606578827, -0.13465702533721924, -0.1257764995098114, -0.11689595878124237, -0.10801541805267334, -0.0991348847746849, -0.09025435149669647, -0.08137381821870804, -0.0724932849407196, -0.06361274421215057, -0.05473221093416214, -0.045851677656173706, -0.036971140652894974, -0.02809060364961624, -0.019210070371627808, -0.010329535230994225, -0.0014490000903606415, 0.007431535050272942, 0.016312070190906525, 0.02519260346889496, 0.03407314047217369, 0.04295367747545242, 0.05183419585227966, 0.0607147291302681, 0.06959526240825653, 0.07847580313682556, 0.087356336414814, 0.09623686969280243, 0.10511741042137146, 0.1139979436993599, 0.12287847697734833, 0.13175901770591736, 0.1406395435333252, 0.14952008426189423, 0.15840062499046326, 0.1672811508178711, 0.17616169154644012, 0.18504223227500916, 0.193922758102417, 0.20280329883098602, 0.21168382465839386, 0.2205643653869629, 0.22944489121437073, 0.23832543194293976, 0.2472059726715088, 0.2560864984989166, 0.26496702432632446, 0.2738475501537323, 0.2827281057834625, 0.29160863161087036, 0.3004891574382782, 0.30936968326568604, 0.31825023889541626, 0.3271307647228241, 0.3360113203525543]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 8.0, 6.0, 7.0, 9.0, 15.0, 9.0, 24.0, 24.0, 19.0, 25.0, 33.0, 32.0, 33.0, 34.0, 41.0, 47.0, 45.0, 42.0, 49.0, 47.0, 44.0, 50.0, 35.0, 35.0, 33.0, 32.0, 33.0, 35.0, 17.0, 18.0, 19.0, 16.0, 18.0, 11.0, 12.0, 11.0, 11.0, 1.0, 6.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.14557647705078125, -0.1409279853105545, -0.13627947866916656, -0.13163098692893982, -0.12698249518871307, -0.12233399599790573, -0.11768549680709839, -0.11303700506687164, -0.1083885058760643, -0.10374000668525696, -0.09909151494503021, -0.09444301575422287, -0.08979451656341553, -0.08514602482318878, -0.08049752563238144, -0.0758490264415741, -0.07120053470134735, -0.06655203551054001, -0.06190354377031326, -0.05725504457950592, -0.052606549113988876, -0.04795805364847183, -0.04330955445766449, -0.038661058992147446, -0.0340125635266304, -0.029364068061113358, -0.024715570732951164, -0.02006707340478897, -0.015418577939271927, -0.010770082473754883, -0.0061215851455926895, -0.0014730878174304962, 0.003175407648086548, 0.007823904044926167, 0.012472400441765785, 0.01712089776992798, 0.021769393235445023, 0.026417888700962067, 0.03106638602912426, 0.03571488335728645, 0.0403633788228035, 0.04501187428832054, 0.049660369753837585, 0.05430886894464493, 0.05895736441016197, 0.06360585987567902, 0.06825435906648636, 0.0729028582572937, 0.07755134999752045, 0.08219984918832779, 0.08684834092855453, 0.09149684011936188, 0.09614533185958862, 0.10079383105039597, 0.10544233024120331, 0.11009082198143005, 0.1147393211722374, 0.11938782036304474, 0.12403631210327148, 0.12868480384349823, 0.13333331048488617, 0.13798180222511292, 0.14263029396533966, 0.1472788006067276, 0.15192729234695435]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 10.0, 12.0, 17.0, 20.0, 37.0, 45.0, 73.0, 173.0, 324.0, 699.0, 1730.0, 4334.0, 12297.0, 39245.0, 136782.0, 372370.0, 324671.0, 108466.0, 31119.0, 9955.0, 3513.0, 1390.0, 602.0, 297.0, 155.0, 97.0, 44.0, 25.0, 15.0, 14.0, 11.0, 6.0, 4.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2242431640625, -0.21742820739746094, -0.21061325073242188, -0.2037982940673828, -0.19698333740234375, -0.1901683807373047, -0.18335342407226562, -0.17653846740722656, -0.1697235107421875, -0.16290855407714844, -0.15609359741210938, -0.1492786407470703, -0.14246368408203125, -0.1356487274169922, -0.12883377075195312, -0.12201881408691406, -0.115203857421875, -0.10838890075683594, -0.10157394409179688, -0.09475898742675781, -0.08794403076171875, -0.08112907409667969, -0.07431411743164062, -0.06749916076660156, -0.0606842041015625, -0.05386924743652344, -0.047054290771484375, -0.04023933410644531, -0.03342437744140625, -0.026609420776367188, -0.019794464111328125, -0.012979507446289062, -0.00616455078125, 0.0006504058837890625, 0.007465362548828125, 0.014280319213867188, 0.02109527587890625, 0.027910232543945312, 0.034725189208984375, 0.04154014587402344, 0.0483551025390625, 0.05517005920410156, 0.061985015869140625, 0.06879997253417969, 0.07561492919921875, 0.08242988586425781, 0.08924484252929688, 0.09605979919433594, 0.102874755859375, 0.10968971252441406, 0.11650466918945312, 0.12331962585449219, 0.13013458251953125, 0.1369495391845703, 0.14376449584960938, 0.15057945251464844, 0.1573944091796875, 0.16420936584472656, 0.17102432250976562, 0.1778392791748047, 0.18465423583984375, 0.1914691925048828, 0.19828414916992188, 0.20509910583496094, 0.2119140625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 0.0, 3.0, 5.0, 9.0, 4.0, 15.0, 12.0, 16.0, 26.0, 42.0, 35.0, 35.0, 48.0, 60.0, 56.0, 54.0, 58.0, 75.0, 79.0, 57.0, 48.0, 44.0, 39.0, 39.0, 29.0, 20.0, 21.0, 31.0, 8.0, 10.0, 7.0, 7.0, 0.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10498046875, -0.10171318054199219, -0.09844589233398438, -0.09517860412597656, -0.09191131591796875, -0.08864402770996094, -0.08537673950195312, -0.08210945129394531, -0.0788421630859375, -0.07557487487792969, -0.07230758666992188, -0.06904029846191406, -0.06577301025390625, -0.06250572204589844, -0.059238433837890625, -0.05597114562988281, -0.052703857421875, -0.04943656921386719, -0.046169281005859375, -0.04290199279785156, -0.03963470458984375, -0.03636741638183594, -0.033100128173828125, -0.029832839965820312, -0.0265655517578125, -0.023298263549804688, -0.020030975341796875, -0.016763687133789062, -0.01349639892578125, -0.010229110717773438, -0.006961822509765625, -0.0036945343017578125, -0.00042724609375, 0.0028400421142578125, 0.006107330322265625, 0.009374618530273438, 0.01264190673828125, 0.015909194946289062, 0.019176483154296875, 0.022443771362304688, 0.0257110595703125, 0.028978347778320312, 0.032245635986328125, 0.03551292419433594, 0.03878021240234375, 0.04204750061035156, 0.045314788818359375, 0.04858207702636719, 0.051849365234375, 0.05511665344238281, 0.058383941650390625, 0.06165122985839844, 0.06491851806640625, 0.06818580627441406, 0.07145309448242188, 0.07472038269042969, 0.0779876708984375, 0.08125495910644531, 0.08452224731445312, 0.08778953552246094, 0.09105682373046875, 0.09432411193847656, 0.09759140014648438, 0.10085868835449219, 0.1041259765625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 6.0, 10.0, 11.0, 15.0, 14.0, 25.0, 37.0, 53.0, 81.0, 101.0, 150.0, 207.0, 382.0, 571.0, 1005.0, 2069.0, 5466.0, 23520.0, 205141.0, 675304.0, 111104.0, 15331.0, 3889.0, 1677.0, 883.0, 513.0, 268.0, 220.0, 172.0, 111.0, 57.0, 45.0, 26.0, 21.0, 23.0, 14.0, 7.0, 8.0, 5.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.341064453125, -0.33052825927734375, -0.3199920654296875, -0.30945587158203125, -0.298919677734375, -0.28838348388671875, -0.2778472900390625, -0.26731109619140625, -0.25677490234375, -0.24623870849609375, -0.2357025146484375, -0.22516632080078125, -0.214630126953125, -0.20409393310546875, -0.1935577392578125, -0.18302154541015625, -0.1724853515625, -0.16194915771484375, -0.1514129638671875, -0.14087677001953125, -0.130340576171875, -0.11980438232421875, -0.1092681884765625, -0.09873199462890625, -0.08819580078125, -0.07765960693359375, -0.0671234130859375, -0.05658721923828125, -0.046051025390625, -0.03551483154296875, -0.0249786376953125, -0.01444244384765625, -0.00390625, 0.00662994384765625, 0.0171661376953125, 0.02770233154296875, 0.038238525390625, 0.04877471923828125, 0.0593109130859375, 0.06984710693359375, 0.08038330078125, 0.09091949462890625, 0.1014556884765625, 0.11199188232421875, 0.122528076171875, 0.13306427001953125, 0.1436004638671875, 0.15413665771484375, 0.1646728515625, 0.17520904541015625, 0.1857452392578125, 0.19628143310546875, 0.206817626953125, 0.21735382080078125, 0.2278900146484375, 0.23842620849609375, 0.24896240234375, 0.25949859619140625, 0.2700347900390625, 0.28057098388671875, 0.291107177734375, 0.30164337158203125, 0.3121795654296875, 0.32271575927734375, 0.333251953125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 6.0, 6.0, 7.0, 7.0, 13.0, 14.0, 10.0, 14.0, 13.0, 25.0, 24.0, 26.0, 29.0, 34.0, 42.0, 42.0, 43.0, 33.0, 53.0, 58.0, 47.0, 48.0, 36.0, 46.0, 30.0, 34.0, 51.0, 42.0, 25.0, 29.0, 19.0, 16.0, 20.0, 14.0, 12.0, 6.0, 7.0, 4.0, 7.0, 8.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4091796875, -0.3976097106933594, -0.38603973388671875, -0.3744697570800781, -0.3628997802734375, -0.3513298034667969, -0.33975982666015625, -0.3281898498535156, -0.316619873046875, -0.3050498962402344, -0.29347991943359375, -0.2819099426269531, -0.2703399658203125, -0.2587699890136719, -0.24720001220703125, -0.23563003540039062, -0.22406005859375, -0.21249008178710938, -0.20092010498046875, -0.18935012817382812, -0.1777801513671875, -0.16621017456054688, -0.15464019775390625, -0.14307022094726562, -0.131500244140625, -0.11993026733398438, -0.10836029052734375, -0.09679031372070312, -0.0852203369140625, -0.07365036010742188, -0.06208038330078125, -0.050510406494140625, -0.0389404296875, -0.027370452880859375, -0.01580047607421875, -0.004230499267578125, 0.0073394775390625, 0.018909454345703125, 0.03047943115234375, 0.042049407958984375, 0.053619384765625, 0.06518936157226562, 0.07675933837890625, 0.08832931518554688, 0.0998992919921875, 0.11146926879882812, 0.12303924560546875, 0.13460922241210938, 0.14617919921875, 0.15774917602539062, 0.16931915283203125, 0.18088912963867188, 0.1924591064453125, 0.20402908325195312, 0.21559906005859375, 0.22716903686523438, 0.238739013671875, 0.2503089904785156, 0.26187896728515625, 0.2734489440917969, 0.2850189208984375, 0.2965888977050781, 0.30815887451171875, 0.3197288513183594, 0.331298828125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 4.0, 8.0, 4.0, 10.0, 13.0, 14.0, 22.0, 29.0, 54.0, 66.0, 127.0, 219.0, 377.0, 695.0, 1652.0, 4552.0, 19441.0, 170961.0, 708703.0, 119778.0, 15041.0, 3798.0, 1461.0, 652.0, 319.0, 202.0, 119.0, 69.0, 57.0, 33.0, 22.0, 13.0, 13.0, 8.0, 5.0, 4.0, 4.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1885986328125, -0.1832752227783203, -0.17795181274414062, -0.17262840270996094, -0.16730499267578125, -0.16198158264160156, -0.15665817260742188, -0.1513347625732422, -0.1460113525390625, -0.1406879425048828, -0.13536453247070312, -0.13004112243652344, -0.12471771240234375, -0.11939430236816406, -0.11407089233398438, -0.10874748229980469, -0.103424072265625, -0.09810066223144531, -0.09277725219726562, -0.08745384216308594, -0.08213043212890625, -0.07680702209472656, -0.07148361206054688, -0.06616020202636719, -0.0608367919921875, -0.05551338195800781, -0.050189971923828125, -0.04486656188964844, -0.03954315185546875, -0.03421974182128906, -0.028896331787109375, -0.023572921752929688, -0.01824951171875, -0.012926101684570312, -0.007602691650390625, -0.0022792816162109375, 0.00304412841796875, 0.008367538452148438, 0.013690948486328125, 0.019014358520507812, 0.0243377685546875, 0.029661178588867188, 0.034984588623046875, 0.04030799865722656, 0.04563140869140625, 0.05095481872558594, 0.056278228759765625, 0.06160163879394531, 0.066925048828125, 0.07224845886230469, 0.07757186889648438, 0.08289527893066406, 0.08821868896484375, 0.09354209899902344, 0.09886550903320312, 0.10418891906738281, 0.1095123291015625, 0.11483573913574219, 0.12015914916992188, 0.12548255920410156, 0.13080596923828125, 0.13612937927246094, 0.14145278930664062, 0.1467761993408203, 0.152099609375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 12.0, 15.0, 19.0, 22.0, 32.0, 54.0, 70.0, 74.0, 76.0, 96.0, 100.0, 102.0, 89.0, 68.0, 53.0, 31.0, 27.0, 20.0, 17.0, 6.0, 10.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.502866744995117e-05, -6.263144314289093e-05, -6.023421883583069e-05, -5.783699452877045e-05, -5.5439770221710205e-05, -5.304254591464996e-05, -5.064532160758972e-05, -4.824809730052948e-05, -4.585087299346924e-05, -4.3453648686408997e-05, -4.1056424379348755e-05, -3.865920007228851e-05, -3.626197576522827e-05, -3.386475145816803e-05, -3.146752715110779e-05, -2.9070302844047546e-05, -2.6673078536987305e-05, -2.4275854229927063e-05, -2.187862992286682e-05, -1.948140561580658e-05, -1.7084181308746338e-05, -1.4686957001686096e-05, -1.2289732694625854e-05, -9.892508387565613e-06, -7.495284080505371e-06, -5.098059773445129e-06, -2.7008354663848877e-06, -3.03611159324646e-07, 2.0936131477355957e-06, 4.490837454795837e-06, 6.888061761856079e-06, 9.28528606891632e-06, 1.1682510375976562e-05, 1.4079734683036804e-05, 1.6476958990097046e-05, 1.8874183297157288e-05, 2.127140760421753e-05, 2.366863191127777e-05, 2.6065856218338013e-05, 2.8463080525398254e-05, 3.0860304832458496e-05, 3.325752913951874e-05, 3.565475344657898e-05, 3.805197775363922e-05, 4.044920206069946e-05, 4.2846426367759705e-05, 4.5243650674819946e-05, 4.764087498188019e-05, 5.003809928894043e-05, 5.243532359600067e-05, 5.483254790306091e-05, 5.7229772210121155e-05, 5.9626996517181396e-05, 6.202422082424164e-05, 6.442144513130188e-05, 6.681866943836212e-05, 6.921589374542236e-05, 7.16131180524826e-05, 7.401034235954285e-05, 7.640756666660309e-05, 7.880479097366333e-05, 8.120201528072357e-05, 8.359923958778381e-05, 8.599646389484406e-05, 8.83936882019043e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 7.0, 9.0, 6.0, 13.0, 12.0, 19.0, 28.0, 39.0, 71.0, 116.0, 189.0, 388.0, 809.0, 1871.0, 4813.0, 21423.0, 221104.0, 690238.0, 89631.0, 11719.0, 3353.0, 1298.0, 627.0, 308.0, 179.0, 104.0, 55.0, 39.0, 25.0, 17.0, 16.0, 8.0, 7.0, 6.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1558837890625, -0.15056800842285156, -0.14525222778320312, -0.1399364471435547, -0.13462066650390625, -0.1293048858642578, -0.12398910522460938, -0.11867332458496094, -0.1133575439453125, -0.10804176330566406, -0.10272598266601562, -0.09741020202636719, -0.09209442138671875, -0.08677864074707031, -0.08146286010742188, -0.07614707946777344, -0.070831298828125, -0.06551551818847656, -0.060199737548828125, -0.05488395690917969, -0.04956817626953125, -0.04425239562988281, -0.038936614990234375, -0.03362083435058594, -0.0283050537109375, -0.022989273071289062, -0.017673492431640625, -0.012357711791992188, -0.00704193115234375, -0.0017261505126953125, 0.003589630126953125, 0.008905410766601562, 0.01422119140625, 0.019536972045898438, 0.024852752685546875, 0.030168533325195312, 0.03548431396484375, 0.04080009460449219, 0.046115875244140625, 0.05143165588378906, 0.0567474365234375, 0.06206321716308594, 0.06737899780273438, 0.07269477844238281, 0.07801055908203125, 0.08332633972167969, 0.08864212036132812, 0.09395790100097656, 0.099273681640625, 0.10458946228027344, 0.10990524291992188, 0.11522102355957031, 0.12053680419921875, 0.1258525848388672, 0.13116836547851562, 0.13648414611816406, 0.1417999267578125, 0.14711570739746094, 0.15243148803710938, 0.1577472686767578, 0.16306304931640625, 0.1683788299560547, 0.17369461059570312, 0.17901039123535156, 0.184326171875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 9.0, 9.0, 12.0, 19.0, 25.0, 26.0, 51.0, 50.0, 78.0, 96.0, 90.0, 111.0, 103.0, 72.0, 73.0, 63.0, 40.0, 23.0, 22.0, 10.0, 9.0, 6.0, 1.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.14794921875, -0.1432323455810547, -0.13851547241210938, -0.13379859924316406, -0.12908172607421875, -0.12436485290527344, -0.11964797973632812, -0.11493110656738281, -0.1102142333984375, -0.10549736022949219, -0.10078048706054688, -0.09606361389160156, -0.09134674072265625, -0.08662986755371094, -0.08191299438476562, -0.07719612121582031, -0.072479248046875, -0.06776237487792969, -0.06304550170898438, -0.05832862854003906, -0.05361175537109375, -0.04889488220214844, -0.044178009033203125, -0.03946113586425781, -0.0347442626953125, -0.030027389526367188, -0.025310516357421875, -0.020593643188476562, -0.01587677001953125, -0.011159896850585938, -0.006443023681640625, -0.0017261505126953125, 0.00299072265625, 0.0077075958251953125, 0.012424468994140625, 0.017141342163085938, 0.02185821533203125, 0.026575088500976562, 0.031291961669921875, 0.03600883483886719, 0.0407257080078125, 0.04544258117675781, 0.050159454345703125, 0.05487632751464844, 0.05959320068359375, 0.06431007385253906, 0.06902694702148438, 0.07374382019042969, 0.078460693359375, 0.08317756652832031, 0.08789443969726562, 0.09261131286621094, 0.09732818603515625, 0.10204505920410156, 0.10676193237304688, 0.11147880554199219, 0.1161956787109375, 0.12091255187988281, 0.12562942504882812, 0.13034629821777344, 0.13506317138671875, 0.13978004455566406, 0.14449691772460938, 0.1492137908935547, 0.1539306640625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 5.0, 8.0, 30.0, 50.0, 108.0, 181.0, 197.0, 191.0, 132.0, 61.0, 26.0, 10.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.165902137756348, -5.057231903076172, -4.948562145233154, -4.8398919105529785, -4.731222152709961, -4.622551918029785, -4.513881683349609, -4.405211925506592, -4.296541690826416, -4.18787145614624, -4.079201698303223, -3.970531463623047, -3.86186146736145, -3.7531914710998535, -3.644521474838257, -3.53585147857666, -3.4271814823150635, -3.318511486053467, -3.20984148979187, -3.1011714935302734, -2.9925012588500977, -2.883831262588501, -2.7751612663269043, -2.6664912700653076, -2.557821273803711, -2.4491512775421143, -2.3404812812805176, -2.231811046600342, -2.123141050338745, -2.0144710540771484, -1.9058010578155518, -1.797131061553955, -1.6884608268737793, -1.5797908306121826, -1.4711207151412964, -1.3624507188796997, -1.2537806034088135, -1.1451106071472168, -1.0364406108856201, -0.9277705550193787, -0.8191004991531372, -0.7104304432868958, -0.6017603874206543, -0.4930903911590576, -0.38442033529281616, -0.2757502794265747, -0.16708028316497803, -0.05841022729873657, 0.05025982856750488, 0.15892986953258514, 0.2675999104976654, 0.3762699365615845, 0.4849399924278259, 0.5936100482940674, 0.7022800445556641, 0.8109501004219055, 0.919620156288147, 1.0282901525497437, 1.1369602680206299, 1.2456302642822266, 1.3543002605438232, 1.4629703760147095, 1.5716403722763062, 1.6803104877471924, 1.788980484008789]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 8.0, 4.0, 9.0, 6.0, 8.0, 23.0, 18.0, 16.0, 24.0, 19.0, 27.0, 31.0, 41.0, 47.0, 41.0, 43.0, 47.0, 40.0, 53.0, 53.0, 56.0, 49.0, 45.0, 37.0, 36.0, 46.0, 23.0, 20.0, 23.0, 23.0, 20.0, 14.0, 12.0, 7.0, 12.0, 7.0, 2.0, 6.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8363511562347412, -1.783287525177002, -1.7302238941192627, -1.6771602630615234, -1.6240966320037842, -1.571033000946045, -1.5179694890975952, -1.464905858039856, -1.4118422269821167, -1.3587785959243774, -1.3057149648666382, -1.252651333808899, -1.1995878219604492, -1.14652419090271, -1.0934605598449707, -1.0403969287872314, -0.9873332977294922, -0.9342696666717529, -0.8812060356140137, -0.8281424641609192, -0.7750788331031799, -0.7220152020454407, -0.6689516305923462, -0.6158879995346069, -0.5628243684768677, -0.5097607374191284, -0.45669713616371155, -0.4036335349082947, -0.3505699038505554, -0.29750627279281616, -0.2444426715373993, -0.19137907028198242, -0.13831555843353271, -0.08525194227695465, -0.03218832612037659, 0.020875290036201477, 0.07393890619277954, 0.1270025372505188, 0.18006613850593567, 0.23312973976135254, 0.2861933708190918, 0.33925700187683105, 0.3923206031322479, 0.4453842043876648, 0.49844783544540405, 0.5515114665031433, 0.6045750379562378, 0.657638669013977, 0.7107023000717163, 0.7637659311294556, 0.8168295621871948, 0.8698931336402893, 0.9229567646980286, 0.9760203957557678, 1.0290839672088623, 1.0821475982666016, 1.1352112293243408, 1.18827486038208, 1.2413384914398193, 1.2944021224975586, 1.3474657535552979, 1.400529384613037, 1.4535928964614868, 1.506656527519226, 1.5597201585769653]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 4.0, 17.0, 19.0, 11.0, 28.0, 37.0, 46.0, 65.0, 101.0, 126.0, 202.0, 289.0, 384.0, 644.0, 1035.0, 1840.0, 4080.0, 13111.0, 154518.0, 3988309.0, 18822.0, 5056.0, 2223.0, 1173.0, 670.0, 436.0, 287.0, 228.0, 146.0, 105.0, 86.0, 49.0, 43.0, 25.0, 21.0, 11.0, 11.0, 8.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.384033203125, -0.3716888427734375, -0.359344482421875, -0.3470001220703125, -0.33465576171875, -0.3223114013671875, -0.309967041015625, -0.2976226806640625, -0.2852783203125, -0.2729339599609375, -0.260589599609375, -0.2482452392578125, -0.23590087890625, -0.2235565185546875, -0.211212158203125, -0.1988677978515625, -0.1865234375, -0.1741790771484375, -0.161834716796875, -0.1494903564453125, -0.13714599609375, -0.1248016357421875, -0.112457275390625, -0.1001129150390625, -0.0877685546875, -0.0754241943359375, -0.063079833984375, -0.0507354736328125, -0.03839111328125, -0.0260467529296875, -0.013702392578125, -0.0013580322265625, 0.010986328125, 0.0233306884765625, 0.035675048828125, 0.0480194091796875, 0.06036376953125, 0.0727081298828125, 0.085052490234375, 0.0973968505859375, 0.1097412109375, 0.1220855712890625, 0.134429931640625, 0.1467742919921875, 0.15911865234375, 0.1714630126953125, 0.183807373046875, 0.1961517333984375, 0.20849609375, 0.2208404541015625, 0.233184814453125, 0.2455291748046875, 0.25787353515625, 0.2702178955078125, 0.282562255859375, 0.2949066162109375, 0.3072509765625, 0.3195953369140625, 0.331939697265625, 0.3442840576171875, 0.35662841796875, 0.3689727783203125, 0.381317138671875, 0.3936614990234375, 0.406005859375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 7.0, 8.0, 11.0, 24.0, 16.0, 17.0, 29.0, 36.0, 45.0, 53.0, 58.0, 46.0, 57.0, 63.0, 52.0, 65.0, 66.0, 51.0, 68.0, 39.0, 36.0, 41.0, 29.0, 25.0, 12.0, 15.0, 11.0, 3.0, 1.0, 4.0, 4.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1016845703125, -0.0985565185546875, -0.095428466796875, -0.0923004150390625, -0.08917236328125, -0.0860443115234375, -0.082916259765625, -0.0797882080078125, -0.07666015625, -0.0735321044921875, -0.070404052734375, -0.0672760009765625, -0.06414794921875, -0.0610198974609375, -0.057891845703125, -0.0547637939453125, -0.0516357421875, -0.0485076904296875, -0.045379638671875, -0.0422515869140625, -0.03912353515625, -0.0359954833984375, -0.032867431640625, -0.0297393798828125, -0.026611328125, -0.0234832763671875, -0.020355224609375, -0.0172271728515625, -0.01409912109375, -0.0109710693359375, -0.007843017578125, -0.0047149658203125, -0.0015869140625, 0.0015411376953125, 0.004669189453125, 0.0077972412109375, 0.01092529296875, 0.0140533447265625, 0.017181396484375, 0.0203094482421875, 0.0234375, 0.0265655517578125, 0.029693603515625, 0.0328216552734375, 0.03594970703125, 0.0390777587890625, 0.042205810546875, 0.0453338623046875, 0.0484619140625, 0.0515899658203125, 0.054718017578125, 0.0578460693359375, 0.06097412109375, 0.0641021728515625, 0.067230224609375, 0.0703582763671875, 0.073486328125, 0.0766143798828125, 0.079742431640625, 0.0828704833984375, 0.08599853515625, 0.0891265869140625, 0.092254638671875, 0.0953826904296875, 0.0985107421875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 5.0, 9.0, 9.0, 10.0, 17.0, 20.0, 15.0, 28.0, 38.0, 40.0, 46.0, 68.0, 118.0, 129.0, 144.0, 218.0, 363.0, 690.0, 1434.0, 3860.0, 16417.0, 3855322.0, 295062.0, 13539.0, 3531.0, 1327.0, 585.0, 365.0, 215.0, 135.0, 106.0, 98.0, 71.0, 49.0, 47.0, 28.0, 33.0, 21.0, 22.0, 9.0, 11.0, 4.0, 4.0, 4.0, 7.0, 5.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0], "bins": [-0.5791015625, -0.5615234375, -0.5439453125, -0.5263671875, -0.5087890625, -0.4912109375, -0.4736328125, -0.4560546875, -0.4384765625, -0.4208984375, -0.4033203125, -0.3857421875, -0.3681640625, -0.3505859375, -0.3330078125, -0.3154296875, -0.2978515625, -0.2802734375, -0.2626953125, -0.2451171875, -0.2275390625, -0.2099609375, -0.1923828125, -0.1748046875, -0.1572265625, -0.1396484375, -0.1220703125, -0.1044921875, -0.0869140625, -0.0693359375, -0.0517578125, -0.0341796875, -0.0166015625, 0.0009765625, 0.0185546875, 0.0361328125, 0.0537109375, 0.0712890625, 0.0888671875, 0.1064453125, 0.1240234375, 0.1416015625, 0.1591796875, 0.1767578125, 0.1943359375, 0.2119140625, 0.2294921875, 0.2470703125, 0.2646484375, 0.2822265625, 0.2998046875, 0.3173828125, 0.3349609375, 0.3525390625, 0.3701171875, 0.3876953125, 0.4052734375, 0.4228515625, 0.4404296875, 0.4580078125, 0.4755859375, 0.4931640625, 0.5107421875, 0.5283203125, 0.5458984375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 17.0, 18.0, 62.0, 3543.0, 335.0, 50.0, 19.0, 12.0, 7.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17626953125, -0.17073440551757812, -0.16519927978515625, -0.15966415405273438, -0.1541290283203125, -0.14859390258789062, -0.14305877685546875, -0.13752365112304688, -0.131988525390625, -0.12645339965820312, -0.12091827392578125, -0.11538314819335938, -0.1098480224609375, -0.10431289672851562, -0.09877777099609375, -0.09324264526367188, -0.08770751953125, -0.08217239379882812, -0.07663726806640625, -0.07110214233398438, -0.0655670166015625, -0.060031890869140625, -0.05449676513671875, -0.048961639404296875, -0.043426513671875, -0.037891387939453125, -0.03235626220703125, -0.026821136474609375, -0.0212860107421875, -0.015750885009765625, -0.01021575927734375, -0.004680633544921875, 0.0008544921875, 0.006389617919921875, 0.01192474365234375, 0.017459869384765625, 0.0229949951171875, 0.028530120849609375, 0.03406524658203125, 0.039600372314453125, 0.045135498046875, 0.050670623779296875, 0.05620574951171875, 0.061740875244140625, 0.0672760009765625, 0.07281112670898438, 0.07834625244140625, 0.08388137817382812, 0.08941650390625, 0.09495162963867188, 0.10048675537109375, 0.10602188110351562, 0.1115570068359375, 0.11709213256835938, 0.12262725830078125, 0.12816238403320312, 0.133697509765625, 0.13923263549804688, 0.14476776123046875, 0.15030288696289062, 0.1558380126953125, 0.16137313842773438, 0.16690826416015625, 0.17244338989257812, 0.177978515625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 12.0, 13.0, 14.0, 26.0, 36.0, 60.0, 102.0, 106.0, 147.0, 152.0, 117.0, 87.0, 57.0, 28.0, 12.0, 10.0, 4.0, 8.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3946044445037842, -0.3813950717449188, -0.36818569898605347, -0.3549763262271881, -0.34176695346832275, -0.3285575807094574, -0.31534820795059204, -0.3021388351917267, -0.28892946243286133, -0.27572008967399597, -0.2625107169151306, -0.24930134415626526, -0.2360919713973999, -0.22288259863853455, -0.2096732258796692, -0.19646385312080383, -0.18325448036193848, -0.17004510760307312, -0.15683573484420776, -0.1436263620853424, -0.13041698932647705, -0.1172076165676117, -0.10399824380874634, -0.09078887104988098, -0.07757949829101562, -0.06437012553215027, -0.05116075277328491, -0.037951380014419556, -0.0247420072555542, -0.011532634496688843, 0.0016767382621765137, 0.01488611102104187, 0.028095483779907227, 0.04130485653877258, 0.05451422929763794, 0.0677236020565033, 0.08093297481536865, 0.09414234757423401, 0.10735172033309937, 0.12056109309196472, 0.13377046585083008, 0.14697983860969543, 0.1601892113685608, 0.17339858412742615, 0.1866079568862915, 0.19981732964515686, 0.21302670240402222, 0.22623607516288757, 0.23944544792175293, 0.2526548206806183, 0.26586419343948364, 0.279073566198349, 0.29228293895721436, 0.3054923117160797, 0.31870168447494507, 0.3319110572338104, 0.3451204299926758, 0.35832980275154114, 0.3715391755104065, 0.38474854826927185, 0.3979579210281372, 0.41116729378700256, 0.4243766665458679, 0.4375860393047333, 0.45079541206359863]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 9.0, 9.0, 8.0, 8.0, 10.0, 9.0, 21.0, 19.0, 22.0, 24.0, 26.0, 22.0, 31.0, 46.0, 38.0, 42.0, 31.0, 45.0, 36.0, 50.0, 43.0, 40.0, 43.0, 34.0, 47.0, 32.0, 30.0, 34.0, 18.0, 22.0, 24.0, 21.0, 11.0, 8.0, 22.0, 9.0, 17.0, 9.0, 4.0, 7.0, 3.0, 5.0, 2.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1824837327003479, -0.1767328530550003, -0.1709819883108139, -0.1652311086654663, -0.1594802290201187, -0.15372934937477112, -0.14797848463058472, -0.14222760498523712, -0.13647672533988953, -0.13072584569454193, -0.12497497349977493, -0.11922410130500793, -0.11347322165966034, -0.10772234946489334, -0.10197147727012634, -0.09622059762477875, -0.09046973288059235, -0.08471886068582535, -0.07896798104047775, -0.07321710884571075, -0.06746622920036316, -0.06171535700559616, -0.05596448481082916, -0.050213608890771866, -0.04446273297071457, -0.03871185705065727, -0.032960981130599976, -0.027210108935832977, -0.02145923301577568, -0.015708357095718384, -0.009957484900951385, -0.004206608980894089, 0.001544266939163208, 0.00729514192789793, 0.013046016916632652, 0.0187968909740448, 0.024547766894102097, 0.030298642814159393, 0.03604951500892639, 0.04180039092898369, 0.047551266849040985, 0.05330214276909828, 0.05905301868915558, 0.06480389088392258, 0.07055476307868958, 0.07630564272403717, 0.08205651491880417, 0.08780738711357117, 0.09355826675891876, 0.09930913895368576, 0.10506001859903336, 0.11081089079380035, 0.11656177043914795, 0.12231264263391495, 0.12806351482868195, 0.13381439447402954, 0.13956525921821594, 0.14531613886356354, 0.15106700360774994, 0.15681788325309753, 0.16256876289844513, 0.16831964254379272, 0.17407050728797913, 0.17982138693332672, 0.18557226657867432]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 7.0, 7.0, 14.0, 25.0, 24.0, 29.0, 73.0, 110.0, 132.0, 189.0, 251.0, 459.0, 698.0, 968.0, 1586.0, 2520.0, 4209.0, 7127.0, 12994.0, 24228.0, 48509.0, 98425.0, 193527.0, 270957.0, 186598.0, 94829.0, 45966.0, 23528.0, 12326.0, 7157.0, 4180.0, 2456.0, 1528.0, 1024.0, 601.0, 431.0, 271.0, 189.0, 142.0, 93.0, 62.0, 32.0, 16.0, 20.0, 18.0, 13.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.1278076171875, -0.12398910522460938, -0.12017059326171875, -0.11635208129882812, -0.1125335693359375, -0.10871505737304688, -0.10489654541015625, -0.10107803344726562, -0.097259521484375, -0.09344100952148438, -0.08962249755859375, -0.08580398559570312, -0.0819854736328125, -0.07816696166992188, -0.07434844970703125, -0.07052993774414062, -0.06671142578125, -0.06289291381835938, -0.05907440185546875, -0.055255889892578125, -0.0514373779296875, -0.047618865966796875, -0.04380035400390625, -0.039981842041015625, -0.036163330078125, -0.032344818115234375, -0.02852630615234375, -0.024707794189453125, -0.0208892822265625, -0.017070770263671875, -0.01325225830078125, -0.009433746337890625, -0.005615234375, -0.001796722412109375, 0.00202178955078125, 0.005840301513671875, 0.0096588134765625, 0.013477325439453125, 0.01729583740234375, 0.021114349365234375, 0.024932861328125, 0.028751373291015625, 0.03256988525390625, 0.036388397216796875, 0.0402069091796875, 0.044025421142578125, 0.04784393310546875, 0.051662445068359375, 0.05548095703125, 0.059299468994140625, 0.06311798095703125, 0.06693649291992188, 0.0707550048828125, 0.07457351684570312, 0.07839202880859375, 0.08221054077148438, 0.086029052734375, 0.08984756469726562, 0.09366607666015625, 0.09748458862304688, 0.1013031005859375, 0.10512161254882812, 0.10894012451171875, 0.11275863647460938, 0.1165771484375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 5.0, 6.0, 11.0, 17.0, 17.0, 22.0, 20.0, 25.0, 43.0, 44.0, 43.0, 41.0, 64.0, 53.0, 55.0, 68.0, 64.0, 60.0, 63.0, 39.0, 47.0, 50.0, 30.0, 21.0, 19.0, 18.0, 13.0, 16.0, 6.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10687255859375, -0.10356807708740234, -0.10026359558105469, -0.09695911407470703, -0.09365463256835938, -0.09035015106201172, -0.08704566955566406, -0.0837411880493164, -0.08043670654296875, -0.0771322250366211, -0.07382774353027344, -0.07052326202392578, -0.06721878051757812, -0.06391429901123047, -0.06060981750488281, -0.057305335998535156, -0.0540008544921875, -0.050696372985839844, -0.04739189147949219, -0.04408740997314453, -0.040782928466796875, -0.03747844696044922, -0.03417396545410156, -0.030869483947753906, -0.02756500244140625, -0.024260520935058594, -0.020956039428710938, -0.01765155792236328, -0.014347076416015625, -0.011042594909667969, -0.0077381134033203125, -0.004433631896972656, -0.001129150390625, 0.0021753311157226562, 0.0054798126220703125, 0.008784294128417969, 0.012088775634765625, 0.015393257141113281, 0.018697738647460938, 0.022002220153808594, 0.02530670166015625, 0.028611183166503906, 0.03191566467285156, 0.03522014617919922, 0.038524627685546875, 0.04182910919189453, 0.04513359069824219, 0.048438072204589844, 0.0517425537109375, 0.055047035217285156, 0.05835151672363281, 0.06165599822998047, 0.06496047973632812, 0.06826496124267578, 0.07156944274902344, 0.0748739242553711, 0.07817840576171875, 0.0814828872680664, 0.08478736877441406, 0.08809185028076172, 0.09139633178710938, 0.09470081329345703, 0.09800529479980469, 0.10130977630615234, 0.1046142578125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 7.0, 10.0, 3.0, 13.0, 19.0, 19.0, 23.0, 33.0, 36.0, 71.0, 88.0, 106.0, 131.0, 224.0, 306.0, 476.0, 751.0, 1377.0, 3245.0, 11958.0, 86766.0, 711866.0, 200903.0, 21058.0, 4689.0, 1701.0, 921.0, 537.0, 370.0, 243.0, 162.0, 116.0, 87.0, 53.0, 55.0, 36.0, 24.0, 22.0, 10.0, 15.0, 12.0, 8.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30859375, -0.29853057861328125, -0.2884674072265625, -0.27840423583984375, -0.268341064453125, -0.25827789306640625, -0.2482147216796875, -0.23815155029296875, -0.22808837890625, -0.21802520751953125, -0.2079620361328125, -0.19789886474609375, -0.187835693359375, -0.17777252197265625, -0.1677093505859375, -0.15764617919921875, -0.1475830078125, -0.13751983642578125, -0.1274566650390625, -0.11739349365234375, -0.107330322265625, -0.09726715087890625, -0.0872039794921875, -0.07714080810546875, -0.06707763671875, -0.05701446533203125, -0.0469512939453125, -0.03688812255859375, -0.026824951171875, -0.01676177978515625, -0.0066986083984375, 0.00336456298828125, 0.013427734375, 0.02349090576171875, 0.0335540771484375, 0.04361724853515625, 0.053680419921875, 0.06374359130859375, 0.0738067626953125, 0.08386993408203125, 0.09393310546875, 0.10399627685546875, 0.1140594482421875, 0.12412261962890625, 0.134185791015625, 0.14424896240234375, 0.1543121337890625, 0.16437530517578125, 0.1744384765625, 0.18450164794921875, 0.1945648193359375, 0.20462799072265625, 0.214691162109375, 0.22475433349609375, 0.2348175048828125, 0.24488067626953125, 0.25494384765625, 0.26500701904296875, 0.2750701904296875, 0.28513336181640625, 0.295196533203125, 0.30525970458984375, 0.3153228759765625, 0.32538604736328125, 0.33544921875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 7.0, 6.0, 5.0, 7.0, 4.0, 14.0, 9.0, 14.0, 6.0, 21.0, 24.0, 24.0, 21.0, 28.0, 35.0, 21.0, 40.0, 34.0, 52.0, 37.0, 41.0, 35.0, 46.0, 40.0, 30.0, 38.0, 37.0, 43.0, 32.0, 34.0, 26.0, 25.0, 27.0, 20.0, 26.0, 19.0, 16.0, 13.0, 14.0, 7.0, 6.0, 4.0, 2.0, 6.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.316650390625, -0.3068962097167969, -0.29714202880859375, -0.2873878479003906, -0.2776336669921875, -0.2678794860839844, -0.25812530517578125, -0.24837112426757812, -0.238616943359375, -0.22886276245117188, -0.21910858154296875, -0.20935440063476562, -0.1996002197265625, -0.18984603881835938, -0.18009185791015625, -0.17033767700195312, -0.16058349609375, -0.15082931518554688, -0.14107513427734375, -0.13132095336914062, -0.1215667724609375, -0.11181259155273438, -0.10205841064453125, -0.09230422973632812, -0.082550048828125, -0.07279586791992188, -0.06304168701171875, -0.053287506103515625, -0.0435333251953125, -0.033779144287109375, -0.02402496337890625, -0.014270782470703125, -0.0045166015625, 0.005237579345703125, 0.01499176025390625, 0.024745941162109375, 0.0345001220703125, 0.044254302978515625, 0.05400848388671875, 0.06376266479492188, 0.073516845703125, 0.08327102661132812, 0.09302520751953125, 0.10277938842773438, 0.1125335693359375, 0.12228775024414062, 0.13204193115234375, 0.14179611206054688, 0.15155029296875, 0.16130447387695312, 0.17105865478515625, 0.18081283569335938, 0.1905670166015625, 0.20032119750976562, 0.21007537841796875, 0.21982955932617188, 0.229583740234375, 0.23933792114257812, 0.24909210205078125, 0.2588462829589844, 0.2686004638671875, 0.2783546447753906, 0.28810882568359375, 0.2978630065917969, 0.3076171875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 2.0, 4.0, 6.0, 4.0, 11.0, 11.0, 18.0, 28.0, 50.0, 64.0, 89.0, 126.0, 237.0, 448.0, 918.0, 2360.0, 9903.0, 112263.0, 795056.0, 112545.0, 10006.0, 2347.0, 939.0, 423.0, 252.0, 151.0, 85.0, 67.0, 38.0, 28.0, 25.0, 13.0, 5.0, 11.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1826171875, -0.17699813842773438, -0.17137908935546875, -0.16576004028320312, -0.1601409912109375, -0.15452194213867188, -0.14890289306640625, -0.14328384399414062, -0.137664794921875, -0.13204574584960938, -0.12642669677734375, -0.12080764770507812, -0.1151885986328125, -0.10956954956054688, -0.10395050048828125, -0.09833145141601562, -0.09271240234375, -0.08709335327148438, -0.08147430419921875, -0.07585525512695312, -0.0702362060546875, -0.06461715698242188, -0.05899810791015625, -0.053379058837890625, -0.047760009765625, -0.042140960693359375, -0.03652191162109375, -0.030902862548828125, -0.0252838134765625, -0.019664764404296875, -0.01404571533203125, -0.008426666259765625, -0.0028076171875, 0.002811431884765625, 0.00843048095703125, 0.014049530029296875, 0.0196685791015625, 0.025287628173828125, 0.03090667724609375, 0.036525726318359375, 0.042144775390625, 0.047763824462890625, 0.05338287353515625, 0.059001922607421875, 0.0646209716796875, 0.07024002075195312, 0.07585906982421875, 0.08147811889648438, 0.08709716796875, 0.09271621704101562, 0.09833526611328125, 0.10395431518554688, 0.1095733642578125, 0.11519241333007812, 0.12081146240234375, 0.12643051147460938, 0.132049560546875, 0.13766860961914062, 0.14328765869140625, 0.14890670776367188, 0.1545257568359375, 0.16014480590820312, 0.16576385498046875, 0.17138290405273438, 0.177001953125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 8.0, 11.0, 9.0, 16.0, 9.0, 25.0, 18.0, 32.0, 37.0, 40.0, 76.0, 75.0, 58.0, 65.0, 73.0, 69.0, 70.0, 61.0, 49.0, 44.0, 29.0, 17.0, 17.0, 11.0, 5.0, 7.0, 7.0, 14.0, 6.0, 7.0, 1.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.143880844116211e-05, -4.9768947064876556e-05, -4.8099085688591003e-05, -4.642922431230545e-05, -4.47593629360199e-05, -4.3089501559734344e-05, -4.141964018344879e-05, -3.974977880716324e-05, -3.8079917430877686e-05, -3.641005605459213e-05, -3.474019467830658e-05, -3.3070333302021027e-05, -3.1400471925735474e-05, -2.973061054944992e-05, -2.8060749173164368e-05, -2.6390887796878815e-05, -2.4721026420593262e-05, -2.305116504430771e-05, -2.1381303668022156e-05, -1.9711442291736603e-05, -1.804158091545105e-05, -1.6371719539165497e-05, -1.4701858162879944e-05, -1.3031996786594391e-05, -1.1362135410308838e-05, -9.692274034023285e-06, -8.022412657737732e-06, -6.352551281452179e-06, -4.682689905166626e-06, -3.012828528881073e-06, -1.34296715259552e-06, 3.2689422369003296e-07, 1.996755599975586e-06, 3.666616976261139e-06, 5.336478352546692e-06, 7.006339728832245e-06, 8.676201105117798e-06, 1.034606248140335e-05, 1.2015923857688904e-05, 1.3685785233974457e-05, 1.535564661026001e-05, 1.7025507986545563e-05, 1.8695369362831116e-05, 2.036523073911667e-05, 2.203509211540222e-05, 2.3704953491687775e-05, 2.5374814867973328e-05, 2.704467624425888e-05, 2.8714537620544434e-05, 3.0384398996829987e-05, 3.205426037311554e-05, 3.372412174940109e-05, 3.5393983125686646e-05, 3.70638445019722e-05, 3.873370587825775e-05, 4.0403567254543304e-05, 4.207342863082886e-05, 4.374329000711441e-05, 4.541315138339996e-05, 4.7083012759685516e-05, 4.875287413597107e-05, 5.042273551225662e-05, 5.2092596888542175e-05, 5.376245826482773e-05, 5.543231964111328e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 3.0, 8.0, 13.0, 18.0, 17.0, 37.0, 45.0, 81.0, 157.0, 258.0, 535.0, 1013.0, 2572.0, 9416.0, 74085.0, 724089.0, 210847.0, 18355.0, 4121.0, 1449.0, 621.0, 343.0, 171.0, 129.0, 68.0, 39.0, 23.0, 11.0, 6.0, 2.0, 5.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.2293701171875, -0.22386837005615234, -0.2183666229248047, -0.21286487579345703, -0.20736312866210938, -0.20186138153076172, -0.19635963439941406, -0.1908578872680664, -0.18535614013671875, -0.1798543930053711, -0.17435264587402344, -0.16885089874267578, -0.16334915161132812, -0.15784740447998047, -0.1523456573486328, -0.14684391021728516, -0.1413421630859375, -0.13584041595458984, -0.1303386688232422, -0.12483692169189453, -0.11933517456054688, -0.11383342742919922, -0.10833168029785156, -0.1028299331665039, -0.09732818603515625, -0.0918264389038086, -0.08632469177246094, -0.08082294464111328, -0.07532119750976562, -0.06981945037841797, -0.06431770324707031, -0.058815956115722656, -0.053314208984375, -0.047812461853027344, -0.04231071472167969, -0.03680896759033203, -0.031307220458984375, -0.02580547332763672, -0.020303726196289062, -0.014801979064941406, -0.00930023193359375, -0.0037984848022460938, 0.0017032623291015625, 0.007205009460449219, 0.012706756591796875, 0.01820850372314453, 0.023710250854492188, 0.029211997985839844, 0.0347137451171875, 0.040215492248535156, 0.04571723937988281, 0.05121898651123047, 0.056720733642578125, 0.06222248077392578, 0.06772422790527344, 0.0732259750366211, 0.07872772216796875, 0.0842294692993164, 0.08973121643066406, 0.09523296356201172, 0.10073471069335938, 0.10623645782470703, 0.11173820495605469, 0.11723995208740234, 0.12274169921875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 10.0, 5.0, 7.0, 11.0, 13.0, 20.0, 34.0, 42.0, 48.0, 69.0, 100.0, 103.0, 109.0, 96.0, 80.0, 68.0, 47.0, 44.0, 33.0, 18.0, 15.0, 9.0, 8.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.19873046875, -0.19403457641601562, -0.18933868408203125, -0.18464279174804688, -0.1799468994140625, -0.17525100708007812, -0.17055511474609375, -0.16585922241210938, -0.161163330078125, -0.15646743774414062, -0.15177154541015625, -0.14707565307617188, -0.1423797607421875, -0.13768386840820312, -0.13298797607421875, -0.12829208374023438, -0.12359619140625, -0.11890029907226562, -0.11420440673828125, -0.10950851440429688, -0.1048126220703125, -0.10011672973632812, -0.09542083740234375, -0.09072494506835938, -0.086029052734375, -0.08133316040039062, -0.07663726806640625, -0.07194137573242188, -0.0672454833984375, -0.06254959106445312, -0.05785369873046875, -0.053157806396484375, -0.0484619140625, -0.043766021728515625, -0.03907012939453125, -0.034374237060546875, -0.0296783447265625, -0.024982452392578125, -0.02028656005859375, -0.015590667724609375, -0.010894775390625, -0.006198883056640625, -0.00150299072265625, 0.003192901611328125, 0.0078887939453125, 0.012584686279296875, 0.01728057861328125, 0.021976470947265625, 0.02667236328125, 0.031368255615234375, 0.03606414794921875, 0.040760040283203125, 0.0454559326171875, 0.050151824951171875, 0.05484771728515625, 0.059543609619140625, 0.064239501953125, 0.06893539428710938, 0.07363128662109375, 0.07832717895507812, 0.0830230712890625, 0.08771896362304688, 0.09241485595703125, 0.09711074829101562, 0.101806640625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 10.0, 10.0, 54.0, 172.0, 254.0, 255.0, 174.0, 55.0, 12.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.75568962097168, -4.62678337097168, -4.49787712097168, -4.368971347808838, -4.240065097808838, -4.111158847808838, -3.982252836227417, -3.853346824645996, -3.724440574645996, -3.595534324645996, -3.466628313064575, -3.3377223014831543, -3.2088160514831543, -3.0799098014831543, -2.9510037899017334, -2.8220977783203125, -2.6931915283203125, -2.5642852783203125, -2.4353792667388916, -2.3064732551574707, -2.1775670051574707, -2.0486607551574707, -1.9197547435760498, -1.7908486127853394, -1.661942481994629, -1.5330363512039185, -1.404130220413208, -1.2752240896224976, -1.146317958831787, -1.0174118280410767, -0.8885056972503662, -0.7595995664596558, -0.6306934356689453, -0.5017873048782349, -0.3728811740875244, -0.24397504329681396, -0.11506891250610352, 0.013837218284606934, 0.14274334907531738, 0.27164947986602783, 0.4005556106567383, 0.5294617414474487, 0.6583678722381592, 0.7872740030288696, 0.9161801338195801, 1.0450862646102905, 1.173992395401001, 1.3028985261917114, 1.4318046569824219, 1.5607107877731323, 1.6896169185638428, 1.8185230493545532, 1.9474291801452637, 2.0763354301452637, 2.2052414417266846, 2.3341474533081055, 2.4630537033081055, 2.5919599533081055, 2.7208659648895264, 2.8497719764709473, 2.9786782264709473, 3.1075844764709473, 3.236490488052368, 3.365396499633789, 3.494302749633789]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 2.0, 6.0, 6.0, 10.0, 6.0, 6.0, 11.0, 12.0, 10.0, 12.0, 22.0, 22.0, 23.0, 33.0, 31.0, 39.0, 30.0, 41.0, 42.0, 36.0, 50.0, 57.0, 56.0, 38.0, 42.0, 44.0, 44.0, 37.0, 41.0, 31.0, 32.0, 22.0, 21.0, 11.0, 16.0, 11.0, 10.0, 10.0, 3.0, 7.0, 3.0, 6.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.6720733642578125, -1.6205507516860962, -1.5690281391143799, -1.517505407333374, -1.4659827947616577, -1.4144601821899414, -1.3629374504089355, -1.3114148378372192, -1.259892225265503, -1.2083696126937866, -1.1568470001220703, -1.1053242683410645, -1.0538016557693481, -1.0022790431976318, -0.9507563710212708, -0.8992336988449097, -0.8477110862731934, -0.796188473701477, -0.744665801525116, -0.6931431293487549, -0.6416205167770386, -0.5900979042053223, -0.5385752320289612, -0.4870525896549225, -0.4355299472808838, -0.3840073049068451, -0.3324846625328064, -0.2809620201587677, -0.229439377784729, -0.1779167354106903, -0.1263940930366516, -0.07487145066261292, -0.02334892749786377, 0.028173714876174927, 0.07969635725021362, 0.13121899962425232, 0.18274164199829102, 0.2342642843723297, 0.2857869267463684, 0.3373095691204071, 0.3888322114944458, 0.4403548538684845, 0.4918774962425232, 0.5434001684188843, 0.5949227809906006, 0.6464453935623169, 0.697968065738678, 0.7494907379150391, 0.8010133504867554, 0.8525359630584717, 0.9040586352348328, 0.9555813074111938, 1.0071039199829102, 1.0586265325546265, 1.1101491451263428, 1.1616718769073486, 1.213194489479065, 1.2647171020507812, 1.316239833831787, 1.3677624464035034, 1.4192850589752197, 1.470807671546936, 1.5223302841186523, 1.5738530158996582, 1.6253756284713745]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 9.0, 6.0, 11.0, 21.0, 30.0, 48.0, 59.0, 100.0, 121.0, 204.0, 298.0, 508.0, 873.0, 1554.0, 3152.0, 7601.0, 21446.0, 113341.0, 3930628.0, 82936.0, 18202.0, 6651.0, 2937.0, 1349.0, 810.0, 476.0, 292.0, 194.0, 145.0, 84.0, 57.0, 35.0, 28.0, 21.0, 17.0, 10.0, 7.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.2470703125, -0.23945236206054688, -0.23183441162109375, -0.22421646118164062, -0.2165985107421875, -0.20898056030273438, -0.20136260986328125, -0.19374465942382812, -0.186126708984375, -0.17850875854492188, -0.17089080810546875, -0.16327285766601562, -0.1556549072265625, -0.14803695678710938, -0.14041900634765625, -0.13280105590820312, -0.12518310546875, -0.11756515502929688, -0.10994720458984375, -0.10232925415039062, -0.0947113037109375, -0.08709335327148438, -0.07947540283203125, -0.07185745239257812, -0.064239501953125, -0.056621551513671875, -0.04900360107421875, -0.041385650634765625, -0.0337677001953125, -0.026149749755859375, -0.01853179931640625, -0.010913848876953125, -0.0032958984375, 0.004322052001953125, 0.01194000244140625, 0.019557952880859375, 0.0271759033203125, 0.034793853759765625, 0.04241180419921875, 0.050029754638671875, 0.057647705078125, 0.06526565551757812, 0.07288360595703125, 0.08050155639648438, 0.0881195068359375, 0.09573745727539062, 0.10335540771484375, 0.11097335815429688, 0.11859130859375, 0.12620925903320312, 0.13382720947265625, 0.14144515991210938, 0.1490631103515625, 0.15668106079101562, 0.16429901123046875, 0.17191696166992188, 0.179534912109375, 0.18715286254882812, 0.19477081298828125, 0.20238876342773438, 0.2100067138671875, 0.21762466430664062, 0.22524261474609375, 0.23286056518554688, 0.240478515625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 12.0, 11.0, 16.0, 26.0, 33.0, 43.0, 38.0, 45.0, 77.0, 60.0, 72.0, 101.0, 87.0, 76.0, 66.0, 49.0, 54.0, 39.0, 26.0, 20.0, 20.0, 13.0, 11.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11700439453125, -0.11278057098388672, -0.10855674743652344, -0.10433292388916016, -0.10010910034179688, -0.0958852767944336, -0.09166145324707031, -0.08743762969970703, -0.08321380615234375, -0.07898998260498047, -0.07476615905761719, -0.0705423355102539, -0.06631851196289062, -0.062094688415527344, -0.05787086486816406, -0.05364704132080078, -0.0494232177734375, -0.04519939422607422, -0.04097557067871094, -0.036751747131347656, -0.032527923583984375, -0.028304100036621094, -0.024080276489257812, -0.01985645294189453, -0.01563262939453125, -0.011408805847167969, -0.0071849822998046875, -0.0029611587524414062, 0.001262664794921875, 0.005486488342285156, 0.009710311889648438, 0.013934135437011719, 0.018157958984375, 0.02238178253173828, 0.026605606079101562, 0.030829429626464844, 0.035053253173828125, 0.039277076721191406, 0.04350090026855469, 0.04772472381591797, 0.05194854736328125, 0.05617237091064453, 0.06039619445800781, 0.0646200180053711, 0.06884384155273438, 0.07306766510009766, 0.07729148864746094, 0.08151531219482422, 0.0857391357421875, 0.08996295928955078, 0.09418678283691406, 0.09841060638427734, 0.10263442993164062, 0.1068582534790039, 0.11108207702636719, 0.11530590057373047, 0.11952972412109375, 0.12375354766845703, 0.1279773712158203, 0.1322011947631836, 0.13642501831054688, 0.14064884185791016, 0.14487266540527344, 0.14909648895263672, 0.1533203125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 3.0, 5.0, 5.0, 8.0, 12.0, 10.0, 19.0, 32.0, 54.0, 69.0, 99.0, 191.0, 389.0, 815.0, 2070.0, 6190.0, 28363.0, 3180482.0, 939863.0, 26162.0, 5828.0, 1954.0, 751.0, 369.0, 184.0, 112.0, 81.0, 56.0, 36.0, 21.0, 9.0, 7.0, 8.0, 7.0, 8.0, 2.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.387451171875, -0.3745269775390625, -0.361602783203125, -0.3486785888671875, -0.33575439453125, -0.3228302001953125, -0.309906005859375, -0.2969818115234375, -0.2840576171875, -0.2711334228515625, -0.258209228515625, -0.2452850341796875, -0.23236083984375, -0.2194366455078125, -0.206512451171875, -0.1935882568359375, -0.1806640625, -0.1677398681640625, -0.154815673828125, -0.1418914794921875, -0.12896728515625, -0.1160430908203125, -0.103118896484375, -0.0901947021484375, -0.0772705078125, -0.0643463134765625, -0.051422119140625, -0.0384979248046875, -0.02557373046875, -0.0126495361328125, 0.000274658203125, 0.0131988525390625, 0.026123046875, 0.0390472412109375, 0.051971435546875, 0.0648956298828125, 0.07781982421875, 0.0907440185546875, 0.103668212890625, 0.1165924072265625, 0.1295166015625, 0.1424407958984375, 0.155364990234375, 0.1682891845703125, 0.18121337890625, 0.1941375732421875, 0.207061767578125, 0.2199859619140625, 0.23291015625, 0.2458343505859375, 0.258758544921875, 0.2716827392578125, 0.28460693359375, 0.2975311279296875, 0.310455322265625, 0.3233795166015625, 0.3363037109375, 0.3492279052734375, 0.362152099609375, 0.3750762939453125, 0.38800048828125, 0.4009246826171875, 0.413848876953125, 0.4267730712890625, 0.439697265625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 11.0, 11.0, 36.0, 47.0, 96.0, 340.0, 3104.0, 230.0, 86.0, 38.0, 23.0, 14.0, 7.0, 10.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13720703125, -0.13134384155273438, -0.12548065185546875, -0.11961746215820312, -0.1137542724609375, -0.10789108276367188, -0.10202789306640625, -0.09616470336914062, -0.090301513671875, -0.08443832397460938, -0.07857513427734375, -0.07271194458007812, -0.0668487548828125, -0.060985565185546875, -0.05512237548828125, -0.049259185791015625, -0.04339599609375, -0.037532806396484375, -0.03166961669921875, -0.025806427001953125, -0.0199432373046875, -0.014080047607421875, -0.00821685791015625, -0.002353668212890625, 0.003509521484375, 0.009372711181640625, 0.01523590087890625, 0.021099090576171875, 0.0269622802734375, 0.032825469970703125, 0.03868865966796875, 0.044551849365234375, 0.0504150390625, 0.056278228759765625, 0.06214141845703125, 0.06800460815429688, 0.0738677978515625, 0.07973098754882812, 0.08559417724609375, 0.09145736694335938, 0.097320556640625, 0.10318374633789062, 0.10904693603515625, 0.11491012573242188, 0.1207733154296875, 0.12663650512695312, 0.13249969482421875, 0.13836288452148438, 0.14422607421875, 0.15008926391601562, 0.15595245361328125, 0.16181564331054688, 0.1676788330078125, 0.17354202270507812, 0.17940521240234375, 0.18526840209960938, 0.191131591796875, 0.19699478149414062, 0.20285797119140625, 0.20872116088867188, 0.2145843505859375, 0.22044754028320312, 0.22631072998046875, 0.23217391967773438, 0.238037109375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 5.0, 8.0, 15.0, 27.0, 29.0, 56.0, 87.0, 111.0, 128.0, 118.0, 108.0, 106.0, 73.0, 50.0, 23.0, 20.0, 11.0, 9.0, 0.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50335693359375, -0.4859715402126312, -0.46858614683151245, -0.4512007236480713, -0.4338153302669525, -0.41642993688583374, -0.3990445137023926, -0.3816591203212738, -0.36427372694015503, -0.34688833355903625, -0.3295029401779175, -0.3121175169944763, -0.29473212361335754, -0.27734673023223877, -0.2599613070487976, -0.24257591366767883, -0.22519052028656006, -0.20780512690544128, -0.19041971862316132, -0.17303431034088135, -0.15564891695976257, -0.1382635235786438, -0.12087811529636383, -0.10349271446466446, -0.08610731363296509, -0.06872191280126572, -0.051336511969566345, -0.033951111137866974, -0.016565710306167603, 0.0008196905255317688, 0.01820509135723114, 0.03559049218893051, 0.05297589302062988, 0.07036129385232925, 0.08774669468402863, 0.105132095515728, 0.12251749634742737, 0.13990288972854614, 0.1572882980108261, 0.17467370629310608, 0.19205909967422485, 0.20944449305534363, 0.2268299013376236, 0.24421530961990356, 0.26160070300102234, 0.2789860963821411, 0.2963715195655823, 0.31375691294670105, 0.3311423063278198, 0.3485276997089386, 0.3659130930900574, 0.38329851627349854, 0.4006839096546173, 0.4180693030357361, 0.43545472621917725, 0.452840119600296, 0.4702255129814148, 0.48761090636253357, 0.5049962997436523, 0.5223817229270935, 0.5397671461105347, 0.557152509689331, 0.5745379328727722, 0.5919232964515686, 0.6093087196350098]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 7.0, 6.0, 9.0, 17.0, 11.0, 13.0, 23.0, 19.0, 26.0, 21.0, 26.0, 25.0, 35.0, 23.0, 38.0, 46.0, 45.0, 51.0, 54.0, 47.0, 38.0, 33.0, 35.0, 46.0, 51.0, 24.0, 34.0, 27.0, 33.0, 25.0, 17.0, 22.0, 9.0, 12.0, 12.0, 6.0, 4.0, 2.0, 4.0, 8.0, 2.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.3324315547943115, -0.3221175968647003, -0.3118036091327667, -0.3014896512031555, -0.2911756634712219, -0.2808617055416107, -0.2705477476119995, -0.2602337598800659, -0.2499198019504547, -0.2396058291196823, -0.2292918562889099, -0.2189778983592987, -0.2086639255285263, -0.1983499526977539, -0.1880359947681427, -0.1777220219373703, -0.1674080491065979, -0.1570940762758255, -0.1467801034450531, -0.1364661455154419, -0.1261521726846695, -0.1158381998538971, -0.10552423447370529, -0.09521026909351349, -0.08489629626274109, -0.07458232343196869, -0.06426835805177689, -0.053954388946294785, -0.04364041984081268, -0.03332645073533058, -0.02301248162984848, -0.012698516249656677, -0.0023845434188842773, 0.007929425686597824, 0.018243394792079926, 0.028557363897562027, 0.03887133300304413, 0.04918530210852623, 0.05949927121400833, 0.06981323659420013, 0.08012720942497253, 0.09044118225574493, 0.10075514763593674, 0.11106911301612854, 0.12138308584690094, 0.13169705867767334, 0.14201101660728455, 0.15232498943805695, 0.16263896226882935, 0.17295293509960175, 0.18326690793037415, 0.19358086585998535, 0.20389483869075775, 0.21420881152153015, 0.22452276945114136, 0.23483674228191376, 0.24515071511268616, 0.25546467304229736, 0.26577866077423096, 0.27609261870384216, 0.28640657663345337, 0.29672056436538696, 0.30703452229499817, 0.3173484802246094, 0.32766246795654297]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 9.0, 3.0, 10.0, 12.0, 23.0, 46.0, 79.0, 157.0, 326.0, 625.0, 1426.0, 3095.0, 7590.0, 18833.0, 50797.0, 143126.0, 394424.0, 276435.0, 94565.0, 34399.0, 13123.0, 5187.0, 2244.0, 1022.0, 529.0, 226.0, 124.0, 48.0, 29.0, 15.0, 15.0, 10.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.263671875, -0.25720977783203125, -0.2507476806640625, -0.24428558349609375, -0.237823486328125, -0.23136138916015625, -0.2248992919921875, -0.21843719482421875, -0.21197509765625, -0.20551300048828125, -0.1990509033203125, -0.19258880615234375, -0.186126708984375, -0.17966461181640625, -0.1732025146484375, -0.16674041748046875, -0.1602783203125, -0.15381622314453125, -0.1473541259765625, -0.14089202880859375, -0.134429931640625, -0.12796783447265625, -0.1215057373046875, -0.11504364013671875, -0.10858154296875, -0.10211944580078125, -0.0956573486328125, -0.08919525146484375, -0.082733154296875, -0.07627105712890625, -0.0698089599609375, -0.06334686279296875, -0.056884765625, -0.05042266845703125, -0.0439605712890625, -0.03749847412109375, -0.031036376953125, -0.02457427978515625, -0.0181121826171875, -0.01165008544921875, -0.00518798828125, 0.00127410888671875, 0.0077362060546875, 0.01419830322265625, 0.020660400390625, 0.02712249755859375, 0.0335845947265625, 0.04004669189453125, 0.0465087890625, 0.05297088623046875, 0.0594329833984375, 0.06589508056640625, 0.072357177734375, 0.07881927490234375, 0.0852813720703125, 0.09174346923828125, 0.09820556640625, 0.10466766357421875, 0.1111297607421875, 0.11759185791015625, 0.124053955078125, 0.13051605224609375, 0.1369781494140625, 0.14344024658203125, 0.14990234375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 11.0, 14.0, 19.0, 18.0, 26.0, 34.0, 39.0, 53.0, 50.0, 64.0, 72.0, 83.0, 71.0, 61.0, 80.0, 60.0, 54.0, 45.0, 35.0, 27.0, 24.0, 19.0, 10.0, 15.0, 9.0, 3.0, 5.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1280517578125, -0.12396621704101562, -0.11988067626953125, -0.11579513549804688, -0.1117095947265625, -0.10762405395507812, -0.10353851318359375, -0.09945297241210938, -0.095367431640625, -0.09128189086914062, -0.08719635009765625, -0.08311080932617188, -0.0790252685546875, -0.07493972778320312, -0.07085418701171875, -0.06676864624023438, -0.06268310546875, -0.058597564697265625, -0.05451202392578125, -0.050426483154296875, -0.0463409423828125, -0.042255401611328125, -0.03816986083984375, -0.034084320068359375, -0.029998779296875, -0.025913238525390625, -0.02182769775390625, -0.017742156982421875, -0.0136566162109375, -0.009571075439453125, -0.00548553466796875, -0.001399993896484375, 0.002685546875, 0.006771087646484375, 0.01085662841796875, 0.014942169189453125, 0.0190277099609375, 0.023113250732421875, 0.02719879150390625, 0.031284332275390625, 0.035369873046875, 0.039455413818359375, 0.04354095458984375, 0.047626495361328125, 0.0517120361328125, 0.055797576904296875, 0.05988311767578125, 0.06396865844726562, 0.06805419921875, 0.07213973999023438, 0.07622528076171875, 0.08031082153320312, 0.0843963623046875, 0.08848190307617188, 0.09256744384765625, 0.09665298461914062, 0.100738525390625, 0.10482406616210938, 0.10890960693359375, 0.11299514770507812, 0.1170806884765625, 0.12116622924804688, 0.12525177001953125, 0.12933731079101562, 0.1334228515625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 3.0, 10.0, 9.0, 19.0, 11.0, 16.0, 37.0, 57.0, 62.0, 105.0, 137.0, 211.0, 305.0, 480.0, 859.0, 1539.0, 3911.0, 18709.0, 204055.0, 728413.0, 74223.0, 9607.0, 2685.0, 1181.0, 643.0, 412.0, 277.0, 167.0, 118.0, 101.0, 59.0, 43.0, 27.0, 24.0, 14.0, 9.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.427978515625, -0.41550445556640625, -0.4030303955078125, -0.39055633544921875, -0.378082275390625, -0.36560821533203125, -0.3531341552734375, -0.34066009521484375, -0.32818603515625, -0.31571197509765625, -0.3032379150390625, -0.29076385498046875, -0.278289794921875, -0.26581573486328125, -0.2533416748046875, -0.24086761474609375, -0.2283935546875, -0.21591949462890625, -0.2034454345703125, -0.19097137451171875, -0.178497314453125, -0.16602325439453125, -0.1535491943359375, -0.14107513427734375, -0.12860107421875, -0.11612701416015625, -0.1036529541015625, -0.09117889404296875, -0.078704833984375, -0.06623077392578125, -0.0537567138671875, -0.04128265380859375, -0.02880859375, -0.01633453369140625, -0.0038604736328125, 0.00861358642578125, 0.021087646484375, 0.03356170654296875, 0.0460357666015625, 0.05850982666015625, 0.07098388671875, 0.08345794677734375, 0.0959320068359375, 0.10840606689453125, 0.120880126953125, 0.13335418701171875, 0.1458282470703125, 0.15830230712890625, 0.1707763671875, 0.18325042724609375, 0.1957244873046875, 0.20819854736328125, 0.220672607421875, 0.23314666748046875, 0.2456207275390625, 0.25809478759765625, 0.27056884765625, 0.28304290771484375, 0.2955169677734375, 0.30799102783203125, 0.320465087890625, 0.33293914794921875, 0.3454132080078125, 0.35788726806640625, 0.370361328125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 2.0, 9.0, 10.0, 15.0, 7.0, 13.0, 22.0, 21.0, 16.0, 24.0, 32.0, 24.0, 33.0, 35.0, 28.0, 29.0, 50.0, 48.0, 48.0, 39.0, 39.0, 39.0, 39.0, 49.0, 42.0, 31.0, 40.0, 29.0, 30.0, 32.0, 18.0, 22.0, 17.0, 16.0, 18.0, 11.0, 8.0, 5.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35888671875, -0.347564697265625, -0.33624267578125, -0.324920654296875, -0.3135986328125, -0.302276611328125, -0.29095458984375, -0.279632568359375, -0.268310546875, -0.256988525390625, -0.24566650390625, -0.234344482421875, -0.2230224609375, -0.211700439453125, -0.20037841796875, -0.189056396484375, -0.177734375, -0.166412353515625, -0.15509033203125, -0.143768310546875, -0.1324462890625, -0.121124267578125, -0.10980224609375, -0.098480224609375, -0.087158203125, -0.075836181640625, -0.06451416015625, -0.053192138671875, -0.0418701171875, -0.030548095703125, -0.01922607421875, -0.007904052734375, 0.00341796875, 0.014739990234375, 0.02606201171875, 0.037384033203125, 0.0487060546875, 0.060028076171875, 0.07135009765625, 0.082672119140625, 0.093994140625, 0.105316162109375, 0.11663818359375, 0.127960205078125, 0.1392822265625, 0.150604248046875, 0.16192626953125, 0.173248291015625, 0.1845703125, 0.195892333984375, 0.20721435546875, 0.218536376953125, 0.2298583984375, 0.241180419921875, 0.25250244140625, 0.263824462890625, 0.275146484375, 0.286468505859375, 0.29779052734375, 0.309112548828125, 0.3204345703125, 0.331756591796875, 0.34307861328125, 0.354400634765625, 0.36572265625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 5.0, 9.0, 15.0, 18.0, 29.0, 34.0, 52.0, 108.0, 235.0, 635.0, 2560.0, 25808.0, 916543.0, 96042.0, 4869.0, 937.0, 329.0, 118.0, 76.0, 46.0, 25.0, 17.0, 14.0, 8.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3466796875, -0.3363838195800781, -0.32608795166015625, -0.3157920837402344, -0.3054962158203125, -0.2952003479003906, -0.28490447998046875, -0.2746086120605469, -0.264312744140625, -0.2540168762207031, -0.24372100830078125, -0.23342514038085938, -0.2231292724609375, -0.21283340454101562, -0.20253753662109375, -0.19224166870117188, -0.18194580078125, -0.17164993286132812, -0.16135406494140625, -0.15105819702148438, -0.1407623291015625, -0.13046646118164062, -0.12017059326171875, -0.10987472534179688, -0.099578857421875, -0.08928298950195312, -0.07898712158203125, -0.06869125366210938, -0.0583953857421875, -0.048099517822265625, -0.03780364990234375, -0.027507781982421875, -0.0172119140625, -0.006916046142578125, 0.00337982177734375, 0.013675689697265625, 0.0239715576171875, 0.034267425537109375, 0.04456329345703125, 0.054859161376953125, 0.065155029296875, 0.07545089721679688, 0.08574676513671875, 0.09604263305664062, 0.1063385009765625, 0.11663436889648438, 0.12693023681640625, 0.13722610473632812, 0.14752197265625, 0.15781784057617188, 0.16811370849609375, 0.17840957641601562, 0.1887054443359375, 0.19900131225585938, 0.20929718017578125, 0.21959304809570312, 0.229888916015625, 0.24018478393554688, 0.25048065185546875, 0.2607765197753906, 0.2710723876953125, 0.2813682556152344, 0.29166412353515625, 0.3019599914550781, 0.312255859375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 11.0, 6.0, 11.0, 11.0, 10.0, 30.0, 32.0, 45.0, 70.0, 80.0, 98.0, 148.0, 117.0, 81.0, 49.0, 61.0, 43.0, 37.0, 19.0, 11.0, 11.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.771087646484375e-05, -6.49699941277504e-05, -6.222911179065704e-05, -5.948822945356369e-05, -5.674734711647034e-05, -5.4006464779376984e-05, -5.126558244228363e-05, -4.852470010519028e-05, -4.5783817768096924e-05, -4.304293543100357e-05, -4.030205309391022e-05, -3.7561170756816864e-05, -3.482028841972351e-05, -3.207940608263016e-05, -2.9338523745536804e-05, -2.659764140844345e-05, -2.3856759071350098e-05, -2.1115876734256744e-05, -1.837499439716339e-05, -1.5634112060070038e-05, -1.2893229722976685e-05, -1.0152347385883331e-05, -7.411465048789978e-06, -4.670582711696625e-06, -1.9297003746032715e-06, 8.111819624900818e-07, 3.552064299583435e-06, 6.292946636676788e-06, 9.033828973770142e-06, 1.1774711310863495e-05, 1.4515593647956848e-05, 1.72564759850502e-05, 1.9997358322143555e-05, 2.2738240659236908e-05, 2.547912299633026e-05, 2.8220005333423615e-05, 3.096088767051697e-05, 3.370177000761032e-05, 3.6442652344703674e-05, 3.918353468179703e-05, 4.192441701889038e-05, 4.4665299355983734e-05, 4.740618169307709e-05, 5.014706403017044e-05, 5.2887946367263794e-05, 5.562882870435715e-05, 5.83697110414505e-05, 6.111059337854385e-05, 6.385147571563721e-05, 6.659235805273056e-05, 6.933324038982391e-05, 7.207412272691727e-05, 7.481500506401062e-05, 7.755588740110397e-05, 8.029676973819733e-05, 8.303765207529068e-05, 8.577853441238403e-05, 8.851941674947739e-05, 9.126029908657074e-05, 9.400118142366409e-05, 9.674206376075745e-05, 9.94829460978508e-05, 0.00010222382843494415, 0.0001049647107720375, 0.00010770559310913086]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 3.0, 12.0, 21.0, 20.0, 24.0, 34.0, 70.0, 120.0, 204.0, 481.0, 1207.0, 3602.0, 22854.0, 941406.0, 70124.0, 5499.0, 1584.0, 607.0, 250.0, 153.0, 101.0, 62.0, 36.0, 18.0, 15.0, 12.0, 6.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.352783203125, -0.3408851623535156, -0.32898712158203125, -0.3170890808105469, -0.3051910400390625, -0.2932929992675781, -0.28139495849609375, -0.2694969177246094, -0.257598876953125, -0.24570083618164062, -0.23380279541015625, -0.22190475463867188, -0.2100067138671875, -0.19810867309570312, -0.18621063232421875, -0.17431259155273438, -0.16241455078125, -0.15051651000976562, -0.13861846923828125, -0.12672042846679688, -0.1148223876953125, -0.10292434692382812, -0.09102630615234375, -0.07912826538085938, -0.067230224609375, -0.055332183837890625, -0.04343414306640625, -0.031536102294921875, -0.0196380615234375, -0.007740020751953125, 0.00415802001953125, 0.016056060791015625, 0.0279541015625, 0.039852142333984375, 0.05175018310546875, 0.06364822387695312, 0.0755462646484375, 0.08744430541992188, 0.09934234619140625, 0.11124038696289062, 0.123138427734375, 0.13503646850585938, 0.14693450927734375, 0.15883255004882812, 0.1707305908203125, 0.18262863159179688, 0.19452667236328125, 0.20642471313476562, 0.21832275390625, 0.23022079467773438, 0.24211883544921875, 0.2540168762207031, 0.2659149169921875, 0.2778129577636719, 0.28971099853515625, 0.3016090393066406, 0.313507080078125, 0.3254051208496094, 0.33730316162109375, 0.3492012023925781, 0.3610992431640625, 0.3729972839355469, 0.38489532470703125, 0.3967933654785156, 0.40869140625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 7.0, 17.0, 26.0, 21.0, 53.0, 65.0, 110.0, 155.0, 134.0, 135.0, 77.0, 53.0, 35.0, 32.0, 24.0, 11.0, 9.0, 2.0, 3.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.232421875, -0.22618865966796875, -0.2199554443359375, -0.21372222900390625, -0.207489013671875, -0.20125579833984375, -0.1950225830078125, -0.18878936767578125, -0.18255615234375, -0.17632293701171875, -0.1700897216796875, -0.16385650634765625, -0.157623291015625, -0.15139007568359375, -0.1451568603515625, -0.13892364501953125, -0.1326904296875, -0.12645721435546875, -0.1202239990234375, -0.11399078369140625, -0.107757568359375, -0.10152435302734375, -0.0952911376953125, -0.08905792236328125, -0.08282470703125, -0.07659149169921875, -0.0703582763671875, -0.06412506103515625, -0.057891845703125, -0.05165863037109375, -0.0454254150390625, -0.03919219970703125, -0.032958984375, -0.02672576904296875, -0.0204925537109375, -0.01425933837890625, -0.008026123046875, -0.00179290771484375, 0.0044403076171875, 0.01067352294921875, 0.01690673828125, 0.02313995361328125, 0.0293731689453125, 0.03560638427734375, 0.041839599609375, 0.04807281494140625, 0.0543060302734375, 0.06053924560546875, 0.0667724609375, 0.07300567626953125, 0.0792388916015625, 0.08547210693359375, 0.091705322265625, 0.09793853759765625, 0.1041717529296875, 0.11040496826171875, 0.11663818359375, 0.12287139892578125, 0.1291046142578125, 0.13533782958984375, 0.141571044921875, 0.14780426025390625, 0.1540374755859375, 0.16027069091796875, 0.16650390625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 16.0, 55.0, 129.0, 248.0, 291.0, 156.0, 55.0, 28.0, 9.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.76110315322876, -4.603743553161621, -4.446383953094482, -4.289024353027344, -4.131664276123047, -3.9743049144744873, -3.8169450759887695, -3.659585475921631, -3.502225875854492, -3.3448662757873535, -3.187506675720215, -3.030146837234497, -2.8727872371673584, -2.7154276371002197, -2.558067798614502, -2.4007081985473633, -2.2433485984802246, -2.085988998413086, -1.9286292791366577, -1.7712695598602295, -1.6139099597930908, -1.4565503597259521, -1.299190640449524, -1.1418309211730957, -0.984471321105957, -0.8271116614341736, -0.6697520017623901, -0.5123923420906067, -0.35503268241882324, -0.1976730227470398, -0.04031336307525635, 0.11704635620117188, 0.27440643310546875, 0.4317660927772522, 0.5891257524490356, 0.7464854121208191, 0.9038450717926025, 1.0612046718597412, 1.2185643911361694, 1.3759241104125977, 1.5332837104797363, 1.690643310546875, 1.8480030298233032, 2.0053627490997314, 2.16272234916687, 2.320081949234009, 2.4774417877197266, 2.6348013877868652, 2.792160987854004, 2.9495205879211426, 3.1068801879882812, 3.264240026473999, 3.4215996265411377, 3.5789592266082764, 3.736319065093994, 3.893678665161133, 4.0510382652282715, 4.20839786529541, 4.365757465362549, 4.5231170654296875, 4.680477142333984, 4.837836742401123, 4.995196342468262, 5.1525559425354, 5.309915542602539]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 7.0, 8.0, 10.0, 20.0, 29.0, 29.0, 34.0, 42.0, 49.0, 53.0, 78.0, 74.0, 73.0, 77.0, 71.0, 68.0, 53.0, 54.0, 40.0, 29.0, 36.0, 16.0, 16.0, 15.0, 6.0, 8.0, 5.0, 1.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.288053035736084, -3.205904245376587, -3.12375545501709, -3.041606903076172, -2.959458112716675, -2.8773093223571777, -2.7951605319976807, -2.7130117416381836, -2.6308631896972656, -2.5487143993377686, -2.4665656089782715, -2.3844170570373535, -2.3022682666778564, -2.2201194763183594, -2.1379706859588623, -2.0558218955993652, -1.9736732244491577, -1.8915244340896606, -1.8093757629394531, -1.727226972579956, -1.6450783014297485, -1.5629295110702515, -1.480780839920044, -1.3986320495605469, -1.3164832592010498, -1.2343344688415527, -1.1521857976913452, -1.0700370073318481, -0.9878883361816406, -0.9057395458221436, -0.8235908150672913, -0.741442084312439, -0.659293532371521, -0.5771448016166687, -0.4949960708618164, -0.4128473103046417, -0.33069857954978943, -0.24854984879493713, -0.16640108823776245, -0.08425235748291016, -0.0021036267280578613, 0.08004511147737503, 0.16219384968280792, 0.2443425953388214, 0.3264913260936737, 0.408640056848526, 0.4907888174057007, 0.572937548160553, 0.6550862789154053, 0.7372350096702576, 0.8193837404251099, 0.9015325307846069, 0.9836812019348145, 1.0658299922943115, 1.1479787826538086, 1.2301274538040161, 1.3122761249542236, 1.3944249153137207, 1.4765735864639282, 1.5587223768234253, 1.6408710479736328, 1.7230198383331299, 1.805168628692627, 1.8873172998428345, 1.9694660902023315]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 6.0, 9.0, 12.0, 21.0, 24.0, 30.0, 62.0, 78.0, 156.0, 245.0, 487.0, 973.0, 2496.0, 6884.0, 25389.0, 185405.0, 3384620.0, 525793.0, 45478.0, 10579.0, 3216.0, 1193.0, 544.0, 249.0, 122.0, 81.0, 51.0, 30.0, 19.0, 4.0, 15.0, 6.0, 6.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.3515625, -0.3431243896484375, -0.334686279296875, -0.3262481689453125, -0.31781005859375, -0.3093719482421875, -0.300933837890625, -0.2924957275390625, -0.2840576171875, -0.2756195068359375, -0.267181396484375, -0.2587432861328125, -0.25030517578125, -0.2418670654296875, -0.233428955078125, -0.2249908447265625, -0.216552734375, -0.2081146240234375, -0.199676513671875, -0.1912384033203125, -0.18280029296875, -0.1743621826171875, -0.165924072265625, -0.1574859619140625, -0.1490478515625, -0.1406097412109375, -0.132171630859375, -0.1237335205078125, -0.11529541015625, -0.1068572998046875, -0.098419189453125, -0.0899810791015625, -0.08154296875, -0.0731048583984375, -0.064666748046875, -0.0562286376953125, -0.04779052734375, -0.0393524169921875, -0.030914306640625, -0.0224761962890625, -0.0140380859375, -0.0055999755859375, 0.002838134765625, 0.0112762451171875, 0.01971435546875, 0.0281524658203125, 0.036590576171875, 0.0450286865234375, 0.053466796875, 0.0619049072265625, 0.070343017578125, 0.0787811279296875, 0.08721923828125, 0.0956573486328125, 0.104095458984375, 0.1125335693359375, 0.1209716796875, 0.1294097900390625, 0.137847900390625, 0.1462860107421875, 0.15472412109375, 0.1631622314453125, 0.171600341796875, 0.1800384521484375, 0.1884765625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 8.0, 8.0, 10.0, 17.0, 22.0, 17.0, 19.0, 38.0, 46.0, 43.0, 51.0, 60.0, 68.0, 65.0, 79.0, 62.0, 79.0, 65.0, 51.0, 42.0, 35.0, 25.0, 28.0, 19.0, 10.0, 15.0, 7.0, 7.0, 4.0, 1.0, 1.0, 4.0, 1.0, 4.0], "bins": [-0.162109375, -0.15844154357910156, -0.15477371215820312, -0.1511058807373047, -0.14743804931640625, -0.1437702178955078, -0.14010238647460938, -0.13643455505371094, -0.1327667236328125, -0.12909889221191406, -0.12543106079101562, -0.12176322937011719, -0.11809539794921875, -0.11442756652832031, -0.11075973510742188, -0.10709190368652344, -0.103424072265625, -0.09975624084472656, -0.09608840942382812, -0.09242057800292969, -0.08875274658203125, -0.08508491516113281, -0.08141708374023438, -0.07774925231933594, -0.0740814208984375, -0.07041358947753906, -0.06674575805664062, -0.06307792663574219, -0.05941009521484375, -0.05574226379394531, -0.052074432373046875, -0.04840660095214844, -0.04473876953125, -0.04107093811035156, -0.037403106689453125, -0.03373527526855469, -0.03006744384765625, -0.026399612426757812, -0.022731781005859375, -0.019063949584960938, -0.0153961181640625, -0.011728286743164062, -0.008060455322265625, -0.0043926239013671875, -0.00072479248046875, 0.0029430389404296875, 0.006610870361328125, 0.010278701782226562, 0.013946533203125, 0.017614364624023438, 0.021282196044921875, 0.024950027465820312, 0.02861785888671875, 0.03228569030761719, 0.035953521728515625, 0.03962135314941406, 0.0432891845703125, 0.04695701599121094, 0.050624847412109375, 0.05429267883300781, 0.05796051025390625, 0.06162834167480469, 0.06529617309570312, 0.06896400451660156, 0.0726318359375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 7.0, 8.0, 22.0, 31.0, 56.0, 122.0, 254.0, 708.0, 2532.0, 23748.0, 3616216.0, 537595.0, 10454.0, 1635.0, 491.0, 191.0, 93.0, 47.0, 20.0, 15.0, 11.0, 11.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6298828125, -0.609466552734375, -0.58905029296875, -0.568634033203125, -0.5482177734375, -0.527801513671875, -0.50738525390625, -0.486968994140625, -0.466552734375, -0.446136474609375, -0.42572021484375, -0.405303955078125, -0.3848876953125, -0.364471435546875, -0.34405517578125, -0.323638916015625, -0.30322265625, -0.282806396484375, -0.26239013671875, -0.241973876953125, -0.2215576171875, -0.201141357421875, -0.18072509765625, -0.160308837890625, -0.139892578125, -0.119476318359375, -0.09906005859375, -0.078643798828125, -0.0582275390625, -0.037811279296875, -0.01739501953125, 0.003021240234375, 0.0234375, 0.043853759765625, 0.06427001953125, 0.084686279296875, 0.1051025390625, 0.125518798828125, 0.14593505859375, 0.166351318359375, 0.186767578125, 0.207183837890625, 0.22760009765625, 0.248016357421875, 0.2684326171875, 0.288848876953125, 0.30926513671875, 0.329681396484375, 0.35009765625, 0.370513916015625, 0.39093017578125, 0.411346435546875, 0.4317626953125, 0.452178955078125, 0.47259521484375, 0.493011474609375, 0.513427734375, 0.533843994140625, 0.55426025390625, 0.574676513671875, 0.5950927734375, 0.615509033203125, 0.63592529296875, 0.656341552734375, 0.6767578125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 7.0, 10.0, 10.0, 10.0, 13.0, 29.0, 64.0, 87.0, 185.0, 456.0, 1229.0, 1124.0, 405.0, 197.0, 108.0, 49.0, 27.0, 21.0, 14.0, 11.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43115234375, -0.4180755615234375, -0.404998779296875, -0.3919219970703125, -0.37884521484375, -0.3657684326171875, -0.352691650390625, -0.3396148681640625, -0.3265380859375, -0.3134613037109375, -0.300384521484375, -0.2873077392578125, -0.27423095703125, -0.2611541748046875, -0.248077392578125, -0.2350006103515625, -0.221923828125, -0.2088470458984375, -0.195770263671875, -0.1826934814453125, -0.16961669921875, -0.1565399169921875, -0.143463134765625, -0.1303863525390625, -0.1173095703125, -0.1042327880859375, -0.091156005859375, -0.0780792236328125, -0.06500244140625, -0.0519256591796875, -0.038848876953125, -0.0257720947265625, -0.0126953125, 0.0003814697265625, 0.013458251953125, 0.0265350341796875, 0.03961181640625, 0.0526885986328125, 0.065765380859375, 0.0788421630859375, 0.0919189453125, 0.1049957275390625, 0.118072509765625, 0.1311492919921875, 0.14422607421875, 0.1573028564453125, 0.170379638671875, 0.1834564208984375, 0.196533203125, 0.2096099853515625, 0.222686767578125, 0.2357635498046875, 0.24884033203125, 0.2619171142578125, 0.274993896484375, 0.2880706787109375, 0.3011474609375, 0.3142242431640625, 0.327301025390625, 0.3403778076171875, 0.35345458984375, 0.3665313720703125, 0.379608154296875, 0.3926849365234375, 0.40576171875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 8.0, 8.0, 8.0, 15.0, 40.0, 83.0, 185.0, 225.0, 202.0, 118.0, 54.0, 24.0, 10.0, 10.0, 3.0, 3.0, 6.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4501988887786865, -3.3506782054901123, -3.251157522201538, -3.151636838912964, -3.0521161556243896, -2.9525954723358154, -2.853074789047241, -2.753554105758667, -2.6540334224700928, -2.5545127391815186, -2.4549920558929443, -2.35547137260437, -2.255950689315796, -2.1564300060272217, -2.0569093227386475, -1.9573886394500732, -1.857867956161499, -1.7583472728729248, -1.6588265895843506, -1.5593059062957764, -1.4597852230072021, -1.360264539718628, -1.2607438564300537, -1.1612231731414795, -1.0617024898529053, -0.962181806564331, -0.8626611232757568, -0.7631404399871826, -0.6636197566986084, -0.5640990734100342, -0.46457839012145996, -0.36505770683288574, -0.2655370235443115, -0.1660163402557373, -0.06649565696716309, 0.03302502632141113, 0.13254570960998535, 0.23206639289855957, 0.3315870761871338, 0.431107759475708, 0.5306284427642822, 0.6301491260528564, 0.7296698093414307, 0.8291904926300049, 0.9287111759185791, 1.0282318592071533, 1.1277525424957275, 1.2272732257843018, 1.326793909072876, 1.4263145923614502, 1.5258352756500244, 1.6253559589385986, 1.7248766422271729, 1.824397325515747, 1.9239180088043213, 2.0234386920928955, 2.1229593753814697, 2.222480058670044, 2.322000741958618, 2.4215214252471924, 2.5210421085357666, 2.620562791824341, 2.720083475112915, 2.8196041584014893, 2.9191248416900635]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 9.0, 10.0, 7.0, 7.0, 9.0, 15.0, 17.0, 36.0, 32.0, 34.0, 31.0, 41.0, 57.0, 56.0, 63.0, 67.0, 71.0, 61.0, 61.0, 55.0, 49.0, 36.0, 32.0, 29.0, 33.0, 28.0, 13.0, 13.0, 10.0, 7.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9883368015289307, -1.9346591234207153, -1.8809813261032104, -1.8273036479949951, -1.7736259698867798, -1.719948172569275, -1.6662704944610596, -1.6125926971435547, -1.5589150190353394, -1.505237340927124, -1.4515595436096191, -1.3978818655014038, -1.3442041873931885, -1.2905263900756836, -1.2368487119674683, -1.183171033859253, -1.129493236541748, -1.0758155584335327, -1.0221377611160278, -0.9684600830078125, -0.9147823452949524, -0.8611046075820923, -0.807426929473877, -0.7537491917610168, -0.7000715732574463, -0.6463938355445862, -0.5927161574363708, -0.5390384197235107, -0.48536068201065063, -0.4316829741001129, -0.3780052661895752, -0.3243275284767151, -0.270649790763855, -0.21697206795215607, -0.16329434514045715, -0.10961663722991943, -0.05593891441822052, -0.0022611916065216064, 0.05141651630401611, 0.10509425401687622, 0.15877196192741394, 0.21244968473911285, 0.26612740755081177, 0.3198051154613495, 0.3734828233718872, 0.4271605610847473, 0.48083826899528503, 0.5345159769058228, 0.5881937146186829, 0.641871452331543, 0.6955491304397583, 0.7492268681526184, 0.8029046058654785, 0.8565822839736938, 0.910260021686554, 0.9639377593994141, 1.0176154375076294, 1.0712931156158447, 1.1249709129333496, 1.178648591041565, 1.2323262691497803, 1.2860040664672852, 1.3396817445755005, 1.3933594226837158, 1.4470372200012207]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 9.0, 6.0, 12.0, 27.0, 30.0, 54.0, 70.0, 114.0, 178.0, 338.0, 580.0, 989.0, 1851.0, 3574.0, 7085.0, 15543.0, 36808.0, 101928.0, 397620.0, 334409.0, 87309.0, 32631.0, 13888.0, 6356.0, 3198.0, 1658.0, 968.0, 514.0, 318.0, 192.0, 122.0, 59.0, 37.0, 19.0, 15.0, 10.0, 8.0, 9.0, 8.0, 3.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.227783203125, -0.22041893005371094, -0.21305465698242188, -0.2056903839111328, -0.19832611083984375, -0.1909618377685547, -0.18359756469726562, -0.17623329162597656, -0.1688690185546875, -0.16150474548339844, -0.15414047241210938, -0.1467761993408203, -0.13941192626953125, -0.1320476531982422, -0.12468338012695312, -0.11731910705566406, -0.109954833984375, -0.10259056091308594, -0.09522628784179688, -0.08786201477050781, -0.08049774169921875, -0.07313346862792969, -0.06576919555664062, -0.05840492248535156, -0.0510406494140625, -0.04367637634277344, -0.036312103271484375, -0.028947830200195312, -0.02158355712890625, -0.014219284057617188, -0.006855010986328125, 0.0005092620849609375, 0.00787353515625, 0.015237808227539062, 0.022602081298828125, 0.029966354370117188, 0.03733062744140625, 0.04469490051269531, 0.052059173583984375, 0.05942344665527344, 0.0667877197265625, 0.07415199279785156, 0.08151626586914062, 0.08888053894042969, 0.09624481201171875, 0.10360908508300781, 0.11097335815429688, 0.11833763122558594, 0.125701904296875, 0.13306617736816406, 0.14043045043945312, 0.1477947235107422, 0.15515899658203125, 0.1625232696533203, 0.16988754272460938, 0.17725181579589844, 0.1846160888671875, 0.19198036193847656, 0.19934463500976562, 0.2067089080810547, 0.21407318115234375, 0.2214374542236328, 0.22880172729492188, 0.23616600036621094, 0.2435302734375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 8.0, 5.0, 7.0, 5.0, 11.0, 18.0, 17.0, 23.0, 26.0, 43.0, 37.0, 40.0, 47.0, 37.0, 51.0, 65.0, 65.0, 62.0, 71.0, 67.0, 49.0, 48.0, 47.0, 28.0, 27.0, 22.0, 19.0, 17.0, 16.0, 9.0, 5.0, 6.0, 3.0, 5.0, 0.0, 1.0, 0.0, 3.0, 3.0], "bins": [-0.1446533203125, -0.1411733627319336, -0.1376934051513672, -0.13421344757080078, -0.13073348999023438, -0.12725353240966797, -0.12377357482910156, -0.12029361724853516, -0.11681365966796875, -0.11333370208740234, -0.10985374450683594, -0.10637378692626953, -0.10289382934570312, -0.09941387176513672, -0.09593391418457031, -0.0924539566040039, -0.0889739990234375, -0.0854940414428711, -0.08201408386230469, -0.07853412628173828, -0.07505416870117188, -0.07157421112060547, -0.06809425354003906, -0.06461429595947266, -0.06113433837890625, -0.057654380798339844, -0.05417442321777344, -0.05069446563720703, -0.047214508056640625, -0.04373455047607422, -0.04025459289550781, -0.036774635314941406, -0.033294677734375, -0.029814720153808594, -0.026334762573242188, -0.02285480499267578, -0.019374847412109375, -0.01589488983154297, -0.012414932250976562, -0.008934974670410156, -0.00545501708984375, -0.0019750595092773438, 0.0015048980712890625, 0.004984855651855469, 0.008464813232421875, 0.011944770812988281, 0.015424728393554688, 0.018904685974121094, 0.0223846435546875, 0.025864601135253906, 0.029344558715820312, 0.03282451629638672, 0.036304473876953125, 0.03978443145751953, 0.04326438903808594, 0.046744346618652344, 0.05022430419921875, 0.053704261779785156, 0.05718421936035156, 0.06066417694091797, 0.06414413452148438, 0.06762409210205078, 0.07110404968261719, 0.0745840072631836, 0.07806396484375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 4.0, 9.0, 10.0, 16.0, 27.0, 23.0, 42.0, 53.0, 78.0, 122.0, 192.0, 265.0, 481.0, 988.0, 2365.0, 8311.0, 63952.0, 867022.0, 89190.0, 10160.0, 2722.0, 1050.0, 522.0, 307.0, 182.0, 113.0, 113.0, 62.0, 39.0, 22.0, 32.0, 21.0, 16.0, 9.0, 13.0, 0.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.75439453125, -0.7325668334960938, -0.7107391357421875, -0.6889114379882812, -0.667083740234375, -0.6452560424804688, -0.6234283447265625, -0.6016006469726562, -0.57977294921875, -0.5579452514648438, -0.5361175537109375, -0.5142898559570312, -0.492462158203125, -0.47063446044921875, -0.4488067626953125, -0.42697906494140625, -0.4051513671875, -0.38332366943359375, -0.3614959716796875, -0.33966827392578125, -0.317840576171875, -0.29601287841796875, -0.2741851806640625, -0.25235748291015625, -0.23052978515625, -0.20870208740234375, -0.1868743896484375, -0.16504669189453125, -0.143218994140625, -0.12139129638671875, -0.0995635986328125, -0.07773590087890625, -0.055908203125, -0.03408050537109375, -0.0122528076171875, 0.00957489013671875, 0.031402587890625, 0.05323028564453125, 0.0750579833984375, 0.09688568115234375, 0.11871337890625, 0.14054107666015625, 0.1623687744140625, 0.18419647216796875, 0.206024169921875, 0.22785186767578125, 0.2496795654296875, 0.27150726318359375, 0.2933349609375, 0.31516265869140625, 0.3369903564453125, 0.35881805419921875, 0.380645751953125, 0.40247344970703125, 0.4243011474609375, 0.44612884521484375, 0.46795654296875, 0.48978424072265625, 0.5116119384765625, 0.5334396362304688, 0.555267333984375, 0.5770950317382812, 0.5989227294921875, 0.6207504272460938, 0.642578125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 3.0, 6.0, 7.0, 12.0, 9.0, 7.0, 19.0, 21.0, 21.0, 20.0, 33.0, 39.0, 37.0, 46.0, 60.0, 52.0, 66.0, 59.0, 46.0, 54.0, 51.0, 54.0, 42.0, 41.0, 39.0, 16.0, 26.0, 20.0, 11.0, 16.0, 8.0, 12.0, 7.0, 8.0, 2.0, 7.0, 4.0, 5.0, 0.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.486083984375, -0.4698143005371094, -0.45354461669921875, -0.4372749328613281, -0.4210052490234375, -0.4047355651855469, -0.38846588134765625, -0.3721961975097656, -0.355926513671875, -0.3396568298339844, -0.32338714599609375, -0.3071174621582031, -0.2908477783203125, -0.2745780944824219, -0.25830841064453125, -0.24203872680664062, -0.22576904296875, -0.20949935913085938, -0.19322967529296875, -0.17695999145507812, -0.1606903076171875, -0.14442062377929688, -0.12815093994140625, -0.11188125610351562, -0.095611572265625, -0.07934188842773438, -0.06307220458984375, -0.046802520751953125, -0.0305328369140625, -0.014263153076171875, 0.00200653076171875, 0.018276214599609375, 0.0345458984375, 0.050815582275390625, 0.06708526611328125, 0.08335494995117188, 0.0996246337890625, 0.11589431762695312, 0.13216400146484375, 0.14843368530273438, 0.164703369140625, 0.18097305297851562, 0.19724273681640625, 0.21351242065429688, 0.2297821044921875, 0.24605178833007812, 0.26232147216796875, 0.2785911560058594, 0.29486083984375, 0.3111305236816406, 0.32740020751953125, 0.3436698913574219, 0.3599395751953125, 0.3762092590332031, 0.39247894287109375, 0.4087486267089844, 0.425018310546875, 0.4412879943847656, 0.45755767822265625, 0.4738273620605469, 0.4900970458984375, 0.5063667297363281, 0.5226364135742188, 0.5389060974121094, 0.55517578125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 3.0, 7.0, 8.0, 3.0, 6.0, 15.0, 22.0, 37.0, 70.0, 109.0, 212.0, 482.0, 1287.0, 5543.0, 50610.0, 911467.0, 69415.0, 6762.0, 1494.0, 514.0, 213.0, 117.0, 62.0, 36.0, 17.0, 9.0, 12.0, 6.0, 4.0, 4.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.350830078125, -0.338958740234375, -0.32708740234375, -0.315216064453125, -0.3033447265625, -0.291473388671875, -0.27960205078125, -0.267730712890625, -0.255859375, -0.243988037109375, -0.23211669921875, -0.220245361328125, -0.2083740234375, -0.196502685546875, -0.18463134765625, -0.172760009765625, -0.160888671875, -0.149017333984375, -0.13714599609375, -0.125274658203125, -0.1134033203125, -0.101531982421875, -0.08966064453125, -0.077789306640625, -0.06591796875, -0.054046630859375, -0.04217529296875, -0.030303955078125, -0.0184326171875, -0.006561279296875, 0.00531005859375, 0.017181396484375, 0.029052734375, 0.040924072265625, 0.05279541015625, 0.064666748046875, 0.0765380859375, 0.088409423828125, 0.10028076171875, 0.112152099609375, 0.1240234375, 0.135894775390625, 0.14776611328125, 0.159637451171875, 0.1715087890625, 0.183380126953125, 0.19525146484375, 0.207122802734375, 0.218994140625, 0.230865478515625, 0.24273681640625, 0.254608154296875, 0.2664794921875, 0.278350830078125, 0.29022216796875, 0.302093505859375, 0.31396484375, 0.325836181640625, 0.33770751953125, 0.349578857421875, 0.3614501953125, 0.373321533203125, 0.38519287109375, 0.397064208984375, 0.408935546875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 5.0, 7.0, 10.0, 10.0, 16.0, 18.0, 22.0, 34.0, 42.0, 55.0, 77.0, 101.0, 114.0, 128.0, 87.0, 60.0, 42.0, 32.0, 31.0, 24.0, 12.0, 8.0, 12.0, 8.0, 4.0, 6.0, 6.0, 4.0, 3.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.334087371826172e-05, -9.079650044441223e-05, -8.825212717056274e-05, -8.570775389671326e-05, -8.316338062286377e-05, -8.061900734901428e-05, -7.80746340751648e-05, -7.553026080131531e-05, -7.298588752746582e-05, -7.044151425361633e-05, -6.789714097976685e-05, -6.535276770591736e-05, -6.280839443206787e-05, -6.0264021158218384e-05, -5.7719647884368896e-05, -5.517527461051941e-05, -5.263090133666992e-05, -5.0086528062820435e-05, -4.754215478897095e-05, -4.499778151512146e-05, -4.245340824127197e-05, -3.9909034967422485e-05, -3.7364661693573e-05, -3.482028841972351e-05, -3.2275915145874023e-05, -2.9731541872024536e-05, -2.718716859817505e-05, -2.464279532432556e-05, -2.2098422050476074e-05, -1.9554048776626587e-05, -1.70096755027771e-05, -1.4465302228927612e-05, -1.1920928955078125e-05, -9.376555681228638e-06, -6.83218240737915e-06, -4.287809133529663e-06, -1.7434358596801758e-06, 8.009374141693115e-07, 3.345310688018799e-06, 5.889683961868286e-06, 8.434057235717773e-06, 1.097843050956726e-05, 1.3522803783416748e-05, 1.6067177057266235e-05, 1.8611550331115723e-05, 2.115592360496521e-05, 2.3700296878814697e-05, 2.6244670152664185e-05, 2.8789043426513672e-05, 3.133341670036316e-05, 3.3877789974212646e-05, 3.6422163248062134e-05, 3.896653652191162e-05, 4.151090979576111e-05, 4.4055283069610596e-05, 4.659965634346008e-05, 4.914402961730957e-05, 5.168840289115906e-05, 5.4232776165008545e-05, 5.677714943885803e-05, 5.932152271270752e-05, 6.186589598655701e-05, 6.44102692604065e-05, 6.695464253425598e-05, 6.949901580810547e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 3.0, 5.0, 1.0, 6.0, 7.0, 9.0, 16.0, 18.0, 22.0, 33.0, 44.0, 77.0, 99.0, 173.0, 250.0, 514.0, 1147.0, 3562.0, 14949.0, 262739.0, 734162.0, 23158.0, 4579.0, 1487.0, 675.0, 305.0, 166.0, 104.0, 69.0, 46.0, 34.0, 16.0, 21.0, 12.0, 9.0, 10.0, 7.0, 4.0, 4.0, 4.0, 1.0, 0.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.305419921875, -0.2945556640625, -0.28369140625, -0.2728271484375, -0.261962890625, -0.2510986328125, -0.240234375, -0.2293701171875, -0.218505859375, -0.2076416015625, -0.19677734375, -0.1859130859375, -0.175048828125, -0.1641845703125, -0.1533203125, -0.1424560546875, -0.131591796875, -0.1207275390625, -0.10986328125, -0.0989990234375, -0.088134765625, -0.0772705078125, -0.06640625, -0.0555419921875, -0.044677734375, -0.0338134765625, -0.02294921875, -0.0120849609375, -0.001220703125, 0.0096435546875, 0.0205078125, 0.0313720703125, 0.042236328125, 0.0531005859375, 0.06396484375, 0.0748291015625, 0.085693359375, 0.0965576171875, 0.107421875, 0.1182861328125, 0.129150390625, 0.1400146484375, 0.15087890625, 0.1617431640625, 0.172607421875, 0.1834716796875, 0.1943359375, 0.2052001953125, 0.216064453125, 0.2269287109375, 0.23779296875, 0.2486572265625, 0.259521484375, 0.2703857421875, 0.28125, 0.2921142578125, 0.302978515625, 0.3138427734375, 0.32470703125, 0.3355712890625, 0.346435546875, 0.3572998046875, 0.3681640625, 0.3790283203125, 0.389892578125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 1.0, 3.0, 8.0, 7.0, 9.0, 12.0, 12.0, 18.0, 31.0, 57.0, 74.0, 111.0, 152.0, 170.0, 114.0, 64.0, 43.0, 38.0, 13.0, 11.0, 20.0, 9.0, 2.0, 10.0, 1.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2027587890625, -0.1943035125732422, -0.18584823608398438, -0.17739295959472656, -0.16893768310546875, -0.16048240661621094, -0.15202713012695312, -0.1435718536376953, -0.1351165771484375, -0.1266613006591797, -0.11820602416992188, -0.10975074768066406, -0.10129547119140625, -0.09284019470214844, -0.08438491821289062, -0.07592964172363281, -0.067474365234375, -0.05901908874511719, -0.050563812255859375, -0.04210853576660156, -0.03365325927734375, -0.025197982788085938, -0.016742706298828125, -0.008287429809570312, 0.0001678466796875, 0.008623123168945312, 0.017078399658203125, 0.025533676147460938, 0.03398895263671875, 0.04244422912597656, 0.050899505615234375, 0.05935478210449219, 0.06781005859375, 0.07626533508300781, 0.08472061157226562, 0.09317588806152344, 0.10163116455078125, 0.11008644104003906, 0.11854171752929688, 0.1269969940185547, 0.1354522705078125, 0.1439075469970703, 0.15236282348632812, 0.16081809997558594, 0.16927337646484375, 0.17772865295410156, 0.18618392944335938, 0.1946392059326172, 0.203094482421875, 0.2115497589111328, 0.22000503540039062, 0.22846031188964844, 0.23691558837890625, 0.24537086486816406, 0.2538261413574219, 0.2622814178466797, 0.2707366943359375, 0.2791919708251953, 0.2876472473144531, 0.29610252380371094, 0.30455780029296875, 0.31301307678222656, 0.3214683532714844, 0.3299236297607422, 0.33837890625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 13.0, 32.0, 59.0, 125.0, 202.0, 244.0, 147.0, 94.0, 45.0, 12.0, 7.0, 7.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.706342697143555, -4.560476779937744, -4.414610385894775, -4.268744468688965, -4.122878074645996, -3.9770121574401855, -3.831146001815796, -3.6852798461914062, -3.5394136905670166, -3.393547534942627, -3.2476813793182373, -3.1018152236938477, -2.955949306488037, -2.8100829124450684, -2.664216995239258, -2.518350839614868, -2.3724846839904785, -2.226618528366089, -2.080752372741699, -1.9348863363265991, -1.7890201807022095, -1.6431540250778198, -1.4972879886627197, -1.35142183303833, -1.2055556774139404, -1.0596895217895508, -0.9138234257698059, -0.767957329750061, -0.6220911741256714, -0.47622501850128174, -0.33035892248153687, -0.184492826461792, -0.038626670837402344, 0.10723945498466492, 0.2531055808067322, 0.39897170662879944, 0.5448378324508667, 0.6907039880752563, 0.8365700840950012, 0.9824361801147461, 1.1283023357391357, 1.2741684913635254, 1.420034646987915, 1.5659006834030151, 1.7117668390274048, 1.8576329946517944, 2.0034990310668945, 2.149365186691284, 2.295231342315674, 2.4410974979400635, 2.586963653564453, 2.7328298091888428, 2.8786959648132324, 3.024561882019043, 3.1704280376434326, 3.3162941932678223, 3.462160348892212, 3.6080265045166016, 3.753892660140991, 3.899758815765381, 4.045624732971191, 4.19149112701416, 4.337357044219971, 4.483222961425781, 4.62908935546875]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 7.0, 7.0, 5.0, 4.0, 7.0, 8.0, 11.0, 14.0, 13.0, 17.0, 21.0, 20.0, 24.0, 32.0, 31.0, 34.0, 38.0, 48.0, 52.0, 49.0, 35.0, 52.0, 47.0, 44.0, 48.0, 45.0, 28.0, 33.0, 26.0, 36.0, 27.0, 26.0, 21.0, 14.0, 19.0, 13.0, 15.0, 6.0, 3.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6672248840332031, -1.6136741638183594, -1.5601234436035156, -1.5065727233886719, -1.4530220031738281, -1.3994712829589844, -1.3459205627441406, -1.2923698425292969, -1.2388191223144531, -1.1852684020996094, -1.1317176818847656, -1.0781669616699219, -1.0246162414550781, -0.9710655212402344, -0.9175148606300354, -0.8639641404151917, -0.8104134798049927, -0.7568627595901489, -0.7033120393753052, -0.6497613191604614, -0.5962105989456177, -0.5426598787307739, -0.48910921812057495, -0.4355584979057312, -0.38200777769088745, -0.3284570574760437, -0.27490633726119995, -0.2213556468486786, -0.16780492663383484, -0.11425420641899109, -0.06070351600646973, -0.0071527957916259766, 0.04639780521392822, 0.09994851797819138, 0.15349923074245453, 0.20704993605613708, 0.26060065627098083, 0.3141513764858246, 0.36770206689834595, 0.4212527871131897, 0.47480350732803345, 0.5283542275428772, 0.581904947757721, 0.6354556083679199, 0.6890063285827637, 0.7425570487976074, 0.7961077690124512, 0.8496584892272949, 0.9032092094421387, 0.9567599296569824, 1.0103106498718262, 1.06386137008667, 1.1174120903015137, 1.1709628105163574, 1.2245135307312012, 1.278064250946045, 1.3316149711608887, 1.3851656913757324, 1.4387164115905762, 1.49226713180542, 1.5458178520202637, 1.5993685722351074, 1.6529192924499512, 1.706470012664795, 1.7600206136703491]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 4.0, 10.0, 12.0, 17.0, 16.0, 22.0, 33.0, 49.0, 69.0, 115.0, 194.0, 457.0, 1161.0, 4445.0, 33887.0, 3319803.0, 809586.0, 19641.0, 3189.0, 866.0, 303.0, 147.0, 91.0, 50.0, 28.0, 24.0, 21.0, 12.0, 2.0, 10.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.489013671875, -0.474578857421875, -0.46014404296875, -0.445709228515625, -0.4312744140625, -0.416839599609375, -0.40240478515625, -0.387969970703125, -0.37353515625, -0.359100341796875, -0.34466552734375, -0.330230712890625, -0.3157958984375, -0.301361083984375, -0.28692626953125, -0.272491455078125, -0.258056640625, -0.243621826171875, -0.22918701171875, -0.214752197265625, -0.2003173828125, -0.185882568359375, -0.17144775390625, -0.157012939453125, -0.142578125, -0.128143310546875, -0.11370849609375, -0.099273681640625, -0.0848388671875, -0.070404052734375, -0.05596923828125, -0.041534423828125, -0.027099609375, -0.012664794921875, 0.00177001953125, 0.016204833984375, 0.0306396484375, 0.045074462890625, 0.05950927734375, 0.073944091796875, 0.08837890625, 0.102813720703125, 0.11724853515625, 0.131683349609375, 0.1461181640625, 0.160552978515625, 0.17498779296875, 0.189422607421875, 0.203857421875, 0.218292236328125, 0.23272705078125, 0.247161865234375, 0.2615966796875, 0.276031494140625, 0.29046630859375, 0.304901123046875, 0.3193359375, 0.333770751953125, 0.34820556640625, 0.362640380859375, 0.3770751953125, 0.391510009765625, 0.40594482421875, 0.420379638671875, 0.434814453125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 6.0, 5.0, 12.0, 20.0, 26.0, 26.0, 32.0, 50.0, 50.0, 63.0, 72.0, 95.0, 89.0, 76.0, 83.0, 74.0, 58.0, 56.0, 31.0, 30.0, 15.0, 12.0, 5.0, 9.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.18896484375, -0.18426895141601562, -0.17957305908203125, -0.17487716674804688, -0.1701812744140625, -0.16548538208007812, -0.16078948974609375, -0.15609359741210938, -0.151397705078125, -0.14670181274414062, -0.14200592041015625, -0.13731002807617188, -0.1326141357421875, -0.12791824340820312, -0.12322235107421875, -0.11852645874023438, -0.11383056640625, -0.10913467407226562, -0.10443878173828125, -0.09974288940429688, -0.0950469970703125, -0.09035110473632812, -0.08565521240234375, -0.08095932006835938, -0.076263427734375, -0.07156753540039062, -0.06687164306640625, -0.062175750732421875, -0.0574798583984375, -0.052783966064453125, -0.04808807373046875, -0.043392181396484375, -0.0386962890625, -0.034000396728515625, -0.02930450439453125, -0.024608612060546875, -0.0199127197265625, -0.015216827392578125, -0.01052093505859375, -0.005825042724609375, -0.001129150390625, 0.003566741943359375, 0.00826263427734375, 0.012958526611328125, 0.0176544189453125, 0.022350311279296875, 0.02704620361328125, 0.031742095947265625, 0.03643798828125, 0.041133880615234375, 0.04582977294921875, 0.050525665283203125, 0.0552215576171875, 0.059917449951171875, 0.06461334228515625, 0.06930923461914062, 0.074005126953125, 0.07870101928710938, 0.08339691162109375, 0.08809280395507812, 0.0927886962890625, 0.09748458862304688, 0.10218048095703125, 0.10687637329101562, 0.111572265625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 4.0, 13.0, 10.0, 10.0, 20.0, 29.0, 51.0, 112.0, 246.0, 659.0, 2251.0, 10031.0, 94493.0, 3811725.0, 252411.0, 17442.0, 3155.0, 917.0, 299.0, 163.0, 91.0, 56.0, 31.0, 14.0, 19.0, 14.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41357421875, -0.39678955078125, -0.3800048828125, -0.36322021484375, -0.346435546875, -0.32965087890625, -0.3128662109375, -0.29608154296875, -0.279296875, -0.26251220703125, -0.2457275390625, -0.22894287109375, -0.212158203125, -0.19537353515625, -0.1785888671875, -0.16180419921875, -0.14501953125, -0.12823486328125, -0.1114501953125, -0.09466552734375, -0.077880859375, -0.06109619140625, -0.0443115234375, -0.02752685546875, -0.0107421875, 0.00604248046875, 0.0228271484375, 0.03961181640625, 0.056396484375, 0.07318115234375, 0.0899658203125, 0.10675048828125, 0.12353515625, 0.14031982421875, 0.1571044921875, 0.17388916015625, 0.190673828125, 0.20745849609375, 0.2242431640625, 0.24102783203125, 0.2578125, 0.27459716796875, 0.2913818359375, 0.30816650390625, 0.324951171875, 0.34173583984375, 0.3585205078125, 0.37530517578125, 0.39208984375, 0.40887451171875, 0.4256591796875, 0.44244384765625, 0.459228515625, 0.47601318359375, 0.4927978515625, 0.50958251953125, 0.5263671875, 0.54315185546875, 0.5599365234375, 0.57672119140625, 0.593505859375, 0.61029052734375, 0.6270751953125, 0.64385986328125, 0.66064453125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 3.0, 4.0, 2.0, 5.0, 20.0, 30.0, 47.0, 72.0, 137.0, 266.0, 722.0, 1398.0, 758.0, 278.0, 142.0, 58.0, 40.0, 30.0, 20.0, 11.0, 11.0, 4.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27294921875, -0.25962066650390625, -0.2462921142578125, -0.23296356201171875, -0.219635009765625, -0.20630645751953125, -0.1929779052734375, -0.17964935302734375, -0.16632080078125, -0.15299224853515625, -0.1396636962890625, -0.12633514404296875, -0.113006591796875, -0.09967803955078125, -0.0863494873046875, -0.07302093505859375, -0.0596923828125, -0.04636383056640625, -0.0330352783203125, -0.01970672607421875, -0.006378173828125, 0.00695037841796875, 0.0202789306640625, 0.03360748291015625, 0.04693603515625, 0.06026458740234375, 0.0735931396484375, 0.08692169189453125, 0.100250244140625, 0.11357879638671875, 0.1269073486328125, 0.14023590087890625, 0.153564453125, 0.16689300537109375, 0.1802215576171875, 0.19355010986328125, 0.206878662109375, 0.22020721435546875, 0.2335357666015625, 0.24686431884765625, 0.26019287109375, 0.27352142333984375, 0.2868499755859375, 0.30017852783203125, 0.313507080078125, 0.32683563232421875, 0.3401641845703125, 0.35349273681640625, 0.3668212890625, 0.38014984130859375, 0.3934783935546875, 0.40680694580078125, 0.420135498046875, 0.43346405029296875, 0.4467926025390625, 0.46012115478515625, 0.47344970703125, 0.48677825927734375, 0.5001068115234375, 0.5134353637695312, 0.526763916015625, 0.5400924682617188, 0.5534210205078125, 0.5667495727539062, 0.580078125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 12.0, 20.0, 44.0, 81.0, 211.0, 242.0, 203.0, 101.0, 36.0, 20.0, 10.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7889578342437744, -2.683520793914795, -2.5780837535858154, -2.472646713256836, -2.3672094345092773, -2.261772394180298, -2.1563353538513184, -2.050898313522339, -1.9454611539840698, -1.8400241136550903, -1.7345869541168213, -1.6291499137878418, -1.5237128734588623, -1.4182757139205933, -1.3128386735916138, -1.2074015140533447, -1.1019644737243652, -0.996527373790741, -0.8910902738571167, -0.7856532335281372, -0.6802161335945129, -0.5747790336608887, -0.4693419933319092, -0.3639048933982849, -0.25846779346466064, -0.15303070843219757, -0.0475936233997345, 0.05784344673156738, 0.16328054666519165, 0.2687176465988159, 0.3741546869277954, 0.4795917868614197, 0.585029125213623, 0.6904662251472473, 0.7959033250808716, 0.9013403654098511, 1.0067775249481201, 1.1122145652770996, 1.217651605606079, 1.3230886459350586, 1.4285258054733276, 1.5339628458023071, 1.6394000053405762, 1.7448370456695557, 1.8502740859985352, 1.9557112455368042, 2.061148166656494, 2.1665854454040527, 2.2720224857330322, 2.3774595260620117, 2.482896566390991, 2.5883336067199707, 2.6937708854675293, 2.799207925796509, 2.9046449661254883, 3.0100820064544678, 3.1155190467834473, 3.2209560871124268, 3.3263931274414062, 3.431830406188965, 3.5372674465179443, 3.642704486846924, 3.7481415271759033, 3.853578567504883, 3.9590158462524414]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 8.0, 9.0, 6.0, 15.0, 20.0, 23.0, 19.0, 32.0, 33.0, 36.0, 42.0, 61.0, 54.0, 69.0, 60.0, 65.0, 46.0, 60.0, 55.0, 34.0, 50.0, 31.0, 42.0, 30.0, 22.0, 17.0, 13.0, 11.0, 14.0, 4.0, 10.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.397870659828186, -1.3496992588043213, -1.301527976989746, -1.2533565759658813, -1.2051851749420166, -1.1570138931274414, -1.1088424921035767, -1.060671091079712, -1.0124998092651367, -0.9643284678459167, -0.9161571264266968, -0.867985725402832, -0.8198143839836121, -0.7716430425643921, -0.7234716415405273, -0.6753003001213074, -0.6271289587020874, -0.5789576172828674, -0.5307862758636475, -0.4826148748397827, -0.43444353342056274, -0.3862721920013428, -0.3381008207798004, -0.28992944955825806, -0.24175810813903809, -0.19358675181865692, -0.14541539549827576, -0.09724403917789459, -0.04907268285751343, -0.0009013265371322632, 0.0472700297832489, 0.09544140100479126, 0.14361262321472168, 0.19178397953510284, 0.239955335855484, 0.28812670707702637, 0.33629804849624634, 0.3844693899154663, 0.43264076113700867, 0.480812132358551, 0.528983473777771, 0.577154815196991, 0.6253261566162109, 0.6734975576400757, 0.7216688990592957, 0.7698402404785156, 0.8180116415023804, 0.8661829829216003, 0.9143543243408203, 0.9625256657600403, 1.0106970071792603, 1.058868408203125, 1.1070396900177002, 1.155211091041565, 1.2033824920654297, 1.2515537738800049, 1.2997251749038696, 1.3478965759277344, 1.3960678577423096, 1.4442392587661743, 1.492410659790039, 1.5405819416046143, 1.588753342628479, 1.6369247436523438, 1.685096025466919]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 7.0, 3.0, 4.0, 10.0, 16.0, 26.0, 50.0, 68.0, 189.0, 445.0, 1338.0, 5944.0, 38976.0, 683795.0, 290247.0, 22022.0, 3852.0, 928.0, 335.0, 137.0, 84.0, 41.0, 20.0, 8.0, 4.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56201171875, -0.5431900024414062, -0.5243682861328125, -0.5055465698242188, -0.486724853515625, -0.46790313720703125, -0.4490814208984375, -0.43025970458984375, -0.41143798828125, -0.39261627197265625, -0.3737945556640625, -0.35497283935546875, -0.336151123046875, -0.31732940673828125, -0.2985076904296875, -0.27968597412109375, -0.2608642578125, -0.24204254150390625, -0.2232208251953125, -0.20439910888671875, -0.185577392578125, -0.16675567626953125, -0.1479339599609375, -0.12911224365234375, -0.11029052734375, -0.09146881103515625, -0.0726470947265625, -0.05382537841796875, -0.035003662109375, -0.01618194580078125, 0.0026397705078125, 0.02146148681640625, 0.040283203125, 0.05910491943359375, 0.0779266357421875, 0.09674835205078125, 0.115570068359375, 0.13439178466796875, 0.1532135009765625, 0.17203521728515625, 0.19085693359375, 0.20967864990234375, 0.2285003662109375, 0.24732208251953125, 0.266143798828125, 0.28496551513671875, 0.3037872314453125, 0.32260894775390625, 0.3414306640625, 0.36025238037109375, 0.3790740966796875, 0.39789581298828125, 0.416717529296875, 0.43553924560546875, 0.4543609619140625, 0.47318267822265625, 0.49200439453125, 0.5108261108398438, 0.5296478271484375, 0.5484695434570312, 0.567291259765625, 0.5861129760742188, 0.6049346923828125, 0.6237564086914062, 0.642578125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 13.0, 15.0, 13.0, 13.0, 31.0, 38.0, 38.0, 57.0, 45.0, 64.0, 56.0, 96.0, 99.0, 82.0, 73.0, 57.0, 61.0, 41.0, 36.0, 30.0, 19.0, 10.0, 10.0, 5.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.2420654296875, -0.23701190948486328, -0.23195838928222656, -0.22690486907958984, -0.22185134887695312, -0.2167978286743164, -0.2117443084716797, -0.20669078826904297, -0.20163726806640625, -0.19658374786376953, -0.1915302276611328, -0.1864767074584961, -0.18142318725585938, -0.17636966705322266, -0.17131614685058594, -0.16626262664794922, -0.1612091064453125, -0.15615558624267578, -0.15110206604003906, -0.14604854583740234, -0.14099502563476562, -0.1359415054321289, -0.1308879852294922, -0.12583446502685547, -0.12078094482421875, -0.11572742462158203, -0.11067390441894531, -0.1056203842163086, -0.10056686401367188, -0.09551334381103516, -0.09045982360839844, -0.08540630340576172, -0.080352783203125, -0.07529926300048828, -0.07024574279785156, -0.06519222259521484, -0.060138702392578125, -0.055085182189941406, -0.05003166198730469, -0.04497814178466797, -0.03992462158203125, -0.03487110137939453, -0.029817581176757812, -0.024764060974121094, -0.019710540771484375, -0.014657020568847656, -0.009603500366210938, -0.004549980163574219, 0.0005035400390625, 0.005557060241699219, 0.010610580444335938, 0.015664100646972656, 0.020717620849609375, 0.025771141052246094, 0.030824661254882812, 0.03587818145751953, 0.04093170166015625, 0.04598522186279297, 0.05103874206542969, 0.056092262268066406, 0.061145782470703125, 0.06619930267333984, 0.07125282287597656, 0.07630634307861328, 0.08135986328125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 9.0, 15.0, 24.0, 13.0, 25.0, 39.0, 59.0, 101.0, 159.0, 308.0, 553.0, 1271.0, 3667.0, 15097.0, 147380.0, 820578.0, 47169.0, 7856.0, 2274.0, 901.0, 429.0, 247.0, 120.0, 96.0, 55.0, 33.0, 17.0, 21.0, 8.0, 4.0, 8.0, 3.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6357421875, -0.6154251098632812, -0.5951080322265625, -0.5747909545898438, -0.554473876953125, -0.5341567993164062, -0.5138397216796875, -0.49352264404296875, -0.47320556640625, -0.45288848876953125, -0.4325714111328125, -0.41225433349609375, -0.391937255859375, -0.37162017822265625, -0.3513031005859375, -0.33098602294921875, -0.3106689453125, -0.29035186767578125, -0.2700347900390625, -0.24971771240234375, -0.229400634765625, -0.20908355712890625, -0.1887664794921875, -0.16844940185546875, -0.14813232421875, -0.12781524658203125, -0.1074981689453125, -0.08718109130859375, -0.066864013671875, -0.04654693603515625, -0.0262298583984375, -0.00591278076171875, 0.014404296875, 0.03472137451171875, 0.0550384521484375, 0.07535552978515625, 0.095672607421875, 0.11598968505859375, 0.1363067626953125, 0.15662384033203125, 0.17694091796875, 0.19725799560546875, 0.2175750732421875, 0.23789215087890625, 0.258209228515625, 0.27852630615234375, 0.2988433837890625, 0.31916046142578125, 0.3394775390625, 0.35979461669921875, 0.3801116943359375, 0.40042877197265625, 0.420745849609375, 0.44106292724609375, 0.4613800048828125, 0.48169708251953125, 0.50201416015625, 0.5223312377929688, 0.5426483154296875, 0.5629653930664062, 0.583282470703125, 0.6035995483398438, 0.6239166259765625, 0.6442337036132812, 0.66455078125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 5.0, 5.0, 7.0, 8.0, 14.0, 12.0, 23.0, 20.0, 28.0, 23.0, 45.0, 33.0, 59.0, 55.0, 57.0, 59.0, 64.0, 63.0, 65.0, 62.0, 52.0, 48.0, 35.0, 29.0, 31.0, 14.0, 18.0, 15.0, 15.0, 6.0, 8.0, 7.0, 2.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.466552734375, -0.4490242004394531, -0.43149566650390625, -0.4139671325683594, -0.3964385986328125, -0.3789100646972656, -0.36138153076171875, -0.3438529968261719, -0.326324462890625, -0.3087959289550781, -0.29126739501953125, -0.2737388610839844, -0.2562103271484375, -0.23868179321289062, -0.22115325927734375, -0.20362472534179688, -0.18609619140625, -0.16856765747070312, -0.15103912353515625, -0.13351058959960938, -0.1159820556640625, -0.09845352172851562, -0.08092498779296875, -0.06339645385742188, -0.045867919921875, -0.028339385986328125, -0.01081085205078125, 0.006717681884765625, 0.0242462158203125, 0.041774749755859375, 0.05930328369140625, 0.07683181762695312, 0.0943603515625, 0.11188888549804688, 0.12941741943359375, 0.14694595336914062, 0.1644744873046875, 0.18200302124023438, 0.19953155517578125, 0.21706008911132812, 0.234588623046875, 0.2521171569824219, 0.26964569091796875, 0.2871742248535156, 0.3047027587890625, 0.3222312927246094, 0.33975982666015625, 0.3572883605957031, 0.37481689453125, 0.3923454284667969, 0.40987396240234375, 0.4274024963378906, 0.4449310302734375, 0.4624595642089844, 0.47998809814453125, 0.4975166320800781, 0.515045166015625, 0.5325736999511719, 0.5501022338867188, 0.5676307678222656, 0.5851593017578125, 0.6026878356933594, 0.6202163696289062, 0.6377449035644531, 0.6552734375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 2.0, 5.0, 6.0, 12.0, 13.0, 18.0, 20.0, 46.0, 57.0, 112.0, 190.0, 484.0, 1429.0, 7016.0, 140946.0, 875849.0, 18396.0, 2542.0, 713.0, 313.0, 139.0, 81.0, 43.0, 25.0, 27.0, 19.0, 11.0, 12.0, 3.0, 6.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.490478515625, -0.475250244140625, -0.46002197265625, -0.444793701171875, -0.4295654296875, -0.414337158203125, -0.39910888671875, -0.383880615234375, -0.36865234375, -0.353424072265625, -0.33819580078125, -0.322967529296875, -0.3077392578125, -0.292510986328125, -0.27728271484375, -0.262054443359375, -0.246826171875, -0.231597900390625, -0.21636962890625, -0.201141357421875, -0.1859130859375, -0.170684814453125, -0.15545654296875, -0.140228271484375, -0.125, -0.109771728515625, -0.09454345703125, -0.079315185546875, -0.0640869140625, -0.048858642578125, -0.03363037109375, -0.018402099609375, -0.003173828125, 0.012054443359375, 0.02728271484375, 0.042510986328125, 0.0577392578125, 0.072967529296875, 0.08819580078125, 0.103424072265625, 0.11865234375, 0.133880615234375, 0.14910888671875, 0.164337158203125, 0.1795654296875, 0.194793701171875, 0.21002197265625, 0.225250244140625, 0.240478515625, 0.255706787109375, 0.27093505859375, 0.286163330078125, 0.3013916015625, 0.316619873046875, 0.33184814453125, 0.347076416015625, 0.3623046875, 0.377532958984375, 0.39276123046875, 0.407989501953125, 0.4232177734375, 0.438446044921875, 0.45367431640625, 0.468902587890625, 0.484130859375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 7.0, 6.0, 7.0, 10.0, 7.0, 23.0, 18.0, 27.0, 30.0, 54.0, 59.0, 85.0, 117.0, 107.0, 112.0, 78.0, 73.0, 57.0, 26.0, 32.0, 20.0, 11.0, 8.0, 10.0, 5.0, 8.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00010055303573608398, -9.813159704208374e-05, -9.57101583480835e-05, -9.328871965408325e-05, -9.086728096008301e-05, -8.844584226608276e-05, -8.602440357208252e-05, -8.360296487808228e-05, -8.118152618408203e-05, -7.876008749008179e-05, -7.633864879608154e-05, -7.39172101020813e-05, -7.149577140808105e-05, -6.907433271408081e-05, -6.665289402008057e-05, -6.423145532608032e-05, -6.181001663208008e-05, -5.9388577938079834e-05, -5.696713924407959e-05, -5.4545700550079346e-05, -5.21242618560791e-05, -4.970282316207886e-05, -4.728138446807861e-05, -4.485994577407837e-05, -4.2438507080078125e-05, -4.001706838607788e-05, -3.759562969207764e-05, -3.517419099807739e-05, -3.275275230407715e-05, -3.0331313610076904e-05, -2.790987491607666e-05, -2.5488436222076416e-05, -2.3066997528076172e-05, -2.0645558834075928e-05, -1.8224120140075684e-05, -1.580268144607544e-05, -1.3381242752075195e-05, -1.0959804058074951e-05, -8.538365364074707e-06, -6.116926670074463e-06, -3.6954879760742188e-06, -1.2740492820739746e-06, 1.1473894119262695e-06, 3.5688281059265137e-06, 5.990266799926758e-06, 8.411705493927002e-06, 1.0833144187927246e-05, 1.325458288192749e-05, 1.5676021575927734e-05, 1.809746026992798e-05, 2.0518898963928223e-05, 2.2940337657928467e-05, 2.536177635192871e-05, 2.7783215045928955e-05, 3.02046537399292e-05, 3.262609243392944e-05, 3.504753112792969e-05, 3.746896982192993e-05, 3.9890408515930176e-05, 4.231184720993042e-05, 4.4733285903930664e-05, 4.715472459793091e-05, 4.957616329193115e-05, 5.1997601985931396e-05, 5.441904067993164e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 9.0, 8.0, 12.0, 26.0, 24.0, 44.0, 60.0, 93.0, 173.0, 335.0, 657.0, 1795.0, 5687.0, 29843.0, 608149.0, 369954.0, 23832.0, 4991.0, 1578.0, 629.0, 294.0, 143.0, 86.0, 38.0, 27.0, 17.0, 15.0, 14.0, 7.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.298095703125, -0.2890472412109375, -0.279998779296875, -0.2709503173828125, -0.26190185546875, -0.2528533935546875, -0.243804931640625, -0.2347564697265625, -0.2257080078125, -0.2166595458984375, -0.207611083984375, -0.1985626220703125, -0.18951416015625, -0.1804656982421875, -0.171417236328125, -0.1623687744140625, -0.1533203125, -0.1442718505859375, -0.135223388671875, -0.1261749267578125, -0.11712646484375, -0.1080780029296875, -0.099029541015625, -0.0899810791015625, -0.0809326171875, -0.0718841552734375, -0.062835693359375, -0.0537872314453125, -0.04473876953125, -0.0356903076171875, -0.026641845703125, -0.0175933837890625, -0.008544921875, 0.0005035400390625, 0.009552001953125, 0.0186004638671875, 0.02764892578125, 0.0366973876953125, 0.045745849609375, 0.0547943115234375, 0.0638427734375, 0.0728912353515625, 0.081939697265625, 0.0909881591796875, 0.10003662109375, 0.1090850830078125, 0.118133544921875, 0.1271820068359375, 0.13623046875, 0.1452789306640625, 0.154327392578125, 0.1633758544921875, 0.17242431640625, 0.1814727783203125, 0.190521240234375, 0.1995697021484375, 0.2086181640625, 0.2176666259765625, 0.226715087890625, 0.2357635498046875, 0.24481201171875, 0.2538604736328125, 0.262908935546875, 0.2719573974609375, 0.281005859375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 6.0, 2.0, 6.0, 3.0, 6.0, 17.0, 23.0, 37.0, 55.0, 68.0, 91.0, 138.0, 161.0, 113.0, 90.0, 57.0, 37.0, 25.0, 11.0, 19.0, 11.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.28125, -0.2735271453857422, -0.2658042907714844, -0.25808143615722656, -0.25035858154296875, -0.24263572692871094, -0.23491287231445312, -0.2271900177001953, -0.2194671630859375, -0.2117443084716797, -0.20402145385742188, -0.19629859924316406, -0.18857574462890625, -0.18085289001464844, -0.17313003540039062, -0.1654071807861328, -0.157684326171875, -0.1499614715576172, -0.14223861694335938, -0.13451576232910156, -0.12679290771484375, -0.11907005310058594, -0.11134719848632812, -0.10362434387207031, -0.0959014892578125, -0.08817863464355469, -0.08045578002929688, -0.07273292541503906, -0.06501007080078125, -0.05728721618652344, -0.049564361572265625, -0.04184150695800781, -0.03411865234375, -0.026395797729492188, -0.018672943115234375, -0.010950088500976562, -0.00322723388671875, 0.0044956207275390625, 0.012218475341796875, 0.019941329956054688, 0.0276641845703125, 0.03538703918457031, 0.043109893798828125, 0.05083274841308594, 0.05855560302734375, 0.06627845764160156, 0.07400131225585938, 0.08172416687011719, 0.089447021484375, 0.09716987609863281, 0.10489273071289062, 0.11261558532714844, 0.12033843994140625, 0.12806129455566406, 0.13578414916992188, 0.1435070037841797, 0.1512298583984375, 0.1589527130126953, 0.16667556762695312, 0.17439842224121094, 0.18212127685546875, 0.18984413146972656, 0.19756698608398438, 0.2052898406982422, 0.2130126953125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 9.0, 24.0, 48.0, 151.0, 287.0, 240.0, 136.0, 51.0, 16.0, 12.0, 9.0, 1.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.172328472137451, -5.010281085968018, -4.848234176635742, -4.686186790466309, -4.524139404296875, -4.362092018127441, -4.200045108795166, -4.037997722625732, -3.875950574874878, -3.7139034271240234, -3.55185604095459, -3.3898088932037354, -3.227761745452881, -3.0657143592834473, -2.9036672115325928, -2.7416200637817383, -2.5795726776123047, -2.41752552986145, -2.2554781436920166, -2.093430995941162, -1.931383728981018, -1.769336462020874, -1.6072893142700195, -1.4452420473098755, -1.2831947803497314, -1.1211475133895874, -0.9591003060340881, -0.7970530986785889, -0.6350058317184448, -0.4729585647583008, -0.3109113574028015, -0.14886415004730225, 0.013182640075683594, 0.17522987723350525, 0.3372771143913269, 0.49932435154914856, 0.6613715887069702, 0.8234188556671143, 0.9854660630226135, 1.1475132703781128, 1.3095605373382568, 1.4716078042984009, 1.633655071258545, 1.7957022190093994, 1.9577494859695435, 2.1197967529296875, 2.281843900680542, 2.4438910484313965, 2.60593843460083, 2.7679855823516846, 2.930032968521118, 3.0920801162719727, 3.2541275024414062, 3.4161746501922607, 3.5782217979431152, 3.740269184112549, 3.9023163318634033, 4.064363479614258, 4.226410865783691, 4.388458251953125, 4.5505051612854, 4.712552547454834, 4.874599933624268, 5.036646842956543, 5.198694229125977]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 5.0, 9.0, 9.0, 12.0, 20.0, 8.0, 13.0, 18.0, 18.0, 23.0, 29.0, 26.0, 25.0, 21.0, 35.0, 36.0, 34.0, 53.0, 42.0, 53.0, 55.0, 46.0, 46.0, 41.0, 26.0, 38.0, 42.0, 25.0, 33.0, 13.0, 24.0, 17.0, 21.0, 14.0, 12.0, 14.0, 10.0, 6.0, 2.0, 6.0, 6.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.5909292697906494, -1.5423047542572021, -1.4936801195144653, -1.445055603981018, -1.3964309692382812, -1.347806453704834, -1.2991818189620972, -1.25055730342865, -1.201932668685913, -1.1533081531524658, -1.104683518409729, -1.0560590028762817, -1.007434368133545, -0.9588097929954529, -0.9101852178573608, -0.8615607023239136, -0.8129361271858215, -0.7643115520477295, -0.7156869769096375, -0.6670624017715454, -0.6184378266334534, -0.5698132514953613, -0.5211887359619141, -0.47256413102149963, -0.4239395558834076, -0.37531498074531555, -0.3266904056072235, -0.27806586027145386, -0.22944127023220062, -0.18081669509410858, -0.13219213485717773, -0.0835675597190857, -0.03494298458099365, 0.01368158683180809, 0.06230615824460983, 0.11093072593212128, 0.15955530107021332, 0.20817987620830536, 0.2568044364452362, 0.30542901158332825, 0.3540535867214203, 0.40267816185951233, 0.45130273699760437, 0.499927282333374, 0.5485518574714661, 0.5971764326095581, 0.6458010077476501, 0.6944255828857422, 0.7430501580238342, 0.7916747331619263, 0.8402993083000183, 0.8889238834381104, 0.9375484585762024, 0.9861730337142944, 1.0347975492477417, 1.0834221839904785, 1.1320466995239258, 1.180671215057373, 1.2292958498001099, 1.2779203653335571, 1.326545000076294, 1.3751695156097412, 1.423794150352478, 1.4724186658859253, 1.521043300628662]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 7.0, 1.0, 2.0, 3.0, 12.0, 11.0, 11.0, 25.0, 21.0, 56.0, 71.0, 146.0, 250.0, 524.0, 1215.0, 3315.0, 11125.0, 53526.0, 662907.0, 3181732.0, 237213.0, 30792.0, 7338.0, 2371.0, 879.0, 358.0, 193.0, 80.0, 44.0, 21.0, 13.0, 6.0, 4.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.392333984375, -0.3828411102294922, -0.3733482360839844, -0.36385536193847656, -0.35436248779296875, -0.34486961364746094, -0.3353767395019531, -0.3258838653564453, -0.3163909912109375, -0.3068981170654297, -0.2974052429199219, -0.28791236877441406, -0.27841949462890625, -0.26892662048339844, -0.2594337463378906, -0.2499408721923828, -0.240447998046875, -0.2309551239013672, -0.22146224975585938, -0.21196937561035156, -0.20247650146484375, -0.19298362731933594, -0.18349075317382812, -0.1739978790283203, -0.1645050048828125, -0.1550121307373047, -0.14551925659179688, -0.13602638244628906, -0.12653350830078125, -0.11704063415527344, -0.10754776000976562, -0.09805488586425781, -0.08856201171875, -0.07906913757324219, -0.06957626342773438, -0.06008338928222656, -0.05059051513671875, -0.04109764099121094, -0.031604766845703125, -0.022111892700195312, -0.0126190185546875, -0.0031261444091796875, 0.006366729736328125, 0.015859603881835938, 0.02535247802734375, 0.03484535217285156, 0.044338226318359375, 0.05383110046386719, 0.063323974609375, 0.07281684875488281, 0.08230972290039062, 0.09180259704589844, 0.10129547119140625, 0.11078834533691406, 0.12028121948242188, 0.1297740936279297, 0.1392669677734375, 0.1487598419189453, 0.15825271606445312, 0.16774559020996094, 0.17723846435546875, 0.18673133850097656, 0.19622421264648438, 0.2057170867919922, 0.2152099609375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 8.0, 5.0, 12.0, 9.0, 18.0, 17.0, 10.0, 24.0, 31.0, 33.0, 55.0, 42.0, 44.0, 55.0, 49.0, 60.0, 51.0, 54.0, 46.0, 51.0, 50.0, 35.0, 41.0, 41.0, 31.0, 28.0, 27.0, 15.0, 11.0, 9.0, 11.0, 7.0, 6.0, 6.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.12548828125, -0.12221431732177734, -0.11894035339355469, -0.11566638946533203, -0.11239242553710938, -0.10911846160888672, -0.10584449768066406, -0.1025705337524414, -0.09929656982421875, -0.0960226058959961, -0.09274864196777344, -0.08947467803955078, -0.08620071411132812, -0.08292675018310547, -0.07965278625488281, -0.07637882232666016, -0.0731048583984375, -0.06983089447021484, -0.06655693054199219, -0.06328296661376953, -0.060009002685546875, -0.05673503875732422, -0.05346107482910156, -0.050187110900878906, -0.04691314697265625, -0.043639183044433594, -0.04036521911621094, -0.03709125518798828, -0.033817291259765625, -0.03054332733154297, -0.027269363403320312, -0.023995399475097656, -0.020721435546875, -0.017447471618652344, -0.014173507690429688, -0.010899543762207031, -0.007625579833984375, -0.004351615905761719, -0.0010776519775390625, 0.0021963119506835938, 0.00547027587890625, 0.008744239807128906, 0.012018203735351562, 0.015292167663574219, 0.018566131591796875, 0.02184009552001953, 0.025114059448242188, 0.028388023376464844, 0.0316619873046875, 0.034935951232910156, 0.03820991516113281, 0.04148387908935547, 0.044757843017578125, 0.04803180694580078, 0.05130577087402344, 0.054579734802246094, 0.05785369873046875, 0.061127662658691406, 0.06440162658691406, 0.06767559051513672, 0.07094955444335938, 0.07422351837158203, 0.07749748229980469, 0.08077144622802734, 0.08404541015625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 6.0, 2.0, 6.0, 7.0, 10.0, 23.0, 34.0, 36.0, 58.0, 107.0, 232.0, 599.0, 1925.0, 7515.0, 60736.0, 3198758.0, 888896.0, 29157.0, 4190.0, 1154.0, 395.0, 212.0, 98.0, 50.0, 21.0, 17.0, 12.0, 6.0, 4.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6494140625, -0.6302337646484375, -0.611053466796875, -0.5918731689453125, -0.57269287109375, -0.5535125732421875, -0.534332275390625, -0.5151519775390625, -0.4959716796875, -0.4767913818359375, -0.457611083984375, -0.4384307861328125, -0.41925048828125, -0.4000701904296875, -0.380889892578125, -0.3617095947265625, -0.342529296875, -0.3233489990234375, -0.304168701171875, -0.2849884033203125, -0.26580810546875, -0.2466278076171875, -0.227447509765625, -0.2082672119140625, -0.1890869140625, -0.1699066162109375, -0.150726318359375, -0.1315460205078125, -0.11236572265625, -0.0931854248046875, -0.074005126953125, -0.0548248291015625, -0.03564453125, -0.0164642333984375, 0.002716064453125, 0.0218963623046875, 0.04107666015625, 0.0602569580078125, 0.079437255859375, 0.0986175537109375, 0.1177978515625, 0.1369781494140625, 0.156158447265625, 0.1753387451171875, 0.19451904296875, 0.2136993408203125, 0.232879638671875, 0.2520599365234375, 0.271240234375, 0.2904205322265625, 0.309600830078125, 0.3287811279296875, 0.34796142578125, 0.3671417236328125, 0.386322021484375, 0.4055023193359375, 0.4246826171875, 0.4438629150390625, 0.463043212890625, 0.4822235107421875, 0.50140380859375, 0.5205841064453125, 0.539764404296875, 0.5589447021484375, 0.578125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 4.0, 13.0, 10.0, 14.0, 21.0, 20.0, 34.0, 44.0, 72.0, 136.0, 227.0, 414.0, 740.0, 945.0, 565.0, 328.0, 175.0, 113.0, 66.0, 36.0, 29.0, 24.0, 10.0, 11.0, 5.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5107421875, -0.4962615966796875, -0.481781005859375, -0.4673004150390625, -0.45281982421875, -0.4383392333984375, -0.423858642578125, -0.4093780517578125, -0.3948974609375, -0.3804168701171875, -0.365936279296875, -0.3514556884765625, -0.33697509765625, -0.3224945068359375, -0.308013916015625, -0.2935333251953125, -0.279052734375, -0.2645721435546875, -0.250091552734375, -0.2356109619140625, -0.22113037109375, -0.2066497802734375, -0.192169189453125, -0.1776885986328125, -0.1632080078125, -0.1487274169921875, -0.134246826171875, -0.1197662353515625, -0.10528564453125, -0.0908050537109375, -0.076324462890625, -0.0618438720703125, -0.04736328125, -0.0328826904296875, -0.018402099609375, -0.0039215087890625, 0.01055908203125, 0.0250396728515625, 0.039520263671875, 0.0540008544921875, 0.0684814453125, 0.0829620361328125, 0.097442626953125, 0.1119232177734375, 0.12640380859375, 0.1408843994140625, 0.155364990234375, 0.1698455810546875, 0.184326171875, 0.1988067626953125, 0.213287353515625, 0.2277679443359375, 0.24224853515625, 0.2567291259765625, 0.271209716796875, 0.2856903076171875, 0.3001708984375, 0.3146514892578125, 0.329132080078125, 0.3436126708984375, 0.35809326171875, 0.3725738525390625, 0.387054443359375, 0.4015350341796875, 0.416015625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 7.0, 13.0, 37.0, 107.0, 232.0, 289.0, 176.0, 70.0, 30.0, 10.0, 10.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.058704376220703, -7.8810529708862305, -7.703401565551758, -7.525750160217285, -7.348099231719971, -7.170447826385498, -6.992796421051025, -6.815145015716553, -6.63749361038208, -6.459842205047607, -6.282190799713135, -6.10453987121582, -5.926888465881348, -5.749237060546875, -5.571585655212402, -5.39393424987793, -5.216282844543457, -5.038631439208984, -4.860980033874512, -4.683328628540039, -4.505677700042725, -4.328026294708252, -4.150374889373779, -3.9727234840393066, -3.795072555541992, -3.6174211502075195, -3.439769983291626, -3.2621185779571533, -3.0844671726226807, -2.906816005706787, -2.7291646003723145, -2.551513195037842, -2.37386155128479, -2.1962101459503174, -2.018558979034424, -1.8409075736999512, -1.6632561683654785, -1.4856048822402954, -1.3079535961151123, -1.1303021907806396, -0.9526509046554565, -0.7749995589256287, -0.5973482131958008, -0.4196969270706177, -0.2420455813407898, -0.06439423561096191, 0.11325705051422119, 0.29090845584869385, 0.46855974197387695, 0.6462110877037048, 0.8238624334335327, 1.0015137195587158, 1.1791651248931885, 1.3568164110183716, 1.5344676971435547, 1.7121191024780273, 1.8897703886032104, 2.0674216747283936, 2.245073080062866, 2.4227242469787598, 2.6003756523132324, 2.778027057647705, 2.9556784629821777, 3.1333298683166504, 3.310981035232544]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 8.0, 5.0, 6.0, 7.0, 10.0, 12.0, 24.0, 20.0, 24.0, 30.0, 35.0, 45.0, 33.0, 46.0, 56.0, 46.0, 60.0, 53.0, 45.0, 48.0, 48.0, 46.0, 46.0, 27.0, 35.0, 35.0, 23.0, 24.0, 22.0, 15.0, 11.0, 8.0, 7.0, 7.0, 8.0, 8.0, 8.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5826128721237183, -1.526394009590149, -1.4701752662658691, -1.4139564037322998, -1.3577375411987305, -1.3015186786651611, -1.2452998161315918, -1.189081072807312, -1.1328622102737427, -1.0766433477401733, -1.0204246044158936, -0.9642057418823242, -0.9079868793487549, -0.8517680168151855, -0.795549213886261, -0.7393304109573364, -0.6831115484237671, -0.6268926858901978, -0.5706738829612732, -0.5144550800323486, -0.4582362174987793, -0.40201738476753235, -0.3457985520362854, -0.28957971930503845, -0.2333608865737915, -0.17714205384254456, -0.12092322111129761, -0.06470438838005066, -0.008485555648803711, 0.04773327708244324, 0.10395210981369019, 0.16017094254493713, 0.21638989448547363, 0.2726087272167206, 0.32882755994796753, 0.3850463926792145, 0.4412652254104614, 0.4974840581417084, 0.5537028908729553, 0.6099216938018799, 0.6661405563354492, 0.7223594188690186, 0.7785782217979431, 0.8347970247268677, 0.891015887260437, 0.9472347497940063, 1.0034534931182861, 1.0596723556518555, 1.1158912181854248, 1.1721100807189941, 1.2283289432525635, 1.2845476865768433, 1.3407665491104126, 1.396985411643982, 1.4532041549682617, 1.509423017501831, 1.5656418800354004, 1.6218607425689697, 1.678079605102539, 1.7342983484268188, 1.7905172109603882, 1.8467360734939575, 1.9029548168182373, 1.9591736793518066, 2.015392541885376]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 1.0, 5.0, 6.0, 9.0, 22.0, 24.0, 42.0, 60.0, 89.0, 149.0, 276.0, 527.0, 1095.0, 2432.0, 6101.0, 18156.0, 62252.0, 275952.0, 524386.0, 110204.0, 30323.0, 9815.0, 3525.0, 1483.0, 716.0, 382.0, 201.0, 105.0, 65.0, 46.0, 31.0, 14.0, 23.0, 13.0, 5.0, 3.0, 5.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.410888671875, -0.3985176086425781, -0.38614654541015625, -0.3737754821777344, -0.3614044189453125, -0.3490333557128906, -0.33666229248046875, -0.3242912292480469, -0.311920166015625, -0.2995491027832031, -0.28717803955078125, -0.2748069763183594, -0.2624359130859375, -0.2500648498535156, -0.23769378662109375, -0.22532272338867188, -0.21295166015625, -0.20058059692382812, -0.18820953369140625, -0.17583847045898438, -0.1634674072265625, -0.15109634399414062, -0.13872528076171875, -0.12635421752929688, -0.113983154296875, -0.10161209106445312, -0.08924102783203125, -0.07686996459960938, -0.0644989013671875, -0.052127838134765625, -0.03975677490234375, -0.027385711669921875, -0.0150146484375, -0.002643585205078125, 0.00972747802734375, 0.022098541259765625, 0.0344696044921875, 0.046840667724609375, 0.05921173095703125, 0.07158279418945312, 0.083953857421875, 0.09632492065429688, 0.10869598388671875, 0.12106704711914062, 0.1334381103515625, 0.14580917358398438, 0.15818023681640625, 0.17055130004882812, 0.18292236328125, 0.19529342651367188, 0.20766448974609375, 0.22003555297851562, 0.2324066162109375, 0.24477767944335938, 0.25714874267578125, 0.2695198059082031, 0.281890869140625, 0.2942619323730469, 0.30663299560546875, 0.3190040588378906, 0.3313751220703125, 0.3437461853027344, 0.35611724853515625, 0.3684883117675781, 0.380859375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 6.0, 5.0, 13.0, 16.0, 25.0, 29.0, 24.0, 43.0, 45.0, 61.0, 66.0, 61.0, 65.0, 78.0, 72.0, 71.0, 66.0, 64.0, 40.0, 43.0, 30.0, 24.0, 15.0, 11.0, 15.0, 9.0, 4.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.220458984375, -0.21550464630126953, -0.21055030822753906, -0.2055959701538086, -0.20064163208007812, -0.19568729400634766, -0.1907329559326172, -0.18577861785888672, -0.18082427978515625, -0.17586994171142578, -0.1709156036376953, -0.16596126556396484, -0.16100692749023438, -0.1560525894165039, -0.15109825134277344, -0.14614391326904297, -0.1411895751953125, -0.13623523712158203, -0.13128089904785156, -0.1263265609741211, -0.12137222290039062, -0.11641788482666016, -0.11146354675292969, -0.10650920867919922, -0.10155487060546875, -0.09660053253173828, -0.09164619445800781, -0.08669185638427734, -0.08173751831054688, -0.0767831802368164, -0.07182884216308594, -0.06687450408935547, -0.061920166015625, -0.05696582794189453, -0.05201148986816406, -0.047057151794433594, -0.042102813720703125, -0.037148475646972656, -0.03219413757324219, -0.02723979949951172, -0.02228546142578125, -0.01733112335205078, -0.012376785278320312, -0.007422447204589844, -0.002468109130859375, 0.0024862289428710938, 0.0074405670166015625, 0.012394905090332031, 0.0173492431640625, 0.02230358123779297, 0.027257919311523438, 0.032212257385253906, 0.037166595458984375, 0.042120933532714844, 0.04707527160644531, 0.05202960968017578, 0.05698394775390625, 0.06193828582763672, 0.06689262390136719, 0.07184696197509766, 0.07680130004882812, 0.0817556381225586, 0.08670997619628906, 0.09166431427001953, 0.09661865234375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 5.0, 6.0, 9.0, 16.0, 13.0, 25.0, 32.0, 48.0, 67.0, 118.0, 161.0, 242.0, 507.0, 808.0, 1895.0, 4916.0, 20416.0, 257622.0, 716152.0, 34111.0, 6485.0, 2352.0, 1053.0, 571.0, 298.0, 216.0, 126.0, 74.0, 48.0, 40.0, 30.0, 27.0, 19.0, 8.0, 8.0, 9.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.79541015625, -0.7681045532226562, -0.7407989501953125, -0.7134933471679688, -0.686187744140625, -0.6588821411132812, -0.6315765380859375, -0.6042709350585938, -0.57696533203125, -0.5496597290039062, -0.5223541259765625, -0.49504852294921875, -0.467742919921875, -0.44043731689453125, -0.4131317138671875, -0.38582611083984375, -0.3585205078125, -0.33121490478515625, -0.3039093017578125, -0.27660369873046875, -0.249298095703125, -0.22199249267578125, -0.1946868896484375, -0.16738128662109375, -0.14007568359375, -0.11277008056640625, -0.0854644775390625, -0.05815887451171875, -0.030853271484375, -0.00354766845703125, 0.0237579345703125, 0.05106353759765625, 0.078369140625, 0.10567474365234375, 0.1329803466796875, 0.16028594970703125, 0.187591552734375, 0.21489715576171875, 0.2422027587890625, 0.26950836181640625, 0.29681396484375, 0.32411956787109375, 0.3514251708984375, 0.37873077392578125, 0.406036376953125, 0.43334197998046875, 0.4606475830078125, 0.48795318603515625, 0.5152587890625, 0.5425643920898438, 0.5698699951171875, 0.5971755981445312, 0.624481201171875, 0.6517868041992188, 0.6790924072265625, 0.7063980102539062, 0.73370361328125, 0.7610092163085938, 0.7883148193359375, 0.8156204223632812, 0.842926025390625, 0.8702316284179688, 0.8975372314453125, 0.9248428344726562, 0.9521484375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 6.0, 2.0, 0.0, 1.0, 5.0, 5.0, 12.0, 12.0, 13.0, 13.0, 16.0, 24.0, 24.0, 41.0, 45.0, 54.0, 49.0, 52.0, 59.0, 51.0, 64.0, 61.0, 52.0, 59.0, 52.0, 33.0, 42.0, 24.0, 22.0, 23.0, 24.0, 15.0, 14.0, 10.0, 10.0, 8.0, 4.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59521484375, -0.5738677978515625, -0.552520751953125, -0.5311737060546875, -0.50982666015625, -0.4884796142578125, -0.467132568359375, -0.4457855224609375, -0.4244384765625, -0.4030914306640625, -0.381744384765625, -0.3603973388671875, -0.33905029296875, -0.3177032470703125, -0.296356201171875, -0.2750091552734375, -0.253662109375, -0.2323150634765625, -0.210968017578125, -0.1896209716796875, -0.16827392578125, -0.1469268798828125, -0.125579833984375, -0.1042327880859375, -0.0828857421875, -0.0615386962890625, -0.040191650390625, -0.0188446044921875, 0.00250244140625, 0.0238494873046875, 0.045196533203125, 0.0665435791015625, 0.087890625, 0.1092376708984375, 0.130584716796875, 0.1519317626953125, 0.17327880859375, 0.1946258544921875, 0.215972900390625, 0.2373199462890625, 0.2586669921875, 0.2800140380859375, 0.301361083984375, 0.3227081298828125, 0.34405517578125, 0.3654022216796875, 0.386749267578125, 0.4080963134765625, 0.429443359375, 0.4507904052734375, 0.472137451171875, 0.4934844970703125, 0.51483154296875, 0.5361785888671875, 0.557525634765625, 0.5788726806640625, 0.6002197265625, 0.6215667724609375, 0.642913818359375, 0.6642608642578125, 0.68560791015625, 0.7069549560546875, 0.728302001953125, 0.7496490478515625, 0.77099609375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 7.0, 9.0, 6.0, 9.0, 13.0, 27.0, 26.0, 52.0, 93.0, 165.0, 362.0, 761.0, 2161.0, 8187.0, 56754.0, 822912.0, 137607.0, 14139.0, 3206.0, 1117.0, 416.0, 224.0, 105.0, 80.0, 30.0, 22.0, 14.0, 18.0, 5.0, 5.0, 9.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.33935546875, -0.3286399841308594, -0.31792449951171875, -0.3072090148925781, -0.2964935302734375, -0.2857780456542969, -0.27506256103515625, -0.2643470764160156, -0.253631591796875, -0.24291610717773438, -0.23220062255859375, -0.22148513793945312, -0.2107696533203125, -0.20005416870117188, -0.18933868408203125, -0.17862319946289062, -0.16790771484375, -0.15719223022460938, -0.14647674560546875, -0.13576126098632812, -0.1250457763671875, -0.11433029174804688, -0.10361480712890625, -0.09289932250976562, -0.082183837890625, -0.07146835327148438, -0.06075286865234375, -0.050037384033203125, -0.0393218994140625, -0.028606414794921875, -0.01789093017578125, -0.007175445556640625, 0.0035400390625, 0.014255523681640625, 0.02497100830078125, 0.035686492919921875, 0.0464019775390625, 0.057117462158203125, 0.06783294677734375, 0.07854843139648438, 0.089263916015625, 0.09997940063476562, 0.11069488525390625, 0.12141036987304688, 0.1321258544921875, 0.14284133911132812, 0.15355682373046875, 0.16427230834960938, 0.17498779296875, 0.18570327758789062, 0.19641876220703125, 0.20713424682617188, 0.2178497314453125, 0.22856521606445312, 0.23928070068359375, 0.24999618530273438, 0.260711669921875, 0.2714271545410156, 0.28214263916015625, 0.2928581237792969, 0.3035736083984375, 0.3142890930175781, 0.32500457763671875, 0.3357200622558594, 0.346435546875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 7.0, 7.0, 8.0, 4.0, 14.0, 15.0, 11.0, 18.0, 13.0, 26.0, 37.0, 31.0, 55.0, 69.0, 78.0, 83.0, 86.0, 71.0, 52.0, 50.0, 49.0, 41.0, 16.0, 22.0, 15.0, 22.0, 13.0, 15.0, 7.0, 13.0, 5.0, 3.0, 8.0, 4.0, 4.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.918741226196289e-05, -5.7208351790905e-05, -5.522929131984711e-05, -5.3250230848789215e-05, -5.127117037773132e-05, -4.929210990667343e-05, -4.731304943561554e-05, -4.533398896455765e-05, -4.3354928493499756e-05, -4.1375868022441864e-05, -3.939680755138397e-05, -3.741774708032608e-05, -3.543868660926819e-05, -3.34596261382103e-05, -3.1480565667152405e-05, -2.9501505196094513e-05, -2.752244472503662e-05, -2.554338425397873e-05, -2.3564323782920837e-05, -2.1585263311862946e-05, -1.9606202840805054e-05, -1.7627142369747162e-05, -1.564808189868927e-05, -1.3669021427631378e-05, -1.1689960956573486e-05, -9.710900485515594e-06, -7.731840014457703e-06, -5.752779543399811e-06, -3.773719072341919e-06, -1.794658601284027e-06, 1.8440186977386475e-07, 2.1634623408317566e-06, 4.1425228118896484e-06, 6.12158328294754e-06, 8.100643754005432e-06, 1.0079704225063324e-05, 1.2058764696121216e-05, 1.4037825167179108e-05, 1.6016885638237e-05, 1.799594610929489e-05, 1.9975006580352783e-05, 2.1954067051410675e-05, 2.3933127522468567e-05, 2.591218799352646e-05, 2.789124846458435e-05, 2.9870308935642242e-05, 3.1849369406700134e-05, 3.3828429877758026e-05, 3.580749034881592e-05, 3.778655081987381e-05, 3.97656112909317e-05, 4.1744671761989594e-05, 4.3723732233047485e-05, 4.570279270410538e-05, 4.768185317516327e-05, 4.966091364622116e-05, 5.163997411727905e-05, 5.3619034588336945e-05, 5.5598095059394836e-05, 5.757715553045273e-05, 5.955621600151062e-05, 6.153527647256851e-05, 6.35143369436264e-05, 6.54933974146843e-05, 6.747245788574219e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 3.0, 6.0, 12.0, 11.0, 15.0, 20.0, 21.0, 30.0, 46.0, 70.0, 64.0, 113.0, 199.0, 290.0, 476.0, 923.0, 1918.0, 4949.0, 17082.0, 119538.0, 802694.0, 78714.0, 13373.0, 4128.0, 1720.0, 842.0, 461.0, 279.0, 172.0, 104.0, 80.0, 45.0, 43.0, 29.0, 23.0, 15.0, 19.0, 7.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.297119140625, -0.2882270812988281, -0.27933502197265625, -0.2704429626464844, -0.2615509033203125, -0.2526588439941406, -0.24376678466796875, -0.23487472534179688, -0.225982666015625, -0.21709060668945312, -0.20819854736328125, -0.19930648803710938, -0.1904144287109375, -0.18152236938476562, -0.17263031005859375, -0.16373825073242188, -0.15484619140625, -0.14595413208007812, -0.13706207275390625, -0.12817001342773438, -0.1192779541015625, -0.11038589477539062, -0.10149383544921875, -0.09260177612304688, -0.083709716796875, -0.07481765747070312, -0.06592559814453125, -0.057033538818359375, -0.0481414794921875, -0.039249420166015625, -0.03035736083984375, -0.021465301513671875, -0.0125732421875, -0.003681182861328125, 0.00521087646484375, 0.014102935791015625, 0.0229949951171875, 0.031887054443359375, 0.04077911376953125, 0.049671173095703125, 0.058563232421875, 0.06745529174804688, 0.07634735107421875, 0.08523941040039062, 0.0941314697265625, 0.10302352905273438, 0.11191558837890625, 0.12080764770507812, 0.12969970703125, 0.13859176635742188, 0.14748382568359375, 0.15637588500976562, 0.1652679443359375, 0.17416000366210938, 0.18305206298828125, 0.19194412231445312, 0.200836181640625, 0.20972824096679688, 0.21862030029296875, 0.22751235961914062, 0.2364044189453125, 0.24529647827148438, 0.25418853759765625, 0.2630805969238281, 0.27197265625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 0.0, 3.0, 5.0, 3.0, 5.0, 6.0, 9.0, 12.0, 6.0, 24.0, 15.0, 32.0, 34.0, 36.0, 61.0, 88.0, 110.0, 132.0, 103.0, 78.0, 63.0, 32.0, 35.0, 18.0, 22.0, 13.0, 14.0, 8.0, 9.0, 8.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.31298828125, -0.30504417419433594, -0.2971000671386719, -0.2891559600830078, -0.28121185302734375, -0.2732677459716797, -0.2653236389160156, -0.25737953186035156, -0.2494354248046875, -0.24149131774902344, -0.23354721069335938, -0.2256031036376953, -0.21765899658203125, -0.2097148895263672, -0.20177078247070312, -0.19382667541503906, -0.185882568359375, -0.17793846130371094, -0.16999435424804688, -0.1620502471923828, -0.15410614013671875, -0.1461620330810547, -0.13821792602539062, -0.13027381896972656, -0.1223297119140625, -0.11438560485839844, -0.10644149780273438, -0.09849739074707031, -0.09055328369140625, -0.08260917663574219, -0.07466506958007812, -0.06672096252441406, -0.05877685546875, -0.05083274841308594, -0.042888641357421875, -0.03494453430175781, -0.02700042724609375, -0.019056320190429688, -0.011112213134765625, -0.0031681060791015625, 0.0047760009765625, 0.012720108032226562, 0.020664215087890625, 0.028608322143554688, 0.03655242919921875, 0.04449653625488281, 0.052440643310546875, 0.06038475036621094, 0.068328857421875, 0.07627296447753906, 0.08421707153320312, 0.09216117858886719, 0.10010528564453125, 0.10804939270019531, 0.11599349975585938, 0.12393760681152344, 0.1318817138671875, 0.13982582092285156, 0.14776992797851562, 0.1557140350341797, 0.16365814208984375, 0.1716022491455078, 0.17954635620117188, 0.18749046325683594, 0.1954345703125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 5.0, 7.0, 10.0, 20.0, 40.0, 94.0, 118.0, 265.0, 219.0, 113.0, 51.0, 22.0, 12.0, 9.0, 8.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.828040599822998, -7.657020092010498, -7.485999584197998, -7.31497859954834, -7.14395809173584, -6.97293758392334, -6.80191707611084, -6.63089656829834, -6.459875583648682, -6.288855075836182, -6.117834568023682, -5.946813583374023, -5.775793075561523, -5.604772567749023, -5.433752059936523, -5.262731552124023, -5.091711044311523, -4.920690536499023, -4.749670028686523, -4.578649044036865, -4.407628536224365, -4.236608028411865, -4.065587520599365, -3.894566774368286, -3.723546028137207, -3.552525520324707, -3.381504774093628, -3.210484266281128, -3.039463520050049, -2.868443012237549, -2.697422504425049, -2.5264017581939697, -2.3553812503814697, -2.1843607425689697, -2.0133399963378906, -1.8423194885253906, -1.6712987422943115, -1.5002782344818115, -1.329257607460022, -1.1582369804382324, -0.9872163534164429, -0.8161957263946533, -0.6451750993728638, -0.474154531955719, -0.30313390493392944, -0.1321132779121399, 0.03890728950500488, 0.20992791652679443, 0.380948543548584, 0.5519691705703735, 0.7229897975921631, 0.8940103650093079, 1.0650310516357422, 1.2360515594482422, 1.4070721864700317, 1.5780928134918213, 1.7491134405136108, 1.9201340675354004, 2.0911545753479004, 2.2621753215789795, 2.4331958293914795, 2.6042165756225586, 2.7752370834350586, 2.9462575912475586, 3.1172783374786377]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 10.0, 9.0, 11.0, 4.0, 17.0, 20.0, 18.0, 22.0, 30.0, 14.0, 29.0, 27.0, 39.0, 49.0, 38.0, 55.0, 56.0, 63.0, 63.0, 47.0, 39.0, 31.0, 43.0, 38.0, 35.0, 30.0, 21.0, 10.0, 22.0, 19.0, 14.0, 17.0, 12.0, 8.0, 6.0, 9.0, 6.0, 8.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9805541038513184, -1.9171664714813232, -1.8537788391113281, -1.790391206741333, -1.727003574371338, -1.6636159420013428, -1.6002283096313477, -1.5368406772613525, -1.4734530448913574, -1.4100654125213623, -1.3466777801513672, -1.283290147781372, -1.219902515411377, -1.1565148830413818, -1.0931272506713867, -1.0297396183013916, -0.9663518667221069, -0.9029642343521118, -0.8395766019821167, -0.7761889696121216, -0.7128013372421265, -0.6494137048721313, -0.5860260128974915, -0.5226383805274963, -0.4592507481575012, -0.3958631157875061, -0.332475483417511, -0.2690878212451935, -0.20570018887519836, -0.14231255650520325, -0.07892489433288574, -0.015537261962890625, 0.04785037040710449, 0.1112380102276802, 0.17462565004825592, 0.23801329731941223, 0.30140092968940735, 0.36478856205940247, 0.42817622423171997, 0.4915638566017151, 0.5549514889717102, 0.6183391213417053, 0.6817267537117004, 0.7451144456863403, 0.8085020780563354, 0.8718897104263306, 0.9352773427963257, 0.9986649751663208, 1.062052607536316, 1.125440239906311, 1.1888278722763062, 1.2522155046463013, 1.3156031370162964, 1.3789907693862915, 1.4423785209655762, 1.5057661533355713, 1.5691537857055664, 1.6325414180755615, 1.6959290504455566, 1.7593166828155518, 1.8227043151855469, 1.886091947555542, 1.949479579925537, 2.0128672122955322, 2.0762548446655273]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 15.0, 10.0, 19.0, 36.0, 42.0, 75.0, 120.0, 198.0, 392.0, 959.0, 2637.0, 9493.0, 60729.0, 1850641.0, 2187278.0, 66735.0, 10159.0, 2824.0, 953.0, 413.0, 227.0, 128.0, 55.0, 43.0, 31.0, 27.0, 11.0, 10.0, 9.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.4873046875, -0.47542572021484375, -0.4635467529296875, -0.45166778564453125, -0.439788818359375, -0.42790985107421875, -0.4160308837890625, -0.40415191650390625, -0.39227294921875, -0.38039398193359375, -0.3685150146484375, -0.35663604736328125, -0.344757080078125, -0.33287811279296875, -0.3209991455078125, -0.30912017822265625, -0.2972412109375, -0.28536224365234375, -0.2734832763671875, -0.26160430908203125, -0.249725341796875, -0.23784637451171875, -0.2259674072265625, -0.21408843994140625, -0.20220947265625, -0.19033050537109375, -0.1784515380859375, -0.16657257080078125, -0.154693603515625, -0.14281463623046875, -0.1309356689453125, -0.11905670166015625, -0.107177734375, -0.09529876708984375, -0.0834197998046875, -0.07154083251953125, -0.059661865234375, -0.04778289794921875, -0.0359039306640625, -0.02402496337890625, -0.01214599609375, -0.00026702880859375, 0.0116119384765625, 0.02349090576171875, 0.035369873046875, 0.04724884033203125, 0.0591278076171875, 0.07100677490234375, 0.0828857421875, 0.09476470947265625, 0.1066436767578125, 0.11852264404296875, 0.130401611328125, 0.14228057861328125, 0.1541595458984375, 0.16603851318359375, 0.17791748046875, 0.18979644775390625, 0.2016754150390625, 0.21355438232421875, 0.225433349609375, 0.23731231689453125, 0.2491912841796875, 0.26107025146484375, 0.27294921875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 9.0, 12.0, 17.0, 30.0, 52.0, 77.0, 97.0, 112.0, 109.0, 116.0, 117.0, 87.0, 58.0, 45.0, 24.0, 28.0, 8.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1944580078125, -0.18630409240722656, -0.17815017700195312, -0.1699962615966797, -0.16184234619140625, -0.1536884307861328, -0.14553451538085938, -0.13738059997558594, -0.1292266845703125, -0.12107276916503906, -0.11291885375976562, -0.10476493835449219, -0.09661102294921875, -0.08845710754394531, -0.08030319213867188, -0.07214927673339844, -0.063995361328125, -0.05584144592285156, -0.047687530517578125, -0.03953361511230469, -0.03137969970703125, -0.023225784301757812, -0.015071868896484375, -0.0069179534912109375, 0.0012359619140625, 0.009389877319335938, 0.017543792724609375, 0.025697708129882812, 0.03385162353515625, 0.04200553894042969, 0.050159454345703125, 0.05831336975097656, 0.06646728515625, 0.07462120056152344, 0.08277511596679688, 0.09092903137207031, 0.09908294677734375, 0.10723686218261719, 0.11539077758789062, 0.12354469299316406, 0.1316986083984375, 0.13985252380371094, 0.14800643920898438, 0.1561603546142578, 0.16431427001953125, 0.1724681854248047, 0.18062210083007812, 0.18877601623535156, 0.196929931640625, 0.20508384704589844, 0.21323776245117188, 0.2213916778564453, 0.22954559326171875, 0.2376995086669922, 0.24585342407226562, 0.25400733947753906, 0.2621612548828125, 0.27031517028808594, 0.2784690856933594, 0.2866230010986328, 0.29477691650390625, 0.3029308319091797, 0.3110847473144531, 0.31923866271972656, 0.327392578125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 8.0, 19.0, 29.0, 46.0, 87.0, 194.0, 438.0, 1286.0, 4665.0, 29877.0, 559283.0, 3473291.0, 107445.0, 12673.0, 2973.0, 1062.0, 425.0, 232.0, 106.0, 55.0, 34.0, 19.0, 10.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.482666015625, -0.4642829895019531, -0.44589996337890625, -0.4275169372558594, -0.4091339111328125, -0.3907508850097656, -0.37236785888671875, -0.3539848327636719, -0.335601806640625, -0.3172187805175781, -0.29883575439453125, -0.2804527282714844, -0.2620697021484375, -0.24368667602539062, -0.22530364990234375, -0.20692062377929688, -0.18853759765625, -0.17015457153320312, -0.15177154541015625, -0.13338851928710938, -0.1150054931640625, -0.09662246704101562, -0.07823944091796875, -0.059856414794921875, -0.041473388671875, -0.023090362548828125, -0.00470733642578125, 0.013675689697265625, 0.0320587158203125, 0.050441741943359375, 0.06882476806640625, 0.08720779418945312, 0.1055908203125, 0.12397384643554688, 0.14235687255859375, 0.16073989868164062, 0.1791229248046875, 0.19750595092773438, 0.21588897705078125, 0.23427200317382812, 0.252655029296875, 0.2710380554199219, 0.28942108154296875, 0.3078041076660156, 0.3261871337890625, 0.3445701599121094, 0.36295318603515625, 0.3813362121582031, 0.39971923828125, 0.4181022644042969, 0.43648529052734375, 0.4548683166503906, 0.4732513427734375, 0.4916343688964844, 0.5100173950195312, 0.5284004211425781, 0.546783447265625, 0.5651664733886719, 0.5835494995117188, 0.6019325256347656, 0.6203155517578125, 0.6386985778808594, 0.6570816040039062, 0.6754646301269531, 0.69384765625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 7.0, 8.0, 11.0, 24.0, 27.0, 38.0, 70.0, 97.0, 167.0, 278.0, 527.0, 805.0, 792.0, 506.0, 265.0, 141.0, 83.0, 65.0, 47.0, 33.0, 16.0, 21.0, 16.0, 10.0, 10.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.302734375, -0.288330078125, -0.27392578125, -0.259521484375, -0.2451171875, -0.230712890625, -0.21630859375, -0.201904296875, -0.1875, -0.173095703125, -0.15869140625, -0.144287109375, -0.1298828125, -0.115478515625, -0.10107421875, -0.086669921875, -0.072265625, -0.057861328125, -0.04345703125, -0.029052734375, -0.0146484375, -0.000244140625, 0.01416015625, 0.028564453125, 0.04296875, 0.057373046875, 0.07177734375, 0.086181640625, 0.1005859375, 0.114990234375, 0.12939453125, 0.143798828125, 0.158203125, 0.172607421875, 0.18701171875, 0.201416015625, 0.2158203125, 0.230224609375, 0.24462890625, 0.259033203125, 0.2734375, 0.287841796875, 0.30224609375, 0.316650390625, 0.3310546875, 0.345458984375, 0.35986328125, 0.374267578125, 0.388671875, 0.403076171875, 0.41748046875, 0.431884765625, 0.4462890625, 0.460693359375, 0.47509765625, 0.489501953125, 0.50390625, 0.518310546875, 0.53271484375, 0.547119140625, 0.5615234375, 0.575927734375, 0.59033203125, 0.604736328125, 0.619140625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 11.0, 34.0, 91.0, 202.0, 301.0, 219.0, 92.0, 27.0, 14.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.331094741821289, -3.1280770301818848, -2.9250595569610596, -2.7220420837402344, -2.51902437210083, -2.316006660461426, -2.1129891872406006, -1.9099715948104858, -1.706954002380371, -1.5039364099502563, -1.3009188175201416, -1.0979012250900269, -0.8948836326599121, -0.6918660402297974, -0.4888484477996826, -0.28583085536956787, -0.08281326293945312, 0.12020432949066162, 0.32322192192077637, 0.5262395143508911, 0.7292571067810059, 0.9322746992111206, 1.1352922916412354, 1.33830988407135, 1.5413274765014648, 1.7443450689315796, 1.9473626613616943, 2.1503801345825195, 2.353397846221924, 2.556415557861328, 2.7594330310821533, 2.9624505043029785, 3.165468215942383, 3.368485927581787, 3.5715034008026123, 3.7745208740234375, 3.977538585662842, 4.180556297302246, 4.383573532104492, 4.5865912437438965, 4.789608955383301, 4.992626667022705, 5.195644378662109, 5.3986616134643555, 5.60167932510376, 5.804697036743164, 6.00771427154541, 6.2107319831848145, 6.413749694824219, 6.616767406463623, 6.819785118103027, 7.022802352905273, 7.225820064544678, 7.428837776184082, 7.631855010986328, 7.834872722625732, 8.037890434265137, 8.240907669067383, 8.443925857543945, 8.646943092346191, 8.849960327148438, 9.052978515625, 9.255995750427246, 9.459013938903809, 9.662031173706055]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 6.0, 5.0, 9.0, 9.0, 9.0, 16.0, 16.0, 26.0, 22.0, 29.0, 36.0, 36.0, 41.0, 43.0, 50.0, 40.0, 54.0, 49.0, 58.0, 50.0, 33.0, 51.0, 57.0, 39.0, 38.0, 38.0, 26.0, 24.0, 24.0, 14.0, 16.0, 9.0, 12.0, 10.0, 2.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.272352457046509, -2.2094199657440186, -2.1464877128601074, -2.083555221557617, -2.020622730255127, -1.9576903581619263, -1.8947579860687256, -1.8318254947662354, -1.7688931226730347, -1.705960750579834, -1.6430282592773438, -1.580095887184143, -1.5171635150909424, -1.4542310237884521, -1.3912986516952515, -1.3283662796020508, -1.2654337882995605, -1.2025014162063599, -1.1395689249038696, -1.076636552810669, -1.0137040615081787, -0.950771689414978, -0.8878393173217773, -0.8249068856239319, -0.7619744539260864, -0.699042022228241, -0.6361095905303955, -0.5731772184371948, -0.5102447867393494, -0.4473123550415039, -0.38437995314598083, -0.32144755125045776, -0.25851523876190186, -0.1955828219652176, -0.13265040516853333, -0.06971798837184906, -0.006785571575164795, 0.056146860122680664, 0.11907926201820374, 0.1820116639137268, 0.24494409561157227, 0.3078765273094177, 0.3708089292049408, 0.43374133110046387, 0.4966737627983093, 0.5596061944961548, 0.6225385665893555, 0.6854709982872009, 0.7484034299850464, 0.8113358616828918, 0.8742682933807373, 0.937200665473938, 1.0001330375671387, 1.063065528869629, 1.1259979009628296, 1.1889302730560303, 1.2518627643585205, 1.3147951364517212, 1.3777276277542114, 1.440659999847412, 1.5035924911499023, 1.566524863243103, 1.6294572353363037, 1.692389726638794, 1.7553220987319946]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 2.0, 5.0, 8.0, 9.0, 11.0, 27.0, 51.0, 78.0, 138.0, 316.0, 685.0, 1773.0, 5309.0, 20615.0, 131407.0, 732026.0, 127937.0, 20033.0, 5058.0, 1669.0, 683.0, 350.0, 169.0, 82.0, 37.0, 26.0, 11.0, 4.0, 6.0, 9.0, 2.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.62451171875, -0.6082878112792969, -0.5920639038085938, -0.5758399963378906, -0.5596160888671875, -0.5433921813964844, -0.5271682739257812, -0.5109443664550781, -0.494720458984375, -0.4784965515136719, -0.46227264404296875, -0.4460487365722656, -0.4298248291015625, -0.4136009216308594, -0.39737701416015625, -0.3811531066894531, -0.36492919921875, -0.3487052917480469, -0.33248138427734375, -0.3162574768066406, -0.3000335693359375, -0.2838096618652344, -0.26758575439453125, -0.2513618469238281, -0.235137939453125, -0.21891403198242188, -0.20269012451171875, -0.18646621704101562, -0.1702423095703125, -0.15401840209960938, -0.13779449462890625, -0.12157058715820312, -0.1053466796875, -0.08912277221679688, -0.07289886474609375, -0.056674957275390625, -0.0404510498046875, -0.024227142333984375, -0.00800323486328125, 0.008220672607421875, 0.024444580078125, 0.040668487548828125, 0.05689239501953125, 0.07311630249023438, 0.0893402099609375, 0.10556411743164062, 0.12178802490234375, 0.13801193237304688, 0.15423583984375, 0.17045974731445312, 0.18668365478515625, 0.20290756225585938, 0.2191314697265625, 0.23535537719726562, 0.25157928466796875, 0.2678031921386719, 0.284027099609375, 0.3002510070800781, 0.31647491455078125, 0.3326988220214844, 0.3489227294921875, 0.3651466369628906, 0.38137054443359375, 0.3975944519042969, 0.413818359375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 10.0, 12.0, 13.0, 19.0, 28.0, 31.0, 40.0, 42.0, 73.0, 67.0, 77.0, 67.0, 62.0, 73.0, 73.0, 66.0, 52.0, 46.0, 43.0, 21.0, 32.0, 25.0, 14.0, 10.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2353515625, -0.22939109802246094, -0.22343063354492188, -0.2174701690673828, -0.21150970458984375, -0.2055492401123047, -0.19958877563476562, -0.19362831115722656, -0.1876678466796875, -0.18170738220214844, -0.17574691772460938, -0.1697864532470703, -0.16382598876953125, -0.1578655242919922, -0.15190505981445312, -0.14594459533691406, -0.139984130859375, -0.13402366638183594, -0.12806320190429688, -0.12210273742675781, -0.11614227294921875, -0.11018180847167969, -0.10422134399414062, -0.09826087951660156, -0.0923004150390625, -0.08633995056152344, -0.08037948608398438, -0.07441902160644531, -0.06845855712890625, -0.06249809265136719, -0.056537628173828125, -0.05057716369628906, -0.04461669921875, -0.03865623474121094, -0.032695770263671875, -0.026735305786132812, -0.02077484130859375, -0.014814376831054688, -0.008853912353515625, -0.0028934478759765625, 0.0030670166015625, 0.009027481079101562, 0.014987945556640625, 0.020948410034179688, 0.02690887451171875, 0.03286933898925781, 0.038829803466796875, 0.04479026794433594, 0.050750732421875, 0.05671119689941406, 0.06267166137695312, 0.06863212585449219, 0.07459259033203125, 0.08055305480957031, 0.08651351928710938, 0.09247398376464844, 0.0984344482421875, 0.10439491271972656, 0.11035537719726562, 0.11631584167480469, 0.12227630615234375, 0.1282367706298828, 0.13419723510742188, 0.14015769958496094, 0.1461181640625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 0.0, 3.0, 5.0, 5.0, 3.0, 2.0, 2.0, 5.0, 5.0, 4.0, 15.0, 18.0, 18.0, 32.0, 27.0, 37.0, 52.0, 64.0, 116.0, 189.0, 255.0, 379.0, 672.0, 1565.0, 3732.0, 13771.0, 87790.0, 808146.0, 108704.0, 15170.0, 4129.0, 1670.0, 731.0, 400.0, 253.0, 178.0, 113.0, 84.0, 50.0, 44.0, 28.0, 28.0, 9.0, 11.0, 11.0, 11.0, 8.0, 3.0, 3.0, 2.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5927734375, -0.5727081298828125, -0.552642822265625, -0.5325775146484375, -0.51251220703125, -0.4924468994140625, -0.472381591796875, -0.4523162841796875, -0.4322509765625, -0.4121856689453125, -0.392120361328125, -0.3720550537109375, -0.35198974609375, -0.3319244384765625, -0.311859130859375, -0.2917938232421875, -0.271728515625, -0.2516632080078125, -0.231597900390625, -0.2115325927734375, -0.19146728515625, -0.1714019775390625, -0.151336669921875, -0.1312713623046875, -0.1112060546875, -0.0911407470703125, -0.071075439453125, -0.0510101318359375, -0.03094482421875, -0.0108795166015625, 0.009185791015625, 0.0292510986328125, 0.04931640625, 0.0693817138671875, 0.089447021484375, 0.1095123291015625, 0.12957763671875, 0.1496429443359375, 0.169708251953125, 0.1897735595703125, 0.2098388671875, 0.2299041748046875, 0.249969482421875, 0.2700347900390625, 0.29010009765625, 0.3101654052734375, 0.330230712890625, 0.3502960205078125, 0.370361328125, 0.3904266357421875, 0.410491943359375, 0.4305572509765625, 0.45062255859375, 0.4706878662109375, 0.490753173828125, 0.5108184814453125, 0.5308837890625, 0.5509490966796875, 0.571014404296875, 0.5910797119140625, 0.61114501953125, 0.6312103271484375, 0.651275634765625, 0.6713409423828125, 0.69140625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 2.0, 11.0, 5.0, 18.0, 12.0, 13.0, 25.0, 33.0, 35.0, 43.0, 48.0, 39.0, 43.0, 42.0, 68.0, 63.0, 73.0, 58.0, 61.0, 55.0, 50.0, 37.0, 33.0, 32.0, 22.0, 16.0, 16.0, 9.0, 15.0, 3.0, 6.0, 3.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69482421875, -0.6731796264648438, -0.6515350341796875, -0.6298904418945312, -0.608245849609375, -0.5866012573242188, -0.5649566650390625, -0.5433120727539062, -0.52166748046875, -0.5000228881835938, -0.4783782958984375, -0.45673370361328125, -0.435089111328125, -0.41344451904296875, -0.3917999267578125, -0.37015533447265625, -0.3485107421875, -0.32686614990234375, -0.3052215576171875, -0.28357696533203125, -0.261932373046875, -0.24028778076171875, -0.2186431884765625, -0.19699859619140625, -0.17535400390625, -0.15370941162109375, -0.1320648193359375, -0.11042022705078125, -0.088775634765625, -0.06713104248046875, -0.0454864501953125, -0.02384185791015625, -0.002197265625, 0.01944732666015625, 0.0410919189453125, 0.06273651123046875, 0.084381103515625, 0.10602569580078125, 0.1276702880859375, 0.14931488037109375, 0.17095947265625, 0.19260406494140625, 0.2142486572265625, 0.23589324951171875, 0.257537841796875, 0.27918243408203125, 0.3008270263671875, 0.32247161865234375, 0.3441162109375, 0.36576080322265625, 0.3874053955078125, 0.40904998779296875, 0.430694580078125, 0.45233917236328125, 0.4739837646484375, 0.49562835693359375, 0.51727294921875, 0.5389175415039062, 0.5605621337890625, 0.5822067260742188, 0.603851318359375, 0.6254959106445312, 0.6471405029296875, 0.6687850952148438, 0.6904296875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 7.0, 10.0, 15.0, 21.0, 31.0, 49.0, 71.0, 109.0, 193.0, 390.0, 1061.0, 4083.0, 25770.0, 720859.0, 274718.0, 16427.0, 3082.0, 877.0, 321.0, 147.0, 92.0, 63.0, 42.0, 32.0, 18.0, 14.0, 14.0, 7.0, 10.0, 3.0, 3.0, 4.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.331787109375, -0.32030487060546875, -0.3088226318359375, -0.29734039306640625, -0.285858154296875, -0.27437591552734375, -0.2628936767578125, -0.25141143798828125, -0.23992919921875, -0.22844696044921875, -0.2169647216796875, -0.20548248291015625, -0.194000244140625, -0.18251800537109375, -0.1710357666015625, -0.15955352783203125, -0.1480712890625, -0.13658905029296875, -0.1251068115234375, -0.11362457275390625, -0.102142333984375, -0.09066009521484375, -0.0791778564453125, -0.06769561767578125, -0.05621337890625, -0.04473114013671875, -0.0332489013671875, -0.02176666259765625, -0.010284423828125, 0.00119781494140625, 0.0126800537109375, 0.02416229248046875, 0.03564453125, 0.04712677001953125, 0.0586090087890625, 0.07009124755859375, 0.081573486328125, 0.09305572509765625, 0.1045379638671875, 0.11602020263671875, 0.12750244140625, 0.13898468017578125, 0.1504669189453125, 0.16194915771484375, 0.173431396484375, 0.18491363525390625, 0.1963958740234375, 0.20787811279296875, 0.2193603515625, 0.23084259033203125, 0.2423248291015625, 0.25380706787109375, 0.265289306640625, 0.27677154541015625, 0.2882537841796875, 0.29973602294921875, 0.31121826171875, 0.32270050048828125, 0.3341827392578125, 0.34566497802734375, 0.357147216796875, 0.36862945556640625, 0.3801116943359375, 0.39159393310546875, 0.403076171875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 8.0, 1.0, 11.0, 13.0, 18.0, 41.0, 53.0, 83.0, 126.0, 184.0, 157.0, 125.0, 61.0, 36.0, 30.0, 16.0, 7.0, 10.0, 7.0, 3.0, 5.0, 1.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001461505889892578, -0.00014247652143239975, -0.0001388024538755417, -0.00013512838631868362, -0.00013145431876182556, -0.0001277802512049675, -0.00012410618364810944, -0.00012043211609125137, -0.00011675804853439331, -0.00011308398097753525, -0.00010940991342067719, -0.00010573584586381912, -0.00010206177830696106, -9.8387710750103e-05, -9.471364319324493e-05, -9.103957563638687e-05, -8.736550807952881e-05, -8.369144052267075e-05, -8.001737296581268e-05, -7.634330540895462e-05, -7.266923785209656e-05, -6.89951702952385e-05, -6.532110273838043e-05, -6.164703518152237e-05, -5.797296762466431e-05, -5.4298900067806244e-05, -5.062483251094818e-05, -4.695076495409012e-05, -4.3276697397232056e-05, -3.960262984037399e-05, -3.592856228351593e-05, -3.225449472665787e-05, -2.8580427169799805e-05, -2.4906359612941742e-05, -2.123229205608368e-05, -1.7558224499225616e-05, -1.3884156942367554e-05, -1.0210089385509491e-05, -6.536021828651428e-06, -2.8619542717933655e-06, 8.121132850646973e-07, 4.48618084192276e-06, 8.160248398780823e-06, 1.1834315955638885e-05, 1.5508383512496948e-05, 1.918245106935501e-05, 2.2856518626213074e-05, 2.6530586183071136e-05, 3.02046537399292e-05, 3.387872129678726e-05, 3.7552788853645325e-05, 4.122685641050339e-05, 4.490092396736145e-05, 4.857499152421951e-05, 5.2249059081077576e-05, 5.592312663793564e-05, 5.95971941947937e-05, 6.327126175165176e-05, 6.694532930850983e-05, 7.061939686536789e-05, 7.429346442222595e-05, 7.796753197908401e-05, 8.164159953594208e-05, 8.531566709280014e-05, 8.89897346496582e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 1.0, 3.0, 6.0, 6.0, 10.0, 12.0, 14.0, 22.0, 40.0, 48.0, 63.0, 93.0, 172.0, 294.0, 636.0, 1376.0, 3566.0, 11951.0, 92515.0, 841805.0, 78749.0, 11142.0, 3340.0, 1291.0, 569.0, 294.0, 185.0, 103.0, 76.0, 50.0, 31.0, 16.0, 18.0, 12.0, 10.0, 10.0, 6.0, 2.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.330322265625, -0.32073974609375, -0.3111572265625, -0.30157470703125, -0.2919921875, -0.28240966796875, -0.2728271484375, -0.26324462890625, -0.253662109375, -0.24407958984375, -0.2344970703125, -0.22491455078125, -0.21533203125, -0.20574951171875, -0.1961669921875, -0.18658447265625, -0.177001953125, -0.16741943359375, -0.1578369140625, -0.14825439453125, -0.138671875, -0.12908935546875, -0.1195068359375, -0.10992431640625, -0.100341796875, -0.09075927734375, -0.0811767578125, -0.07159423828125, -0.06201171875, -0.05242919921875, -0.0428466796875, -0.03326416015625, -0.023681640625, -0.01409912109375, -0.0045166015625, 0.00506591796875, 0.0146484375, 0.02423095703125, 0.0338134765625, 0.04339599609375, 0.052978515625, 0.06256103515625, 0.0721435546875, 0.08172607421875, 0.09130859375, 0.10089111328125, 0.1104736328125, 0.12005615234375, 0.129638671875, 0.13922119140625, 0.1488037109375, 0.15838623046875, 0.16796875, 0.17755126953125, 0.1871337890625, 0.19671630859375, 0.206298828125, 0.21588134765625, 0.2254638671875, 0.23504638671875, 0.24462890625, 0.25421142578125, 0.2637939453125, 0.27337646484375, 0.282958984375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 11.0, 7.0, 8.0, 9.0, 21.0, 25.0, 34.0, 63.0, 100.0, 140.0, 163.0, 136.0, 93.0, 62.0, 30.0, 24.0, 21.0, 5.0, 16.0, 8.0, 5.0, 2.0, 3.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26025390625, -0.2516288757324219, -0.24300384521484375, -0.23437881469726562, -0.2257537841796875, -0.21712875366210938, -0.20850372314453125, -0.19987869262695312, -0.191253662109375, -0.18262863159179688, -0.17400360107421875, -0.16537857055664062, -0.1567535400390625, -0.14812850952148438, -0.13950347900390625, -0.13087844848632812, -0.12225341796875, -0.11362838745117188, -0.10500335693359375, -0.09637832641601562, -0.0877532958984375, -0.07912826538085938, -0.07050323486328125, -0.061878204345703125, -0.053253173828125, -0.044628143310546875, -0.03600311279296875, -0.027378082275390625, -0.0187530517578125, -0.010128021240234375, -0.00150299072265625, 0.007122039794921875, 0.0157470703125, 0.024372100830078125, 0.03299713134765625, 0.041622161865234375, 0.0502471923828125, 0.058872222900390625, 0.06749725341796875, 0.07612228393554688, 0.084747314453125, 0.09337234497070312, 0.10199737548828125, 0.11062240600585938, 0.1192474365234375, 0.12787246704101562, 0.13649749755859375, 0.14512252807617188, 0.15374755859375, 0.16237258911132812, 0.17099761962890625, 0.17962265014648438, 0.1882476806640625, 0.19687271118164062, 0.20549774169921875, 0.21412277221679688, 0.222747802734375, 0.23137283325195312, 0.23999786376953125, 0.24862289428710938, 0.2572479248046875, 0.2658729553222656, 0.27449798583984375, 0.2831230163574219, 0.291748046875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 13.0, 37.0, 327.0, 487.0, 97.0, 17.0, 11.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.933162689208984, -15.588034629821777, -15.24290657043457, -14.897777557373047, -14.55264949798584, -14.207521438598633, -13.862393379211426, -13.517265319824219, -13.172136306762695, -12.827008247375488, -12.481880187988281, -12.136751174926758, -11.79162311553955, -11.446495056152344, -11.101366996765137, -10.75623893737793, -10.411109924316406, -10.0659818649292, -9.720853805541992, -9.375724792480469, -9.030596733093262, -8.685468673706055, -8.340340614318848, -7.995212078094482, -7.650084495544434, -7.304956436157227, -6.959827899932861, -6.614699840545654, -6.269571304321289, -5.924443244934082, -5.579315185546875, -5.23418664932251, -4.8890581130981445, -4.5439300537109375, -4.198801517486572, -3.8536734580993652, -3.508544921875, -3.163416862487793, -2.818288564682007, -2.4731602668762207, -2.1280319690704346, -1.7829036712646484, -1.4377753734588623, -1.0926471948623657, -0.7475188970565796, -0.40239059925079346, -0.057262420654296875, 0.28786587715148926, 0.6329941749572754, 0.9781224727630615, 1.3232507705688477, 1.6683789491653442, 2.01350736618042, 2.358635425567627, 2.703763723373413, 3.048892021179199, 3.3940203189849854, 3.7391486167907715, 4.0842766761779785, 4.429405212402344, 4.774533271789551, 5.119661808013916, 5.464789867401123, 5.809918403625488, 6.155046463012695]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 6.0, 6.0, 6.0, 4.0, 11.0, 10.0, 11.0, 10.0, 16.0, 28.0, 23.0, 22.0, 25.0, 28.0, 28.0, 37.0, 44.0, 48.0, 65.0, 63.0, 51.0, 60.0, 47.0, 45.0, 27.0, 29.0, 26.0, 23.0, 25.0, 22.0, 24.0, 24.0, 19.0, 12.0, 10.0, 11.0, 9.0, 3.0, 7.0, 3.0, 6.0, 2.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-2.0123491287231445, -1.9493887424468994, -1.8864283561706543, -1.8234679698944092, -1.760507583618164, -1.697547197341919, -1.6345866918563843, -1.5716263055801392, -1.508665919303894, -1.445705533027649, -1.3827451467514038, -1.3197847604751587, -1.256824254989624, -1.193863868713379, -1.1309034824371338, -1.0679430961608887, -1.0049827098846436, -0.9420223236083984, -0.8790619373321533, -0.8161014914512634, -0.7531411051750183, -0.6901807188987732, -0.6272202730178833, -0.5642598867416382, -0.5012995004653931, -0.43833911418914795, -0.37537869811058044, -0.31241828203201294, -0.24945789575576782, -0.1864975094795227, -0.1235370934009552, -0.060576677322387695, 0.0023834705352783203, 0.06534387171268463, 0.12830427289009094, 0.19126467406749725, 0.25422507524490356, 0.3171854615211487, 0.3801458775997162, 0.4431062936782837, 0.5060666799545288, 0.5690270662307739, 0.631987452507019, 0.6949478983879089, 0.757908284664154, 0.8208686709403992, 0.8838291168212891, 0.9467895030975342, 1.0097498893737793, 1.0727102756500244, 1.1356706619262695, 1.1986310482025146, 1.2615914344787598, 1.3245518207550049, 1.3875123262405396, 1.4504727125167847, 1.5134330987930298, 1.576393485069275, 1.63935387134552, 1.7023142576217651, 1.7652747631072998, 1.828235149383545, 1.89119553565979, 1.9541559219360352, 2.0171163082122803]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 9.0, 5.0, 5.0, 19.0, 24.0, 24.0, 41.0, 76.0, 142.0, 349.0, 1166.0, 4982.0, 54092.0, 3953099.0, 168894.0, 8495.0, 1853.0, 547.0, 231.0, 101.0, 42.0, 34.0, 15.0, 7.0, 2.0, 5.0, 4.0, 2.0, 0.0, 4.0], "bins": [-1.0537109375, -1.0315895080566406, -1.0094680786132812, -0.9873466491699219, -0.9652252197265625, -0.9431037902832031, -0.9209823608398438, -0.8988609313964844, -0.876739501953125, -0.8546180725097656, -0.8324966430664062, -0.8103752136230469, -0.7882537841796875, -0.7661323547363281, -0.7440109252929688, -0.7218894958496094, -0.69976806640625, -0.6776466369628906, -0.6555252075195312, -0.6334037780761719, -0.6112823486328125, -0.5891609191894531, -0.5670394897460938, -0.5449180603027344, -0.522796630859375, -0.5006752014160156, -0.47855377197265625, -0.4564323425292969, -0.4343109130859375, -0.4121894836425781, -0.39006805419921875, -0.3679466247558594, -0.3458251953125, -0.3237037658691406, -0.30158233642578125, -0.2794609069824219, -0.2573394775390625, -0.23521804809570312, -0.21309661865234375, -0.19097518920898438, -0.168853759765625, -0.14673233032226562, -0.12461090087890625, -0.10248947143554688, -0.0803680419921875, -0.058246612548828125, -0.03612518310546875, -0.014003753662109375, 0.00811767578125, 0.030239105224609375, 0.05236053466796875, 0.07448196411132812, 0.0966033935546875, 0.11872482299804688, 0.14084625244140625, 0.16296768188476562, 0.185089111328125, 0.20721054077148438, 0.22933197021484375, 0.2514533996582031, 0.2735748291015625, 0.2956962585449219, 0.31781768798828125, 0.3399391174316406, 0.362060546875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 7.0, 9.0, 11.0, 10.0, 12.0, 15.0, 23.0, 32.0, 42.0, 47.0, 51.0, 67.0, 66.0, 65.0, 64.0, 71.0, 66.0, 54.0, 49.0, 57.0, 33.0, 38.0, 27.0, 22.0, 21.0, 17.0, 8.0, 9.0, 5.0, 6.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2076416015625, -0.20241928100585938, -0.19719696044921875, -0.19197463989257812, -0.1867523193359375, -0.18152999877929688, -0.17630767822265625, -0.17108535766601562, -0.165863037109375, -0.16064071655273438, -0.15541839599609375, -0.15019607543945312, -0.1449737548828125, -0.13975143432617188, -0.13452911376953125, -0.12930679321289062, -0.12408447265625, -0.11886215209960938, -0.11363983154296875, -0.10841751098632812, -0.1031951904296875, -0.09797286987304688, -0.09275054931640625, -0.08752822875976562, -0.082305908203125, -0.07708358764648438, -0.07186126708984375, -0.06663894653320312, -0.0614166259765625, -0.056194305419921875, -0.05097198486328125, -0.045749664306640625, -0.04052734375, -0.035305023193359375, -0.03008270263671875, -0.024860382080078125, -0.0196380615234375, -0.014415740966796875, -0.00919342041015625, -0.003971099853515625, 0.001251220703125, 0.006473541259765625, 0.01169586181640625, 0.016918182373046875, 0.0221405029296875, 0.027362823486328125, 0.03258514404296875, 0.037807464599609375, 0.04302978515625, 0.048252105712890625, 0.05347442626953125, 0.058696746826171875, 0.0639190673828125, 0.06914138793945312, 0.07436370849609375, 0.07958602905273438, 0.084808349609375, 0.09003067016601562, 0.09525299072265625, 0.10047531127929688, 0.1056976318359375, 0.11091995239257812, 0.11614227294921875, 0.12136459350585938, 0.1265869140625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 12.0, 9.0, 22.0, 32.0, 59.0, 109.0, 248.0, 641.0, 1883.0, 8508.0, 168904.0, 3956268.0, 50663.0, 4812.0, 1208.0, 470.0, 197.0, 116.0, 50.0, 21.0, 20.0, 12.0, 7.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.97607421875, -0.9449386596679688, -0.9138031005859375, -0.8826675415039062, -0.851531982421875, -0.8203964233398438, -0.7892608642578125, -0.7581253051757812, -0.72698974609375, -0.6958541870117188, -0.6647186279296875, -0.6335830688476562, -0.602447509765625, -0.5713119506835938, -0.5401763916015625, -0.5090408325195312, -0.4779052734375, -0.44676971435546875, -0.4156341552734375, -0.38449859619140625, -0.353363037109375, -0.32222747802734375, -0.2910919189453125, -0.25995635986328125, -0.22882080078125, -0.19768524169921875, -0.1665496826171875, -0.13541412353515625, -0.104278564453125, -0.07314300537109375, -0.0420074462890625, -0.01087188720703125, 0.020263671875, 0.05139923095703125, 0.0825347900390625, 0.11367034912109375, 0.144805908203125, 0.17594146728515625, 0.2070770263671875, 0.23821258544921875, 0.26934814453125, 0.30048370361328125, 0.3316192626953125, 0.36275482177734375, 0.393890380859375, 0.42502593994140625, 0.4561614990234375, 0.48729705810546875, 0.5184326171875, 0.5495681762695312, 0.5807037353515625, 0.6118392944335938, 0.642974853515625, 0.6741104125976562, 0.7052459716796875, 0.7363815307617188, 0.76751708984375, 0.7986526489257812, 0.8297882080078125, 0.8609237670898438, 0.892059326171875, 0.9231948852539062, 0.9543304443359375, 0.9854660034179688, 1.0166015625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 6.0, 6.0, 11.0, 8.0, 25.0, 44.0, 79.0, 151.0, 329.0, 905.0, 1413.0, 637.0, 227.0, 101.0, 47.0, 32.0, 21.0, 10.0, 10.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69140625, -0.6693191528320312, -0.6472320556640625, -0.6251449584960938, -0.603057861328125, -0.5809707641601562, -0.5588836669921875, -0.5367965698242188, -0.51470947265625, -0.49262237548828125, -0.4705352783203125, -0.44844818115234375, -0.426361083984375, -0.40427398681640625, -0.3821868896484375, -0.36009979248046875, -0.3380126953125, -0.31592559814453125, -0.2938385009765625, -0.27175140380859375, -0.249664306640625, -0.22757720947265625, -0.2054901123046875, -0.18340301513671875, -0.16131591796875, -0.13922882080078125, -0.1171417236328125, -0.09505462646484375, -0.072967529296875, -0.05088043212890625, -0.0287933349609375, -0.00670623779296875, 0.015380859375, 0.03746795654296875, 0.0595550537109375, 0.08164215087890625, 0.103729248046875, 0.12581634521484375, 0.1479034423828125, 0.16999053955078125, 0.19207763671875, 0.21416473388671875, 0.2362518310546875, 0.25833892822265625, 0.280426025390625, 0.30251312255859375, 0.3246002197265625, 0.34668731689453125, 0.3687744140625, 0.39086151123046875, 0.4129486083984375, 0.43503570556640625, 0.457122802734375, 0.47920989990234375, 0.5012969970703125, 0.5233840942382812, 0.54547119140625, 0.5675582885742188, 0.5896453857421875, 0.6117324829101562, 0.633819580078125, 0.6559066772460938, 0.6779937744140625, 0.7000808715820312, 0.72216796875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 6.0, 7.0, 12.0, 19.0, 32.0, 54.0, 128.0, 195.0, 208.0, 167.0, 87.0, 48.0, 17.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.769728899002075, -3.631511688232422, -3.4932944774627686, -3.3550772666931152, -3.216860055923462, -3.0786428451538086, -2.940425395965576, -2.802208423614502, -2.6639909744262695, -2.525773763656616, -2.387556552886963, -2.2493393421173096, -2.1111221313476562, -1.972904920578003, -1.83468759059906, -1.6964703798294067, -1.558253288269043, -1.4200360774993896, -1.2818188667297363, -1.143601655960083, -1.0053844451904297, -0.8671671748161316, -0.7289499044418335, -0.5907326936721802, -0.45251548290252686, -0.31429827213287354, -0.17608103156089783, -0.03786379098892212, 0.1003534197807312, 0.23857063055038452, 0.3767879009246826, 0.5150051116943359, 0.6532225608825684, 0.7914397716522217, 0.929656982421875, 1.0678741931915283, 1.2060914039611816, 1.344308614730835, 1.4825259447097778, 1.6207431554794312, 1.7589603662490845, 1.8971775770187378, 2.0353949069976807, 2.173612117767334, 2.3118293285369873, 2.4500465393066406, 2.588263750076294, 2.7264809608459473, 2.8646981716156006, 3.002915382385254, 3.1411325931549072, 3.2793498039245605, 3.417567014694214, 3.555784225463867, 3.6940016746520996, 3.832218647003174, 3.9704360961914062, 4.108653545379639, 4.246870517730713, 4.385087966918945, 4.5233049392700195, 4.661522388458252, 4.799739360809326, 4.937956809997559, 5.076173782348633]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 9.0, 12.0, 24.0, 33.0, 44.0, 45.0, 69.0, 72.0, 74.0, 90.0, 112.0, 81.0, 80.0, 79.0, 53.0, 49.0, 26.0, 16.0, 15.0, 5.0, 11.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5023036003112793, -2.3944942951202393, -2.286684989929199, -2.178875684738159, -2.071066379547119, -1.963257074356079, -1.8554476499557495, -1.7476383447647095, -1.6398290395736694, -1.5320197343826294, -1.4242104291915894, -1.3164010047912598, -1.2085916996002197, -1.1007823944091797, -0.9929730892181396, -0.8851637840270996, -0.7773544788360596, -0.6695451736450195, -0.5617358684539795, -0.4539265036582947, -0.34611719846725464, -0.2383078932762146, -0.13049852848052979, -0.022689223289489746, 0.08512008190155029, 0.19292940199375153, 0.30073872208595276, 0.4085480570793152, 0.5163573622703552, 0.6241666674613953, 0.7319760322570801, 0.8397853374481201, 0.9475946426391602, 1.0554039478302002, 1.1632132530212402, 1.2710225582122803, 1.3788318634033203, 1.4866411685943604, 1.59445059299469, 1.70225989818573, 1.81006920337677, 1.91787850856781, 2.0256879329681396, 2.1334972381591797, 2.2413065433502197, 2.3491158485412598, 2.4569251537323, 2.56473445892334, 2.67254376411438, 2.78035306930542, 2.88816237449646, 2.9959716796875, 3.10378098487854, 3.21159029006958, 3.319399833679199, 3.42720890045166, 3.5350184440612793, 3.6428277492523193, 3.7506370544433594, 3.8584463596343994, 3.9662556648254395, 4.074065208435059, 4.1818742752075195, 4.289683818817139, 4.3974928855896]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 10.0, 11.0, 15.0, 28.0, 49.0, 80.0, 125.0, 274.0, 625.0, 1731.0, 6567.0, 46305.0, 642784.0, 321211.0, 22392.0, 4175.0, 1206.0, 459.0, 230.0, 101.0, 65.0, 26.0, 23.0, 10.0, 13.0, 5.0, 6.0, 2.0, 6.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.52001953125, -0.5046539306640625, -0.489288330078125, -0.4739227294921875, -0.45855712890625, -0.4431915283203125, -0.427825927734375, -0.4124603271484375, -0.3970947265625, -0.3817291259765625, -0.366363525390625, -0.3509979248046875, -0.33563232421875, -0.3202667236328125, -0.304901123046875, -0.2895355224609375, -0.274169921875, -0.2588043212890625, -0.243438720703125, -0.2280731201171875, -0.21270751953125, -0.1973419189453125, -0.181976318359375, -0.1666107177734375, -0.1512451171875, -0.1358795166015625, -0.120513916015625, -0.1051483154296875, -0.08978271484375, -0.0744171142578125, -0.059051513671875, -0.0436859130859375, -0.0283203125, -0.0129547119140625, 0.002410888671875, 0.0177764892578125, 0.03314208984375, 0.0485076904296875, 0.063873291015625, 0.0792388916015625, 0.0946044921875, 0.1099700927734375, 0.125335693359375, 0.1407012939453125, 0.15606689453125, 0.1714324951171875, 0.186798095703125, 0.2021636962890625, 0.217529296875, 0.2328948974609375, 0.248260498046875, 0.2636260986328125, 0.27899169921875, 0.2943572998046875, 0.309722900390625, 0.3250885009765625, 0.3404541015625, 0.3558197021484375, 0.371185302734375, 0.3865509033203125, 0.40191650390625, 0.4172821044921875, 0.432647705078125, 0.4480133056640625, 0.46337890625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 3.0, 7.0, 15.0, 14.0, 7.0, 19.0, 26.0, 34.0, 41.0, 42.0, 65.0, 71.0, 53.0, 75.0, 51.0, 68.0, 63.0, 73.0, 47.0, 53.0, 34.0, 26.0, 28.0, 21.0, 21.0, 10.0, 12.0, 9.0, 5.0, 7.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.250244140625, -0.24436187744140625, -0.2384796142578125, -0.23259735107421875, -0.226715087890625, -0.22083282470703125, -0.2149505615234375, -0.20906829833984375, -0.20318603515625, -0.19730377197265625, -0.1914215087890625, -0.18553924560546875, -0.179656982421875, -0.17377471923828125, -0.1678924560546875, -0.16201019287109375, -0.1561279296875, -0.15024566650390625, -0.1443634033203125, -0.13848114013671875, -0.132598876953125, -0.12671661376953125, -0.1208343505859375, -0.11495208740234375, -0.10906982421875, -0.10318756103515625, -0.0973052978515625, -0.09142303466796875, -0.085540771484375, -0.07965850830078125, -0.0737762451171875, -0.06789398193359375, -0.06201171875, -0.05612945556640625, -0.0502471923828125, -0.04436492919921875, -0.038482666015625, -0.03260040283203125, -0.0267181396484375, -0.02083587646484375, -0.01495361328125, -0.00907135009765625, -0.0031890869140625, 0.00269317626953125, 0.008575439453125, 0.01445770263671875, 0.0203399658203125, 0.02622222900390625, 0.0321044921875, 0.03798675537109375, 0.0438690185546875, 0.04975128173828125, 0.055633544921875, 0.06151580810546875, 0.0673980712890625, 0.07328033447265625, 0.07916259765625, 0.08504486083984375, 0.0909271240234375, 0.09680938720703125, 0.102691650390625, 0.10857391357421875, 0.1144561767578125, 0.12033843994140625, 0.126220703125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 7.0, 7.0, 12.0, 11.0, 10.0, 19.0, 26.0, 40.0, 57.0, 93.0, 139.0, 234.0, 411.0, 745.0, 1500.0, 3714.0, 9921.0, 36167.0, 200436.0, 649176.0, 110535.0, 22863.0, 6940.0, 2729.0, 1221.0, 618.0, 328.0, 200.0, 125.0, 74.0, 64.0, 44.0, 26.0, 15.0, 19.0, 7.0, 2.0, 4.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.3232421875, -0.31292724609375, -0.3026123046875, -0.29229736328125, -0.281982421875, -0.27166748046875, -0.2613525390625, -0.25103759765625, -0.24072265625, -0.23040771484375, -0.2200927734375, -0.20977783203125, -0.199462890625, -0.18914794921875, -0.1788330078125, -0.16851806640625, -0.158203125, -0.14788818359375, -0.1375732421875, -0.12725830078125, -0.116943359375, -0.10662841796875, -0.0963134765625, -0.08599853515625, -0.07568359375, -0.06536865234375, -0.0550537109375, -0.04473876953125, -0.034423828125, -0.02410888671875, -0.0137939453125, -0.00347900390625, 0.0068359375, 0.01715087890625, 0.0274658203125, 0.03778076171875, 0.048095703125, 0.05841064453125, 0.0687255859375, 0.07904052734375, 0.08935546875, 0.09967041015625, 0.1099853515625, 0.12030029296875, 0.130615234375, 0.14093017578125, 0.1512451171875, 0.16156005859375, 0.171875, 0.18218994140625, 0.1925048828125, 0.20281982421875, 0.213134765625, 0.22344970703125, 0.2337646484375, 0.24407958984375, 0.25439453125, 0.26470947265625, 0.2750244140625, 0.28533935546875, 0.295654296875, 0.30596923828125, 0.3162841796875, 0.32659912109375, 0.3369140625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 5.0, 14.0, 4.0, 5.0, 9.0, 9.0, 12.0, 18.0, 22.0, 16.0, 26.0, 26.0, 38.0, 45.0, 40.0, 44.0, 38.0, 37.0, 43.0, 37.0, 53.0, 43.0, 40.0, 55.0, 35.0, 37.0, 38.0, 31.0, 26.0, 24.0, 19.0, 23.0, 10.0, 21.0, 11.0, 10.0, 8.0, 5.0, 4.0, 6.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.49755859375, -0.48174285888671875, -0.4659271240234375, -0.45011138916015625, -0.434295654296875, -0.41847991943359375, -0.4026641845703125, -0.38684844970703125, -0.37103271484375, -0.35521697998046875, -0.3394012451171875, -0.32358551025390625, -0.307769775390625, -0.29195404052734375, -0.2761383056640625, -0.26032257080078125, -0.2445068359375, -0.22869110107421875, -0.2128753662109375, -0.19705963134765625, -0.181243896484375, -0.16542816162109375, -0.1496124267578125, -0.13379669189453125, -0.11798095703125, -0.10216522216796875, -0.0863494873046875, -0.07053375244140625, -0.054718017578125, -0.03890228271484375, -0.0230865478515625, -0.00727081298828125, 0.008544921875, 0.02436065673828125, 0.0401763916015625, 0.05599212646484375, 0.071807861328125, 0.08762359619140625, 0.1034393310546875, 0.11925506591796875, 0.13507080078125, 0.15088653564453125, 0.1667022705078125, 0.18251800537109375, 0.198333740234375, 0.21414947509765625, 0.2299652099609375, 0.24578094482421875, 0.2615966796875, 0.27741241455078125, 0.2932281494140625, 0.30904388427734375, 0.324859619140625, 0.34067535400390625, 0.3564910888671875, 0.37230682373046875, 0.38812255859375, 0.40393829345703125, 0.4197540283203125, 0.43556976318359375, 0.451385498046875, 0.46720123291015625, 0.4830169677734375, 0.49883270263671875, 0.5146484375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 8.0, 9.0, 9.0, 13.0, 25.0, 53.0, 75.0, 125.0, 281.0, 533.0, 1181.0, 3147.0, 9568.0, 35579.0, 190394.0, 668195.0, 106655.0, 22180.0, 6433.0, 2266.0, 900.0, 449.0, 182.0, 111.0, 62.0, 37.0, 25.0, 11.0, 19.0, 9.0, 8.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.133544921875, -0.12914276123046875, -0.1247406005859375, -0.12033843994140625, -0.115936279296875, -0.11153411865234375, -0.1071319580078125, -0.10272979736328125, -0.09832763671875, -0.09392547607421875, -0.0895233154296875, -0.08512115478515625, -0.080718994140625, -0.07631683349609375, -0.0719146728515625, -0.06751251220703125, -0.0631103515625, -0.05870819091796875, -0.0543060302734375, -0.04990386962890625, -0.045501708984375, -0.04109954833984375, -0.0366973876953125, -0.03229522705078125, -0.02789306640625, -0.02349090576171875, -0.0190887451171875, -0.01468658447265625, -0.010284423828125, -0.00588226318359375, -0.0014801025390625, 0.00292205810546875, 0.00732421875, 0.01172637939453125, 0.0161285400390625, 0.02053070068359375, 0.024932861328125, 0.02933502197265625, 0.0337371826171875, 0.03813934326171875, 0.04254150390625, 0.04694366455078125, 0.0513458251953125, 0.05574798583984375, 0.060150146484375, 0.06455230712890625, 0.0689544677734375, 0.07335662841796875, 0.0777587890625, 0.08216094970703125, 0.0865631103515625, 0.09096527099609375, 0.095367431640625, 0.09976959228515625, 0.1041717529296875, 0.10857391357421875, 0.11297607421875, 0.11737823486328125, 0.1217803955078125, 0.12618255615234375, 0.130584716796875, 0.13498687744140625, 0.1393890380859375, 0.14379119873046875, 0.148193359375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 6.0, 4.0, 6.0, 11.0, 22.0, 24.0, 21.0, 37.0, 28.0, 57.0, 45.0, 47.0, 65.0, 72.0, 66.0, 65.0, 72.0, 61.0, 57.0, 52.0, 45.0, 26.0, 23.0, 20.0, 11.0, 14.0, 8.0, 6.0, 6.0, 9.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.075599670410156e-05, -2.9577873647212982e-05, -2.8399750590324402e-05, -2.722162753343582e-05, -2.604350447654724e-05, -2.486538141965866e-05, -2.368725836277008e-05, -2.25091353058815e-05, -2.133101224899292e-05, -2.015288919210434e-05, -1.897476613521576e-05, -1.779664307832718e-05, -1.66185200214386e-05, -1.544039696455002e-05, -1.4262273907661438e-05, -1.3084150850772858e-05, -1.1906027793884277e-05, -1.0727904736995697e-05, -9.549781680107117e-06, -8.371658623218536e-06, -7.193535566329956e-06, -6.015412509441376e-06, -4.837289452552795e-06, -3.659166395664215e-06, -2.4810433387756348e-06, -1.3029202818870544e-06, -1.2479722499847412e-07, 1.0533258318901062e-06, 2.2314488887786865e-06, 3.409571945667267e-06, 4.587695002555847e-06, 5.7658180594444275e-06, 6.943941116333008e-06, 8.122064173221588e-06, 9.300187230110168e-06, 1.0478310286998749e-05, 1.1656433343887329e-05, 1.283455640077591e-05, 1.401267945766449e-05, 1.519080251455307e-05, 1.636892557144165e-05, 1.754704862833023e-05, 1.872517168521881e-05, 1.990329474210739e-05, 2.108141779899597e-05, 2.2259540855884552e-05, 2.3437663912773132e-05, 2.4615786969661713e-05, 2.5793910026550293e-05, 2.6972033083438873e-05, 2.8150156140327454e-05, 2.9328279197216034e-05, 3.0506402254104614e-05, 3.1684525310993195e-05, 3.2862648367881775e-05, 3.4040771424770355e-05, 3.5218894481658936e-05, 3.6397017538547516e-05, 3.7575140595436096e-05, 3.8753263652324677e-05, 3.993138670921326e-05, 4.110950976610184e-05, 4.228763282299042e-05, 4.3465755879879e-05, 4.464387893676758e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 9.0, 15.0, 22.0, 23.0, 35.0, 51.0, 101.0, 201.0, 295.0, 566.0, 1132.0, 2802.0, 8553.0, 35899.0, 228415.0, 661480.0, 84222.0, 16610.0, 4654.0, 1680.0, 826.0, 372.0, 232.0, 127.0, 82.0, 46.0, 33.0, 22.0, 16.0, 13.0, 4.0, 2.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15625, -0.15124893188476562, -0.14624786376953125, -0.14124679565429688, -0.1362457275390625, -0.13124465942382812, -0.12624359130859375, -0.12124252319335938, -0.116241455078125, -0.11124038696289062, -0.10623931884765625, -0.10123825073242188, -0.0962371826171875, -0.09123611450195312, -0.08623504638671875, -0.08123397827148438, -0.07623291015625, -0.07123184204101562, -0.06623077392578125, -0.061229705810546875, -0.0562286376953125, -0.051227569580078125, -0.04622650146484375, -0.041225433349609375, -0.036224365234375, -0.031223297119140625, -0.02622222900390625, -0.021221160888671875, -0.0162200927734375, -0.011219024658203125, -0.00621795654296875, -0.001216888427734375, 0.0037841796875, 0.008785247802734375, 0.01378631591796875, 0.018787384033203125, 0.0237884521484375, 0.028789520263671875, 0.03379058837890625, 0.038791656494140625, 0.043792724609375, 0.048793792724609375, 0.05379486083984375, 0.058795928955078125, 0.0637969970703125, 0.06879806518554688, 0.07379913330078125, 0.07880020141601562, 0.08380126953125, 0.08880233764648438, 0.09380340576171875, 0.09880447387695312, 0.1038055419921875, 0.10880661010742188, 0.11380767822265625, 0.11880874633789062, 0.123809814453125, 0.12881088256835938, 0.13381195068359375, 0.13881301879882812, 0.1438140869140625, 0.14881515502929688, 0.15381622314453125, 0.15881729125976562, 0.163818359375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 8.0, 15.0, 18.0, 23.0, 20.0, 34.0, 43.0, 46.0, 89.0, 84.0, 98.0, 116.0, 97.0, 100.0, 52.0, 40.0, 25.0, 22.0, 23.0, 8.0, 9.0, 6.0, 5.0, 7.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12127685546875, -0.1164693832397461, -0.11166191101074219, -0.10685443878173828, -0.10204696655273438, -0.09723949432373047, -0.09243202209472656, -0.08762454986572266, -0.08281707763671875, -0.07800960540771484, -0.07320213317871094, -0.06839466094970703, -0.06358718872070312, -0.05877971649169922, -0.05397224426269531, -0.049164772033691406, -0.0443572998046875, -0.039549827575683594, -0.03474235534667969, -0.02993488311767578, -0.025127410888671875, -0.02031993865966797, -0.015512466430664062, -0.010704994201660156, -0.00589752197265625, -0.0010900497436523438, 0.0037174224853515625, 0.008524894714355469, 0.013332366943359375, 0.01813983917236328, 0.022947311401367188, 0.027754783630371094, 0.032562255859375, 0.037369728088378906, 0.04217720031738281, 0.04698467254638672, 0.051792144775390625, 0.05659961700439453, 0.06140708923339844, 0.06621456146240234, 0.07102203369140625, 0.07582950592041016, 0.08063697814941406, 0.08544445037841797, 0.09025192260742188, 0.09505939483642578, 0.09986686706542969, 0.1046743392944336, 0.1094818115234375, 0.1142892837524414, 0.11909675598144531, 0.12390422821044922, 0.12871170043945312, 0.13351917266845703, 0.13832664489746094, 0.14313411712646484, 0.14794158935546875, 0.15274906158447266, 0.15755653381347656, 0.16236400604248047, 0.16717147827148438, 0.17197895050048828, 0.1767864227294922, 0.1815938949584961, 0.1864013671875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 16.0, 42.0, 119.0, 277.0, 305.0, 143.0, 59.0, 19.0, 9.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.487732887268066, -5.339611530303955, -5.191490173339844, -5.043368816375732, -4.895247459411621, -4.747125625610352, -4.599004745483398, -4.450882911682129, -4.302761554718018, -4.154640197753906, -4.006518840789795, -3.8583974838256836, -3.710275888442993, -3.562154531478882, -3.4140331745147705, -3.26591157913208, -3.117790460586548, -2.9696691036224365, -2.821547746658325, -2.6734261512756348, -2.5253047943115234, -2.377183437347412, -2.229062080383301, -2.0809407234191895, -1.9328192472457886, -1.7846978902816772, -1.6365764141082764, -1.488455057144165, -1.3403337001800537, -1.1922122240066528, -1.0440908670425415, -0.8959693908691406, -0.7478482723236084, -0.5997268557548523, -0.4516054689884186, -0.30348408222198486, -0.15536266565322876, -0.007241249084472656, 0.14088010787963867, 0.28900158405303955, 0.4371229410171509, 0.585244357585907, 0.7333657741546631, 0.8814871311187744, 1.0296084880828857, 1.1777299642562866, 1.325851321220398, 1.4739727973937988, 1.6220941543579102, 1.7702155113220215, 1.9183369874954224, 2.066458225250244, 2.2145798206329346, 2.362701177597046, 2.5108225345611572, 2.6589441299438477, 2.807065486907959, 2.9551868438720703, 3.1033082008361816, 3.251429557800293, 3.3995511531829834, 3.5476725101470947, 3.695793867111206, 3.8439154624938965, 3.9920365810394287]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 10.0, 3.0, 6.0, 15.0, 16.0, 15.0, 20.0, 22.0, 20.0, 41.0, 35.0, 39.0, 50.0, 46.0, 58.0, 74.0, 96.0, 67.0, 58.0, 45.0, 33.0, 32.0, 34.0, 25.0, 24.0, 20.0, 20.0, 13.0, 11.0, 8.0, 10.0, 7.0, 6.0, 3.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.0541341304779053, -1.9814300537109375, -1.9087260961532593, -1.836022138595581, -1.7633180618286133, -1.6906139850616455, -1.6179100275039673, -1.545206069946289, -1.4725019931793213, -1.3997979164123535, -1.3270939588546753, -1.254390001296997, -1.1816859245300293, -1.1089818477630615, -1.0362778902053833, -0.9635738730430603, -0.8908698558807373, -0.8181658387184143, -0.7454618215560913, -0.6727578043937683, -0.6000537872314453, -0.5273497700691223, -0.4546457529067993, -0.3819417357444763, -0.3092377185821533, -0.23653370141983032, -0.16382968425750732, -0.09112566709518433, -0.018421649932861328, 0.05428236722946167, 0.12698638439178467, 0.19969040155410767, 0.27239465713500977, 0.34509867429733276, 0.41780269145965576, 0.49050670862197876, 0.5632107257843018, 0.6359147429466248, 0.7086187601089478, 0.7813227772712708, 0.8540267944335938, 0.9267308115959167, 0.9994348287582397, 1.072138786315918, 1.1448428630828857, 1.2175469398498535, 1.2902508974075317, 1.36295485496521, 1.4356589317321777, 1.5083630084991455, 1.5810669660568237, 1.653770923614502, 1.7264750003814697, 1.7991790771484375, 1.8718830347061157, 1.944586992263794, 2.0172910690307617, 2.0899951457977295, 2.1626992225646973, 2.235403060913086, 2.3081071376800537, 2.3808112144470215, 2.45351505279541, 2.526219129562378, 2.5989232063293457]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 7.0, 14.0, 17.0, 41.0, 75.0, 142.0, 298.0, 845.0, 9282.0, 4069879.0, 110480.0, 2348.0, 479.0, 174.0, 93.0, 47.0, 31.0, 13.0, 9.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.66796875, -1.6322784423828125, -1.596588134765625, -1.5608978271484375, -1.52520751953125, -1.4895172119140625, -1.453826904296875, -1.4181365966796875, -1.3824462890625, -1.3467559814453125, -1.311065673828125, -1.2753753662109375, -1.23968505859375, -1.2039947509765625, -1.168304443359375, -1.1326141357421875, -1.096923828125, -1.0612335205078125, -1.025543212890625, -0.9898529052734375, -0.95416259765625, -0.9184722900390625, -0.882781982421875, -0.8470916748046875, -0.8114013671875, -0.7757110595703125, -0.740020751953125, -0.7043304443359375, -0.66864013671875, -0.6329498291015625, -0.597259521484375, -0.5615692138671875, -0.52587890625, -0.4901885986328125, -0.454498291015625, -0.4188079833984375, -0.38311767578125, -0.3474273681640625, -0.311737060546875, -0.2760467529296875, -0.2403564453125, -0.2046661376953125, -0.168975830078125, -0.1332855224609375, -0.09759521484375, -0.0619049072265625, -0.026214599609375, 0.0094757080078125, 0.045166015625, 0.0808563232421875, 0.116546630859375, 0.1522369384765625, 0.18792724609375, 0.2236175537109375, 0.259307861328125, 0.2949981689453125, 0.3306884765625, 0.3663787841796875, 0.402069091796875, 0.4377593994140625, 0.47344970703125, 0.5091400146484375, 0.544830322265625, 0.5805206298828125, 0.6162109375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 7.0, 6.0, 13.0, 10.0, 16.0, 22.0, 25.0, 31.0, 31.0, 36.0, 48.0, 68.0, 60.0, 58.0, 64.0, 59.0, 67.0, 57.0, 41.0, 48.0, 37.0, 37.0, 30.0, 24.0, 24.0, 17.0, 17.0, 18.0, 9.0, 6.0, 4.0, 1.0, 2.0, 5.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.190185546875, -0.18519973754882812, -0.18021392822265625, -0.17522811889648438, -0.1702423095703125, -0.16525650024414062, -0.16027069091796875, -0.15528488159179688, -0.150299072265625, -0.14531326293945312, -0.14032745361328125, -0.13534164428710938, -0.1303558349609375, -0.12537002563476562, -0.12038421630859375, -0.11539840698242188, -0.11041259765625, -0.10542678833007812, -0.10044097900390625, -0.09545516967773438, -0.0904693603515625, -0.08548355102539062, -0.08049774169921875, -0.07551193237304688, -0.070526123046875, -0.06554031372070312, -0.06055450439453125, -0.055568695068359375, -0.0505828857421875, -0.045597076416015625, -0.04061126708984375, -0.035625457763671875, -0.0306396484375, -0.025653839111328125, -0.02066802978515625, -0.015682220458984375, -0.0106964111328125, -0.005710601806640625, -0.00072479248046875, 0.004261016845703125, 0.009246826171875, 0.014232635498046875, 0.01921844482421875, 0.024204254150390625, 0.0291900634765625, 0.034175872802734375, 0.03916168212890625, 0.044147491455078125, 0.04913330078125, 0.054119110107421875, 0.05910491943359375, 0.06409072875976562, 0.0690765380859375, 0.07406234741210938, 0.07904815673828125, 0.08403396606445312, 0.089019775390625, 0.09400558471679688, 0.09899139404296875, 0.10397720336914062, 0.1089630126953125, 0.11394882202148438, 0.11893463134765625, 0.12392044067382812, 0.12890625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 5.0, 4.0, 3.0, 7.0, 4.0, 17.0, 8.0, 27.0, 37.0, 81.0, 151.0, 473.0, 1499.0, 7927.0, 109590.0, 3974864.0, 90250.0, 7211.0, 1328.0, 427.0, 164.0, 71.0, 48.0, 24.0, 16.0, 16.0, 10.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9541015625, -0.9286422729492188, -0.9031829833984375, -0.8777236938476562, -0.852264404296875, -0.8268051147460938, -0.8013458251953125, -0.7758865356445312, -0.75042724609375, -0.7249679565429688, -0.6995086669921875, -0.6740493774414062, -0.648590087890625, -0.6231307983398438, -0.5976715087890625, -0.5722122192382812, -0.5467529296875, -0.5212936401367188, -0.4958343505859375, -0.47037506103515625, -0.444915771484375, -0.41945648193359375, -0.3939971923828125, -0.36853790283203125, -0.34307861328125, -0.31761932373046875, -0.2921600341796875, -0.26670074462890625, -0.241241455078125, -0.21578216552734375, -0.1903228759765625, -0.16486358642578125, -0.139404296875, -0.11394500732421875, -0.0884857177734375, -0.06302642822265625, -0.037567138671875, -0.01210784912109375, 0.0133514404296875, 0.03881072998046875, 0.06427001953125, 0.08972930908203125, 0.1151885986328125, 0.14064788818359375, 0.166107177734375, 0.19156646728515625, 0.2170257568359375, 0.24248504638671875, 0.2679443359375, 0.29340362548828125, 0.3188629150390625, 0.34432220458984375, 0.369781494140625, 0.39524078369140625, 0.4207000732421875, 0.44615936279296875, 0.47161865234375, 0.49707794189453125, 0.5225372314453125, 0.5479965209960938, 0.573455810546875, 0.5989151000976562, 0.6243743896484375, 0.6498336791992188, 0.67529296875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 7.0, 5.0, 10.0, 6.0, 12.0, 21.0, 31.0, 33.0, 61.0, 102.0, 163.0, 335.0, 779.0, 1109.0, 749.0, 281.0, 134.0, 80.0, 36.0, 35.0, 29.0, 14.0, 4.0, 12.0, 9.0, 4.0, 5.0, 5.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.401611328125, -0.3863868713378906, -0.37116241455078125, -0.3559379577636719, -0.3407135009765625, -0.3254890441894531, -0.31026458740234375, -0.2950401306152344, -0.279815673828125, -0.2645912170410156, -0.24936676025390625, -0.23414230346679688, -0.2189178466796875, -0.20369338989257812, -0.18846893310546875, -0.17324447631835938, -0.15802001953125, -0.14279556274414062, -0.12757110595703125, -0.11234664916992188, -0.0971221923828125, -0.08189773559570312, -0.06667327880859375, -0.051448822021484375, -0.036224365234375, -0.020999908447265625, -0.00577545166015625, 0.009449005126953125, 0.0246734619140625, 0.039897918701171875, 0.05512237548828125, 0.07034683227539062, 0.0855712890625, 0.10079574584960938, 0.11602020263671875, 0.13124465942382812, 0.1464691162109375, 0.16169357299804688, 0.17691802978515625, 0.19214248657226562, 0.207366943359375, 0.22259140014648438, 0.23781585693359375, 0.2530403137207031, 0.2682647705078125, 0.2834892272949219, 0.29871368408203125, 0.3139381408691406, 0.32916259765625, 0.3443870544433594, 0.35961151123046875, 0.3748359680175781, 0.3900604248046875, 0.4052848815917969, 0.42050933837890625, 0.4357337951660156, 0.450958251953125, 0.4661827087402344, 0.48140716552734375, 0.4966316223144531, 0.5118560791015625, 0.5270805358886719, 0.5423049926757812, 0.5575294494628906, 0.57275390625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 9.0, 7.0, 11.0, 25.0, 35.0, 68.0, 88.0, 101.0, 155.0, 148.0, 100.0, 111.0, 48.0, 32.0, 16.0, 12.0, 6.0, 8.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.008906126022339, -2.9259893894195557, -2.8430726528167725, -2.7601561546325684, -2.677239418029785, -2.594322681427002, -2.5114059448242188, -2.4284892082214355, -2.3455727100372314, -2.2626559734344482, -2.179739236831665, -2.096822738647461, -2.0139060020446777, -1.9309892654418945, -1.8480725288391113, -1.7651559114456177, -1.6822391748428345, -1.5993224382400513, -1.5164058208465576, -1.4334890842437744, -1.3505724668502808, -1.2676557302474976, -1.184739112854004, -1.1018223762512207, -1.0189056396484375, -0.9359889626502991, -0.8530722856521606, -0.7701555490493774, -0.6872389316558838, -0.6043221950531006, -0.5214055180549622, -0.43848884105682373, -0.3555722236633301, -0.27265554666519165, -0.18973885476589203, -0.10682216286659241, -0.02390548586845398, 0.05901119112968445, 0.14192789793014526, 0.2248445749282837, 0.3077612519264221, 0.39067792892456055, 0.473594605922699, 0.5565112829208374, 0.6394280195236206, 0.7223446369171143, 0.8052613735198975, 0.8881780505180359, 0.9710947275161743, 1.0540114641189575, 1.1369280815124512, 1.2198448181152344, 1.302761435508728, 1.3856781721115112, 1.4685947895050049, 1.551511526107788, 1.6344282627105713, 1.7173449993133545, 1.8002616167068481, 1.8831783533096313, 1.966094970703125, 2.049011707305908, 2.1319284439086914, 2.2148451805114746, 2.2977616786956787]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 3.0, 5.0, 4.0, 9.0, 10.0, 11.0, 18.0, 21.0, 32.0, 17.0, 42.0, 39.0, 38.0, 50.0, 47.0, 48.0, 61.0, 57.0, 60.0, 54.0, 40.0, 51.0, 50.0, 39.0, 37.0, 24.0, 24.0, 16.0, 15.0, 15.0, 16.0, 12.0, 11.0, 6.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6852667331695557, -1.6285483837127686, -1.571829915046692, -1.5151115655899048, -1.4583932161331177, -1.401674747467041, -1.344956398010254, -1.2882380485534668, -1.2315196990966797, -1.1748013496398926, -1.118082880973816, -1.0613645315170288, -1.0046461820602417, -0.9479277729988098, -0.8912093639373779, -0.8344910144805908, -0.7777725458145142, -0.7210541367530823, -0.6643357872962952, -0.6076173782348633, -0.5508990287780762, -0.4941806197166443, -0.4374622106552124, -0.3807438313961029, -0.3240254521369934, -0.2673070728778839, -0.21058867871761322, -0.15387028455734253, -0.09715190529823303, -0.040433526039123535, 0.01628488302230835, 0.07300326228141785, 0.1297215223312378, 0.1864399015903473, 0.24315829575061798, 0.29987668991088867, 0.35659506916999817, 0.41331344842910767, 0.47003185749053955, 0.5267502069473267, 0.5834686160087585, 0.6401870250701904, 0.6969053745269775, 0.7536237835884094, 0.8103421926498413, 0.8670605421066284, 0.9237789511680603, 0.9804973602294922, 1.0372157096862793, 1.0939340591430664, 1.150652527809143, 1.2073708772659302, 1.2640892267227173, 1.320807695388794, 1.377526044845581, 1.4342443943023682, 1.4909627437591553, 1.5476810932159424, 1.604399561882019, 1.6611179113388062, 1.7178362607955933, 1.77455472946167, 1.831273078918457, 1.8879914283752441, 1.9447098970413208]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 7.0, 5.0, 11.0, 14.0, 21.0, 35.0, 76.0, 133.0, 224.0, 531.0, 1316.0, 4324.0, 21549.0, 315324.0, 652753.0, 42519.0, 6598.0, 1816.0, 633.0, 290.0, 139.0, 83.0, 50.0, 31.0, 17.0, 13.0, 7.0, 4.0, 6.0, 4.0, 8.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.53125, -0.5156936645507812, -0.5001373291015625, -0.48458099365234375, -0.469024658203125, -0.45346832275390625, -0.4379119873046875, -0.42235565185546875, -0.40679931640625, -0.39124298095703125, -0.3756866455078125, -0.36013031005859375, -0.344573974609375, -0.32901763916015625, -0.3134613037109375, -0.29790496826171875, -0.2823486328125, -0.26679229736328125, -0.2512359619140625, -0.23567962646484375, -0.220123291015625, -0.20456695556640625, -0.1890106201171875, -0.17345428466796875, -0.15789794921875, -0.14234161376953125, -0.1267852783203125, -0.11122894287109375, -0.095672607421875, -0.08011627197265625, -0.0645599365234375, -0.04900360107421875, -0.033447265625, -0.01789093017578125, -0.0023345947265625, 0.01322174072265625, 0.028778076171875, 0.04433441162109375, 0.0598907470703125, 0.07544708251953125, 0.09100341796875, 0.10655975341796875, 0.1221160888671875, 0.13767242431640625, 0.153228759765625, 0.16878509521484375, 0.1843414306640625, 0.19989776611328125, 0.2154541015625, 0.23101043701171875, 0.2465667724609375, 0.26212310791015625, 0.277679443359375, 0.29323577880859375, 0.3087921142578125, 0.32434844970703125, 0.33990478515625, 0.35546112060546875, 0.3710174560546875, 0.38657379150390625, 0.402130126953125, 0.41768646240234375, 0.4332427978515625, 0.44879913330078125, 0.46435546875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 5.0, 3.0, 13.0, 12.0, 18.0, 18.0, 22.0, 31.0, 37.0, 34.0, 42.0, 36.0, 45.0, 45.0, 73.0, 47.0, 54.0, 53.0, 58.0, 42.0, 46.0, 43.0, 25.0, 41.0, 34.0, 32.0, 11.0, 20.0, 13.0, 15.0, 5.0, 5.0, 4.0, 5.0, 6.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.183349609375, -0.1782855987548828, -0.17322158813476562, -0.16815757751464844, -0.16309356689453125, -0.15802955627441406, -0.15296554565429688, -0.1479015350341797, -0.1428375244140625, -0.1377735137939453, -0.13270950317382812, -0.12764549255371094, -0.12258148193359375, -0.11751747131347656, -0.11245346069335938, -0.10738945007324219, -0.102325439453125, -0.09726142883300781, -0.09219741821289062, -0.08713340759277344, -0.08206939697265625, -0.07700538635253906, -0.07194137573242188, -0.06687736511230469, -0.0618133544921875, -0.05674934387207031, -0.051685333251953125, -0.04662132263183594, -0.04155731201171875, -0.03649330139160156, -0.031429290771484375, -0.026365280151367188, -0.02130126953125, -0.016237258911132812, -0.011173248291015625, -0.0061092376708984375, -0.00104522705078125, 0.0040187835693359375, 0.009082794189453125, 0.014146804809570312, 0.0192108154296875, 0.024274826049804688, 0.029338836669921875, 0.03440284729003906, 0.03946685791015625, 0.04453086853027344, 0.049594879150390625, 0.05465888977050781, 0.059722900390625, 0.06478691101074219, 0.06985092163085938, 0.07491493225097656, 0.07997894287109375, 0.08504295349121094, 0.09010696411132812, 0.09517097473144531, 0.1002349853515625, 0.10529899597167969, 0.11036300659179688, 0.11542701721191406, 0.12049102783203125, 0.12555503845214844, 0.13061904907226562, 0.1356830596923828, 0.1407470703125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 14.0, 14.0, 10.0, 22.0, 34.0, 66.0, 80.0, 151.0, 317.0, 636.0, 1737.0, 5617.0, 32652.0, 692174.0, 286468.0, 21605.0, 4326.0, 1439.0, 582.0, 250.0, 128.0, 72.0, 45.0, 40.0, 22.0, 22.0, 6.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47998046875, -0.46337127685546875, -0.4467620849609375, -0.43015289306640625, -0.413543701171875, -0.39693450927734375, -0.3803253173828125, -0.36371612548828125, -0.34710693359375, -0.33049774169921875, -0.3138885498046875, -0.29727935791015625, -0.280670166015625, -0.26406097412109375, -0.2474517822265625, -0.23084259033203125, -0.2142333984375, -0.19762420654296875, -0.1810150146484375, -0.16440582275390625, -0.147796630859375, -0.13118743896484375, -0.1145782470703125, -0.09796905517578125, -0.08135986328125, -0.06475067138671875, -0.0481414794921875, -0.03153228759765625, -0.014923095703125, 0.00168609619140625, 0.0182952880859375, 0.03490447998046875, 0.051513671875, 0.06812286376953125, 0.0847320556640625, 0.10134124755859375, 0.117950439453125, 0.13455963134765625, 0.1511688232421875, 0.16777801513671875, 0.18438720703125, 0.20099639892578125, 0.2176055908203125, 0.23421478271484375, 0.250823974609375, 0.26743316650390625, 0.2840423583984375, 0.30065155029296875, 0.3172607421875, 0.33386993408203125, 0.3504791259765625, 0.36708831787109375, 0.383697509765625, 0.40030670166015625, 0.4169158935546875, 0.43352508544921875, 0.45013427734375, 0.46674346923828125, 0.4833526611328125, 0.49996185302734375, 0.516571044921875, 0.5331802368164062, 0.5497894287109375, 0.5663986206054688, 0.5830078125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 9.0, 7.0, 7.0, 10.0, 14.0, 12.0, 22.0, 28.0, 20.0, 44.0, 32.0, 41.0, 44.0, 47.0, 80.0, 61.0, 80.0, 62.0, 65.0, 59.0, 47.0, 53.0, 37.0, 26.0, 24.0, 13.0, 12.0, 12.0, 9.0, 5.0, 5.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.72607421875, -0.7041702270507812, -0.6822662353515625, -0.6603622436523438, -0.638458251953125, -0.6165542602539062, -0.5946502685546875, -0.5727462768554688, -0.55084228515625, -0.5289382934570312, -0.5070343017578125, -0.48513031005859375, -0.463226318359375, -0.44132232666015625, -0.4194183349609375, -0.39751434326171875, -0.3756103515625, -0.35370635986328125, -0.3318023681640625, -0.30989837646484375, -0.287994384765625, -0.26609039306640625, -0.2441864013671875, -0.22228240966796875, -0.20037841796875, -0.17847442626953125, -0.1565704345703125, -0.13466644287109375, -0.112762451171875, -0.09085845947265625, -0.0689544677734375, -0.04705047607421875, -0.025146484375, -0.00324249267578125, 0.0186614990234375, 0.04056549072265625, 0.062469482421875, 0.08437347412109375, 0.1062774658203125, 0.12818145751953125, 0.15008544921875, 0.17198944091796875, 0.1938934326171875, 0.21579742431640625, 0.237701416015625, 0.25960540771484375, 0.2815093994140625, 0.30341339111328125, 0.3253173828125, 0.34722137451171875, 0.3691253662109375, 0.39102935791015625, 0.412933349609375, 0.43483734130859375, 0.4567413330078125, 0.47864532470703125, 0.50054931640625, 0.5224533081054688, 0.5443572998046875, 0.5662612915039062, 0.588165283203125, 0.6100692749023438, 0.6319732666015625, 0.6538772583007812, 0.67578125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 8.0, 2.0, 1.0, 17.0, 24.0, 28.0, 36.0, 44.0, 65.0, 98.0, 181.0, 292.0, 443.0, 641.0, 1260.0, 2124.0, 3952.0, 7663.0, 17025.0, 44336.0, 149388.0, 618629.0, 130958.0, 39757.0, 15673.0, 7282.0, 3617.0, 2037.0, 1082.0, 656.0, 415.0, 259.0, 151.0, 107.0, 85.0, 63.0, 38.0, 26.0, 19.0, 16.0, 11.0, 6.0, 9.0, 9.0, 2.0, 6.0, 1.0, 2.0, 2.0, 3.0, 2.0], "bins": [-0.097412109375, -0.09458446502685547, -0.09175682067871094, -0.0889291763305664, -0.08610153198242188, -0.08327388763427734, -0.08044624328613281, -0.07761859893798828, -0.07479095458984375, -0.07196331024169922, -0.06913566589355469, -0.06630802154541016, -0.06348037719726562, -0.060652732849121094, -0.05782508850097656, -0.05499744415283203, -0.0521697998046875, -0.04934215545654297, -0.04651451110839844, -0.043686866760253906, -0.040859222412109375, -0.038031578063964844, -0.03520393371582031, -0.03237628936767578, -0.02954864501953125, -0.02672100067138672, -0.023893356323242188, -0.021065711975097656, -0.018238067626953125, -0.015410423278808594, -0.012582778930664062, -0.009755134582519531, -0.006927490234375, -0.004099845886230469, -0.0012722015380859375, 0.0015554428100585938, 0.004383087158203125, 0.007210731506347656, 0.010038375854492188, 0.012866020202636719, 0.01569366455078125, 0.01852130889892578, 0.021348953247070312, 0.024176597595214844, 0.027004241943359375, 0.029831886291503906, 0.03265953063964844, 0.03548717498779297, 0.0383148193359375, 0.04114246368408203, 0.04397010803222656, 0.046797752380371094, 0.049625396728515625, 0.052453041076660156, 0.05528068542480469, 0.05810832977294922, 0.06093597412109375, 0.06376361846923828, 0.06659126281738281, 0.06941890716552734, 0.07224655151367188, 0.0750741958618164, 0.07790184020996094, 0.08072948455810547, 0.08355712890625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 8.0, 9.0, 3.0, 4.0, 15.0, 9.0, 12.0, 36.0, 35.0, 32.0, 53.0, 66.0, 61.0, 82.0, 88.0, 83.0, 68.0, 66.0, 59.0, 48.0, 36.0, 23.0, 18.0, 21.0, 13.0, 13.0, 9.0, 5.0, 4.0, 4.0, 2.0, 7.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9577484130859375e-05, -3.8324855268001556e-05, -3.707222640514374e-05, -3.581959754228592e-05, -3.45669686794281e-05, -3.331433981657028e-05, -3.206171095371246e-05, -3.0809082090854645e-05, -2.9556453227996826e-05, -2.8303824365139008e-05, -2.705119550228119e-05, -2.579856663942337e-05, -2.4545937776565552e-05, -2.3293308913707733e-05, -2.2040680050849915e-05, -2.0788051187992096e-05, -1.9535422325134277e-05, -1.828279346227646e-05, -1.703016459941864e-05, -1.577753573656082e-05, -1.4524906873703003e-05, -1.3272278010845184e-05, -1.2019649147987366e-05, -1.0767020285129547e-05, -9.514391422271729e-06, -8.26176255941391e-06, -7.009133696556091e-06, -5.756504833698273e-06, -4.503875970840454e-06, -3.2512471079826355e-06, -1.998618245124817e-06, -7.459893822669983e-07, 5.066394805908203e-07, 1.759268343448639e-06, 3.0118972063064575e-06, 4.264526069164276e-06, 5.517154932022095e-06, 6.769783794879913e-06, 8.022412657737732e-06, 9.27504152059555e-06, 1.0527670383453369e-05, 1.1780299246311188e-05, 1.3032928109169006e-05, 1.4285556972026825e-05, 1.5538185834884644e-05, 1.6790814697742462e-05, 1.804344356060028e-05, 1.92960724234581e-05, 2.0548701286315918e-05, 2.1801330149173737e-05, 2.3053959012031555e-05, 2.4306587874889374e-05, 2.5559216737747192e-05, 2.681184560060501e-05, 2.806447446346283e-05, 2.9317103326320648e-05, 3.056973218917847e-05, 3.1822361052036285e-05, 3.3074989914894104e-05, 3.432761877775192e-05, 3.558024764060974e-05, 3.683287650346756e-05, 3.808550536632538e-05, 3.93381342291832e-05, 4.0590763092041016e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 6.0, 5.0, 11.0, 7.0, 13.0, 15.0, 23.0, 42.0, 50.0, 107.0, 129.0, 225.0, 413.0, 791.0, 1900.0, 5326.0, 18537.0, 95191.0, 758093.0, 133265.0, 23788.0, 6302.0, 2244.0, 979.0, 443.0, 245.0, 140.0, 79.0, 57.0, 36.0, 31.0, 25.0, 16.0, 6.0, 4.0, 4.0, 3.0, 4.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.138671875, -0.1334552764892578, -0.12823867797851562, -0.12302207946777344, -0.11780548095703125, -0.11258888244628906, -0.10737228393554688, -0.10215568542480469, -0.0969390869140625, -0.09172248840332031, -0.08650588989257812, -0.08128929138183594, -0.07607269287109375, -0.07085609436035156, -0.06563949584960938, -0.06042289733886719, -0.055206298828125, -0.04998970031738281, -0.044773101806640625, -0.03955650329589844, -0.03433990478515625, -0.029123306274414062, -0.023906707763671875, -0.018690109252929688, -0.0134735107421875, -0.008256912231445312, -0.003040313720703125, 0.0021762847900390625, 0.00739288330078125, 0.012609481811523438, 0.017826080322265625, 0.023042678833007812, 0.02825927734375, 0.03347587585449219, 0.038692474365234375, 0.04390907287597656, 0.04912567138671875, 0.05434226989746094, 0.059558868408203125, 0.06477546691894531, 0.0699920654296875, 0.07520866394042969, 0.08042526245117188, 0.08564186096191406, 0.09085845947265625, 0.09607505798339844, 0.10129165649414062, 0.10650825500488281, 0.111724853515625, 0.11694145202636719, 0.12215805053710938, 0.12737464904785156, 0.13259124755859375, 0.13780784606933594, 0.14302444458007812, 0.1482410430908203, 0.1534576416015625, 0.1586742401123047, 0.16389083862304688, 0.16910743713378906, 0.17432403564453125, 0.17954063415527344, 0.18475723266601562, 0.1899738311767578, 0.1951904296875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 7.0, 4.0, 4.0, 1.0, 10.0, 9.0, 14.0, 15.0, 23.0, 36.0, 57.0, 58.0, 105.0, 136.0, 141.0, 117.0, 78.0, 52.0, 40.0, 25.0, 20.0, 12.0, 8.0, 5.0, 8.0, 8.0, 4.0, 3.0, 5.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16943359375, -0.16381263732910156, -0.15819168090820312, -0.1525707244873047, -0.14694976806640625, -0.1413288116455078, -0.13570785522460938, -0.13008689880371094, -0.1244659423828125, -0.11884498596191406, -0.11322402954101562, -0.10760307312011719, -0.10198211669921875, -0.09636116027832031, -0.09074020385742188, -0.08511924743652344, -0.079498291015625, -0.07387733459472656, -0.06825637817382812, -0.06263542175292969, -0.05701446533203125, -0.05139350891113281, -0.045772552490234375, -0.04015159606933594, -0.0345306396484375, -0.028909683227539062, -0.023288726806640625, -0.017667770385742188, -0.01204681396484375, -0.0064258575439453125, -0.000804901123046875, 0.0048160552978515625, 0.01043701171875, 0.016057968139648438, 0.021678924560546875, 0.027299880981445312, 0.03292083740234375, 0.03854179382324219, 0.044162750244140625, 0.04978370666503906, 0.0554046630859375, 0.06102561950683594, 0.06664657592773438, 0.07226753234863281, 0.07788848876953125, 0.08350944519042969, 0.08913040161132812, 0.09475135803222656, 0.100372314453125, 0.10599327087402344, 0.11161422729492188, 0.11723518371582031, 0.12285614013671875, 0.1284770965576172, 0.13409805297851562, 0.13971900939941406, 0.1453399658203125, 0.15096092224121094, 0.15658187866210938, 0.1622028350830078, 0.16782379150390625, 0.1734447479248047, 0.17906570434570312, 0.18468666076660156, 0.1903076171875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 6.0, 10.0, 17.0, 38.0, 85.0, 193.0, 364.0, 160.0, 72.0, 30.0, 8.0, 7.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.349461555480957, -5.211082458496094, -5.072703838348389, -4.934324741363525, -4.79594612121582, -4.657567024230957, -4.519187927246094, -4.380809307098389, -4.242430210113525, -4.104051113128662, -3.965672492980957, -3.8272933959960938, -3.6889145374298096, -3.5505356788635254, -3.412156581878662, -3.273777723312378, -3.1353988647460938, -2.9970200061798096, -2.8586411476135254, -2.720262050628662, -2.581883192062378, -2.4435043334960938, -2.3051252365112305, -2.1667463779449463, -2.028367519378662, -1.889988660812378, -1.7516096830368042, -1.6132307052612305, -1.4748518466949463, -1.336472988128662, -1.1980940103530884, -1.0597150325775146, -0.9213364124298096, -0.7829574942588806, -0.6445785760879517, -0.5061996579170227, -0.36782073974609375, -0.2294418215751648, -0.09106290340423584, 0.047316014766693115, 0.18569493293762207, 0.324073851108551, 0.46245276927948, 0.6008316874504089, 0.7392106056213379, 0.8775895237922668, 1.0159684419631958, 1.1543474197387695, 1.2927262783050537, 1.431105136871338, 1.5694841146469116, 1.7078630924224854, 1.8462419509887695, 1.9846208095550537, 2.122999668121338, 2.261378765106201, 2.3997576236724854, 2.5381364822387695, 2.676515579223633, 2.814894437789917, 2.953273296356201, 3.0916521549224854, 3.2300310134887695, 3.368410110473633, 3.506788969039917]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 11.0, 13.0, 8.0, 16.0, 11.0, 20.0, 27.0, 24.0, 19.0, 24.0, 34.0, 29.0, 50.0, 61.0, 78.0, 79.0, 90.0, 55.0, 39.0, 42.0, 38.0, 34.0, 25.0, 29.0, 23.0, 15.0, 20.0, 10.0, 21.0, 14.0, 5.0, 8.0, 8.0, 5.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0966553688049316, -2.030437469482422, -1.9642198085784912, -1.898002028465271, -1.8317842483520508, -1.7655664682388306, -1.6993486881256104, -1.6331309080123901, -1.56691312789917, -1.5006953477859497, -1.4344775676727295, -1.3682597875595093, -1.302042007446289, -1.2358242273330688, -1.1696064472198486, -1.1033886671066284, -1.0371708869934082, -0.970953106880188, -0.9047353267669678, -0.8385175466537476, -0.7722997665405273, -0.7060819864273071, -0.6398642063140869, -0.5736464262008667, -0.5074286460876465, -0.44121086597442627, -0.37499308586120605, -0.30877530574798584, -0.24255752563476562, -0.1763397455215454, -0.1101219654083252, -0.04390418529510498, 0.022313594818115234, 0.08853137493133545, 0.15474915504455566, 0.22096693515777588, 0.2871847152709961, 0.3534024953842163, 0.4196202754974365, 0.48583805561065674, 0.552055835723877, 0.6182736158370972, 0.6844913959503174, 0.7507091760635376, 0.8169269561767578, 0.883144736289978, 0.9493625164031982, 1.0155802965164185, 1.0817980766296387, 1.1480158567428589, 1.214233636856079, 1.2804514169692993, 1.3466691970825195, 1.4128869771957397, 1.47910475730896, 1.5453225374221802, 1.6115403175354004, 1.6777580976486206, 1.7439758777618408, 1.810193657875061, 1.8764114379882812, 1.9426292181015015, 2.0088469982147217, 2.0750646591186523, 2.141282558441162]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 9.0, 5.0, 11.0, 19.0, 23.0, 45.0, 62.0, 213.0, 479.0, 1518.0, 7902.0, 136377.0, 3944172.0, 93801.0, 7283.0, 1603.0, 404.0, 173.0, 71.0, 37.0, 23.0, 13.0, 3.0, 8.0, 9.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0], "bins": [-0.921875, -0.9011383056640625, -0.880401611328125, -0.8596649169921875, -0.83892822265625, -0.8181915283203125, -0.797454833984375, -0.7767181396484375, -0.7559814453125, -0.7352447509765625, -0.714508056640625, -0.6937713623046875, -0.67303466796875, -0.6522979736328125, -0.631561279296875, -0.6108245849609375, -0.590087890625, -0.5693511962890625, -0.548614501953125, -0.5278778076171875, -0.50714111328125, -0.4864044189453125, -0.465667724609375, -0.4449310302734375, -0.4241943359375, -0.4034576416015625, -0.382720947265625, -0.3619842529296875, -0.34124755859375, -0.3205108642578125, -0.299774169921875, -0.2790374755859375, -0.25830078125, -0.2375640869140625, -0.216827392578125, -0.1960906982421875, -0.17535400390625, -0.1546173095703125, -0.133880615234375, -0.1131439208984375, -0.0924072265625, -0.0716705322265625, -0.050933837890625, -0.0301971435546875, -0.00946044921875, 0.0112762451171875, 0.032012939453125, 0.0527496337890625, 0.073486328125, 0.0942230224609375, 0.114959716796875, 0.1356964111328125, 0.15643310546875, 0.1771697998046875, 0.197906494140625, 0.2186431884765625, 0.2393798828125, 0.2601165771484375, 0.280853271484375, 0.3015899658203125, 0.32232666015625, 0.3430633544921875, 0.363800048828125, 0.3845367431640625, 0.4052734375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 4.0, 9.0, 11.0, 11.0, 12.0, 18.0, 8.0, 18.0, 25.0, 32.0, 37.0, 46.0, 48.0, 48.0, 45.0, 53.0, 48.0, 57.0, 55.0, 45.0, 62.0, 41.0, 39.0, 36.0, 40.0, 40.0, 21.0, 21.0, 18.0, 11.0, 13.0, 11.0, 7.0, 8.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1820068359375, -0.1770172119140625, -0.172027587890625, -0.1670379638671875, -0.16204833984375, -0.1570587158203125, -0.152069091796875, -0.1470794677734375, -0.14208984375, -0.1371002197265625, -0.132110595703125, -0.1271209716796875, -0.12213134765625, -0.1171417236328125, -0.112152099609375, -0.1071624755859375, -0.1021728515625, -0.0971832275390625, -0.092193603515625, -0.0872039794921875, -0.08221435546875, -0.0772247314453125, -0.072235107421875, -0.0672454833984375, -0.062255859375, -0.0572662353515625, -0.052276611328125, -0.0472869873046875, -0.04229736328125, -0.0373077392578125, -0.032318115234375, -0.0273284912109375, -0.0223388671875, -0.0173492431640625, -0.012359619140625, -0.0073699951171875, -0.00238037109375, 0.0026092529296875, 0.007598876953125, 0.0125885009765625, 0.017578125, 0.0225677490234375, 0.027557373046875, 0.0325469970703125, 0.03753662109375, 0.0425262451171875, 0.047515869140625, 0.0525054931640625, 0.0574951171875, 0.0624847412109375, 0.067474365234375, 0.0724639892578125, 0.07745361328125, 0.0824432373046875, 0.087432861328125, 0.0924224853515625, 0.097412109375, 0.1024017333984375, 0.107391357421875, 0.1123809814453125, 0.11737060546875, 0.1223602294921875, 0.127349853515625, 0.1323394775390625, 0.1373291015625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 1.0, 7.0, 8.0, 8.0, 11.0, 14.0, 28.0, 33.0, 49.0, 99.0, 223.0, 493.0, 1383.0, 4418.0, 19791.0, 206775.0, 3755449.0, 180731.0, 18127.0, 4280.0, 1320.0, 483.0, 209.0, 96.0, 74.0, 50.0, 28.0, 15.0, 13.0, 14.0, 12.0, 4.0, 5.0, 8.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.6103515625, -0.5936203002929688, -0.5768890380859375, -0.5601577758789062, -0.543426513671875, -0.5266952514648438, -0.5099639892578125, -0.49323272705078125, -0.47650146484375, -0.45977020263671875, -0.4430389404296875, -0.42630767822265625, -0.409576416015625, -0.39284515380859375, -0.3761138916015625, -0.35938262939453125, -0.3426513671875, -0.32592010498046875, -0.3091888427734375, -0.29245758056640625, -0.275726318359375, -0.25899505615234375, -0.2422637939453125, -0.22553253173828125, -0.20880126953125, -0.19207000732421875, -0.1753387451171875, -0.15860748291015625, -0.141876220703125, -0.12514495849609375, -0.1084136962890625, -0.09168243408203125, -0.074951171875, -0.05821990966796875, -0.0414886474609375, -0.02475738525390625, -0.008026123046875, 0.00870513916015625, 0.0254364013671875, 0.04216766357421875, 0.05889892578125, 0.07563018798828125, 0.0923614501953125, 0.10909271240234375, 0.125823974609375, 0.14255523681640625, 0.1592864990234375, 0.17601776123046875, 0.1927490234375, 0.20948028564453125, 0.2262115478515625, 0.24294281005859375, 0.259674072265625, 0.27640533447265625, 0.2931365966796875, 0.30986785888671875, 0.32659912109375, 0.34333038330078125, 0.3600616455078125, 0.37679290771484375, 0.393524169921875, 0.41025543212890625, 0.4269866943359375, 0.44371795654296875, 0.46044921875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 7.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 14.0, 8.0, 16.0, 23.0, 27.0, 39.0, 61.0, 73.0, 98.0, 204.0, 298.0, 515.0, 738.0, 673.0, 451.0, 290.0, 159.0, 106.0, 72.0, 44.0, 34.0, 29.0, 21.0, 9.0, 9.0, 4.0, 4.0, 7.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.279296875, -0.2688941955566406, -0.25849151611328125, -0.24808883666992188, -0.2376861572265625, -0.22728347778320312, -0.21688079833984375, -0.20647811889648438, -0.196075439453125, -0.18567276000976562, -0.17527008056640625, -0.16486740112304688, -0.1544647216796875, -0.14406204223632812, -0.13365936279296875, -0.12325668334960938, -0.11285400390625, -0.10245132446289062, -0.09204864501953125, -0.08164596557617188, -0.0712432861328125, -0.060840606689453125, -0.05043792724609375, -0.040035247802734375, -0.029632568359375, -0.019229888916015625, -0.00882720947265625, 0.001575469970703125, 0.0119781494140625, 0.022380828857421875, 0.03278350830078125, 0.043186187744140625, 0.0535888671875, 0.06399154663085938, 0.07439422607421875, 0.08479690551757812, 0.0951995849609375, 0.10560226440429688, 0.11600494384765625, 0.12640762329101562, 0.136810302734375, 0.14721298217773438, 0.15761566162109375, 0.16801834106445312, 0.1784210205078125, 0.18882369995117188, 0.19922637939453125, 0.20962905883789062, 0.22003173828125, 0.23043441772460938, 0.24083709716796875, 0.2512397766113281, 0.2616424560546875, 0.2720451354980469, 0.28244781494140625, 0.2928504943847656, 0.303253173828125, 0.3136558532714844, 0.32405853271484375, 0.3344612121582031, 0.3448638916015625, 0.3552665710449219, 0.36566925048828125, 0.3760719299316406, 0.386474609375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 12.0, 22.0, 50.0, 118.0, 201.0, 277.0, 181.0, 78.0, 29.0, 11.0, 12.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2776670455932617, -3.1167852878570557, -2.9559032917022705, -2.7950215339660645, -2.6341397762298584, -2.4732580184936523, -2.312376022338867, -2.151494264602661, -1.9906123876571655, -1.82973051071167, -1.6688487529754639, -1.5079668760299683, -1.3470849990844727, -1.1862032413482666, -1.025321364402771, -0.8644396066665649, -0.7035577297210693, -0.5426759123802185, -0.3817940652370453, -0.22091221809387207, -0.06003040075302124, 0.10085141658782959, 0.2617332935333252, 0.42261505126953125, 0.5834969282150269, 0.7443787455558777, 0.9052605628967285, 1.0661424398422241, 1.2270243167877197, 1.3879060745239258, 1.5487879514694214, 1.7096697092056274, 1.870551586151123, 2.031433343887329, 2.1923153400421143, 2.3531970977783203, 2.5140788555145264, 2.6749606132507324, 2.8358426094055176, 2.9967243671417236, 3.1576061248779297, 3.3184878826141357, 3.479369878768921, 3.640251636505127, 3.801133394241333, 3.962015151977539, 4.122897148132324, 4.283779144287109, 4.4446611404418945, 4.60554313659668, 4.766424655914307, 4.927306652069092, 5.088188648223877, 5.249070167541504, 5.409952163696289, 5.570834159851074, 5.731715679168701, 5.892597675323486, 6.053479194641113, 6.214361190795898, 6.375243186950684, 6.5361247062683105, 6.697006702423096, 6.857888221740723, 7.018770217895508]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 7.0, 8.0, 6.0, 11.0, 11.0, 26.0, 21.0, 27.0, 41.0, 53.0, 38.0, 40.0, 65.0, 67.0, 65.0, 87.0, 67.0, 56.0, 46.0, 48.0, 31.0, 44.0, 28.0, 23.0, 19.0, 17.0, 15.0, 13.0, 5.0, 4.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.068406581878662, -2.000345230102539, -1.9322841167449951, -1.8642228841781616, -1.7961616516113281, -1.728100299835205, -1.6600390672683716, -1.591977834701538, -1.5239166021347046, -1.455855369567871, -1.3877941370010376, -1.319732904434204, -1.251671552658081, -1.183610439300537, -1.115549087524414, -1.0474878549575806, -0.9794266223907471, -0.9113653898239136, -0.8433041572570801, -0.7752428650856018, -0.7071816325187683, -0.6391203999519348, -0.5710591077804565, -0.502997875213623, -0.43493664264678955, -0.36687541007995605, -0.29881414771080017, -0.23075290024280548, -0.1626916527748108, -0.0946304202079773, -0.02656915783882141, 0.04149210453033447, 0.10955333709716797, 0.17761458456516266, 0.24567583203315735, 0.31373709440231323, 0.38179832696914673, 0.4498595595359802, 0.5179208517074585, 0.585982084274292, 0.6540433168411255, 0.722104549407959, 0.7901657819747925, 0.8582270741462708, 0.9262883067131042, 0.9943495392799377, 1.062410831451416, 1.1304720640182495, 1.198533296585083, 1.2665945291519165, 1.33465576171875, 1.4027169942855835, 1.470778226852417, 1.53883957862854, 1.6069008111953735, 1.674962043762207, 1.7430232763290405, 1.811084508895874, 1.8791457414627075, 1.947206974029541, 2.015268325805664, 2.083329439163208, 2.151390790939331, 2.219451904296875, 2.287513256072998]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 9.0, 16.0, 14.0, 29.0, 25.0, 56.0, 79.0, 133.0, 164.0, 280.0, 504.0, 896.0, 1819.0, 4208.0, 10501.0, 31366.0, 116795.0, 483676.0, 297584.0, 66905.0, 20148.0, 7196.0, 2978.0, 1387.0, 680.0, 404.0, 242.0, 141.0, 95.0, 70.0, 43.0, 36.0, 21.0, 17.0, 6.0, 4.0, 7.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2425537109375, -0.2341327667236328, -0.22571182250976562, -0.21729087829589844, -0.20886993408203125, -0.20044898986816406, -0.19202804565429688, -0.1836071014404297, -0.1751861572265625, -0.1667652130126953, -0.15834426879882812, -0.14992332458496094, -0.14150238037109375, -0.13308143615722656, -0.12466049194335938, -0.11623954772949219, -0.107818603515625, -0.09939765930175781, -0.09097671508789062, -0.08255577087402344, -0.07413482666015625, -0.06571388244628906, -0.057292938232421875, -0.04887199401855469, -0.0404510498046875, -0.03203010559082031, -0.023609161376953125, -0.015188217163085938, -0.00676727294921875, 0.0016536712646484375, 0.010074615478515625, 0.018495559692382812, 0.02691650390625, 0.03533744812011719, 0.043758392333984375, 0.05217933654785156, 0.06060028076171875, 0.06902122497558594, 0.07744216918945312, 0.08586311340332031, 0.0942840576171875, 0.10270500183105469, 0.11112594604492188, 0.11954689025878906, 0.12796783447265625, 0.13638877868652344, 0.14480972290039062, 0.1532306671142578, 0.161651611328125, 0.1700725555419922, 0.17849349975585938, 0.18691444396972656, 0.19533538818359375, 0.20375633239746094, 0.21217727661132812, 0.2205982208251953, 0.2290191650390625, 0.2374401092529297, 0.24586105346679688, 0.25428199768066406, 0.26270294189453125, 0.27112388610839844, 0.2795448303222656, 0.2879657745361328, 0.29638671875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 6.0, 14.0, 14.0, 14.0, 27.0, 36.0, 33.0, 42.0, 53.0, 54.0, 59.0, 70.0, 79.0, 65.0, 55.0, 63.0, 51.0, 40.0, 36.0, 56.0, 34.0, 19.0, 27.0, 17.0, 9.0, 13.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1351318359375, -0.1284351348876953, -0.12173843383789062, -0.11504173278808594, -0.10834503173828125, -0.10164833068847656, -0.09495162963867188, -0.08825492858886719, -0.0815582275390625, -0.07486152648925781, -0.06816482543945312, -0.06146812438964844, -0.05477142333984375, -0.04807472229003906, -0.041378021240234375, -0.03468132019042969, -0.027984619140625, -0.021287918090820312, -0.014591217041015625, -0.007894515991210938, -0.00119781494140625, 0.0054988861083984375, 0.012195587158203125, 0.018892288208007812, 0.0255889892578125, 0.03228569030761719, 0.038982391357421875, 0.04567909240722656, 0.05237579345703125, 0.05907249450683594, 0.06576919555664062, 0.07246589660644531, 0.07916259765625, 0.08585929870605469, 0.09255599975585938, 0.09925270080566406, 0.10594940185546875, 0.11264610290527344, 0.11934280395507812, 0.1260395050048828, 0.1327362060546875, 0.1394329071044922, 0.14612960815429688, 0.15282630920410156, 0.15952301025390625, 0.16621971130371094, 0.17291641235351562, 0.1796131134033203, 0.186309814453125, 0.1930065155029297, 0.19970321655273438, 0.20639991760253906, 0.21309661865234375, 0.21979331970214844, 0.22649002075195312, 0.2331867218017578, 0.2398834228515625, 0.2465801239013672, 0.2532768249511719, 0.25997352600097656, 0.26667022705078125, 0.27336692810058594, 0.2800636291503906, 0.2867603302001953, 0.29345703125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 10.0, 18.0, 24.0, 33.0, 56.0, 77.0, 122.0, 251.0, 482.0, 1176.0, 4167.0, 23935.0, 748545.0, 249386.0, 15286.0, 3045.0, 967.0, 434.0, 208.0, 120.0, 82.0, 39.0, 27.0, 17.0, 7.0, 7.0, 5.0, 2.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0], "bins": [-0.88916015625, -0.8684310913085938, -0.8477020263671875, -0.8269729614257812, -0.806243896484375, -0.7855148315429688, -0.7647857666015625, -0.7440567016601562, -0.72332763671875, -0.7025985717773438, -0.6818695068359375, -0.6611404418945312, -0.640411376953125, -0.6196823120117188, -0.5989532470703125, -0.5782241821289062, -0.5574951171875, -0.5367660522460938, -0.5160369873046875, -0.49530792236328125, -0.474578857421875, -0.45384979248046875, -0.4331207275390625, -0.41239166259765625, -0.39166259765625, -0.37093353271484375, -0.3502044677734375, -0.32947540283203125, -0.308746337890625, -0.28801727294921875, -0.2672882080078125, -0.24655914306640625, -0.225830078125, -0.20510101318359375, -0.1843719482421875, -0.16364288330078125, -0.142913818359375, -0.12218475341796875, -0.1014556884765625, -0.08072662353515625, -0.05999755859375, -0.03926849365234375, -0.0185394287109375, 0.00218963623046875, 0.022918701171875, 0.04364776611328125, 0.0643768310546875, 0.08510589599609375, 0.1058349609375, 0.12656402587890625, 0.1472930908203125, 0.16802215576171875, 0.188751220703125, 0.20948028564453125, 0.2302093505859375, 0.25093841552734375, 0.27166748046875, 0.29239654541015625, 0.3131256103515625, 0.33385467529296875, 0.354583740234375, 0.37531280517578125, 0.3960418701171875, 0.41677093505859375, 0.4375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 9.0, 6.0, 7.0, 10.0, 11.0, 8.0, 17.0, 22.0, 31.0, 38.0, 59.0, 57.0, 67.0, 90.0, 88.0, 86.0, 79.0, 58.0, 53.0, 56.0, 38.0, 26.0, 22.0, 19.0, 13.0, 8.0, 3.0, 7.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.1796875, -1.150115966796875, -1.12054443359375, -1.090972900390625, -1.0614013671875, -1.031829833984375, -1.00225830078125, -0.972686767578125, -0.943115234375, -0.913543701171875, -0.88397216796875, -0.854400634765625, -0.8248291015625, -0.795257568359375, -0.76568603515625, -0.736114501953125, -0.70654296875, -0.676971435546875, -0.64739990234375, -0.617828369140625, -0.5882568359375, -0.558685302734375, -0.52911376953125, -0.499542236328125, -0.469970703125, -0.440399169921875, -0.41082763671875, -0.381256103515625, -0.3516845703125, -0.322113037109375, -0.29254150390625, -0.262969970703125, -0.2333984375, -0.203826904296875, -0.17425537109375, -0.144683837890625, -0.1151123046875, -0.085540771484375, -0.05596923828125, -0.026397705078125, 0.003173828125, 0.032745361328125, 0.06231689453125, 0.091888427734375, 0.1214599609375, 0.151031494140625, 0.18060302734375, 0.210174560546875, 0.23974609375, 0.269317626953125, 0.29888916015625, 0.328460693359375, 0.3580322265625, 0.387603759765625, 0.41717529296875, 0.446746826171875, 0.476318359375, 0.505889892578125, 0.53546142578125, 0.565032958984375, 0.5946044921875, 0.624176025390625, 0.65374755859375, 0.683319091796875, 0.712890625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 3.0, 10.0, 17.0, 26.0, 58.0, 275.0, 2373.0, 415102.0, 627903.0, 2364.0, 277.0, 73.0, 34.0, 10.0, 7.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5927734375, -0.5753402709960938, -0.5579071044921875, -0.5404739379882812, -0.523040771484375, -0.5056076049804688, -0.4881744384765625, -0.47074127197265625, -0.45330810546875, -0.43587493896484375, -0.4184417724609375, -0.40100860595703125, -0.383575439453125, -0.36614227294921875, -0.3487091064453125, -0.33127593994140625, -0.3138427734375, -0.29640960693359375, -0.2789764404296875, -0.26154327392578125, -0.244110107421875, -0.22667694091796875, -0.2092437744140625, -0.19181060791015625, -0.17437744140625, -0.15694427490234375, -0.1395111083984375, -0.12207794189453125, -0.104644775390625, -0.08721160888671875, -0.0697784423828125, -0.05234527587890625, -0.034912109375, -0.01747894287109375, -4.57763671875e-05, 0.01738739013671875, 0.034820556640625, 0.05225372314453125, 0.0696868896484375, 0.08712005615234375, 0.10455322265625, 0.12198638916015625, 0.1394195556640625, 0.15685272216796875, 0.174285888671875, 0.19171905517578125, 0.2091522216796875, 0.22658538818359375, 0.2440185546875, 0.26145172119140625, 0.2788848876953125, 0.29631805419921875, 0.313751220703125, 0.33118438720703125, 0.3486175537109375, 0.36605072021484375, 0.38348388671875, 0.40091705322265625, 0.4183502197265625, 0.43578338623046875, 0.453216552734375, 0.47064971923828125, 0.4880828857421875, 0.5055160522460938, 0.52294921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 6.0, 2.0, 7.0, 5.0, 11.0, 17.0, 5.0, 16.0, 16.0, 31.0, 35.0, 46.0, 63.0, 94.0, 103.0, 109.0, 105.0, 92.0, 52.0, 50.0, 40.0, 16.0, 17.0, 20.0, 13.0, 9.0, 6.0, 6.0, 4.0, 2.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.941225051879883e-05, -4.772935062646866e-05, -4.604645073413849e-05, -4.436355084180832e-05, -4.268065094947815e-05, -4.099775105714798e-05, -3.931485116481781e-05, -3.763195127248764e-05, -3.594905138015747e-05, -3.42661514878273e-05, -3.258325159549713e-05, -3.090035170316696e-05, -2.9217451810836792e-05, -2.7534551918506622e-05, -2.5851652026176453e-05, -2.4168752133846283e-05, -2.2485852241516113e-05, -2.0802952349185944e-05, -1.9120052456855774e-05, -1.7437152564525604e-05, -1.5754252672195435e-05, -1.4071352779865265e-05, -1.2388452887535095e-05, -1.0705552995204926e-05, -9.022653102874756e-06, -7.339753210544586e-06, -5.6568533182144165e-06, -3.973953425884247e-06, -2.291053533554077e-06, -6.081536412239075e-07, 1.0747462511062622e-06, 2.757646143436432e-06, 4.4405460357666016e-06, 6.123445928096771e-06, 7.806345820426941e-06, 9.48924571275711e-06, 1.117214560508728e-05, 1.285504549741745e-05, 1.453794538974762e-05, 1.622084528207779e-05, 1.790374517440796e-05, 1.958664506673813e-05, 2.12695449590683e-05, 2.2952444851398468e-05, 2.4635344743728638e-05, 2.6318244636058807e-05, 2.8001144528388977e-05, 2.9684044420719147e-05, 3.1366944313049316e-05, 3.3049844205379486e-05, 3.4732744097709656e-05, 3.6415643990039825e-05, 3.8098543882369995e-05, 3.9781443774700165e-05, 4.1464343667030334e-05, 4.3147243559360504e-05, 4.4830143451690674e-05, 4.6513043344020844e-05, 4.819594323635101e-05, 4.987884312868118e-05, 5.156174302101135e-05, 5.324464291334152e-05, 5.492754280567169e-05, 5.661044269800186e-05, 5.829334259033203e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 6.0, 6.0, 4.0, 7.0, 9.0, 16.0, 18.0, 20.0, 28.0, 48.0, 62.0, 97.0, 153.0, 279.0, 494.0, 1066.0, 2439.0, 7236.0, 28870.0, 219070.0, 719945.0, 51560.0, 10816.0, 3440.0, 1377.0, 617.0, 373.0, 182.0, 98.0, 60.0, 33.0, 20.0, 23.0, 19.0, 16.0, 11.0, 6.0, 17.0, 3.0, 4.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.164794921875, -0.15982627868652344, -0.15485763549804688, -0.1498889923095703, -0.14492034912109375, -0.1399517059326172, -0.13498306274414062, -0.13001441955566406, -0.1250457763671875, -0.12007713317871094, -0.11510848999023438, -0.11013984680175781, -0.10517120361328125, -0.10020256042480469, -0.09523391723632812, -0.09026527404785156, -0.085296630859375, -0.08032798767089844, -0.07535934448242188, -0.07039070129394531, -0.06542205810546875, -0.06045341491699219, -0.055484771728515625, -0.05051612854003906, -0.0455474853515625, -0.04057884216308594, -0.035610198974609375, -0.030641555786132812, -0.02567291259765625, -0.020704269409179688, -0.015735626220703125, -0.010766983032226562, -0.00579833984375, -0.0008296966552734375, 0.004138946533203125, 0.009107589721679688, 0.01407623291015625, 0.019044876098632812, 0.024013519287109375, 0.028982162475585938, 0.0339508056640625, 0.03891944885253906, 0.043888092041015625, 0.04885673522949219, 0.05382537841796875, 0.05879402160644531, 0.06376266479492188, 0.06873130798339844, 0.073699951171875, 0.07866859436035156, 0.08363723754882812, 0.08860588073730469, 0.09357452392578125, 0.09854316711425781, 0.10351181030273438, 0.10848045349121094, 0.1134490966796875, 0.11841773986816406, 0.12338638305664062, 0.1283550262451172, 0.13332366943359375, 0.1382923126220703, 0.14326095581054688, 0.14822959899902344, 0.1531982421875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 10.0, 10.0, 12.0, 20.0, 26.0, 27.0, 50.0, 67.0, 108.0, 124.0, 119.0, 126.0, 94.0, 65.0, 48.0, 16.0, 14.0, 19.0, 9.0, 6.0, 5.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1802978515625, -0.1741485595703125, -0.167999267578125, -0.1618499755859375, -0.15570068359375, -0.1495513916015625, -0.143402099609375, -0.1372528076171875, -0.131103515625, -0.1249542236328125, -0.118804931640625, -0.1126556396484375, -0.10650634765625, -0.1003570556640625, -0.094207763671875, -0.0880584716796875, -0.0819091796875, -0.0757598876953125, -0.069610595703125, -0.0634613037109375, -0.05731201171875, -0.0511627197265625, -0.045013427734375, -0.0388641357421875, -0.03271484375, -0.0265655517578125, -0.020416259765625, -0.0142669677734375, -0.00811767578125, -0.0019683837890625, 0.004180908203125, 0.0103302001953125, 0.0164794921875, 0.0226287841796875, 0.028778076171875, 0.0349273681640625, 0.04107666015625, 0.0472259521484375, 0.053375244140625, 0.0595245361328125, 0.065673828125, 0.0718231201171875, 0.077972412109375, 0.0841217041015625, 0.09027099609375, 0.0964202880859375, 0.102569580078125, 0.1087188720703125, 0.1148681640625, 0.1210174560546875, 0.127166748046875, 0.1333160400390625, 0.13946533203125, 0.1456146240234375, 0.151763916015625, 0.1579132080078125, 0.1640625, 0.1702117919921875, 0.176361083984375, 0.1825103759765625, 0.18865966796875, 0.1948089599609375, 0.200958251953125, 0.2071075439453125, 0.2132568359375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 9.0, 74.0, 799.0, 118.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.703781127929688, -29.13824462890625, -28.57270622253418, -28.007169723510742, -27.441633224487305, -26.876094818115234, -26.310558319091797, -25.74502182006836, -25.179485321044922, -24.613948822021484, -24.048410415649414, -23.482873916625977, -22.91733741760254, -22.35179901123047, -21.78626251220703, -21.220726013183594, -20.655187606811523, -20.089651107788086, -19.524112701416016, -18.958576202392578, -18.39303970336914, -17.827503204345703, -17.261964797973633, -16.696428298950195, -16.130889892578125, -15.565352439880371, -14.999815940856934, -14.43427848815918, -13.868741989135742, -13.303204536437988, -12.737667083740234, -12.172130584716797, -11.60659408569336, -11.041056632995605, -10.475520133972168, -9.909982681274414, -9.344446182250977, -8.778908729553223, -8.213371276855469, -7.647834300994873, -7.082297325134277, -6.516760349273682, -5.951223373413086, -5.385685920715332, -4.820148944854736, -4.254611968994141, -3.689074754714966, -3.123537540435791, -2.5580005645751953, -1.99246346950531, -1.4269263744354248, -0.8613892793655396, -0.2958521842956543, 0.2696847915649414, 0.8352220058441162, 1.400759220123291, 1.9662961959838867, 2.5318331718444824, 3.0973703861236572, 3.662907600402832, 4.228444576263428, 4.793981552124023, 5.359519004821777, 5.925055980682373, 6.490592956542969]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 11.0, 12.0, 16.0, 23.0, 40.0, 41.0, 54.0, 74.0, 105.0, 194.0, 127.0, 65.0, 60.0, 43.0, 41.0, 36.0, 23.0, 14.0, 7.0, 5.0, 3.0, 6.0, 5.0, 4.0], "bins": [-7.6267619132995605, -7.473153114318848, -7.319544792175293, -7.16593599319458, -7.012327194213867, -6.858718395233154, -6.7051100730896, -6.551501274108887, -6.397892475128174, -6.244283676147461, -6.090675354003906, -5.937066555023193, -5.7834577560424805, -5.629848957061768, -5.476240634918213, -5.3226318359375, -5.169023513793945, -5.015414714813232, -4.861806392669678, -4.708197593688965, -4.554588794708252, -4.400979995727539, -4.247371673583984, -4.0937628746032715, -3.9401540756225586, -3.786545515060425, -3.632936716079712, -3.479328155517578, -3.3257193565368652, -3.1721107959747314, -3.0185022354125977, -2.8648934364318848, -2.7112843990325928, -2.557675838470459, -2.404067039489746, -2.2504584789276123, -2.0968496799468994, -1.9432411193847656, -1.7896324396133423, -1.636023759841919, -1.4824150800704956, -1.3288064002990723, -1.175197720527649, -1.0215890407562256, -0.867980420589447, -0.7143717408180237, -0.5607631206512451, -0.4071544408798218, -0.25354576110839844, -0.09993709623813629, 0.053671568632125854, 0.2072802186012268, 0.36088889837265015, 0.5144975781440735, 0.668106198310852, 0.8217148780822754, 0.9753235578536987, 1.128932237625122, 1.2825409173965454, 1.4361495971679688, 1.5897581577301025, 1.7433669567108154, 1.8969755172729492, 2.050584316253662, 2.204192876815796]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 5.0, 6.0, 8.0, 20.0, 25.0, 50.0, 109.0, 260.0, 939.0, 6688.0, 494677.0, 3666748.0, 21429.0, 2633.0, 456.0, 127.0, 58.0, 20.0, 9.0, 8.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.142578125, -2.0990219116210938, -2.0554656982421875, -2.0119094848632812, -1.968353271484375, -1.9247970581054688, -1.8812408447265625, -1.8376846313476562, -1.79412841796875, -1.7505722045898438, -1.7070159912109375, -1.6634597778320312, -1.619903564453125, -1.5763473510742188, -1.5327911376953125, -1.4892349243164062, -1.4456787109375, -1.4021224975585938, -1.3585662841796875, -1.3150100708007812, -1.271453857421875, -1.2278976440429688, -1.1843414306640625, -1.1407852172851562, -1.09722900390625, -1.0536727905273438, -1.0101165771484375, -0.9665603637695312, -0.923004150390625, -0.8794479370117188, -0.8358917236328125, -0.7923355102539062, -0.748779296875, -0.7052230834960938, -0.6616668701171875, -0.6181106567382812, -0.574554443359375, -0.5309982299804688, -0.4874420166015625, -0.44388580322265625, -0.40032958984375, -0.35677337646484375, -0.3132171630859375, -0.26966094970703125, -0.226104736328125, -0.18254852294921875, -0.1389923095703125, -0.09543609619140625, -0.0518798828125, -0.00832366943359375, 0.0352325439453125, 0.07878875732421875, 0.122344970703125, 0.16590118408203125, 0.2094573974609375, 0.25301361083984375, 0.29656982421875, 0.34012603759765625, 0.3836822509765625, 0.42723846435546875, 0.470794677734375, 0.5143508911132812, 0.5579071044921875, 0.6014633178710938, 0.64501953125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 11.0, 29.0, 48.0, 56.0, 68.0, 117.0, 111.0, 118.0, 133.0, 93.0, 73.0, 59.0, 41.0, 21.0, 15.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.61328125, -0.6011180877685547, -0.5889549255371094, -0.5767917633056641, -0.5646286010742188, -0.5524654388427734, -0.5403022766113281, -0.5281391143798828, -0.5159759521484375, -0.5038127899169922, -0.4916496276855469, -0.47948646545410156, -0.46732330322265625, -0.45516014099121094, -0.4429969787597656, -0.4308338165283203, -0.418670654296875, -0.4065074920654297, -0.3943443298339844, -0.38218116760253906, -0.37001800537109375, -0.35785484313964844, -0.3456916809082031, -0.3335285186767578, -0.3213653564453125, -0.3092021942138672, -0.2970390319824219, -0.28487586975097656, -0.27271270751953125, -0.26054954528808594, -0.24838638305664062, -0.2362232208251953, -0.22406005859375, -0.2118968963623047, -0.19973373413085938, -0.18757057189941406, -0.17540740966796875, -0.16324424743652344, -0.15108108520507812, -0.1389179229736328, -0.1267547607421875, -0.11459159851074219, -0.10242843627929688, -0.09026527404785156, -0.07810211181640625, -0.06593894958496094, -0.053775787353515625, -0.04161262512207031, -0.029449462890625, -0.017286300659179688, -0.005123138427734375, 0.0070400238037109375, 0.01920318603515625, 0.03136634826660156, 0.043529510498046875, 0.05569267272949219, 0.0678558349609375, 0.08001899719238281, 0.09218215942382812, 0.10434532165527344, 0.11650848388671875, 0.12867164611816406, 0.14083480834960938, 0.1529979705810547, 0.1651611328125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 10.0, 8.0, 14.0, 18.0, 32.0, 58.0, 77.0, 146.0, 271.0, 616.0, 1827.0, 8998.0, 444939.0, 3713408.0, 19295.0, 2777.0, 920.0, 351.0, 211.0, 104.0, 55.0, 46.0, 31.0, 16.0, 11.0, 8.0, 9.0, 8.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3330078125, -1.28729248046875, -1.2415771484375, -1.19586181640625, -1.150146484375, -1.10443115234375, -1.0587158203125, -1.01300048828125, -0.96728515625, -0.92156982421875, -0.8758544921875, -0.83013916015625, -0.784423828125, -0.73870849609375, -0.6929931640625, -0.64727783203125, -0.6015625, -0.55584716796875, -0.5101318359375, -0.46441650390625, -0.418701171875, -0.37298583984375, -0.3272705078125, -0.28155517578125, -0.23583984375, -0.19012451171875, -0.1444091796875, -0.09869384765625, -0.052978515625, -0.00726318359375, 0.0384521484375, 0.08416748046875, 0.1298828125, 0.17559814453125, 0.2213134765625, 0.26702880859375, 0.312744140625, 0.35845947265625, 0.4041748046875, 0.44989013671875, 0.49560546875, 0.54132080078125, 0.5870361328125, 0.63275146484375, 0.678466796875, 0.72418212890625, 0.7698974609375, 0.81561279296875, 0.861328125, 0.90704345703125, 0.9527587890625, 0.99847412109375, 1.044189453125, 1.08990478515625, 1.1356201171875, 1.18133544921875, 1.22705078125, 1.27276611328125, 1.3184814453125, 1.36419677734375, 1.409912109375, 1.45562744140625, 1.5013427734375, 1.54705810546875, 1.5927734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 12.0, 9.0, 19.0, 19.0, 38.0, 56.0, 53.0, 88.0, 129.0, 201.0, 315.0, 439.0, 605.0, 660.0, 469.0, 298.0, 221.0, 140.0, 81.0, 75.0, 26.0, 26.0, 18.0, 13.0, 13.0, 11.0, 6.0, 2.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.476806640625, -0.4585380554199219, -0.44026947021484375, -0.4220008850097656, -0.4037322998046875, -0.3854637145996094, -0.36719512939453125, -0.3489265441894531, -0.330657958984375, -0.3123893737792969, -0.29412078857421875, -0.2758522033691406, -0.2575836181640625, -0.23931503295898438, -0.22104644775390625, -0.20277786254882812, -0.18450927734375, -0.16624069213867188, -0.14797210693359375, -0.12970352172851562, -0.1114349365234375, -0.09316635131835938, -0.07489776611328125, -0.056629180908203125, -0.038360595703125, -0.020092010498046875, -0.00182342529296875, 0.016445159912109375, 0.0347137451171875, 0.052982330322265625, 0.07125091552734375, 0.08951950073242188, 0.1077880859375, 0.12605667114257812, 0.14432525634765625, 0.16259384155273438, 0.1808624267578125, 0.19913101196289062, 0.21739959716796875, 0.23566818237304688, 0.253936767578125, 0.2722053527832031, 0.29047393798828125, 0.3087425231933594, 0.3270111083984375, 0.3452796936035156, 0.36354827880859375, 0.3818168640136719, 0.40008544921875, 0.4183540344238281, 0.43662261962890625, 0.4548912048339844, 0.4731597900390625, 0.4914283752441406, 0.5096969604492188, 0.5279655456542969, 0.546234130859375, 0.5645027160644531, 0.5827713012695312, 0.6010398864746094, 0.6193084716796875, 0.6375770568847656, 0.6558456420898438, 0.6741142272949219, 0.6923828125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 11.0, 20.0, 38.0, 111.0, 264.0, 293.0, 157.0, 55.0, 32.0, 12.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.400297164916992, -11.046185493469238, -10.692072868347168, -10.337961196899414, -9.983848571777344, -9.62973690032959, -9.275625228881836, -8.921512603759766, -8.567399978637695, -8.213288307189941, -7.859175682067871, -7.505064010620117, -7.150951385498047, -6.796839714050293, -6.442727565765381, -6.088615417480469, -5.734503746032715, -5.380391597747803, -5.026279449462891, -4.672167778015137, -4.318055152893066, -3.9639432430267334, -3.6098313331604004, -3.2557191848754883, -2.901607036590576, -2.547494888305664, -2.193382740020752, -1.839270830154419, -1.4851586818695068, -1.1310465335845947, -0.7769346237182617, -0.4228224754333496, -0.0687103271484375, 0.28540176153182983, 0.6395138502120972, 0.9936258792877197, 1.3477380275726318, 1.701850175857544, 2.055962085723877, 2.410074234008789, 2.764186382293701, 3.1182985305786133, 3.4724106788635254, 3.8265225887298584, 4.180634498596191, 4.534747123718262, 4.888858795166016, 5.242970943450928, 5.59708309173584, 5.951195240020752, 6.305307388305664, 6.659419059753418, 7.013531684875488, 7.367643356323242, 7.721755504608154, 8.075867652893066, 8.42997932434082, 8.784090995788574, 9.138203620910645, 9.492315292358398, 9.846427917480469, 10.200539588928223, 10.554651260375977, 10.908763885498047, 11.262876510620117]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 13.0, 9.0, 14.0, 21.0, 17.0, 15.0, 32.0, 25.0, 43.0, 45.0, 50.0, 67.0, 67.0, 71.0, 74.0, 56.0, 72.0, 52.0, 49.0, 46.0, 29.0, 33.0, 28.0, 23.0, 8.0, 12.0, 7.0, 7.0, 6.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.021679401397705, -2.910008668899536, -2.798337936401367, -2.686666965484619, -2.57499623298645, -2.4633255004882812, -2.351654529571533, -2.2399837970733643, -2.1283130645751953, -2.0166423320770264, -1.9049714803695679, -1.7933006286621094, -1.6816298961639404, -1.5699591636657715, -1.458288311958313, -1.3466174602508545, -1.2349467277526855, -1.1232759952545166, -1.011605143547058, -0.8999343514442444, -0.7882635593414307, -0.6765927672386169, -0.5649219751358032, -0.4532511830329895, -0.3415803909301758, -0.22990959882736206, -0.11823880672454834, -0.006568014621734619, 0.1051027774810791, 0.21677356958389282, 0.32844436168670654, 0.44011515378952026, 0.551785945892334, 0.6634567379951477, 0.7751275300979614, 0.8867983222007751, 0.9984691143035889, 1.1101398468017578, 1.2218106985092163, 1.3334815502166748, 1.4451522827148438, 1.5568230152130127, 1.6684938669204712, 1.7801647186279297, 1.8918354511260986, 2.0035061836242676, 2.1151771545410156, 2.2268478870391846, 2.3385186195373535, 2.4501893520355225, 2.5618600845336914, 2.6735310554504395, 2.7852017879486084, 2.8968725204467773, 3.0085434913635254, 3.1202142238616943, 3.2318849563598633, 3.3435556888580322, 3.455226421356201, 3.566897392272949, 3.678568124771118, 3.790238857269287, 3.901909828186035, 4.013580322265625, 4.125251293182373]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 6.0, 13.0, 11.0, 20.0, 29.0, 44.0, 86.0, 119.0, 238.0, 529.0, 1028.0, 2448.0, 7207.0, 27355.0, 158023.0, 701037.0, 118428.0, 21785.0, 6034.0, 2174.0, 913.0, 456.0, 243.0, 111.0, 75.0, 49.0, 34.0, 23.0, 14.0, 8.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.363525390625, -0.3515777587890625, -0.339630126953125, -0.3276824951171875, -0.31573486328125, -0.3037872314453125, -0.291839599609375, -0.2798919677734375, -0.2679443359375, -0.2559967041015625, -0.244049072265625, -0.2321014404296875, -0.22015380859375, -0.2082061767578125, -0.196258544921875, -0.1843109130859375, -0.17236328125, -0.1604156494140625, -0.148468017578125, -0.1365203857421875, -0.12457275390625, -0.1126251220703125, -0.100677490234375, -0.0887298583984375, -0.0767822265625, -0.0648345947265625, -0.052886962890625, -0.0409393310546875, -0.02899169921875, -0.0170440673828125, -0.005096435546875, 0.0068511962890625, 0.018798828125, 0.0307464599609375, 0.042694091796875, 0.0546417236328125, 0.06658935546875, 0.0785369873046875, 0.090484619140625, 0.1024322509765625, 0.1143798828125, 0.1263275146484375, 0.138275146484375, 0.1502227783203125, 0.16217041015625, 0.1741180419921875, 0.186065673828125, 0.1980133056640625, 0.2099609375, 0.2219085693359375, 0.233856201171875, 0.2458038330078125, 0.25775146484375, 0.2696990966796875, 0.281646728515625, 0.2935943603515625, 0.3055419921875, 0.3174896240234375, 0.329437255859375, 0.3413848876953125, 0.35333251953125, 0.3652801513671875, 0.377227783203125, 0.3891754150390625, 0.401123046875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 4.0, 3.0, 0.0, 4.0, 6.0, 5.0, 6.0, 13.0, 13.0, 27.0, 32.0, 32.0, 35.0, 47.0, 65.0, 46.0, 65.0, 69.0, 63.0, 81.0, 62.0, 64.0, 36.0, 49.0, 39.0, 28.0, 32.0, 19.0, 16.0, 16.0, 10.0, 11.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1988525390625, -0.1895732879638672, -0.18029403686523438, -0.17101478576660156, -0.16173553466796875, -0.15245628356933594, -0.14317703247070312, -0.1338977813720703, -0.1246185302734375, -0.11533927917480469, -0.10606002807617188, -0.09678077697753906, -0.08750152587890625, -0.07822227478027344, -0.06894302368164062, -0.05966377258300781, -0.050384521484375, -0.04110527038574219, -0.031826019287109375, -0.022546768188476562, -0.01326751708984375, -0.0039882659912109375, 0.005290985107421875, 0.014570236206054688, 0.0238494873046875, 0.03312873840332031, 0.042407989501953125, 0.05168724060058594, 0.06096649169921875, 0.07024574279785156, 0.07952499389648438, 0.08880424499511719, 0.09808349609375, 0.10736274719238281, 0.11664199829101562, 0.12592124938964844, 0.13520050048828125, 0.14447975158691406, 0.15375900268554688, 0.1630382537841797, 0.1723175048828125, 0.1815967559814453, 0.19087600708007812, 0.20015525817871094, 0.20943450927734375, 0.21871376037597656, 0.22799301147460938, 0.2372722625732422, 0.246551513671875, 0.2558307647705078, 0.2651100158691406, 0.27438926696777344, 0.28366851806640625, 0.29294776916503906, 0.3022270202636719, 0.3115062713623047, 0.3207855224609375, 0.3300647735595703, 0.3393440246582031, 0.34862327575683594, 0.35790252685546875, 0.36718177795410156, 0.3764610290527344, 0.3857402801513672, 0.39501953125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 6.0, 8.0, 12.0, 19.0, 15.0, 28.0, 69.0, 161.0, 323.0, 919.0, 4320.0, 56664.0, 957795.0, 24241.0, 2661.0, 733.0, 284.0, 116.0, 80.0, 33.0, 28.0, 12.0, 13.0, 8.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6630859375, -0.63970947265625, -0.6163330078125, -0.59295654296875, -0.569580078125, -0.54620361328125, -0.5228271484375, -0.49945068359375, -0.47607421875, -0.45269775390625, -0.4293212890625, -0.40594482421875, -0.382568359375, -0.35919189453125, -0.3358154296875, -0.31243896484375, -0.2890625, -0.26568603515625, -0.2423095703125, -0.21893310546875, -0.195556640625, -0.17218017578125, -0.1488037109375, -0.12542724609375, -0.10205078125, -0.07867431640625, -0.0552978515625, -0.03192138671875, -0.008544921875, 0.01483154296875, 0.0382080078125, 0.06158447265625, 0.0849609375, 0.10833740234375, 0.1317138671875, 0.15509033203125, 0.178466796875, 0.20184326171875, 0.2252197265625, 0.24859619140625, 0.27197265625, 0.29534912109375, 0.3187255859375, 0.34210205078125, 0.365478515625, 0.38885498046875, 0.4122314453125, 0.43560791015625, 0.458984375, 0.48236083984375, 0.5057373046875, 0.52911376953125, 0.552490234375, 0.57586669921875, 0.5992431640625, 0.62261962890625, 0.64599609375, 0.66937255859375, 0.6927490234375, 0.71612548828125, 0.739501953125, 0.76287841796875, 0.7862548828125, 0.80963134765625, 0.8330078125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 6.0, 5.0, 2.0, 4.0, 10.0, 19.0, 11.0, 13.0, 9.0, 28.0, 23.0, 35.0, 40.0, 42.0, 62.0, 60.0, 72.0, 74.0, 80.0, 56.0, 64.0, 46.0, 29.0, 34.0, 25.0, 19.0, 17.0, 16.0, 21.0, 19.0, 3.0, 12.0, 10.0, 4.0, 5.0, 8.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.9228515625, -0.893707275390625, -0.86456298828125, -0.835418701171875, -0.8062744140625, -0.777130126953125, -0.74798583984375, -0.718841552734375, -0.689697265625, -0.660552978515625, -0.63140869140625, -0.602264404296875, -0.5731201171875, -0.543975830078125, -0.51483154296875, -0.485687255859375, -0.45654296875, -0.427398681640625, -0.39825439453125, -0.369110107421875, -0.3399658203125, -0.310821533203125, -0.28167724609375, -0.252532958984375, -0.223388671875, -0.194244384765625, -0.16510009765625, -0.135955810546875, -0.1068115234375, -0.077667236328125, -0.04852294921875, -0.019378662109375, 0.009765625, 0.038909912109375, 0.06805419921875, 0.097198486328125, 0.1263427734375, 0.155487060546875, 0.18463134765625, 0.213775634765625, 0.242919921875, 0.272064208984375, 0.30120849609375, 0.330352783203125, 0.3594970703125, 0.388641357421875, 0.41778564453125, 0.446929931640625, 0.47607421875, 0.505218505859375, 0.53436279296875, 0.563507080078125, 0.5926513671875, 0.621795654296875, 0.65093994140625, 0.680084228515625, 0.709228515625, 0.738372802734375, 0.76751708984375, 0.796661376953125, 0.8258056640625, 0.854949951171875, 0.88409423828125, 0.913238525390625, 0.9423828125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 15.0, 39.0, 57.0, 87.0, 216.0, 420.0, 1015.0, 3544.0, 18101.0, 402606.0, 598483.0, 18597.0, 3491.0, 1013.0, 391.0, 222.0, 97.0, 61.0, 31.0, 17.0, 12.0, 8.0, 6.0, 2.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11602783203125, -0.11202716827392578, -0.10802650451660156, -0.10402584075927734, -0.10002517700195312, -0.0960245132446289, -0.09202384948730469, -0.08802318572998047, -0.08402252197265625, -0.08002185821533203, -0.07602119445800781, -0.0720205307006836, -0.06801986694335938, -0.06401920318603516, -0.06001853942871094, -0.05601787567138672, -0.0520172119140625, -0.04801654815673828, -0.04401588439941406, -0.040015220642089844, -0.036014556884765625, -0.032013893127441406, -0.028013229370117188, -0.02401256561279297, -0.02001190185546875, -0.01601123809814453, -0.012010574340820312, -0.008009910583496094, -0.004009246826171875, -8.58306884765625e-06, 0.0039920806884765625, 0.007992744445800781, 0.011993408203125, 0.01599407196044922, 0.019994735717773438, 0.023995399475097656, 0.027996063232421875, 0.031996726989746094, 0.03599739074707031, 0.03999805450439453, 0.04399871826171875, 0.04799938201904297, 0.05200004577636719, 0.056000709533691406, 0.060001373291015625, 0.06400203704833984, 0.06800270080566406, 0.07200336456298828, 0.0760040283203125, 0.08000469207763672, 0.08400535583496094, 0.08800601959228516, 0.09200668334960938, 0.0960073471069336, 0.10000801086425781, 0.10400867462158203, 0.10800933837890625, 0.11201000213623047, 0.11601066589355469, 0.1200113296508789, 0.12401199340820312, 0.12801265716552734, 0.13201332092285156, 0.13601398468017578, 0.1400146484375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 6.0, 4.0, 3.0, 5.0, 7.0, 10.0, 8.0, 5.0, 10.0, 8.0, 17.0, 19.0, 25.0, 40.0, 47.0, 74.0, 81.0, 105.0, 146.0, 91.0, 69.0, 66.0, 37.0, 25.0, 22.0, 12.0, 9.0, 11.0, 6.0, 8.0, 5.0, 4.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.547834396362305e-05, -4.409998655319214e-05, -4.272162914276123e-05, -4.134327173233032e-05, -3.9964914321899414e-05, -3.8586556911468506e-05, -3.72081995010376e-05, -3.582984209060669e-05, -3.445148468017578e-05, -3.307312726974487e-05, -3.1694769859313965e-05, -3.0316412448883057e-05, -2.893805503845215e-05, -2.755969762802124e-05, -2.6181340217590332e-05, -2.4802982807159424e-05, -2.3424625396728516e-05, -2.2046267986297607e-05, -2.06679105758667e-05, -1.928955316543579e-05, -1.7911195755004883e-05, -1.6532838344573975e-05, -1.5154480934143066e-05, -1.3776123523712158e-05, -1.239776611328125e-05, -1.1019408702850342e-05, -9.641051292419434e-06, -8.262693881988525e-06, -6.884336471557617e-06, -5.505979061126709e-06, -4.127621650695801e-06, -2.7492642402648926e-06, -1.3709068298339844e-06, 7.450580596923828e-09, 1.385807991027832e-06, 2.7641654014587402e-06, 4.1425228118896484e-06, 5.520880222320557e-06, 6.899237632751465e-06, 8.277595043182373e-06, 9.655952453613281e-06, 1.103430986404419e-05, 1.2412667274475098e-05, 1.3791024684906006e-05, 1.5169382095336914e-05, 1.6547739505767822e-05, 1.792609691619873e-05, 1.930445432662964e-05, 2.0682811737060547e-05, 2.2061169147491455e-05, 2.3439526557922363e-05, 2.481788396835327e-05, 2.619624137878418e-05, 2.7574598789215088e-05, 2.8952956199645996e-05, 3.0331313610076904e-05, 3.170967102050781e-05, 3.308802843093872e-05, 3.446638584136963e-05, 3.584474325180054e-05, 3.7223100662231445e-05, 3.8601458072662354e-05, 3.997981548309326e-05, 4.135817289352417e-05, 4.273653030395508e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 4.0, 6.0, 11.0, 9.0, 19.0, 24.0, 40.0, 64.0, 119.0, 216.0, 509.0, 1246.0, 3718.0, 14754.0, 99150.0, 868042.0, 47298.0, 9065.0, 2571.0, 875.0, 384.0, 178.0, 101.0, 57.0, 25.0, 26.0, 12.0, 13.0, 11.0, 6.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.146728515625, -0.14279842376708984, -0.1388683319091797, -0.13493824005126953, -0.13100814819335938, -0.12707805633544922, -0.12314796447753906, -0.1192178726196289, -0.11528778076171875, -0.1113576889038086, -0.10742759704589844, -0.10349750518798828, -0.09956741333007812, -0.09563732147216797, -0.09170722961425781, -0.08777713775634766, -0.0838470458984375, -0.07991695404052734, -0.07598686218261719, -0.07205677032470703, -0.06812667846679688, -0.06419658660888672, -0.06026649475097656, -0.056336402893066406, -0.05240631103515625, -0.048476219177246094, -0.04454612731933594, -0.04061603546142578, -0.036685943603515625, -0.03275585174560547, -0.028825759887695312, -0.024895668029785156, -0.020965576171875, -0.017035484313964844, -0.013105392456054688, -0.009175300598144531, -0.005245208740234375, -0.0013151168823242188, 0.0026149749755859375, 0.006545066833496094, 0.01047515869140625, 0.014405250549316406, 0.018335342407226562, 0.02226543426513672, 0.026195526123046875, 0.03012561798095703, 0.03405570983886719, 0.037985801696777344, 0.0419158935546875, 0.045845985412597656, 0.04977607727050781, 0.05370616912841797, 0.057636260986328125, 0.06156635284423828, 0.06549644470214844, 0.0694265365600586, 0.07335662841796875, 0.0772867202758789, 0.08121681213378906, 0.08514690399169922, 0.08907699584960938, 0.09300708770751953, 0.09693717956542969, 0.10086727142333984, 0.10479736328125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 10.0, 3.0, 10.0, 6.0, 18.0, 17.0, 17.0, 25.0, 44.0, 34.0, 67.0, 75.0, 83.0, 108.0, 103.0, 79.0, 63.0, 59.0, 38.0, 35.0, 24.0, 18.0, 15.0, 12.0, 11.0, 9.0, 3.0, 2.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07501220703125, -0.07200431823730469, -0.06899642944335938, -0.06598854064941406, -0.06298065185546875, -0.05997276306152344, -0.056964874267578125, -0.05395698547363281, -0.0509490966796875, -0.04794120788574219, -0.044933319091796875, -0.04192543029785156, -0.03891754150390625, -0.03590965270996094, -0.032901763916015625, -0.029893875122070312, -0.026885986328125, -0.023878097534179688, -0.020870208740234375, -0.017862319946289062, -0.01485443115234375, -0.011846542358398438, -0.008838653564453125, -0.0058307647705078125, -0.0028228759765625, 0.0001850128173828125, 0.003192901611328125, 0.0062007904052734375, 0.00920867919921875, 0.012216567993164062, 0.015224456787109375, 0.018232345581054688, 0.021240234375, 0.024248123168945312, 0.027256011962890625, 0.030263900756835938, 0.03327178955078125, 0.03627967834472656, 0.039287567138671875, 0.04229545593261719, 0.0453033447265625, 0.04831123352050781, 0.051319122314453125, 0.05432701110839844, 0.05733489990234375, 0.06034278869628906, 0.06335067749023438, 0.06635856628417969, 0.069366455078125, 0.07237434387207031, 0.07538223266601562, 0.07839012145996094, 0.08139801025390625, 0.08440589904785156, 0.08741378784179688, 0.09042167663574219, 0.0934295654296875, 0.09643745422363281, 0.09944534301757812, 0.10245323181152344, 0.10546112060546875, 0.10846900939941406, 0.11147689819335938, 0.11448478698730469, 0.11749267578125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 9.0, 1.0, 4.0, 5.0, 17.0, 26.0, 48.0, 156.0, 447.0, 141.0, 68.0, 38.0, 23.0, 14.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1545372009277344, -2.014742612838745, -1.8749477863311768, -1.7351531982421875, -1.5953584909439087, -1.4555637836456299, -1.3157691955566406, -1.1759744882583618, -1.036179780960083, -0.8963850736618042, -0.7565904259681702, -0.6167957782745361, -0.4770010709762573, -0.3372063636779785, -0.19741171598434448, -0.05761706829071045, 0.08217763900756836, 0.22197231650352478, 0.3617669939994812, 0.5015616416931152, 0.641356348991394, 0.7811510562896729, 0.9209457039833069, 1.060740351676941, 1.2005350589752197, 1.3403297662734985, 1.4801244735717773, 1.6199190616607666, 1.7597137689590454, 1.8995084762573242, 2.0393030643463135, 2.1790976524353027, 2.3188929557800293, 2.4586875438690186, 2.598482370376587, 2.738276958465576, 2.8780717849731445, 3.017866373062134, 3.157660961151123, 3.2974557876586914, 3.4372503757476807, 3.57704496383667, 3.7168397903442383, 3.8566343784332275, 3.996428966522217, 4.136223793029785, 4.2760186195373535, 4.415812969207764, 4.555607795715332, 4.6954026222229, 4.8351969718933105, 4.974991798400879, 5.114786624908447, 5.254581451416016, 5.394375801086426, 5.534170627593994, 5.6739654541015625, 5.813760280609131, 5.953554630279541, 6.093349456787109, 6.233144283294678, 6.372939109802246, 6.512733459472656, 6.652528285980225, 6.792322635650635]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 6.0, 5.0, 3.0, 4.0, 9.0, 10.0, 5.0, 8.0, 17.0, 15.0, 27.0, 14.0, 30.0, 39.0, 31.0, 71.0, 109.0, 161.0, 107.0, 74.0, 41.0, 22.0, 27.0, 15.0, 17.0, 21.0, 14.0, 15.0, 13.0, 15.0, 8.0, 8.0, 9.0, 7.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.4799249172210693, -2.4034242630004883, -2.3269236087799072, -2.250422954559326, -2.173922300338745, -2.097421646118164, -2.020920991897583, -1.944420337677002, -1.867919683456421, -1.7914190292358398, -1.7149183750152588, -1.6384177207946777, -1.5619170665740967, -1.4854164123535156, -1.4089157581329346, -1.3324151039123535, -1.2559144496917725, -1.1794137954711914, -1.1029131412506104, -1.0264124870300293, -0.9499118328094482, -0.8734111785888672, -0.7969105243682861, -0.7204098701477051, -0.643909215927124, -0.567408561706543, -0.4909079074859619, -0.41440725326538086, -0.3379065990447998, -0.26140594482421875, -0.1849052906036377, -0.10840463638305664, -0.031903743743896484, 0.04459691047668457, 0.12109756469726562, 0.19759821891784668, 0.27409887313842773, 0.3505995273590088, 0.42710018157958984, 0.5036008358001709, 0.580101490020752, 0.656602144241333, 0.7331027984619141, 0.8096034526824951, 0.8861041069030762, 0.9626047611236572, 1.0391054153442383, 1.1156060695648193, 1.1921067237854004, 1.2686073780059814, 1.3451080322265625, 1.4216086864471436, 1.4981093406677246, 1.5746099948883057, 1.6511106491088867, 1.7276113033294678, 1.8041119575500488, 1.8806126117706299, 1.957113265991211, 2.033613920211792, 2.110114574432373, 2.186615228652954, 2.263115882873535, 2.339616537094116, 2.4161171913146973]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 8.0, 15.0, 22.0, 24.0, 30.0, 42.0, 58.0, 50.0, 103.0, 274.0, 90.0, 78.0, 52.0, 40.0, 27.0, 23.0, 21.0, 21.0, 8.0, 9.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.5947265625, -0.5821952819824219, -0.5696640014648438, -0.5571327209472656, -0.5446014404296875, -0.5320701599121094, -0.5195388793945312, -0.5070075988769531, -0.494476318359375, -0.4819450378417969, -0.46941375732421875, -0.4568824768066406, -0.4443511962890625, -0.4318199157714844, -0.41928863525390625, -0.4067573547363281, -0.39422607421875, -0.3816947937011719, -0.36916351318359375, -0.3566322326660156, -0.3441009521484375, -0.3315696716308594, -0.31903839111328125, -0.3065071105957031, -0.293975830078125, -0.2814445495605469, -0.26891326904296875, -0.2563819885253906, -0.2438507080078125, -0.23131942749023438, -0.21878814697265625, -0.20625686645507812, -0.1937255859375, -0.18119430541992188, -0.16866302490234375, -0.15613174438476562, -0.1436004638671875, -0.13106918334960938, -0.11853790283203125, -0.10600662231445312, -0.093475341796875, -0.08094406127929688, -0.06841278076171875, -0.055881500244140625, -0.0433502197265625, -0.030818939208984375, -0.01828765869140625, -0.005756378173828125, 0.00677490234375, 0.019306182861328125, 0.03183746337890625, 0.044368743896484375, 0.0569000244140625, 0.06943130493164062, 0.08196258544921875, 0.09449386596679688, 0.107025146484375, 0.11955642700195312, 0.13208770751953125, 0.14461898803710938, 0.1571502685546875, 0.16968154907226562, 0.18221282958984375, 0.19474411010742188, 0.207275390625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 4.0, 5.0, 1.0, 3.0, 10.0, 4.0, 17.0, 17.0, 14.0, 23.0, 31.0, 35.0, 51.0, 72.0, 175.0, 363.0, 1301.0, 7462.0, 8329077.0, 45295.0, 3318.0, 723.0, 247.0, 90.0, 74.0, 41.0, 39.0, 18.0, 20.0, 14.0, 8.0, 5.0, 2.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 10.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0], "bins": [-2.142411947250366, -2.072843074798584, -2.003274440765381, -1.9337055683135986, -1.864136815071106, -1.7945680618286133, -1.724999189376831, -1.6554304361343384, -1.5858616828918457, -1.516292929649353, -1.4467240571975708, -1.3771553039550781, -1.3075865507125854, -1.2380177974700928, -1.1684489250183105, -1.0988801717758179, -1.0293112993240356, -0.9597424864768982, -0.8901737332344055, -0.8206049203872681, -0.7510361671447754, -0.6814673542976379, -0.6118985414505005, -0.5423297882080078, -0.47276097536087036, -0.4031921923160553, -0.33362340927124023, -0.2640545964241028, -0.19448581337928772, -0.12491703033447266, -0.055348217487335205, 0.014220565557479858, 0.08378934860229492, 0.15335813164710999, 0.22292692959308624, 0.2924957275390625, 0.36206451058387756, 0.4316332936286926, 0.5012021064758301, 0.5707708597183228, 0.6403396725654602, 0.7099084854125977, 0.7794772386550903, 0.8490460515022278, 0.9186148643493652, 0.9881836175918579, 1.0577523708343506, 1.1273212432861328, 1.1968899965286255, 1.2664587497711182, 1.3360276222229004, 1.405596375465393, 1.4751651287078857, 1.544734001159668, 1.6143027544021606, 1.6838715076446533, 1.7534403800964355, 1.8230091333389282, 1.8925780057907104, 1.9621467590332031, 2.0317156314849854, 2.1012842655181885, 2.1708531379699707, 2.240422010421753, 2.309990644454956]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 6.0, 4.0, 5.0, 4.0, 3.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 5.0, 4.0, 4.0, 5.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8204708099365234, -2.755647897720337, -2.6908252239227295, -2.626002311706543, -2.5611793994903564, -2.496356725692749, -2.4315338134765625, -2.366710901260376, -2.3018882274627686, -2.237065315246582, -2.1722426414489746, -2.107419729232788, -2.0425968170166016, -1.9777741432189941, -1.9129512310028076, -1.8481284379959106, -1.7833055257797241, -1.7184827327728271, -1.6536598205566406, -1.5888370275497437, -1.5240142345428467, -1.4591913223266602, -1.3943685293197632, -1.3295457363128662, -1.2647228240966797, -1.1999000310897827, -1.1350771188735962, -1.0702543258666992, -1.0054315328598022, -0.9406086802482605, -0.8757858276367188, -0.8109630346298218, -0.7461402416229248, -0.6813173890113831, -0.6164945960044861, -0.5516717433929443, -0.486848920583725, -0.4220260977745056, -0.35720324516296387, -0.2923804223537445, -0.22755759954452515, -0.1627347767353058, -0.09791193902492523, -0.03308910131454468, 0.03173372149467468, 0.09655654430389404, 0.1613793969154358, 0.22620221972465515, 0.2910250425338745, 0.35584786534309387, 0.42067068815231323, 0.485493540763855, 0.550316333770752, 0.6151391863822937, 0.6799620389938354, 0.7447848320007324, 0.8096076846122742, 0.8744305372238159, 0.9392533302307129, 1.0040762424468994, 1.0688990354537964, 1.1337218284606934, 1.1985447406768799, 1.2633675336837769, 1.3281903266906738]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 2.0, 3.0, 3.0, 3.0, 14.0, 7.0, 9.0, 8.0, 11.0, 11.0, 11.0, 19.0, 19.0, 27.0, 22.0, 34.0, 29.0, 47.0, 43.0, 48.0, 49.0, 33.0, 41.0, 46.0, 46.0, 41.0, 51.0, 43.0, 43.0, 44.0, 31.0, 25.0, 27.0, 26.0, 12.0, 5.0, 14.0, 16.0, 8.0, 5.0, 4.0, 4.0, 5.0, 3.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.17333984375, -0.16819381713867188, -0.16304779052734375, -0.15790176391601562, -0.1527557373046875, -0.14760971069335938, -0.14246368408203125, -0.13731765747070312, -0.132171630859375, -0.12702560424804688, -0.12187957763671875, -0.11673355102539062, -0.1115875244140625, -0.10644149780273438, -0.10129547119140625, -0.09614944458007812, -0.09100341796875, -0.08585739135742188, -0.08071136474609375, -0.07556533813476562, -0.0704193115234375, -0.06527328491210938, -0.06012725830078125, -0.054981231689453125, -0.049835205078125, -0.044689178466796875, -0.03954315185546875, -0.034397125244140625, -0.0292510986328125, -0.024105072021484375, -0.01895904541015625, -0.013813018798828125, -0.0086669921875, -0.003520965576171875, 0.00162506103515625, 0.006771087646484375, 0.0119171142578125, 0.017063140869140625, 0.02220916748046875, 0.027355194091796875, 0.032501220703125, 0.037647247314453125, 0.04279327392578125, 0.047939300537109375, 0.0530853271484375, 0.058231353759765625, 0.06337738037109375, 0.06852340698242188, 0.07366943359375, 0.07881546020507812, 0.08396148681640625, 0.08910751342773438, 0.0942535400390625, 0.09939956665039062, 0.10454559326171875, 0.10969161987304688, 0.114837646484375, 0.11998367309570312, 0.12512969970703125, 0.13027572631835938, 0.1354217529296875, 0.14056777954101562, 0.14571380615234375, 0.15085983276367188, 0.156005859375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 7.0, 6.0, 23.0, 23.0, 27.0, 40.0, 59.0, 133.0, 182.0, 322.0, 604.0, 1205.0, 2531.0, 6373.0, 18427.0, 59167.0, 177892.0, 171597.0, 56310.0, 17681.0, 6335.0, 2636.0, 1189.0, 560.0, 324.0, 211.0, 126.0, 87.0, 57.0, 33.0, 27.0, 17.0, 16.0, 13.0, 9.0, 5.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0966796875, -1.0509490966796875, -1.005218505859375, -0.9594879150390625, -0.91375732421875, -0.8680267333984375, -0.822296142578125, -0.7765655517578125, -0.7308349609375, -0.6851043701171875, -0.639373779296875, -0.5936431884765625, -0.54791259765625, -0.5021820068359375, -0.456451416015625, -0.4107208251953125, -0.364990234375, -0.3192596435546875, -0.273529052734375, -0.2277984619140625, -0.18206787109375, -0.1363372802734375, -0.090606689453125, -0.0448760986328125, 0.0008544921875, 0.0465850830078125, 0.092315673828125, 0.1380462646484375, 0.18377685546875, 0.2295074462890625, 0.275238037109375, 0.3209686279296875, 0.36669921875, 0.4124298095703125, 0.458160400390625, 0.5038909912109375, 0.54962158203125, 0.5953521728515625, 0.641082763671875, 0.6868133544921875, 0.7325439453125, 0.7782745361328125, 0.824005126953125, 0.8697357177734375, 0.91546630859375, 0.9611968994140625, 1.006927490234375, 1.0526580810546875, 1.098388671875, 1.1441192626953125, 1.189849853515625, 1.2355804443359375, 1.28131103515625, 1.3270416259765625, 1.372772216796875, 1.4185028076171875, 1.4642333984375, 1.5099639892578125, 1.555694580078125, 1.6014251708984375, 1.64715576171875, 1.6928863525390625, 1.738616943359375, 1.7843475341796875, 1.830078125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 3.0, 7.0, 15.0, 24.0, 28.0, 54.0, 62.0, 70.0, 81.0, 88.0, 122.0, 90.0, 84.0, 58.0, 42.0, 54.0, 26.0, 34.0, 11.0, 10.0, 11.0, 8.0, 4.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.356689453125, -0.3457183837890625, -0.334747314453125, -0.3237762451171875, -0.31280517578125, -0.3018341064453125, -0.290863037109375, -0.2798919677734375, -0.2689208984375, -0.2579498291015625, -0.246978759765625, -0.2360076904296875, -0.22503662109375, -0.2140655517578125, -0.203094482421875, -0.1921234130859375, -0.18115234375, -0.1701812744140625, -0.159210205078125, -0.1482391357421875, -0.13726806640625, -0.1262969970703125, -0.115325927734375, -0.1043548583984375, -0.0933837890625, -0.0824127197265625, -0.071441650390625, -0.0604705810546875, -0.04949951171875, -0.0385284423828125, -0.027557373046875, -0.0165863037109375, -0.005615234375, 0.0053558349609375, 0.016326904296875, 0.0272979736328125, 0.03826904296875, 0.0492401123046875, 0.060211181640625, 0.0711822509765625, 0.0821533203125, 0.0931243896484375, 0.104095458984375, 0.1150665283203125, 0.12603759765625, 0.1370086669921875, 0.147979736328125, 0.1589508056640625, 0.169921875, 0.1808929443359375, 0.191864013671875, 0.2028350830078125, 0.21380615234375, 0.2247772216796875, 0.235748291015625, 0.2467193603515625, 0.2576904296875, 0.2686614990234375, 0.279632568359375, 0.2906036376953125, 0.30157470703125, 0.3125457763671875, 0.323516845703125, 0.3344879150390625, 0.345458984375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 2.0, 12.0, 11.0, 29.0, 52.0, 90.0, 96.0, 82.0, 38.0, 23.0, 6.0, 6.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.4527597427368164, -2.388012170791626, -2.3232648372650146, -2.258517265319824, -2.193769693374634, -2.1290221214294434, -2.064274787902832, -1.9995272159576416, -1.9347796440124512, -1.8700321912765503, -1.8052846193313599, -1.740537166595459, -1.6757895946502686, -1.6110421419143677, -1.5462946891784668, -1.4815471172332764, -1.4167996644973755, -1.3520522117614746, -1.2873046398162842, -1.2225571870803833, -1.1578096151351929, -1.093062162399292, -1.0283145904541016, -0.9635671377182007, -0.898819625377655, -0.8340721130371094, -0.7693246006965637, -0.7045770883560181, -0.6398296356201172, -0.5750820636749268, -0.5103346109390259, -0.4455870985984802, -0.380839467048645, -0.31609195470809937, -0.2513444423675537, -0.18659695982933044, -0.12184944748878479, -0.057101935148239136, 0.007645547389984131, 0.07239305973052979, 0.13714057207107544, 0.2018880844116211, 0.26663559675216675, 0.33138307929039, 0.39613059163093567, 0.4608781039714813, 0.5256255865097046, 0.5903730988502502, 0.6551206111907959, 0.7198681235313416, 0.7846156358718872, 0.8493630886077881, 0.9141106605529785, 0.9788581132888794, 1.0436055660247803, 1.1083531379699707, 1.1731007099151611, 1.237848162651062, 1.3025957345962524, 1.3673431873321533, 1.4320907592773438, 1.4968382120132446, 1.5615856647491455, 1.626333236694336, 1.6910806894302368]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 4.0, 3.0, 3.0, 3.0, 8.0, 8.0, 13.0, 12.0, 21.0, 34.0, 56.0, 60.0, 66.0, 63.0, 47.0, 20.0, 15.0, 7.0, 11.0, 8.0, 6.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9985530376434326, -1.9410454034805298, -1.8835376501083374, -1.8260300159454346, -1.7685223817825317, -1.7110146284103394, -1.6535069942474365, -1.5959992408752441, -1.5384916067123413, -1.4809839725494385, -1.423476219177246, -1.3659685850143433, -1.3084609508514404, -1.250953197479248, -1.1934455633163452, -1.1359379291534424, -1.07843017578125, -1.0209225416183472, -0.9634148478507996, -0.905907154083252, -0.8483994603157043, -0.7908917665481567, -0.7333841323852539, -0.6758764386177063, -0.6183688640594482, -0.5608611702919006, -0.5033535361289978, -0.4458458423614502, -0.3883381485939026, -0.33083048462867737, -0.27332282066345215, -0.21581512689590454, -0.15830743312835693, -0.10079975426197052, -0.0432920828461647, 0.014215588569641113, 0.07172326743602753, 0.12923094630241394, 0.18673861026763916, 0.24424630403518677, 0.301753968000412, 0.3592616319656372, 0.4167693257331848, 0.47427698969841003, 0.5317846536636353, 0.5892923474311829, 0.6468000411987305, 0.7043076753616333, 0.7618153691291809, 0.8193230628967285, 0.8768306970596313, 0.934338390827179, 0.9918460845947266, 1.0493537187576294, 1.1068613529205322, 1.1643691062927246, 1.2218767404556274, 1.2793843746185303, 1.3368921279907227, 1.3943997621536255, 1.4519073963165283, 1.5094151496887207, 1.5669227838516235, 1.6244304180145264, 1.6819381713867188]}, "eval/loss": 0.35239124298095703, "eval/wer": 0.10420468068226894, "eval/runtime": 326.5742, "eval/samples_per_second": 8.09, "eval/steps_per_second": 0.508, "train/train_runtime": 25891.0003, "train/train_samples_per_second": 11.022, "train/train_steps_per_second": 0.043, "train/total_flos": 0.0, "train/train_loss": 2.1241667401347613} \ No newline at end of file