diff --git "a/wandb/run-20220505_173748-b097rk18/files/wandb-summary.json" "b/wandb/run-20220505_173748-b097rk18/files/wandb-summary.json" --- "a/wandb/run-20220505_173748-b097rk18/files/wandb-summary.json" +++ "b/wandb/run-20220505_173748-b097rk18/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 2.2063, "train/learning_rate": 5.972477064220184e-06, "train/epoch": 2.47, "train/global_step": 4000, "_runtime": 57505, "_timestamp": 1651829773, "_step": 4007, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 13.0, 44.0, 74.0, 144.0, 206.0, 198.0, 163.0, 108.0, 37.0, 18.0, 4.0, 0.0, 0.0, 1.0], "bins": [-1.9302027225494385, -1.8950679302215576, -1.8599330186843872, -1.8247982263565063, -1.789663314819336, -1.754528522491455, -1.7193936109542847, -1.6842588186264038, -1.6491239070892334, -1.6139891147613525, -1.5788542032241821, -1.5437194108963013, -1.5085844993591309, -1.47344970703125, -1.4383147954940796, -1.4031800031661987, -1.3680452108383179, -1.332910418510437, -1.2977755069732666, -1.2626407146453857, -1.2275058031082153, -1.1923710107803345, -1.157236099243164, -1.1221013069152832, -1.0869665145874023, -1.0518317222595215, -1.016696810722351, -0.9815619587898254, -0.9464271068572998, -0.911292314529419, -0.8761574625968933, -0.8410226106643677, -0.8058875799179077, -0.7707527279853821, -0.7356178760528564, -0.7004830241203308, -0.6653481721878052, -0.6302133798599243, -0.5950785279273987, -0.559943675994873, -0.5248088240623474, -0.4896739721298218, -0.45453912019729614, -0.4194042980670929, -0.38426944613456726, -0.3491345942020416, -0.3139997720718384, -0.27886492013931274, -0.2437300682067871, -0.20859521627426147, -0.17346037924289703, -0.1383255422115326, -0.10319069027900696, -0.06805583834648132, -0.03292100131511688, 0.0022138357162475586, 0.03734868764877319, 0.07248353213071823, 0.10761837661266327, 0.1427532136440277, 0.17788806557655334, 0.21302291750907898, 0.24815775454044342, 0.28329259157180786, 0.3184274435043335]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 4.0, 11.0, 8.0, 10.0, 6.0, 12.0, 13.0, 10.0, 12.0, 18.0, 28.0, 16.0, 21.0, 27.0, 30.0, 28.0, 39.0, 27.0, 35.0, 45.0, 38.0, 46.0, 30.0, 29.0, 30.0, 34.0, 42.0, 37.0, 38.0, 29.0, 35.0, 31.0, 30.0, 21.0, 18.0, 26.0, 19.0, 14.0, 11.0, 5.0, 7.0, 5.0, 4.0, 6.0, 4.0, 8.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.3742057681083679, -0.3616308569908142, -0.3490559458732605, -0.3364810347557068, -0.3239060938358307, -0.311331182718277, -0.29875627160072327, -0.28618136048316956, -0.27360644936561584, -0.26103153824806213, -0.24845661222934723, -0.23588170111179352, -0.2233067899942398, -0.2107318639755249, -0.1981569528579712, -0.18558204174041748, -0.17300711572170258, -0.16043220460414886, -0.14785727858543396, -0.13528236746788025, -0.12270745635032654, -0.11013253778219223, -0.09755761921405792, -0.08498270809650421, -0.0724077895283699, -0.059832874685525894, -0.047257959842681885, -0.03468304127454758, -0.022108126431703568, -0.009533211588859558, 0.0030417069792747498, 0.01561661809682846, 0.02819153666496277, 0.04076645150780678, 0.05334136635065079, 0.0659162849187851, 0.0784911960363388, 0.09106611460447311, 0.10364103317260742, 0.11621594429016113, 0.12879085540771484, 0.14136576652526855, 0.15394069254398346, 0.16651560366153717, 0.17909051477909088, 0.1916654407978058, 0.2042403519153595, 0.2168152630329132, 0.2293901890516281, 0.24196510016918182, 0.25454002618789673, 0.26711493730545044, 0.27968984842300415, 0.29226475954055786, 0.3048396706581116, 0.3174145817756653, 0.3299895226955414, 0.3425644338130951, 0.3551393449306488, 0.3677142858505249, 0.3802891969680786, 0.3928641080856323, 0.40543901920318604, 0.41801393032073975, 0.43058884143829346]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 11.0, 17.0, 15.0, 20.0, 25.0, 43.0, 52.0, 79.0, 150.0, 172.0, 317.0, 473.0, 802.0, 1399.0, 2615.0, 5560.0, 13004.0, 32638.0, 87229.0, 214239.0, 469599.0, 866516.0, 1091776.0, 749619.0, 385070.0, 165821.0, 63622.0, 23994.0, 9838.0, 4364.0, 2165.0, 1172.0, 678.0, 400.0, 300.0, 166.0, 103.0, 79.0, 43.0, 35.0, 25.0, 13.0, 7.0, 9.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.6259765625, -0.6077499389648438, -0.5895233154296875, -0.5712966918945312, -0.553070068359375, -0.5348434448242188, -0.5166168212890625, -0.49839019775390625, -0.48016357421875, -0.46193695068359375, -0.4437103271484375, -0.42548370361328125, -0.407257080078125, -0.38903045654296875, -0.3708038330078125, -0.35257720947265625, -0.3343505859375, -0.31612396240234375, -0.2978973388671875, -0.27967071533203125, -0.261444091796875, -0.24321746826171875, -0.2249908447265625, -0.20676422119140625, -0.18853759765625, -0.17031097412109375, -0.1520843505859375, -0.13385772705078125, -0.115631103515625, -0.09740447998046875, -0.0791778564453125, -0.06095123291015625, -0.042724609375, -0.02449798583984375, -0.0062713623046875, 0.01195526123046875, 0.030181884765625, 0.04840850830078125, 0.0666351318359375, 0.08486175537109375, 0.10308837890625, 0.12131500244140625, 0.1395416259765625, 0.15776824951171875, 0.175994873046875, 0.19422149658203125, 0.2124481201171875, 0.23067474365234375, 0.2489013671875, 0.26712799072265625, 0.2853546142578125, 0.30358123779296875, 0.321807861328125, 0.34003448486328125, 0.3582611083984375, 0.37648773193359375, 0.39471435546875, 0.41294097900390625, 0.4311676025390625, 0.44939422607421875, 0.467620849609375, 0.48584747314453125, 0.5040740966796875, 0.5223007202148438, 0.54052734375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 2.0, 4.0, 6.0, 7.0, 10.0, 14.0, 13.0, 18.0, 16.0, 16.0, 15.0, 21.0, 23.0, 25.0, 26.0, 37.0, 33.0, 39.0, 32.0, 30.0, 36.0, 32.0, 39.0, 36.0, 20.0, 42.0, 49.0, 31.0, 32.0, 33.0, 32.0, 32.0, 22.0, 34.0, 21.0, 19.0, 12.0, 23.0, 8.0, 8.0, 7.0, 11.0, 8.0, 8.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.63671875, -0.6169815063476562, -0.5972442626953125, -0.5775070190429688, -0.557769775390625, -0.5380325317382812, -0.5182952880859375, -0.49855804443359375, -0.47882080078125, -0.45908355712890625, -0.4393463134765625, -0.41960906982421875, -0.399871826171875, -0.38013458251953125, -0.3603973388671875, -0.34066009521484375, -0.3209228515625, -0.30118560791015625, -0.2814483642578125, -0.26171112060546875, -0.241973876953125, -0.22223663330078125, -0.2024993896484375, -0.18276214599609375, -0.16302490234375, -0.14328765869140625, -0.1235504150390625, -0.10381317138671875, -0.084075927734375, -0.06433868408203125, -0.0446014404296875, -0.02486419677734375, -0.005126953125, 0.01461029052734375, 0.0343475341796875, 0.05408477783203125, 0.073822021484375, 0.09355926513671875, 0.1132965087890625, 0.13303375244140625, 0.15277099609375, 0.17250823974609375, 0.1922454833984375, 0.21198272705078125, 0.231719970703125, 0.25145721435546875, 0.2711944580078125, 0.29093170166015625, 0.3106689453125, 0.33040618896484375, 0.3501434326171875, 0.36988067626953125, 0.389617919921875, 0.40935516357421875, 0.4290924072265625, 0.44882965087890625, 0.46856689453125, 0.48830413818359375, 0.5080413818359375, 0.5277786254882812, 0.547515869140625, 0.5672531127929688, 0.5869903564453125, 0.6067276000976562, 0.62646484375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 12.0, 12.0, 18.0, 43.0, 58.0, 102.0, 144.0, 292.0, 558.0, 3330.0, 4179908.0, 8401.0, 637.0, 295.0, 152.0, 86.0, 81.0, 46.0, 23.0, 14.0, 19.0, 6.0, 8.0, 4.0, 8.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.625, -11.2984619140625, -10.971923828125, -10.6453857421875, -10.31884765625, -9.9923095703125, -9.665771484375, -9.3392333984375, -9.0126953125, -8.6861572265625, -8.359619140625, -8.0330810546875, -7.70654296875, -7.3800048828125, -7.053466796875, -6.7269287109375, -6.400390625, -6.0738525390625, -5.747314453125, -5.4207763671875, -5.09423828125, -4.7677001953125, -4.441162109375, -4.1146240234375, -3.7880859375, -3.4615478515625, -3.135009765625, -2.8084716796875, -2.48193359375, -2.1553955078125, -1.828857421875, -1.5023193359375, -1.17578125, -0.8492431640625, -0.522705078125, -0.1961669921875, 0.13037109375, 0.4569091796875, 0.783447265625, 1.1099853515625, 1.4365234375, 1.7630615234375, 2.089599609375, 2.4161376953125, 2.74267578125, 3.0692138671875, 3.395751953125, 3.7222900390625, 4.048828125, 4.3753662109375, 4.701904296875, 5.0284423828125, 5.35498046875, 5.6815185546875, 6.008056640625, 6.3345947265625, 6.6611328125, 6.9876708984375, 7.314208984375, 7.6407470703125, 7.96728515625, 8.2938232421875, 8.620361328125, 8.9468994140625, 9.2734375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 12.0, 10.0, 18.0, 21.0, 41.0, 78.0, 106.0, 162.0, 272.0, 403.0, 629.0, 800.0, 555.0, 352.0, 197.0, 135.0, 89.0, 62.0, 36.0, 30.0, 17.0, 8.0, 6.0, 6.0, 7.0, 5.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.494140625, -0.48091888427734375, -0.4676971435546875, -0.45447540283203125, -0.441253662109375, -0.42803192138671875, -0.4148101806640625, -0.40158843994140625, -0.38836669921875, -0.37514495849609375, -0.3619232177734375, -0.34870147705078125, -0.335479736328125, -0.32225799560546875, -0.3090362548828125, -0.29581451416015625, -0.2825927734375, -0.26937103271484375, -0.2561492919921875, -0.24292755126953125, -0.229705810546875, -0.21648406982421875, -0.2032623291015625, -0.19004058837890625, -0.17681884765625, -0.16359710693359375, -0.1503753662109375, -0.13715362548828125, -0.123931884765625, -0.11071014404296875, -0.0974884033203125, -0.08426666259765625, -0.071044921875, -0.05782318115234375, -0.0446014404296875, -0.03137969970703125, -0.018157958984375, -0.00493621826171875, 0.0082855224609375, 0.02150726318359375, 0.03472900390625, 0.04795074462890625, 0.0611724853515625, 0.07439422607421875, 0.087615966796875, 0.10083770751953125, 0.1140594482421875, 0.12728118896484375, 0.1405029296875, 0.15372467041015625, 0.1669464111328125, 0.18016815185546875, 0.193389892578125, 0.20661163330078125, 0.2198333740234375, 0.23305511474609375, 0.24627685546875, 0.25949859619140625, 0.2727203369140625, 0.28594207763671875, 0.299163818359375, 0.31238555908203125, 0.3256072998046875, 0.33882904052734375, 0.35205078125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 6.0, 4.0, 15.0, 13.0, 21.0, 18.0, 27.0, 39.0, 36.0, 63.0, 62.0, 80.0, 80.0, 108.0, 79.0, 71.0, 80.0, 66.0, 41.0, 24.0, 29.0, 15.0, 14.0, 11.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1213198900222778, -1.0827076435089111, -1.0440953969955444, -1.0054831504821777, -0.9668708443641663, -0.9282585978507996, -0.8896462917327881, -0.8510340452194214, -0.8124217987060547, -0.773809552192688, -0.7351973056793213, -0.6965849995613098, -0.6579727530479431, -0.6193605065345764, -0.5807482004165649, -0.5421359539031982, -0.5035237073898315, -0.46491146087646484, -0.42629918456077576, -0.38768690824508667, -0.34907466173171997, -0.31046241521835327, -0.2718501389026642, -0.2332378625869751, -0.1946256160736084, -0.1560133546590805, -0.11740109324455261, -0.07878883183002472, -0.040176570415496826, -0.001564309000968933, 0.03704795241355896, 0.07566022872924805, 0.11427247524261475, 0.15288473665714264, 0.19149699807167053, 0.23010925948619843, 0.2687215209007263, 0.307333767414093, 0.3459460437297821, 0.3845583200454712, 0.4231705665588379, 0.4617828130722046, 0.5003950595855713, 0.5390073657035828, 0.5776196122169495, 0.6162318587303162, 0.6548441648483276, 0.6934564113616943, 0.732068657875061, 0.7706809043884277, 0.8092931509017944, 0.8479054570198059, 0.8865177035331726, 0.9251299500465393, 0.9637422561645508, 1.0023545026779175, 1.0409667491912842, 1.0795789957046509, 1.1181912422180176, 1.1568034887313843, 1.195415735244751, 1.2340281009674072, 1.272640347480774, 1.3112525939941406, 1.3498648405075073]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 0.0, 8.0, 1.0, 5.0, 8.0, 6.0, 6.0, 14.0, 8.0, 13.0, 16.0, 21.0, 16.0, 28.0, 18.0, 34.0, 24.0, 28.0, 18.0, 41.0, 33.0, 39.0, 41.0, 43.0, 44.0, 32.0, 52.0, 40.0, 40.0, 38.0, 31.0, 26.0, 34.0, 25.0, 25.0, 19.0, 20.0, 23.0, 14.0, 13.0, 17.0, 11.0, 4.0, 4.0, 5.0, 7.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.6490494012832642, -0.6292263269424438, -0.6094032526016235, -0.589580237865448, -0.5697571635246277, -0.5499340891838074, -0.5301110148429871, -0.5102879405021667, -0.4904648959636688, -0.4706418216228485, -0.4508187770843506, -0.4309957027435303, -0.41117262840270996, -0.39134958386421204, -0.3715265095233917, -0.3517034649848938, -0.3318803906440735, -0.3120573163032532, -0.29223427176475525, -0.27241119742393494, -0.252588152885437, -0.2327650785446167, -0.2129420042037964, -0.19311894476413727, -0.17329588532447815, -0.15347282588481903, -0.1336497664451599, -0.1138266921043396, -0.09400363266468048, -0.07418057322502136, -0.05435750633478165, -0.03453443944454193, -0.014711320400238037, 0.00511174276471138, 0.024934805929660797, 0.044757869094610214, 0.06458093225955963, 0.08440399169921875, 0.10422705858945847, 0.12405012547969818, 0.1438731849193573, 0.16369624435901642, 0.18351930379867554, 0.20334237813949585, 0.22316543757915497, 0.2429884970188141, 0.2628115713596344, 0.2826346158981323, 0.30245769023895264, 0.32228076457977295, 0.3421038091182709, 0.3619268834590912, 0.3817499279975891, 0.4015730023384094, 0.42139607667922974, 0.44121915102005005, 0.461042195558548, 0.4808652698993683, 0.5006883144378662, 0.5205113887786865, 0.5403344631195068, 0.5601575374603271, 0.5799805521965027, 0.599803626537323, 0.6196267008781433]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 9.0, 5.0, 6.0, 16.0, 17.0, 34.0, 56.0, 82.0, 109.0, 150.0, 230.0, 293.0, 429.0, 725.0, 1071.0, 1588.0, 2515.0, 4005.0, 6923.0, 12096.0, 21245.0, 39414.0, 74440.0, 136281.0, 217572.0, 218907.0, 139765.0, 76786.0, 40679.0, 22281.0, 12192.0, 7081.0, 4086.0, 2526.0, 1606.0, 1116.0, 753.0, 460.0, 318.0, 236.0, 140.0, 100.0, 87.0, 41.0, 21.0, 16.0, 17.0, 13.0, 4.0, 10.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1796875, -0.17407608032226562, -0.16846466064453125, -0.16285324096679688, -0.1572418212890625, -0.15163040161132812, -0.14601898193359375, -0.14040756225585938, -0.134796142578125, -0.12918472290039062, -0.12357330322265625, -0.11796188354492188, -0.1123504638671875, -0.10673904418945312, -0.10112762451171875, -0.09551620483398438, -0.08990478515625, -0.08429336547851562, -0.07868194580078125, -0.07307052612304688, -0.0674591064453125, -0.061847686767578125, -0.05623626708984375, -0.050624847412109375, -0.045013427734375, -0.039402008056640625, -0.03379058837890625, -0.028179168701171875, -0.0225677490234375, -0.016956329345703125, -0.01134490966796875, -0.005733489990234375, -0.0001220703125, 0.005489349365234375, 0.01110076904296875, 0.016712188720703125, 0.0223236083984375, 0.027935028076171875, 0.03354644775390625, 0.039157867431640625, 0.044769287109375, 0.050380706787109375, 0.05599212646484375, 0.061603546142578125, 0.0672149658203125, 0.07282638549804688, 0.07843780517578125, 0.08404922485351562, 0.08966064453125, 0.09527206420898438, 0.10088348388671875, 0.10649490356445312, 0.1121063232421875, 0.11771774291992188, 0.12332916259765625, 0.12894058227539062, 0.134552001953125, 0.14016342163085938, 0.14577484130859375, 0.15138626098632812, 0.1569976806640625, 0.16260910034179688, 0.16822052001953125, 0.17383193969726562, 0.179443359375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 5.0, 7.0, 3.0, 14.0, 8.0, 10.0, 8.0, 21.0, 16.0, 22.0, 25.0, 35.0, 24.0, 33.0, 26.0, 42.0, 41.0, 39.0, 41.0, 55.0, 54.0, 43.0, 42.0, 43.0, 35.0, 40.0, 33.0, 41.0, 30.0, 28.0, 25.0, 12.0, 20.0, 11.0, 21.0, 10.0, 9.0, 7.0, 4.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.59765625, -0.5807571411132812, -0.5638580322265625, -0.5469589233398438, -0.530059814453125, -0.5131607055664062, -0.4962615966796875, -0.47936248779296875, -0.46246337890625, -0.44556427001953125, -0.4286651611328125, -0.41176605224609375, -0.394866943359375, -0.37796783447265625, -0.3610687255859375, -0.34416961669921875, -0.3272705078125, -0.31037139892578125, -0.2934722900390625, -0.27657318115234375, -0.259674072265625, -0.24277496337890625, -0.2258758544921875, -0.20897674560546875, -0.19207763671875, -0.17517852783203125, -0.1582794189453125, -0.14138031005859375, -0.124481201171875, -0.10758209228515625, -0.0906829833984375, -0.07378387451171875, -0.056884765625, -0.03998565673828125, -0.0230865478515625, -0.00618743896484375, 0.010711669921875, 0.02761077880859375, 0.0445098876953125, 0.06140899658203125, 0.07830810546875, 0.09520721435546875, 0.1121063232421875, 0.12900543212890625, 0.145904541015625, 0.16280364990234375, 0.1797027587890625, 0.19660186767578125, 0.2135009765625, 0.23040008544921875, 0.2472991943359375, 0.26419830322265625, 0.281097412109375, 0.29799652099609375, 0.3148956298828125, 0.33179473876953125, 0.34869384765625, 0.36559295654296875, 0.3824920654296875, 0.39939117431640625, 0.416290283203125, 0.43318939208984375, 0.4500885009765625, 0.46698760986328125, 0.48388671875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 5.0, 7.0, 4.0, 12.0, 7.0, 15.0, 27.0, 38.0, 60.0, 87.0, 148.0, 239.0, 406.0, 745.0, 1670.0, 4030.0, 11500.0, 39524.0, 177753.0, 507956.0, 231393.0, 50222.0, 14057.0, 4735.0, 1959.0, 860.0, 462.0, 215.0, 154.0, 90.0, 45.0, 41.0, 32.0, 26.0, 10.0, 9.0, 4.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.50634765625, -0.49170684814453125, -0.4770660400390625, -0.46242523193359375, -0.447784423828125, -0.43314361572265625, -0.4185028076171875, -0.40386199951171875, -0.38922119140625, -0.37458038330078125, -0.3599395751953125, -0.34529876708984375, -0.330657958984375, -0.31601715087890625, -0.3013763427734375, -0.28673553466796875, -0.2720947265625, -0.25745391845703125, -0.2428131103515625, -0.22817230224609375, -0.213531494140625, -0.19889068603515625, -0.1842498779296875, -0.16960906982421875, -0.15496826171875, -0.14032745361328125, -0.1256866455078125, -0.11104583740234375, -0.096405029296875, -0.08176422119140625, -0.0671234130859375, -0.05248260498046875, -0.037841796875, -0.02320098876953125, -0.0085601806640625, 0.00608062744140625, 0.020721435546875, 0.03536224365234375, 0.0500030517578125, 0.06464385986328125, 0.07928466796875, 0.09392547607421875, 0.1085662841796875, 0.12320709228515625, 0.137847900390625, 0.15248870849609375, 0.1671295166015625, 0.18177032470703125, 0.1964111328125, 0.21105194091796875, 0.2256927490234375, 0.24033355712890625, 0.254974365234375, 0.26961517333984375, 0.2842559814453125, 0.29889678955078125, 0.31353759765625, 0.32817840576171875, 0.3428192138671875, 0.35746002197265625, 0.372100830078125, 0.38674163818359375, 0.4013824462890625, 0.41602325439453125, 0.4306640625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 9.0, 6.0, 10.0, 14.0, 13.0, 19.0, 23.0, 29.0, 22.0, 26.0, 29.0, 28.0, 40.0, 43.0, 38.0, 45.0, 51.0, 43.0, 37.0, 43.0, 41.0, 40.0, 46.0, 31.0, 28.0, 49.0, 39.0, 23.0, 21.0, 17.0, 17.0, 12.0, 15.0, 15.0, 9.0, 7.0, 8.0, 2.0, 6.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.130859375, -1.09613037109375, -1.0614013671875, -1.02667236328125, -0.991943359375, -0.95721435546875, -0.9224853515625, -0.88775634765625, -0.85302734375, -0.81829833984375, -0.7835693359375, -0.74884033203125, -0.714111328125, -0.67938232421875, -0.6446533203125, -0.60992431640625, -0.5751953125, -0.54046630859375, -0.5057373046875, -0.47100830078125, -0.436279296875, -0.40155029296875, -0.3668212890625, -0.33209228515625, -0.29736328125, -0.26263427734375, -0.2279052734375, -0.19317626953125, -0.158447265625, -0.12371826171875, -0.0889892578125, -0.05426025390625, -0.01953125, 0.01519775390625, 0.0499267578125, 0.08465576171875, 0.119384765625, 0.15411376953125, 0.1888427734375, 0.22357177734375, 0.25830078125, 0.29302978515625, 0.3277587890625, 0.36248779296875, 0.397216796875, 0.43194580078125, 0.4666748046875, 0.50140380859375, 0.5361328125, 0.57086181640625, 0.6055908203125, 0.64031982421875, 0.675048828125, 0.70977783203125, 0.7445068359375, 0.77923583984375, 0.81396484375, 0.84869384765625, 0.8834228515625, 0.91815185546875, 0.952880859375, 0.98760986328125, 1.0223388671875, 1.05706787109375, 1.091796875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 1.0, 4.0, 7.0, 6.0, 13.0, 13.0, 38.0, 59.0, 62.0, 89.0, 143.0, 276.0, 435.0, 895.0, 1504.0, 3869.0, 11100.0, 54077.0, 558284.0, 367872.0, 35222.0, 8386.0, 3085.0, 1400.0, 705.0, 383.0, 237.0, 140.0, 88.0, 45.0, 34.0, 21.0, 21.0, 11.0, 11.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.237060546875, -0.2285614013671875, -0.220062255859375, -0.2115631103515625, -0.20306396484375, -0.1945648193359375, -0.186065673828125, -0.1775665283203125, -0.1690673828125, -0.1605682373046875, -0.152069091796875, -0.1435699462890625, -0.13507080078125, -0.1265716552734375, -0.118072509765625, -0.1095733642578125, -0.10107421875, -0.0925750732421875, -0.084075927734375, -0.0755767822265625, -0.06707763671875, -0.0585784912109375, -0.050079345703125, -0.0415802001953125, -0.0330810546875, -0.0245819091796875, -0.016082763671875, -0.0075836181640625, 0.00091552734375, 0.0094146728515625, 0.017913818359375, 0.0264129638671875, 0.034912109375, 0.0434112548828125, 0.051910400390625, 0.0604095458984375, 0.06890869140625, 0.0774078369140625, 0.085906982421875, 0.0944061279296875, 0.1029052734375, 0.1114044189453125, 0.119903564453125, 0.1284027099609375, 0.13690185546875, 0.1454010009765625, 0.153900146484375, 0.1623992919921875, 0.1708984375, 0.1793975830078125, 0.187896728515625, 0.1963958740234375, 0.20489501953125, 0.2133941650390625, 0.221893310546875, 0.2303924560546875, 0.2388916015625, 0.2473907470703125, 0.255889892578125, 0.2643890380859375, 0.27288818359375, 0.2813873291015625, 0.289886474609375, 0.2983856201171875, 0.306884765625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 6.0, 6.0, 11.0, 16.0, 37.0, 50.0, 75.0, 143.0, 187.0, 163.0, 105.0, 72.0, 45.0, 36.0, 19.0, 13.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001310110092163086, -0.0001268964260816574, -0.00012278184294700623, -0.00011866725981235504, -0.00011455267667770386, -0.00011043809354305267, -0.00010632351040840149, -0.0001022089272737503, -9.809434413909912e-05, -9.397976100444794e-05, -8.986517786979675e-05, -8.575059473514557e-05, -8.163601160049438e-05, -7.75214284658432e-05, -7.340684533119202e-05, -6.929226219654083e-05, -6.517767906188965e-05, -6.106309592723846e-05, -5.694851279258728e-05, -5.2833929657936096e-05, -4.871934652328491e-05, -4.460476338863373e-05, -4.0490180253982544e-05, -3.637559711933136e-05, -3.2261013984680176e-05, -2.8146430850028992e-05, -2.4031847715377808e-05, -1.9917264580726624e-05, -1.580268144607544e-05, -1.1688098311424255e-05, -7.573515176773071e-06, -3.458932042121887e-06, 6.556510925292969e-07, 4.770234227180481e-06, 8.884817361831665e-06, 1.2999400496482849e-05, 1.7113983631134033e-05, 2.1228566765785217e-05, 2.53431499004364e-05, 2.9457733035087585e-05, 3.357231616973877e-05, 3.7686899304389954e-05, 4.180148243904114e-05, 4.591606557369232e-05, 5.0030648708343506e-05, 5.414523184299469e-05, 5.8259814977645874e-05, 6.237439811229706e-05, 6.648898124694824e-05, 7.060356438159943e-05, 7.471814751625061e-05, 7.88327306509018e-05, 8.294731378555298e-05, 8.706189692020416e-05, 9.117648005485535e-05, 9.529106318950653e-05, 9.940564632415771e-05, 0.0001035202294588089, 0.00010763481259346008, 0.00011174939572811127, 0.00011586397886276245, 0.00011997856199741364, 0.00012409314513206482, 0.000128207728266716, 0.0001323223114013672]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 8.0, 2.0, 7.0, 5.0, 4.0, 18.0, 4.0, 16.0, 31.0, 48.0, 80.0, 134.0, 466.0, 2553.0, 29771.0, 938810.0, 71471.0, 3977.0, 693.0, 220.0, 96.0, 35.0, 30.0, 21.0, 12.0, 15.0, 6.0, 3.0, 5.0, 3.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.68603515625, -0.6667709350585938, -0.6475067138671875, -0.6282424926757812, -0.608978271484375, -0.5897140502929688, -0.5704498291015625, -0.5511856079101562, -0.53192138671875, -0.5126571655273438, -0.4933929443359375, -0.47412872314453125, -0.454864501953125, -0.43560028076171875, -0.4163360595703125, -0.39707183837890625, -0.3778076171875, -0.35854339599609375, -0.3392791748046875, -0.32001495361328125, -0.300750732421875, -0.28148651123046875, -0.2622222900390625, -0.24295806884765625, -0.22369384765625, -0.20442962646484375, -0.1851654052734375, -0.16590118408203125, -0.146636962890625, -0.12737274169921875, -0.1081085205078125, -0.08884429931640625, -0.069580078125, -0.05031585693359375, -0.0310516357421875, -0.01178741455078125, 0.007476806640625, 0.02674102783203125, 0.0460052490234375, 0.06526947021484375, 0.08453369140625, 0.10379791259765625, 0.1230621337890625, 0.14232635498046875, 0.161590576171875, 0.18085479736328125, 0.2001190185546875, 0.21938323974609375, 0.2386474609375, 0.25791168212890625, 0.2771759033203125, 0.29644012451171875, 0.315704345703125, 0.33496856689453125, 0.3542327880859375, 0.37349700927734375, 0.39276123046875, 0.41202545166015625, 0.4312896728515625, 0.45055389404296875, 0.469818115234375, 0.48908233642578125, 0.5083465576171875, 0.5276107788085938, 0.546875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 4.0, 8.0, 10.0, 15.0, 28.0, 42.0, 55.0, 99.0, 122.0, 132.0, 151.0, 103.0, 74.0, 47.0, 35.0, 17.0, 17.0, 5.0, 5.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0882568359375, -0.08563899993896484, -0.08302116394042969, -0.08040332794189453, -0.07778549194335938, -0.07516765594482422, -0.07254981994628906, -0.0699319839477539, -0.06731414794921875, -0.0646963119506836, -0.06207847595214844, -0.05946063995361328, -0.056842803955078125, -0.05422496795654297, -0.05160713195800781, -0.048989295959472656, -0.0463714599609375, -0.043753623962402344, -0.04113578796386719, -0.03851795196533203, -0.035900115966796875, -0.03328227996826172, -0.030664443969726562, -0.028046607971191406, -0.02542877197265625, -0.022810935974121094, -0.020193099975585938, -0.01757526397705078, -0.014957427978515625, -0.012339591979980469, -0.009721755981445312, -0.007103919982910156, -0.004486083984375, -0.0018682479858398438, 0.0007495880126953125, 0.0033674240112304688, 0.005985260009765625, 0.008603096008300781, 0.011220932006835938, 0.013838768005371094, 0.01645660400390625, 0.019074440002441406, 0.021692276000976562, 0.02431011199951172, 0.026927947998046875, 0.02954578399658203, 0.03216361999511719, 0.034781455993652344, 0.0373992919921875, 0.040017127990722656, 0.04263496398925781, 0.04525279998779297, 0.047870635986328125, 0.05048847198486328, 0.05310630798339844, 0.055724143981933594, 0.05834197998046875, 0.060959815979003906, 0.06357765197753906, 0.06619548797607422, 0.06881332397460938, 0.07143115997314453, 0.07404899597167969, 0.07666683197021484, 0.07928466796875]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 9.0, 13.0, 23.0, 37.0, 55.0, 68.0, 113.0, 131.0, 131.0, 138.0, 94.0, 69.0, 52.0, 33.0, 15.0, 6.0, 9.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.1161253452301025, -2.0722553730010986, -2.028385639190674, -1.9845157861709595, -1.9406459331512451, -1.8967760801315308, -1.8529062271118164, -1.809036374092102, -1.7651665210723877, -1.7212966680526733, -1.677426815032959, -1.6335569620132446, -1.5896871089935303, -1.545817255973816, -1.5019474029541016, -1.4580775499343872, -1.4142076969146729, -1.3703378438949585, -1.3264679908752441, -1.2825981378555298, -1.2387282848358154, -1.194858431816101, -1.1509885787963867, -1.1071187257766724, -1.0632487535476685, -1.019378900527954, -0.9755090475082397, -0.9316391944885254, -0.887769341468811, -0.8438994884490967, -0.8000296354293823, -0.756159782409668, -0.7122898697853088, -0.6684200167655945, -0.6245501637458801, -0.5806803107261658, -0.5368104577064514, -0.49294060468673706, -0.4490707218647003, -0.40520086884498596, -0.3613310158252716, -0.31746116280555725, -0.2735913097858429, -0.22972144186496735, -0.185851588845253, -0.14198173582553864, -0.09811186790466309, -0.05424201488494873, -0.010372161865234375, 0.03349769487977028, 0.07736755162477493, 0.12123741209506989, 0.16510726511478424, 0.2089771181344986, 0.25284698605537415, 0.2967168390750885, 0.34058669209480286, 0.3844565451145172, 0.42832639813423157, 0.4721962809562683, 0.5160661339759827, 0.559935986995697, 0.6038058400154114, 0.6476756930351257, 0.6915455460548401]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 7.0, 1.0, 7.0, 5.0, 11.0, 10.0, 13.0, 14.0, 22.0, 19.0, 22.0, 22.0, 31.0, 23.0, 29.0, 28.0, 38.0, 36.0, 42.0, 42.0, 44.0, 35.0, 43.0, 46.0, 41.0, 37.0, 36.0, 37.0, 46.0, 27.0, 19.0, 26.0, 26.0, 18.0, 21.0, 16.0, 12.0, 7.0, 17.0, 6.0, 5.0, 3.0, 4.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5063486099243164, -0.4902411103248596, -0.47413361072540283, -0.45802611112594604, -0.44191861152648926, -0.42581111192703247, -0.4097035825252533, -0.3935960829257965, -0.3774885833263397, -0.36138108372688293, -0.34527358412742615, -0.32916608452796936, -0.3130585551261902, -0.2969510555267334, -0.2808435559272766, -0.2647360563278198, -0.24862855672836304, -0.23252105712890625, -0.21641355752944946, -0.20030604302883148, -0.1841985434293747, -0.1680910438299179, -0.15198352932929993, -0.13587602972984314, -0.11976853013038635, -0.10366103053092957, -0.08755352348089218, -0.0714460164308548, -0.05533851683139801, -0.03923101723194122, -0.02312351018190384, -0.007016003131866455, 0.009091496467590332, 0.025198999792337418, 0.0413065031170845, 0.05741400644183159, 0.07352150976657867, 0.08962900936603546, 0.10573651641607285, 0.12184402346611023, 0.13795152306556702, 0.1540590226650238, 0.1701665222644806, 0.18627403676509857, 0.20238153636455536, 0.21848903596401215, 0.23459655046463013, 0.2507040500640869, 0.2668115496635437, 0.2829190492630005, 0.2990265488624573, 0.31513404846191406, 0.33124154806137085, 0.34734904766082764, 0.3634565770626068, 0.3795640766620636, 0.3956715762615204, 0.4117790758609772, 0.42788657546043396, 0.44399407505989075, 0.4601016044616699, 0.4762091040611267, 0.4923166036605835, 0.5084241032600403, 0.5245316028594971]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 6.0, 12.0, 17.0, 23.0, 34.0, 69.0, 96.0, 123.0, 242.0, 424.0, 755.0, 1404.0, 2570.0, 5296.0, 11480.0, 26396.0, 62826.0, 140445.0, 248867.0, 262852.0, 156903.0, 71702.0, 30284.0, 13180.0, 6096.0, 2974.0, 1542.0, 788.0, 445.0, 258.0, 155.0, 109.0, 59.0, 46.0, 21.0, 15.0, 10.0, 12.0, 7.0, 4.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.281982421875, -0.2737083435058594, -0.26543426513671875, -0.2571601867675781, -0.2488861083984375, -0.24061203002929688, -0.23233795166015625, -0.22406387329101562, -0.215789794921875, -0.20751571655273438, -0.19924163818359375, -0.19096755981445312, -0.1826934814453125, -0.17441940307617188, -0.16614532470703125, -0.15787124633789062, -0.14959716796875, -0.14132308959960938, -0.13304901123046875, -0.12477493286132812, -0.1165008544921875, -0.10822677612304688, -0.09995269775390625, -0.09167861938476562, -0.083404541015625, -0.07513046264648438, -0.06685638427734375, -0.058582305908203125, -0.0503082275390625, -0.042034149169921875, -0.03376007080078125, -0.025485992431640625, -0.0172119140625, -0.008937835693359375, -0.00066375732421875, 0.007610321044921875, 0.0158843994140625, 0.024158477783203125, 0.03243255615234375, 0.040706634521484375, 0.048980712890625, 0.057254791259765625, 0.06552886962890625, 0.07380294799804688, 0.0820770263671875, 0.09035110473632812, 0.09862518310546875, 0.10689926147460938, 0.11517333984375, 0.12344741821289062, 0.13172149658203125, 0.13999557495117188, 0.1482696533203125, 0.15654373168945312, 0.16481781005859375, 0.17309188842773438, 0.181365966796875, 0.18964004516601562, 0.19791412353515625, 0.20618820190429688, 0.2144622802734375, 0.22273635864257812, 0.23101043701171875, 0.23928451538085938, 0.24755859375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 5.0, 6.0, 9.0, 7.0, 13.0, 10.0, 13.0, 13.0, 13.0, 15.0, 12.0, 18.0, 20.0, 25.0, 23.0, 23.0, 36.0, 34.0, 38.0, 33.0, 55.0, 45.0, 39.0, 44.0, 40.0, 33.0, 39.0, 49.0, 32.0, 38.0, 28.0, 21.0, 32.0, 22.0, 16.0, 22.0, 22.0, 18.0, 9.0, 12.0, 5.0, 3.0, 7.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.619140625, -2.524749755859375, -2.43035888671875, -2.335968017578125, -2.2415771484375, -2.147186279296875, -2.05279541015625, -1.958404541015625, -1.864013671875, -1.769622802734375, -1.67523193359375, -1.580841064453125, -1.4864501953125, -1.392059326171875, -1.29766845703125, -1.203277587890625, -1.10888671875, -1.014495849609375, -0.92010498046875, -0.825714111328125, -0.7313232421875, -0.636932373046875, -0.54254150390625, -0.448150634765625, -0.353759765625, -0.259368896484375, -0.16497802734375, -0.070587158203125, 0.0238037109375, 0.118194580078125, 0.21258544921875, 0.306976318359375, 0.4013671875, 0.495758056640625, 0.59014892578125, 0.684539794921875, 0.7789306640625, 0.873321533203125, 0.96771240234375, 1.062103271484375, 1.156494140625, 1.250885009765625, 1.34527587890625, 1.439666748046875, 1.5340576171875, 1.628448486328125, 1.72283935546875, 1.817230224609375, 1.91162109375, 2.006011962890625, 2.10040283203125, 2.194793701171875, 2.2891845703125, 2.383575439453125, 2.47796630859375, 2.572357177734375, 2.666748046875, 2.761138916015625, 2.85552978515625, 2.949920654296875, 3.0443115234375, 3.138702392578125, 3.23309326171875, 3.327484130859375, 3.421875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 8.0, 4.0, 5.0, 11.0, 12.0, 19.0, 20.0, 31.0, 46.0, 52.0, 63.0, 73.0, 106.0, 159.0, 231.0, 355.0, 637.0, 2038.0, 42602.0, 887529.0, 109221.0, 3220.0, 783.0, 408.0, 236.0, 162.0, 114.0, 108.0, 66.0, 48.0, 45.0, 48.0, 18.0, 25.0, 18.0, 13.0, 9.0, 6.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4697265625, -1.425994873046875, -1.38226318359375, -1.338531494140625, -1.2947998046875, -1.251068115234375, -1.20733642578125, -1.163604736328125, -1.119873046875, -1.076141357421875, -1.03240966796875, -0.988677978515625, -0.9449462890625, -0.901214599609375, -0.85748291015625, -0.813751220703125, -0.77001953125, -0.726287841796875, -0.68255615234375, -0.638824462890625, -0.5950927734375, -0.551361083984375, -0.50762939453125, -0.463897705078125, -0.420166015625, -0.376434326171875, -0.33270263671875, -0.288970947265625, -0.2452392578125, -0.201507568359375, -0.15777587890625, -0.114044189453125, -0.0703125, -0.026580810546875, 0.01715087890625, 0.060882568359375, 0.1046142578125, 0.148345947265625, 0.19207763671875, 0.235809326171875, 0.279541015625, 0.323272705078125, 0.36700439453125, 0.410736083984375, 0.4544677734375, 0.498199462890625, 0.54193115234375, 0.585662841796875, 0.62939453125, 0.673126220703125, 0.71685791015625, 0.760589599609375, 0.8043212890625, 0.848052978515625, 0.89178466796875, 0.935516357421875, 0.979248046875, 1.022979736328125, 1.06671142578125, 1.110443115234375, 1.1541748046875, 1.197906494140625, 1.24163818359375, 1.285369873046875, 1.3291015625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 1.0, 4.0, 4.0, 9.0, 8.0, 8.0, 18.0, 23.0, 22.0, 21.0, 21.0, 31.0, 39.0, 32.0, 49.0, 53.0, 51.0, 76.0, 48.0, 40.0, 66.0, 61.0, 53.0, 48.0, 33.0, 36.0, 33.0, 23.0, 15.0, 20.0, 19.0, 6.0, 8.0, 10.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.923828125, -3.8067626953125, -3.689697265625, -3.5726318359375, -3.45556640625, -3.3385009765625, -3.221435546875, -3.1043701171875, -2.9873046875, -2.8702392578125, -2.753173828125, -2.6361083984375, -2.51904296875, -2.4019775390625, -2.284912109375, -2.1678466796875, -2.05078125, -1.9337158203125, -1.816650390625, -1.6995849609375, -1.58251953125, -1.4654541015625, -1.348388671875, -1.2313232421875, -1.1142578125, -0.9971923828125, -0.880126953125, -0.7630615234375, -0.64599609375, -0.5289306640625, -0.411865234375, -0.2947998046875, -0.177734375, -0.0606689453125, 0.056396484375, 0.1734619140625, 0.29052734375, 0.4075927734375, 0.524658203125, 0.6417236328125, 0.7587890625, 0.8758544921875, 0.992919921875, 1.1099853515625, 1.22705078125, 1.3441162109375, 1.461181640625, 1.5782470703125, 1.6953125, 1.8123779296875, 1.929443359375, 2.0465087890625, 2.16357421875, 2.2806396484375, 2.397705078125, 2.5147705078125, 2.6318359375, 2.7489013671875, 2.865966796875, 2.9830322265625, 3.10009765625, 3.2171630859375, 3.334228515625, 3.4512939453125, 3.568359375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 2.0, 2.0, 4.0, 7.0, 17.0, 39.0, 58.0, 189.0, 876.0, 22212.0, 1019943.0, 4556.0, 410.0, 117.0, 58.0, 27.0, 11.0, 6.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0], "bins": [-1.23828125, -1.2115440368652344, -1.1848068237304688, -1.1580696105957031, -1.1313323974609375, -1.1045951843261719, -1.0778579711914062, -1.0511207580566406, -1.024383544921875, -0.9976463317871094, -0.9709091186523438, -0.9441719055175781, -0.9174346923828125, -0.8906974792480469, -0.8639602661132812, -0.8372230529785156, -0.81048583984375, -0.7837486267089844, -0.7570114135742188, -0.7302742004394531, -0.7035369873046875, -0.6767997741699219, -0.6500625610351562, -0.6233253479003906, -0.596588134765625, -0.5698509216308594, -0.5431137084960938, -0.5163764953613281, -0.4896392822265625, -0.4629020690917969, -0.43616485595703125, -0.4094276428222656, -0.3826904296875, -0.3559532165527344, -0.32921600341796875, -0.3024787902832031, -0.2757415771484375, -0.24900436401367188, -0.22226715087890625, -0.19552993774414062, -0.168792724609375, -0.14205551147460938, -0.11531829833984375, -0.08858108520507812, -0.0618438720703125, -0.035106658935546875, -0.00836944580078125, 0.018367767333984375, 0.04510498046875, 0.07184219360351562, 0.09857940673828125, 0.12531661987304688, 0.1520538330078125, 0.17879104614257812, 0.20552825927734375, 0.23226547241210938, 0.259002685546875, 0.2857398986816406, 0.31247711181640625, 0.3392143249511719, 0.3659515380859375, 0.3926887512207031, 0.41942596435546875, 0.4461631774902344, 0.472900390625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 14.0, 13.0, 24.0, 28.0, 71.0, 127.0, 204.0, 171.0, 135.0, 87.0, 38.0, 29.0, 14.0, 12.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.11732292175293e-05, -3.002304583787918e-05, -2.8872862458229065e-05, -2.772267907857895e-05, -2.6572495698928833e-05, -2.5422312319278717e-05, -2.42721289396286e-05, -2.3121945559978485e-05, -2.197176218032837e-05, -2.0821578800678253e-05, -1.9671395421028137e-05, -1.852121204137802e-05, -1.7371028661727905e-05, -1.622084528207779e-05, -1.5070661902427673e-05, -1.3920478522777557e-05, -1.2770295143127441e-05, -1.1620111763477325e-05, -1.046992838382721e-05, -9.319745004177094e-06, -8.169561624526978e-06, -7.0193782448768616e-06, -5.869194865226746e-06, -4.71901148557663e-06, -3.5688281059265137e-06, -2.4186447262763977e-06, -1.2684613466262817e-06, -1.1827796697616577e-07, 1.0319054126739502e-06, 2.182088792324066e-06, 3.332272171974182e-06, 4.482455551624298e-06, 5.632638931274414e-06, 6.78282231092453e-06, 7.933005690574646e-06, 9.083189070224762e-06, 1.0233372449874878e-05, 1.1383555829524994e-05, 1.253373920917511e-05, 1.3683922588825226e-05, 1.4834105968475342e-05, 1.5984289348125458e-05, 1.7134472727775574e-05, 1.828465610742569e-05, 1.9434839487075806e-05, 2.058502286672592e-05, 2.1735206246376038e-05, 2.2885389626026154e-05, 2.403557300567627e-05, 2.5185756385326385e-05, 2.63359397649765e-05, 2.7486123144626617e-05, 2.8636306524276733e-05, 2.978648990392685e-05, 3.0936673283576965e-05, 3.208685666322708e-05, 3.32370400428772e-05, 3.438722342252731e-05, 3.553740680217743e-05, 3.6687590181827545e-05, 3.783777356147766e-05, 3.898795694112778e-05, 4.013814032077789e-05, 4.128832370042801e-05, 4.2438507080078125e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 3.0, 10.0, 24.0, 47.0, 89.0, 209.0, 579.0, 2250.0, 27613.0, 930038.0, 82672.0, 3665.0, 813.0, 282.0, 141.0, 58.0, 31.0, 12.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.276611328125, -0.2666015625, -0.256591796875, -0.24658203125, -0.236572265625, -0.2265625, -0.216552734375, -0.20654296875, -0.196533203125, -0.1865234375, -0.176513671875, -0.16650390625, -0.156494140625, -0.146484375, -0.136474609375, -0.12646484375, -0.116455078125, -0.1064453125, -0.096435546875, -0.08642578125, -0.076416015625, -0.06640625, -0.056396484375, -0.04638671875, -0.036376953125, -0.0263671875, -0.016357421875, -0.00634765625, 0.003662109375, 0.013671875, 0.023681640625, 0.03369140625, 0.043701171875, 0.0537109375, 0.063720703125, 0.07373046875, 0.083740234375, 0.09375, 0.103759765625, 0.11376953125, 0.123779296875, 0.1337890625, 0.143798828125, 0.15380859375, 0.163818359375, 0.173828125, 0.183837890625, 0.19384765625, 0.203857421875, 0.2138671875, 0.223876953125, 0.23388671875, 0.243896484375, 0.25390625, 0.263916015625, 0.27392578125, 0.283935546875, 0.2939453125, 0.303955078125, 0.31396484375, 0.323974609375, 0.333984375, 0.343994140625, 0.35400390625, 0.364013671875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 9.0, 10.0, 17.0, 27.0, 41.0, 69.0, 92.0, 161.0, 162.0, 129.0, 90.0, 60.0, 47.0, 33.0, 19.0, 12.0, 10.0, 5.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06884765625, -0.06624126434326172, -0.06363487243652344, -0.061028480529785156, -0.058422088623046875, -0.055815696716308594, -0.05320930480957031, -0.05060291290283203, -0.04799652099609375, -0.04539012908935547, -0.04278373718261719, -0.040177345275878906, -0.037570953369140625, -0.034964561462402344, -0.03235816955566406, -0.02975177764892578, -0.0271453857421875, -0.02453899383544922, -0.021932601928710938, -0.019326210021972656, -0.016719818115234375, -0.014113426208496094, -0.011507034301757812, -0.008900642395019531, -0.00629425048828125, -0.0036878585815429688, -0.0010814666748046875, 0.0015249252319335938, 0.004131317138671875, 0.006737709045410156, 0.009344100952148438, 0.011950492858886719, 0.014556884765625, 0.01716327667236328, 0.019769668579101562, 0.022376060485839844, 0.024982452392578125, 0.027588844299316406, 0.030195236206054688, 0.03280162811279297, 0.03540802001953125, 0.03801441192626953, 0.04062080383300781, 0.043227195739746094, 0.045833587646484375, 0.048439979553222656, 0.05104637145996094, 0.05365276336669922, 0.0562591552734375, 0.05886554718017578, 0.06147193908691406, 0.06407833099365234, 0.06668472290039062, 0.0692911148071289, 0.07189750671386719, 0.07450389862060547, 0.07711029052734375, 0.07971668243408203, 0.08232307434082031, 0.0849294662475586, 0.08753585815429688, 0.09014225006103516, 0.09274864196777344, 0.09535503387451172, 0.09796142578125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 66.0, 346.0, 456.0, 130.0, 15.0], "bins": [-17.658966064453125, -17.370206832885742, -17.08144760131836, -16.792688369750977, -16.503929138183594, -16.21516990661621, -15.926409721374512, -15.637650489807129, -15.348891258239746, -15.060132026672363, -14.77137279510498, -14.482613563537598, -14.193853378295898, -13.905094146728516, -13.616334915161133, -13.32757568359375, -13.038816452026367, -12.750057220458984, -12.461297988891602, -12.172538757324219, -11.883779525756836, -11.595019340515137, -11.306260108947754, -11.017500877380371, -10.728741645812988, -10.439982414245605, -10.151223182678223, -9.86246395111084, -9.57370376586914, -9.284944534301758, -8.996185302734375, -8.707426071166992, -8.41866683959961, -8.129907608032227, -7.841148376464844, -7.552388668060303, -7.26362943649292, -6.974870204925537, -6.686110496520996, -6.397351264953613, -6.1085920333862305, -5.819832801818848, -5.531073570251465, -5.242313861846924, -4.953554630279541, -4.664795398712158, -4.376035690307617, -4.087276458740234, -3.7985169887542725, -3.5097575187683105, -3.2209982872009277, -2.932239055633545, -2.643479585647583, -2.354720115661621, -2.0659608840942383, -1.7772014141082764, -1.4884421825408936, -1.1996828317642212, -0.9109234809875488, -0.6221641302108765, -0.3334047794342041, -0.04464542865753174, 0.24411392211914062, 0.5328733921051025, 0.8216326236724854]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 9.0, 5.0, 6.0, 6.0, 6.0, 15.0, 14.0, 12.0, 17.0, 22.0, 20.0, 23.0, 19.0, 34.0, 28.0, 33.0, 47.0, 38.0, 39.0, 36.0, 48.0, 39.0, 38.0, 34.0, 58.0, 37.0, 42.0, 42.0, 34.0, 26.0, 26.0, 20.0, 24.0, 19.0, 9.0, 12.0, 14.0, 11.0, 6.0, 10.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.449974060058594, -4.299516201019287, -4.149057865142822, -3.9986000061035156, -3.84814190864563, -3.697683811187744, -3.5472257137298584, -3.3967676162719727, -3.246309757232666, -3.0958516597747803, -2.9453935623168945, -2.794935703277588, -2.644477605819702, -2.4940195083618164, -2.3435614109039307, -2.193103313446045, -2.042645215988159, -1.8921871185302734, -1.7417291402816772, -1.5912710428237915, -1.4408130645751953, -1.2903549671173096, -1.1398968696594238, -0.9894388914108276, -0.8389807939529419, -0.6885227560997009, -0.53806471824646, -0.3876066207885742, -0.23714858293533325, -0.08669054508209229, 0.06376755237579346, 0.21422553062438965, 0.3646836280822754, 0.5151416659355164, 0.6655997037887573, 0.8160578012466431, 0.966515839099884, 1.116973876953125, 1.2674319744110107, 1.417889952659607, 1.5683480501174927, 1.7188061475753784, 1.8692641258239746, 2.0197222232818604, 2.170180320739746, 2.3206381797790527, 2.4710965156555176, 2.621554374694824, 2.77201247215271, 2.9224705696105957, 3.0729286670684814, 3.223386764526367, 3.373844623565674, 3.5243027210235596, 3.6747608184814453, 3.825218677520752, 3.975677013397217, 4.126134872436523, 4.276593208312988, 4.427051067352295, 4.57750940322876, 4.727967262268066, 4.878425598144531, 5.028883457183838, 5.1793413162231445]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 8.0, 7.0, 6.0, 6.0, 15.0, 16.0, 18.0, 29.0, 25.0, 40.0, 40.0, 70.0, 91.0, 247.0, 596.0, 2475.0, 14879.0, 148877.0, 1357820.0, 2232344.0, 393235.0, 35922.0, 5223.0, 1340.0, 440.0, 177.0, 94.0, 65.0, 42.0, 28.0, 22.0, 24.0, 9.0, 9.0, 9.0, 12.0, 6.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.09765625, -1.0587310791015625, -1.019805908203125, -0.9808807373046875, -0.94195556640625, -0.9030303955078125, -0.864105224609375, -0.8251800537109375, -0.7862548828125, -0.7473297119140625, -0.708404541015625, -0.6694793701171875, -0.63055419921875, -0.5916290283203125, -0.552703857421875, -0.5137786865234375, -0.474853515625, -0.4359283447265625, -0.397003173828125, -0.3580780029296875, -0.31915283203125, -0.2802276611328125, -0.241302490234375, -0.2023773193359375, -0.1634521484375, -0.1245269775390625, -0.085601806640625, -0.0466766357421875, -0.00775146484375, 0.0311737060546875, 0.070098876953125, 0.1090240478515625, 0.14794921875, 0.1868743896484375, 0.225799560546875, 0.2647247314453125, 0.30364990234375, 0.3425750732421875, 0.381500244140625, 0.4204254150390625, 0.4593505859375, 0.4982757568359375, 0.537200927734375, 0.5761260986328125, 0.61505126953125, 0.6539764404296875, 0.692901611328125, 0.7318267822265625, 0.770751953125, 0.8096771240234375, 0.848602294921875, 0.8875274658203125, 0.92645263671875, 0.9653778076171875, 1.004302978515625, 1.0432281494140625, 1.0821533203125, 1.1210784912109375, 1.160003662109375, 1.1989288330078125, 1.23785400390625, 1.2767791748046875, 1.315704345703125, 1.3546295166015625, 1.3935546875]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 4.0, 8.0, 3.0, 3.0, 11.0, 10.0, 16.0, 20.0, 25.0, 19.0, 28.0, 25.0, 38.0, 44.0, 45.0, 31.0, 57.0, 49.0, 52.0, 55.0, 50.0, 45.0, 51.0, 40.0, 45.0, 32.0, 25.0, 25.0, 29.0, 22.0, 19.0, 15.0, 10.0, 4.0, 18.0, 7.0, 2.0, 6.0, 2.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7939453125, -0.7706146240234375, -0.747283935546875, -0.7239532470703125, -0.70062255859375, -0.6772918701171875, -0.653961181640625, -0.6306304931640625, -0.6072998046875, -0.5839691162109375, -0.560638427734375, -0.5373077392578125, -0.51397705078125, -0.4906463623046875, -0.467315673828125, -0.4439849853515625, -0.420654296875, -0.3973236083984375, -0.373992919921875, -0.3506622314453125, -0.32733154296875, -0.3040008544921875, -0.280670166015625, -0.2573394775390625, -0.2340087890625, -0.2106781005859375, -0.187347412109375, -0.1640167236328125, -0.14068603515625, -0.1173553466796875, -0.094024658203125, -0.0706939697265625, -0.04736328125, -0.0240325927734375, -0.000701904296875, 0.0226287841796875, 0.04595947265625, 0.0692901611328125, 0.092620849609375, 0.1159515380859375, 0.1392822265625, 0.1626129150390625, 0.185943603515625, 0.2092742919921875, 0.23260498046875, 0.2559356689453125, 0.279266357421875, 0.3025970458984375, 0.325927734375, 0.3492584228515625, 0.372589111328125, 0.3959197998046875, 0.41925048828125, 0.4425811767578125, 0.465911865234375, 0.4892425537109375, 0.5125732421875, 0.5359039306640625, 0.559234619140625, 0.5825653076171875, 0.60589599609375, 0.6292266845703125, 0.652557373046875, 0.6758880615234375, 0.69921875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 7.0, 9.0, 5.0, 9.0, 9.0, 11.0, 20.0, 39.0, 114.0, 361.0, 1321101.0, 2871961.0, 385.0, 89.0, 40.0, 26.0, 19.0, 15.0, 7.0, 9.0, 4.0, 5.0, 5.0, 5.0, 1.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-14.59375, -14.1231689453125, -13.652587890625, -13.1820068359375, -12.71142578125, -12.2408447265625, -11.770263671875, -11.2996826171875, -10.8291015625, -10.3585205078125, -9.887939453125, -9.4173583984375, -8.94677734375, -8.4761962890625, -8.005615234375, -7.5350341796875, -7.064453125, -6.5938720703125, -6.123291015625, -5.6527099609375, -5.18212890625, -4.7115478515625, -4.240966796875, -3.7703857421875, -3.2998046875, -2.8292236328125, -2.358642578125, -1.8880615234375, -1.41748046875, -0.9468994140625, -0.476318359375, -0.0057373046875, 0.46484375, 0.9354248046875, 1.406005859375, 1.8765869140625, 2.34716796875, 2.8177490234375, 3.288330078125, 3.7589111328125, 4.2294921875, 4.7000732421875, 5.170654296875, 5.6412353515625, 6.11181640625, 6.5823974609375, 7.052978515625, 7.5235595703125, 7.994140625, 8.4647216796875, 8.935302734375, 9.4058837890625, 9.87646484375, 10.3470458984375, 10.817626953125, 11.2882080078125, 11.7587890625, 12.2293701171875, 12.699951171875, 13.1705322265625, 13.64111328125, 14.1116943359375, 14.582275390625, 15.0528564453125, 15.5234375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 10.0, 16.0, 16.0, 19.0, 33.0, 55.0, 89.0, 114.0, 164.0, 265.0, 390.0, 535.0, 607.0, 531.0, 405.0, 281.0, 178.0, 128.0, 71.0, 61.0, 29.0, 21.0, 14.0, 14.0, 8.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.413330078125, -0.4025993347167969, -0.39186859130859375, -0.3811378479003906, -0.3704071044921875, -0.3596763610839844, -0.34894561767578125, -0.3382148742675781, -0.327484130859375, -0.3167533874511719, -0.30602264404296875, -0.2952919006347656, -0.2845611572265625, -0.2738304138183594, -0.26309967041015625, -0.2523689270019531, -0.24163818359375, -0.23090744018554688, -0.22017669677734375, -0.20944595336914062, -0.1987152099609375, -0.18798446655273438, -0.17725372314453125, -0.16652297973632812, -0.155792236328125, -0.14506149291992188, -0.13433074951171875, -0.12360000610351562, -0.1128692626953125, -0.10213851928710938, -0.09140777587890625, -0.08067703247070312, -0.0699462890625, -0.059215545654296875, -0.04848480224609375, -0.037754058837890625, -0.0270233154296875, -0.016292572021484375, -0.00556182861328125, 0.005168914794921875, 0.015899658203125, 0.026630401611328125, 0.03736114501953125, 0.048091888427734375, 0.0588226318359375, 0.06955337524414062, 0.08028411865234375, 0.09101486206054688, 0.10174560546875, 0.11247634887695312, 0.12320709228515625, 0.13393783569335938, 0.1446685791015625, 0.15539932250976562, 0.16613006591796875, 0.17686080932617188, 0.187591552734375, 0.19832229614257812, 0.20905303955078125, 0.21978378295898438, 0.2305145263671875, 0.24124526977539062, 0.25197601318359375, 0.2627067565917969, 0.2734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 1.0, 6.0, 11.0, 9.0, 12.0, 19.0, 19.0, 19.0, 28.0, 45.0, 56.0, 63.0, 63.0, 88.0, 78.0, 99.0, 63.0, 73.0, 66.0, 52.0, 39.0, 27.0, 21.0, 13.0, 7.0, 14.0, 5.0, 5.0, 2.0, 2.0, 6.0, 0.0, 0.0, 1.0], "bins": [-1.4711329936981201, -1.438071370124817, -1.4050097465515137, -1.3719481229782104, -1.3388864994049072, -1.3058249950408936, -1.2727633714675903, -1.239701747894287, -1.2066401243209839, -1.1735785007476807, -1.1405168771743774, -1.1074552536010742, -1.0743937492370605, -1.0413321256637573, -1.008270502090454, -0.9752088785171509, -0.9421472549438477, -0.9090856313705444, -0.8760240077972412, -0.8429624438285828, -0.8099008202552795, -0.7768391966819763, -0.7437776327133179, -0.7107160091400146, -0.6776543855667114, -0.6445927619934082, -0.611531138420105, -0.5784695744514465, -0.5454079508781433, -0.5123463273048401, -0.47928473353385925, -0.4462231397628784, -0.41316157579421997, -0.38009995222091675, -0.3470383584499359, -0.3139767646789551, -0.28091514110565186, -0.24785353243350983, -0.2147919237613678, -0.18173031508922577, -0.14866870641708374, -0.11560709774494171, -0.08254548907279968, -0.049483880400657654, -0.016422271728515625, 0.016639336943626404, 0.04970094561576843, 0.08276255428791046, 0.11582416296005249, 0.14888577163219452, 0.18194738030433655, 0.21500898897647858, 0.2480705976486206, 0.28113222122192383, 0.31419381499290466, 0.3472554087638855, 0.3803170323371887, 0.41337865591049194, 0.4464402496814728, 0.4795018434524536, 0.5125634670257568, 0.5456250905990601, 0.5786867141723633, 0.6117482781410217, 0.644809901714325]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 6.0, 4.0, 10.0, 6.0, 11.0, 13.0, 24.0, 29.0, 46.0, 32.0, 38.0, 25.0, 32.0, 37.0, 39.0, 42.0, 47.0, 46.0, 34.0, 52.0, 42.0, 36.0, 36.0, 45.0, 30.0, 29.0, 26.0, 22.0, 28.0, 22.0, 11.0, 9.0, 12.0, 11.0, 11.0, 15.0, 10.0, 3.0, 5.0, 2.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6389943957328796, -0.6174085736274719, -0.595822811126709, -0.5742369890213013, -0.5526511669158936, -0.5310653448104858, -0.5094795823097229, -0.4878937602043152, -0.46630796790122986, -0.44472217559814453, -0.4231363534927368, -0.4015505611896515, -0.37996476888656616, -0.35837894678115845, -0.3367931544780731, -0.3152073621749878, -0.2936215400695801, -0.27203574776649475, -0.25044992566108704, -0.2288641333580017, -0.2072783261537552, -0.18569251894950867, -0.16410672664642334, -0.14252091944217682, -0.1209351122379303, -0.09934930503368378, -0.07776350528001785, -0.05617770552635193, -0.03459189832210541, -0.013006091117858887, 0.00857970118522644, 0.03016550838947296, 0.05175137519836426, 0.07333718240261078, 0.0949229821562767, 0.11650878190994263, 0.13809458911418915, 0.15968039631843567, 0.181266188621521, 0.20285199582576752, 0.22443780303001404, 0.24602361023426056, 0.2676094174385071, 0.2891952097415924, 0.31078100204467773, 0.33236682415008545, 0.3539526164531708, 0.3755384087562561, 0.3971242308616638, 0.41871002316474915, 0.44029584527015686, 0.4618816375732422, 0.4834674596786499, 0.5050532817840576, 0.5266390442848206, 0.5482248663902283, 0.5698106288909912, 0.5913964509963989, 0.6129822134971619, 0.6345680356025696, 0.6561538577079773, 0.6777396202087402, 0.699325442314148, 0.7209112644195557, 0.7424970865249634]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 4.0, 4.0, 12.0, 17.0, 30.0, 39.0, 64.0, 100.0, 136.0, 239.0, 307.0, 505.0, 878.0, 1387.0, 2150.0, 3117.0, 5291.0, 10089.0, 22455.0, 60271.0, 164604.0, 326735.0, 265481.0, 110207.0, 39574.0, 15703.0, 7578.0, 4214.0, 2555.0, 1719.0, 1047.0, 726.0, 467.0, 288.0, 190.0, 150.0, 77.0, 63.0, 28.0, 23.0, 15.0, 9.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.267822265625, -0.26033973693847656, -0.2528572082519531, -0.2453746795654297, -0.23789215087890625, -0.2304096221923828, -0.22292709350585938, -0.21544456481933594, -0.2079620361328125, -0.20047950744628906, -0.19299697875976562, -0.1855144500732422, -0.17803192138671875, -0.1705493927001953, -0.16306686401367188, -0.15558433532714844, -0.148101806640625, -0.14061927795410156, -0.13313674926757812, -0.1256542205810547, -0.11817169189453125, -0.11068916320800781, -0.10320663452148438, -0.09572410583496094, -0.0882415771484375, -0.08075904846191406, -0.07327651977539062, -0.06579399108886719, -0.05831146240234375, -0.05082893371582031, -0.043346405029296875, -0.03586387634277344, -0.02838134765625, -0.020898818969726562, -0.013416290283203125, -0.0059337615966796875, 0.00154876708984375, 0.009031295776367188, 0.016513824462890625, 0.023996353149414062, 0.0314788818359375, 0.03896141052246094, 0.046443939208984375, 0.05392646789550781, 0.06140899658203125, 0.06889152526855469, 0.07637405395507812, 0.08385658264160156, 0.091339111328125, 0.09882164001464844, 0.10630416870117188, 0.11378669738769531, 0.12126922607421875, 0.1287517547607422, 0.13623428344726562, 0.14371681213378906, 0.1511993408203125, 0.15868186950683594, 0.16616439819335938, 0.1736469268798828, 0.18112945556640625, 0.1886119842529297, 0.19609451293945312, 0.20357704162597656, 0.2110595703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 5.0, 4.0, 8.0, 7.0, 13.0, 20.0, 14.0, 35.0, 35.0, 35.0, 42.0, 43.0, 39.0, 48.0, 52.0, 53.0, 52.0, 50.0, 49.0, 46.0, 45.0, 43.0, 40.0, 42.0, 34.0, 19.0, 22.0, 17.0, 15.0, 9.0, 15.0, 14.0, 14.0, 6.0, 3.0, 3.0, 2.0, 1.0, 5.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5244140625, -0.507568359375, -0.49072265625, -0.473876953125, -0.45703125, -0.440185546875, -0.42333984375, -0.406494140625, -0.3896484375, -0.372802734375, -0.35595703125, -0.339111328125, -0.322265625, -0.305419921875, -0.28857421875, -0.271728515625, -0.2548828125, -0.238037109375, -0.22119140625, -0.204345703125, -0.1875, -0.170654296875, -0.15380859375, -0.136962890625, -0.1201171875, -0.103271484375, -0.08642578125, -0.069580078125, -0.052734375, -0.035888671875, -0.01904296875, -0.002197265625, 0.0146484375, 0.031494140625, 0.04833984375, 0.065185546875, 0.08203125, 0.098876953125, 0.11572265625, 0.132568359375, 0.1494140625, 0.166259765625, 0.18310546875, 0.199951171875, 0.216796875, 0.233642578125, 0.25048828125, 0.267333984375, 0.2841796875, 0.301025390625, 0.31787109375, 0.334716796875, 0.3515625, 0.368408203125, 0.38525390625, 0.402099609375, 0.4189453125, 0.435791015625, 0.45263671875, 0.469482421875, 0.486328125, 0.503173828125, 0.52001953125, 0.536865234375, 0.5537109375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 2.0, 10.0, 7.0, 10.0, 10.0, 27.0, 30.0, 49.0, 111.0, 145.0, 255.0, 470.0, 848.0, 1604.0, 3347.0, 8876.0, 35969.0, 189382.0, 527467.0, 220371.0, 42243.0, 10050.0, 3637.0, 1695.0, 869.0, 423.0, 247.0, 140.0, 86.0, 46.0, 40.0, 24.0, 20.0, 8.0, 10.0, 5.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4658203125, -0.451934814453125, -0.43804931640625, -0.424163818359375, -0.4102783203125, -0.396392822265625, -0.38250732421875, -0.368621826171875, -0.354736328125, -0.340850830078125, -0.32696533203125, -0.313079833984375, -0.2991943359375, -0.285308837890625, -0.27142333984375, -0.257537841796875, -0.24365234375, -0.229766845703125, -0.21588134765625, -0.201995849609375, -0.1881103515625, -0.174224853515625, -0.16033935546875, -0.146453857421875, -0.132568359375, -0.118682861328125, -0.10479736328125, -0.090911865234375, -0.0770263671875, -0.063140869140625, -0.04925537109375, -0.035369873046875, -0.021484375, -0.007598876953125, 0.00628662109375, 0.020172119140625, 0.0340576171875, 0.047943115234375, 0.06182861328125, 0.075714111328125, 0.089599609375, 0.103485107421875, 0.11737060546875, 0.131256103515625, 0.1451416015625, 0.159027099609375, 0.17291259765625, 0.186798095703125, 0.20068359375, 0.214569091796875, 0.22845458984375, 0.242340087890625, 0.2562255859375, 0.270111083984375, 0.28399658203125, 0.297882080078125, 0.311767578125, 0.325653076171875, 0.33953857421875, 0.353424072265625, 0.3673095703125, 0.381195068359375, 0.39508056640625, 0.408966064453125, 0.4228515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 9.0, 7.0, 11.0, 14.0, 12.0, 19.0, 20.0, 18.0, 26.0, 23.0, 39.0, 36.0, 33.0, 36.0, 49.0, 41.0, 47.0, 34.0, 58.0, 44.0, 43.0, 45.0, 25.0, 50.0, 28.0, 35.0, 29.0, 29.0, 19.0, 15.0, 14.0, 18.0, 13.0, 7.0, 6.0, 4.0, 12.0, 5.0, 2.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.86865234375, -0.8400039672851562, -0.8113555908203125, -0.7827072143554688, -0.754058837890625, -0.7254104614257812, -0.6967620849609375, -0.6681137084960938, -0.63946533203125, -0.6108169555664062, -0.5821685791015625, -0.5535202026367188, -0.524871826171875, -0.49622344970703125, -0.4675750732421875, -0.43892669677734375, -0.4102783203125, -0.38162994384765625, -0.3529815673828125, -0.32433319091796875, -0.295684814453125, -0.26703643798828125, -0.2383880615234375, -0.20973968505859375, -0.18109130859375, -0.15244293212890625, -0.1237945556640625, -0.09514617919921875, -0.066497802734375, -0.03784942626953125, -0.0092010498046875, 0.01944732666015625, 0.048095703125, 0.07674407958984375, 0.1053924560546875, 0.13404083251953125, 0.162689208984375, 0.19133758544921875, 0.2199859619140625, 0.24863433837890625, 0.27728271484375, 0.30593109130859375, 0.3345794677734375, 0.36322784423828125, 0.391876220703125, 0.42052459716796875, 0.4491729736328125, 0.47782135009765625, 0.5064697265625, 0.5351181030273438, 0.5637664794921875, 0.5924148559570312, 0.621063232421875, 0.6497116088867188, 0.6783599853515625, 0.7070083618164062, 0.73565673828125, 0.7643051147460938, 0.7929534912109375, 0.8216018676757812, 0.850250244140625, 0.8788986206054688, 0.9075469970703125, 0.9361953735351562, 0.96484375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 12.0, 6.0, 17.0, 26.0, 51.0, 88.0, 149.0, 318.0, 713.0, 1737.0, 4993.0, 18363.0, 180838.0, 748316.0, 75269.0, 11696.0, 3567.0, 1350.0, 533.0, 220.0, 111.0, 75.0, 42.0, 20.0, 17.0, 9.0, 9.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.221923828125, -0.21564483642578125, -0.2093658447265625, -0.20308685302734375, -0.196807861328125, -0.19052886962890625, -0.1842498779296875, -0.17797088623046875, -0.17169189453125, -0.16541290283203125, -0.1591339111328125, -0.15285491943359375, -0.146575927734375, -0.14029693603515625, -0.1340179443359375, -0.12773895263671875, -0.1214599609375, -0.11518096923828125, -0.1089019775390625, -0.10262298583984375, -0.096343994140625, -0.09006500244140625, -0.0837860107421875, -0.07750701904296875, -0.07122802734375, -0.06494903564453125, -0.0586700439453125, -0.05239105224609375, -0.046112060546875, -0.03983306884765625, -0.0335540771484375, -0.02727508544921875, -0.02099609375, -0.01471710205078125, -0.0084381103515625, -0.00215911865234375, 0.004119873046875, 0.01039886474609375, 0.0166778564453125, 0.02295684814453125, 0.02923583984375, 0.03551483154296875, 0.0417938232421875, 0.04807281494140625, 0.054351806640625, 0.06063079833984375, 0.0669097900390625, 0.07318878173828125, 0.0794677734375, 0.08574676513671875, 0.0920257568359375, 0.09830474853515625, 0.104583740234375, 0.11086273193359375, 0.1171417236328125, 0.12342071533203125, 0.12969970703125, 0.13597869873046875, 0.1422576904296875, 0.14853668212890625, 0.154815673828125, 0.16109466552734375, 0.1673736572265625, 0.17365264892578125, 0.179931640625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 13.0, 24.0, 62.0, 122.0, 216.0, 232.0, 155.0, 74.0, 37.0, 21.0, 11.0, 7.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.101629257202148e-05, -8.740182965993881e-05, -8.378736674785614e-05, -8.017290383577347e-05, -7.65584409236908e-05, -7.294397801160812e-05, -6.932951509952545e-05, -6.571505218744278e-05, -6.210058927536011e-05, -5.8486126363277435e-05, -5.487166345119476e-05, -5.125720053911209e-05, -4.764273762702942e-05, -4.402827471494675e-05, -4.0413811802864075e-05, -3.67993488907814e-05, -3.318488597869873e-05, -2.957042306661606e-05, -2.5955960154533386e-05, -2.2341497242450714e-05, -1.8727034330368042e-05, -1.511257141828537e-05, -1.1498108506202698e-05, -7.883645594120026e-06, -4.2691826820373535e-06, -6.547197699546814e-07, 2.9597431421279907e-06, 6.574206054210663e-06, 1.0188668966293335e-05, 1.3803131878376007e-05, 1.741759479045868e-05, 2.103205770254135e-05, 2.4646520614624023e-05, 2.8260983526706696e-05, 3.187544643878937e-05, 3.548990935087204e-05, 3.910437226295471e-05, 4.2718835175037384e-05, 4.6333298087120056e-05, 4.994776099920273e-05, 5.35622239112854e-05, 5.717668682336807e-05, 6.0791149735450745e-05, 6.440561264753342e-05, 6.802007555961609e-05, 7.163453847169876e-05, 7.524900138378143e-05, 7.88634642958641e-05, 8.247792720794678e-05, 8.609239012002945e-05, 8.970685303211212e-05, 9.33213159441948e-05, 9.693577885627747e-05, 0.00010055024176836014, 0.00010416470468044281, 0.00010777916759252548, 0.00011139363050460815, 0.00011500809341669083, 0.0001186225563287735, 0.00012223701924085617, 0.00012585148215293884, 0.00012946594506502151, 0.0001330804079771042, 0.00013669487088918686, 0.00014030933380126953]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 4.0, 8.0, 8.0, 3.0, 9.0, 10.0, 23.0, 22.0, 61.0, 117.0, 249.0, 1065.0, 9830.0, 817388.0, 213748.0, 5044.0, 583.0, 156.0, 73.0, 42.0, 29.0, 18.0, 14.0, 14.0, 7.0, 6.0, 4.0, 5.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35205078125, -0.3366546630859375, -0.321258544921875, -0.3058624267578125, -0.29046630859375, -0.2750701904296875, -0.259674072265625, -0.2442779541015625, -0.2288818359375, -0.2134857177734375, -0.198089599609375, -0.1826934814453125, -0.16729736328125, -0.1519012451171875, -0.136505126953125, -0.1211090087890625, -0.105712890625, -0.0903167724609375, -0.074920654296875, -0.0595245361328125, -0.04412841796875, -0.0287322998046875, -0.013336181640625, 0.0020599365234375, 0.0174560546875, 0.0328521728515625, 0.048248291015625, 0.0636444091796875, 0.07904052734375, 0.0944366455078125, 0.109832763671875, 0.1252288818359375, 0.140625, 0.1560211181640625, 0.171417236328125, 0.1868133544921875, 0.20220947265625, 0.2176055908203125, 0.233001708984375, 0.2483978271484375, 0.2637939453125, 0.2791900634765625, 0.294586181640625, 0.3099822998046875, 0.32537841796875, 0.3407745361328125, 0.356170654296875, 0.3715667724609375, 0.386962890625, 0.4023590087890625, 0.417755126953125, 0.4331512451171875, 0.44854736328125, 0.4639434814453125, 0.479339599609375, 0.4947357177734375, 0.5101318359375, 0.5255279541015625, 0.540924072265625, 0.5563201904296875, 0.57171630859375, 0.5871124267578125, 0.602508544921875, 0.6179046630859375, 0.63330078125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 8.0, 7.0, 9.0, 14.0, 29.0, 42.0, 76.0, 129.0, 151.0, 177.0, 132.0, 72.0, 69.0, 23.0, 14.0, 13.0, 6.0, 9.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05145263671875, -0.049628257751464844, -0.04780387878417969, -0.04597949981689453, -0.044155120849609375, -0.04233074188232422, -0.04050636291503906, -0.038681983947753906, -0.03685760498046875, -0.035033226013183594, -0.03320884704589844, -0.03138446807861328, -0.029560089111328125, -0.02773571014404297, -0.025911331176757812, -0.024086952209472656, -0.0222625732421875, -0.020438194274902344, -0.018613815307617188, -0.01678943634033203, -0.014965057373046875, -0.013140678405761719, -0.011316299438476562, -0.009491920471191406, -0.00766754150390625, -0.005843162536621094, -0.0040187835693359375, -0.0021944046020507812, -0.000370025634765625, 0.0014543533325195312, 0.0032787322998046875, 0.005103111267089844, 0.006927490234375, 0.008751869201660156, 0.010576248168945312, 0.012400627136230469, 0.014225006103515625, 0.01604938507080078, 0.017873764038085938, 0.019698143005371094, 0.02152252197265625, 0.023346900939941406, 0.025171279907226562, 0.02699565887451172, 0.028820037841796875, 0.03064441680908203, 0.03246879577636719, 0.034293174743652344, 0.0361175537109375, 0.037941932678222656, 0.03976631164550781, 0.04159069061279297, 0.043415069580078125, 0.04523944854736328, 0.04706382751464844, 0.048888206481933594, 0.05071258544921875, 0.052536964416503906, 0.05436134338378906, 0.05618572235107422, 0.058010101318359375, 0.05983448028564453, 0.06165885925292969, 0.06348323822021484, 0.0653076171875]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 5.0, 6.0, 14.0, 16.0, 35.0, 40.0, 41.0, 53.0, 81.0, 80.0, 100.0, 111.0, 63.0, 95.0, 78.0, 58.0, 41.0, 16.0, 22.0, 15.0, 8.0, 5.0, 5.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.025408387184143, -1.0015565156936646, -0.977704644203186, -0.9538527727127075, -0.930000901222229, -0.9061490297317505, -0.882297158241272, -0.8584452867507935, -0.8345934152603149, -0.8107415437698364, -0.7868896722793579, -0.7630378007888794, -0.7391859292984009, -0.7153340578079224, -0.6914821863174438, -0.6676303148269653, -0.643778383731842, -0.6199265122413635, -0.596074640750885, -0.5722227692604065, -0.548370897769928, -0.5245190262794495, -0.5006670951843262, -0.47681525349617004, -0.45296338200569153, -0.429111510515213, -0.4052596390247345, -0.3814077377319336, -0.3575558662414551, -0.33370399475097656, -0.30985212326049805, -0.28600025177001953, -0.2621484398841858, -0.23829656839370728, -0.21444469690322876, -0.19059281051158905, -0.16674093902111053, -0.14288906753063202, -0.11903718113899231, -0.0951853096485138, -0.07133343815803528, -0.047481562942266464, -0.02362968772649765, 0.0002221912145614624, 0.024074062705039978, 0.047925934195518494, 0.0717778205871582, 0.09562969207763672, 0.11948156356811523, 0.14333343505859375, 0.16718530654907227, 0.19103719294071198, 0.2148890644311905, 0.238740935921669, 0.2625928223133087, 0.28644469380378723, 0.31029656529426575, 0.33414843678474426, 0.3580003082752228, 0.3818522095680237, 0.4057040810585022, 0.4295559525489807, 0.45340782403945923, 0.47725969552993774, 0.5011115670204163]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 6.0, 7.0, 5.0, 11.0, 20.0, 17.0, 31.0, 31.0, 40.0, 39.0, 37.0, 39.0, 30.0, 34.0, 45.0, 50.0, 40.0, 44.0, 59.0, 47.0, 31.0, 35.0, 43.0, 36.0, 22.0, 36.0, 16.0, 24.0, 13.0, 15.0, 9.0, 15.0, 9.0, 16.0, 10.0, 4.0, 7.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.45454877614974976, -0.4400072693824768, -0.42546579241752625, -0.4109243154525757, -0.39638280868530273, -0.3818413019180298, -0.3672998249530792, -0.35275834798812866, -0.3382168412208557, -0.32367533445358276, -0.3091338574886322, -0.29459238052368164, -0.2800508737564087, -0.26550936698913574, -0.2509678900241852, -0.23642639815807343, -0.22188490629196167, -0.20734341442584991, -0.19280192255973816, -0.1782604306936264, -0.16371893882751465, -0.1491774469614029, -0.13463595509529114, -0.12009446322917938, -0.10555297136306763, -0.09101147949695587, -0.07646998763084412, -0.06192849576473236, -0.047387003898620605, -0.03284551203250885, -0.018304020166397095, -0.0037625283002853394, 0.010778933763504028, 0.025320425629615784, 0.03986191749572754, 0.054403409361839294, 0.06894490122795105, 0.0834863930940628, 0.09802788496017456, 0.11256937682628632, 0.12711086869239807, 0.14165236055850983, 0.15619385242462158, 0.17073534429073334, 0.1852768361568451, 0.19981832802295685, 0.2143598198890686, 0.22890131175518036, 0.24344280362129211, 0.2579842805862427, 0.2725257873535156, 0.2870672941207886, 0.30160877108573914, 0.3161502480506897, 0.33069175481796265, 0.3452332615852356, 0.35977473855018616, 0.3743162155151367, 0.38885772228240967, 0.4033992290496826, 0.4179407060146332, 0.43248218297958374, 0.4470236897468567, 0.46156519651412964, 0.4761066734790802]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 10.0, 15.0, 14.0, 35.0, 56.0, 96.0, 167.0, 313.0, 554.0, 1221.0, 2992.0, 7898.0, 24763.0, 87801.0, 481227.0, 345999.0, 65264.0, 19017.0, 6603.0, 2398.0, 1070.0, 470.0, 222.0, 142.0, 79.0, 49.0, 21.0, 20.0, 14.0, 7.0, 8.0, 2.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60302734375, -0.5846939086914062, -0.5663604736328125, -0.5480270385742188, -0.529693603515625, -0.5113601684570312, -0.4930267333984375, -0.47469329833984375, -0.45635986328125, -0.43802642822265625, -0.4196929931640625, -0.40135955810546875, -0.383026123046875, -0.36469268798828125, -0.3463592529296875, -0.32802581787109375, -0.3096923828125, -0.29135894775390625, -0.2730255126953125, -0.25469207763671875, -0.236358642578125, -0.21802520751953125, -0.1996917724609375, -0.18135833740234375, -0.16302490234375, -0.14469146728515625, -0.1263580322265625, -0.10802459716796875, -0.089691162109375, -0.07135772705078125, -0.0530242919921875, -0.03469085693359375, -0.016357421875, 0.00197601318359375, 0.0203094482421875, 0.03864288330078125, 0.056976318359375, 0.07530975341796875, 0.0936431884765625, 0.11197662353515625, 0.13031005859375, 0.14864349365234375, 0.1669769287109375, 0.18531036376953125, 0.203643798828125, 0.22197723388671875, 0.2403106689453125, 0.25864410400390625, 0.2769775390625, 0.29531097412109375, 0.3136444091796875, 0.33197784423828125, 0.350311279296875, 0.36864471435546875, 0.3869781494140625, 0.40531158447265625, 0.42364501953125, 0.44197845458984375, 0.4603118896484375, 0.47864532470703125, 0.496978759765625, 0.5153121948242188, 0.5336456298828125, 0.5519790649414062, 0.5703125]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 9.0, 10.0, 8.0, 11.0, 16.0, 14.0, 16.0, 20.0, 18.0, 27.0, 31.0, 32.0, 32.0, 44.0, 49.0, 36.0, 42.0, 51.0, 44.0, 42.0, 44.0, 48.0, 29.0, 36.0, 30.0, 22.0, 27.0, 36.0, 25.0, 19.0, 17.0, 28.0, 17.0, 7.0, 13.0, 8.0, 9.0, 4.0, 8.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.396484375, -1.3516082763671875, -1.306732177734375, -1.2618560791015625, -1.21697998046875, -1.1721038818359375, -1.127227783203125, -1.0823516845703125, -1.0374755859375, -0.9925994873046875, -0.947723388671875, -0.9028472900390625, -0.85797119140625, -0.8130950927734375, -0.768218994140625, -0.7233428955078125, -0.678466796875, -0.6335906982421875, -0.588714599609375, -0.5438385009765625, -0.49896240234375, -0.4540863037109375, -0.409210205078125, -0.3643341064453125, -0.3194580078125, -0.2745819091796875, -0.229705810546875, -0.1848297119140625, -0.13995361328125, -0.0950775146484375, -0.050201416015625, -0.0053253173828125, 0.03955078125, 0.0844268798828125, 0.129302978515625, 0.1741790771484375, 0.21905517578125, 0.2639312744140625, 0.308807373046875, 0.3536834716796875, 0.3985595703125, 0.4434356689453125, 0.488311767578125, 0.5331878662109375, 0.57806396484375, 0.6229400634765625, 0.667816162109375, 0.7126922607421875, 0.757568359375, 0.8024444580078125, 0.847320556640625, 0.8921966552734375, 0.93707275390625, 0.9819488525390625, 1.026824951171875, 1.0717010498046875, 1.1165771484375, 1.1614532470703125, 1.206329345703125, 1.2512054443359375, 1.29608154296875, 1.3409576416015625, 1.385833740234375, 1.4307098388671875, 1.4755859375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 9.0, 12.0, 15.0, 20.0, 22.0, 38.0, 35.0, 55.0, 82.0, 109.0, 222.0, 1913.0, 1043327.0, 2063.0, 221.0, 90.0, 88.0, 55.0, 42.0, 32.0, 28.0, 14.0, 19.0, 10.0, 9.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.37890625, -6.1697998046875, -5.960693359375, -5.7515869140625, -5.54248046875, -5.3333740234375, -5.124267578125, -4.9151611328125, -4.7060546875, -4.4969482421875, -4.287841796875, -4.0787353515625, -3.86962890625, -3.6605224609375, -3.451416015625, -3.2423095703125, -3.033203125, -2.8240966796875, -2.614990234375, -2.4058837890625, -2.19677734375, -1.9876708984375, -1.778564453125, -1.5694580078125, -1.3603515625, -1.1512451171875, -0.942138671875, -0.7330322265625, -0.52392578125, -0.3148193359375, -0.105712890625, 0.1033935546875, 0.3125, 0.5216064453125, 0.730712890625, 0.9398193359375, 1.14892578125, 1.3580322265625, 1.567138671875, 1.7762451171875, 1.9853515625, 2.1944580078125, 2.403564453125, 2.6126708984375, 2.82177734375, 3.0308837890625, 3.239990234375, 3.4490966796875, 3.658203125, 3.8673095703125, 4.076416015625, 4.2855224609375, 4.49462890625, 4.7037353515625, 4.912841796875, 5.1219482421875, 5.3310546875, 5.5401611328125, 5.749267578125, 5.9583740234375, 6.16748046875, 6.3765869140625, 6.585693359375, 6.7947998046875, 7.00390625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 8.0, 5.0, 8.0, 18.0, 15.0, 15.0, 37.0, 33.0, 41.0, 61.0, 68.0, 82.0, 70.0, 80.0, 81.0, 65.0, 51.0, 52.0, 42.0, 44.0, 37.0, 22.0, 12.0, 18.0, 9.0, 4.0, 8.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.55859375, -2.47479248046875, -2.3909912109375, -2.30718994140625, -2.223388671875, -2.13958740234375, -2.0557861328125, -1.97198486328125, -1.88818359375, -1.80438232421875, -1.7205810546875, -1.63677978515625, -1.552978515625, -1.46917724609375, -1.3853759765625, -1.30157470703125, -1.2177734375, -1.13397216796875, -1.0501708984375, -0.96636962890625, -0.882568359375, -0.79876708984375, -0.7149658203125, -0.63116455078125, -0.54736328125, -0.46356201171875, -0.3797607421875, -0.29595947265625, -0.212158203125, -0.12835693359375, -0.0445556640625, 0.03924560546875, 0.123046875, 0.20684814453125, 0.2906494140625, 0.37445068359375, 0.458251953125, 0.54205322265625, 0.6258544921875, 0.70965576171875, 0.79345703125, 0.87725830078125, 0.9610595703125, 1.04486083984375, 1.128662109375, 1.21246337890625, 1.2962646484375, 1.38006591796875, 1.4638671875, 1.54766845703125, 1.6314697265625, 1.71527099609375, 1.799072265625, 1.88287353515625, 1.9666748046875, 2.05047607421875, 2.13427734375, 2.21807861328125, 2.3018798828125, 2.38568115234375, 2.469482421875, 2.55328369140625, 2.6370849609375, 2.72088623046875, 2.8046875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 6.0, 10.0, 11.0, 13.0, 11.0, 18.0, 29.0, 42.0, 63.0, 114.0, 238.0, 797.0, 5797.0, 157307.0, 857988.0, 23437.0, 1853.0, 389.0, 160.0, 82.0, 62.0, 26.0, 16.0, 16.0, 17.0, 11.0, 6.0, 7.0, 5.0, 6.0, 4.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.380615234375, -0.3671417236328125, -0.353668212890625, -0.3401947021484375, -0.32672119140625, -0.3132476806640625, -0.299774169921875, -0.2863006591796875, -0.2728271484375, -0.2593536376953125, -0.245880126953125, -0.2324066162109375, -0.21893310546875, -0.2054595947265625, -0.191986083984375, -0.1785125732421875, -0.1650390625, -0.1515655517578125, -0.138092041015625, -0.1246185302734375, -0.11114501953125, -0.0976715087890625, -0.084197998046875, -0.0707244873046875, -0.0572509765625, -0.0437774658203125, -0.030303955078125, -0.0168304443359375, -0.00335693359375, 0.0101165771484375, 0.023590087890625, 0.0370635986328125, 0.050537109375, 0.0640106201171875, 0.077484130859375, 0.0909576416015625, 0.10443115234375, 0.1179046630859375, 0.131378173828125, 0.1448516845703125, 0.1583251953125, 0.1717987060546875, 0.185272216796875, 0.1987457275390625, 0.21221923828125, 0.2256927490234375, 0.239166259765625, 0.2526397705078125, 0.26611328125, 0.2795867919921875, 0.293060302734375, 0.3065338134765625, 0.32000732421875, 0.3334808349609375, 0.346954345703125, 0.3604278564453125, 0.3739013671875, 0.3873748779296875, 0.400848388671875, 0.4143218994140625, 0.42779541015625, 0.4412689208984375, 0.454742431640625, 0.4682159423828125, 0.481689453125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 7.0, 4.0, 6.0, 10.0, 12.0, 11.0, 13.0, 20.0, 28.0, 33.0, 41.0, 54.0, 80.0, 117.0, 101.0, 118.0, 94.0, 57.0, 46.0, 36.0, 29.0, 21.0, 15.0, 16.0, 10.0, 3.0, 5.0, 1.0, 5.0, 0.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.300739288330078e-05, -2.220459282398224e-05, -2.1401792764663696e-05, -2.0598992705345154e-05, -1.979619264602661e-05, -1.899339258670807e-05, -1.8190592527389526e-05, -1.7387792468070984e-05, -1.658499240875244e-05, -1.57821923494339e-05, -1.4979392290115356e-05, -1.4176592230796814e-05, -1.3373792171478271e-05, -1.2570992112159729e-05, -1.1768192052841187e-05, -1.0965391993522644e-05, -1.0162591934204102e-05, -9.359791874885559e-06, -8.556991815567017e-06, -7.754191756248474e-06, -6.951391696929932e-06, -6.148591637611389e-06, -5.345791578292847e-06, -4.542991518974304e-06, -3.7401914596557617e-06, -2.9373914003372192e-06, -2.1345913410186768e-06, -1.3317912817001343e-06, -5.289912223815918e-07, 2.738088369369507e-07, 1.0766088962554932e-06, 1.8794089555740356e-06, 2.682209014892578e-06, 3.4850090742111206e-06, 4.287809133529663e-06, 5.0906091928482056e-06, 5.893409252166748e-06, 6.6962093114852905e-06, 7.499009370803833e-06, 8.301809430122375e-06, 9.104609489440918e-06, 9.90740954875946e-06, 1.0710209608078003e-05, 1.1513009667396545e-05, 1.2315809726715088e-05, 1.311860978603363e-05, 1.3921409845352173e-05, 1.4724209904670715e-05, 1.5527009963989258e-05, 1.63298100233078e-05, 1.7132610082626343e-05, 1.7935410141944885e-05, 1.8738210201263428e-05, 1.954101026058197e-05, 2.0343810319900513e-05, 2.1146610379219055e-05, 2.1949410438537598e-05, 2.275221049785614e-05, 2.3555010557174683e-05, 2.4357810616493225e-05, 2.5160610675811768e-05, 2.596341073513031e-05, 2.6766210794448853e-05, 2.7569010853767395e-05, 2.8371810913085938e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 8.0, 7.0, 3.0, 7.0, 12.0, 15.0, 28.0, 26.0, 46.0, 77.0, 155.0, 347.0, 1138.0, 7145.0, 125331.0, 863951.0, 45007.0, 3894.0, 769.0, 261.0, 128.0, 75.0, 43.0, 25.0, 19.0, 12.0, 5.0, 11.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.428466796875, -0.41667938232421875, -0.4048919677734375, -0.39310455322265625, -0.381317138671875, -0.36952972412109375, -0.3577423095703125, -0.34595489501953125, -0.33416748046875, -0.32238006591796875, -0.3105926513671875, -0.29880523681640625, -0.287017822265625, -0.27523040771484375, -0.2634429931640625, -0.25165557861328125, -0.2398681640625, -0.22808074951171875, -0.2162933349609375, -0.20450592041015625, -0.192718505859375, -0.18093109130859375, -0.1691436767578125, -0.15735626220703125, -0.14556884765625, -0.13378143310546875, -0.1219940185546875, -0.11020660400390625, -0.098419189453125, -0.08663177490234375, -0.0748443603515625, -0.06305694580078125, -0.05126953125, -0.03948211669921875, -0.0276947021484375, -0.01590728759765625, -0.004119873046875, 0.00766754150390625, 0.0194549560546875, 0.03124237060546875, 0.04302978515625, 0.05481719970703125, 0.0666046142578125, 0.07839202880859375, 0.090179443359375, 0.10196685791015625, 0.1137542724609375, 0.12554168701171875, 0.1373291015625, 0.14911651611328125, 0.1609039306640625, 0.17269134521484375, 0.184478759765625, 0.19626617431640625, 0.2080535888671875, 0.21984100341796875, 0.23162841796875, 0.24341583251953125, 0.2552032470703125, 0.26699066162109375, 0.278778076171875, 0.29056549072265625, 0.3023529052734375, 0.31414031982421875, 0.325927734375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 2.0, 2.0, 6.0, 6.0, 14.0, 14.0, 30.0, 42.0, 50.0, 100.0, 134.0, 154.0, 156.0, 94.0, 69.0, 41.0, 31.0, 14.0, 10.0, 9.0, 5.0, 5.0, 8.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.082275390625, -0.07939910888671875, -0.0765228271484375, -0.07364654541015625, -0.070770263671875, -0.06789398193359375, -0.0650177001953125, -0.06214141845703125, -0.05926513671875, -0.05638885498046875, -0.0535125732421875, -0.05063629150390625, -0.047760009765625, -0.04488372802734375, -0.0420074462890625, -0.03913116455078125, -0.0362548828125, -0.03337860107421875, -0.0305023193359375, -0.02762603759765625, -0.024749755859375, -0.02187347412109375, -0.0189971923828125, -0.01612091064453125, -0.01324462890625, -0.01036834716796875, -0.0074920654296875, -0.00461578369140625, -0.001739501953125, 0.00113677978515625, 0.0040130615234375, 0.00688934326171875, 0.009765625, 0.01264190673828125, 0.0155181884765625, 0.01839447021484375, 0.021270751953125, 0.02414703369140625, 0.0270233154296875, 0.02989959716796875, 0.03277587890625, 0.03565216064453125, 0.0385284423828125, 0.04140472412109375, 0.044281005859375, 0.04715728759765625, 0.0500335693359375, 0.05290985107421875, 0.0557861328125, 0.05866241455078125, 0.0615386962890625, 0.06441497802734375, 0.067291259765625, 0.07016754150390625, 0.0730438232421875, 0.07592010498046875, 0.07879638671875, 0.08167266845703125, 0.0845489501953125, 0.08742523193359375, 0.090301513671875, 0.09317779541015625, 0.0960540771484375, 0.09893035888671875, 0.101806640625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 6.0, 69.0, 222.0, 442.0, 224.0, 46.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.404793620109558, -1.185573697090149, -0.9663538932800293, -0.7471339702606201, -0.5279141068458557, -0.3086942434310913, -0.08947432041168213, 0.1297454833984375, 0.3489654064178467, 0.5681852698326111, 0.7874051332473755, 1.0066250562667847, 1.2258448600769043, 1.4450647830963135, 1.6642847061157227, 1.8835045099258423, 2.102724552154541, 2.32194447517395, 2.5411643981933594, 2.7603840827941895, 2.9796040058135986, 3.198823928833008, 3.418043851852417, 3.637263774871826, 3.8564834594726562, 4.075703144073486, 4.294923305511475, 4.514142990112305, 4.733363151550293, 4.952582836151123, 5.171802520751953, 5.391022682189941, 5.6102423667907715, 5.829462051391602, 6.04868221282959, 6.26790189743042, 6.487122058868408, 6.706341743469238, 6.925561904907227, 7.144781589508057, 7.364001274108887, 7.583220958709717, 7.802441120147705, 8.021660804748535, 8.240880966186523, 8.460100173950195, 8.679320335388184, 8.898540496826172, 9.11776065826416, 9.336980819702148, 9.55620002746582, 9.775420188903809, 9.994640350341797, 10.213859558105469, 10.433079719543457, 10.652299880981445, 10.871519088745117, 11.090739250183105, 11.309958457946777, 11.529178619384766, 11.748398780822754, 11.967618942260742, 12.186838150024414, 12.406058311462402, 12.62527847290039]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 6.0, 7.0, 4.0, 9.0, 6.0, 9.0, 10.0, 19.0, 18.0, 24.0, 17.0, 21.0, 26.0, 30.0, 29.0, 26.0, 43.0, 37.0, 37.0, 44.0, 47.0, 57.0, 35.0, 39.0, 26.0, 34.0, 32.0, 36.0, 28.0, 31.0, 25.0, 29.0, 28.0, 25.0, 13.0, 15.0, 15.0, 9.0, 17.0, 8.0, 7.0, 7.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.481558084487915, -2.410348892211914, -2.339139461517334, -2.267930269241333, -2.196721076965332, -2.125511646270752, -2.054302453994751, -1.98309326171875, -1.9118839502334595, -1.840674638748169, -1.769465446472168, -1.6982561349868774, -1.627046823501587, -1.555837631225586, -1.4846283197402954, -1.4134190082550049, -1.342209815979004, -1.2710005044937134, -1.1997913122177124, -1.1285820007324219, -1.057372808456421, -0.9861634969711304, -0.9149541854858398, -0.8437449336051941, -0.7725356817245483, -0.7013264298439026, -0.6301171779632568, -0.5589078664779663, -0.48769861459732056, -0.4164893627166748, -0.34528008103370667, -0.2740707993507385, -0.20286154747009277, -0.13165228068828583, -0.06044301390647888, 0.010766252875328064, 0.08197551965713501, 0.15318477153778076, 0.2243940532207489, 0.29560333490371704, 0.3668125867843628, 0.43802183866500854, 0.5092310905456543, 0.5804404020309448, 0.6516496539115906, 0.7228589057922363, 0.7940682172775269, 0.8652774691581726, 0.9364867210388184, 1.0076960325241089, 1.0789052248001099, 1.1501145362854004, 1.2213237285614014, 1.292533040046692, 1.3637423515319824, 1.4349515438079834, 1.506160855293274, 1.5773701667785645, 1.6485793590545654, 1.719788670539856, 1.7909979820251465, 1.8622071743011475, 1.933416485786438, 2.0046257972717285, 2.0758349895477295]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 5.0, 5.0, 1.0, 10.0, 10.0, 19.0, 18.0, 17.0, 18.0, 28.0, 33.0, 43.0, 48.0, 91.0, 207.0, 725.0, 3338.0, 36439.0, 868158.0, 2988759.0, 279235.0, 14102.0, 2051.0, 480.0, 143.0, 65.0, 48.0, 31.0, 14.0, 27.0, 20.0, 20.0, 11.0, 10.0, 11.0, 8.0, 10.0, 4.0, 7.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0], "bins": [-2.0390625, -1.9858551025390625, -1.932647705078125, -1.8794403076171875, -1.82623291015625, -1.7730255126953125, -1.719818115234375, -1.6666107177734375, -1.6134033203125, -1.5601959228515625, -1.506988525390625, -1.4537811279296875, -1.40057373046875, -1.3473663330078125, -1.294158935546875, -1.2409515380859375, -1.187744140625, -1.1345367431640625, -1.081329345703125, -1.0281219482421875, -0.97491455078125, -0.9217071533203125, -0.868499755859375, -0.8152923583984375, -0.7620849609375, -0.7088775634765625, -0.655670166015625, -0.6024627685546875, -0.54925537109375, -0.4960479736328125, -0.442840576171875, -0.3896331787109375, -0.33642578125, -0.2832183837890625, -0.230010986328125, -0.1768035888671875, -0.12359619140625, -0.0703887939453125, -0.017181396484375, 0.0360260009765625, 0.0892333984375, 0.1424407958984375, 0.195648193359375, 0.2488555908203125, 0.30206298828125, 0.3552703857421875, 0.408477783203125, 0.4616851806640625, 0.514892578125, 0.5680999755859375, 0.621307373046875, 0.6745147705078125, 0.72772216796875, 0.7809295654296875, 0.834136962890625, 0.8873443603515625, 0.9405517578125, 0.9937591552734375, 1.046966552734375, 1.1001739501953125, 1.15338134765625, 1.2065887451171875, 1.259796142578125, 1.3130035400390625, 1.3662109375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 3.0, 2.0, 4.0, 2.0, 9.0, 12.0, 17.0, 9.0, 14.0, 17.0, 21.0, 31.0, 36.0, 45.0, 39.0, 48.0, 46.0, 46.0, 43.0, 50.0, 52.0, 49.0, 42.0, 42.0, 48.0, 42.0, 26.0, 34.0, 25.0, 24.0, 19.0, 17.0, 18.0, 8.0, 11.0, 13.0, 6.0, 11.0, 9.0, 3.0, 3.0, 4.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0], "bins": [-0.740234375, -0.7199249267578125, -0.699615478515625, -0.6793060302734375, -0.65899658203125, -0.6386871337890625, -0.618377685546875, -0.5980682373046875, -0.5777587890625, -0.5574493408203125, -0.537139892578125, -0.5168304443359375, -0.49652099609375, -0.4762115478515625, -0.455902099609375, -0.4355926513671875, -0.415283203125, -0.3949737548828125, -0.374664306640625, -0.3543548583984375, -0.33404541015625, -0.3137359619140625, -0.293426513671875, -0.2731170654296875, -0.2528076171875, -0.2324981689453125, -0.212188720703125, -0.1918792724609375, -0.17156982421875, -0.1512603759765625, -0.130950927734375, -0.1106414794921875, -0.09033203125, -0.0700225830078125, -0.049713134765625, -0.0294036865234375, -0.00909423828125, 0.0112152099609375, 0.031524658203125, 0.0518341064453125, 0.0721435546875, 0.0924530029296875, 0.112762451171875, 0.1330718994140625, 0.15338134765625, 0.1736907958984375, 0.194000244140625, 0.2143096923828125, 0.234619140625, 0.2549285888671875, 0.275238037109375, 0.2955474853515625, 0.31585693359375, 0.3361663818359375, 0.356475830078125, 0.3767852783203125, 0.3970947265625, 0.4174041748046875, 0.437713623046875, 0.4580230712890625, 0.47833251953125, 0.4986419677734375, 0.518951416015625, 0.5392608642578125, 0.5595703125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 7.0, 4.0, 12.0, 11.0, 13.0, 21.0, 41.0, 54.0, 58.0, 94.0, 157.0, 221.0, 413.0, 1681.0, 2390954.0, 1797857.0, 1569.0, 402.0, 257.0, 153.0, 97.0, 58.0, 55.0, 34.0, 12.0, 8.0, 11.0, 6.0, 7.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.55078125, -5.37725830078125, -5.2037353515625, -5.03021240234375, -4.856689453125, -4.68316650390625, -4.5096435546875, -4.33612060546875, -4.16259765625, -3.98907470703125, -3.8155517578125, -3.64202880859375, -3.468505859375, -3.29498291015625, -3.1214599609375, -2.94793701171875, -2.7744140625, -2.60089111328125, -2.4273681640625, -2.25384521484375, -2.080322265625, -1.90679931640625, -1.7332763671875, -1.55975341796875, -1.38623046875, -1.21270751953125, -1.0391845703125, -0.86566162109375, -0.692138671875, -0.51861572265625, -0.3450927734375, -0.17156982421875, 0.001953125, 0.17547607421875, 0.3489990234375, 0.52252197265625, 0.696044921875, 0.86956787109375, 1.0430908203125, 1.21661376953125, 1.39013671875, 1.56365966796875, 1.7371826171875, 1.91070556640625, 2.084228515625, 2.25775146484375, 2.4312744140625, 2.60479736328125, 2.7783203125, 2.95184326171875, 3.1253662109375, 3.29888916015625, 3.472412109375, 3.64593505859375, 3.8194580078125, 3.99298095703125, 4.16650390625, 4.34002685546875, 4.5135498046875, 4.68707275390625, 4.860595703125, 5.03411865234375, 5.2076416015625, 5.38116455078125, 5.5546875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 11.0, 5.0, 11.0, 21.0, 19.0, 28.0, 34.0, 47.0, 74.0, 119.0, 162.0, 249.0, 339.0, 544.0, 603.0, 542.0, 395.0, 284.0, 179.0, 123.0, 84.0, 68.0, 52.0, 31.0, 19.0, 12.0, 4.0, 8.0, 2.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.323486328125, -0.3128814697265625, -0.302276611328125, -0.2916717529296875, -0.28106689453125, -0.2704620361328125, -0.259857177734375, -0.2492523193359375, -0.2386474609375, -0.2280426025390625, -0.217437744140625, -0.2068328857421875, -0.19622802734375, -0.1856231689453125, -0.175018310546875, -0.1644134521484375, -0.15380859375, -0.1432037353515625, -0.132598876953125, -0.1219940185546875, -0.11138916015625, -0.1007843017578125, -0.090179443359375, -0.0795745849609375, -0.0689697265625, -0.0583648681640625, -0.047760009765625, -0.0371551513671875, -0.02655029296875, -0.0159454345703125, -0.005340576171875, 0.0052642822265625, 0.015869140625, 0.0264739990234375, 0.037078857421875, 0.0476837158203125, 0.05828857421875, 0.0688934326171875, 0.079498291015625, 0.0901031494140625, 0.1007080078125, 0.1113128662109375, 0.121917724609375, 0.1325225830078125, 0.14312744140625, 0.1537322998046875, 0.164337158203125, 0.1749420166015625, 0.185546875, 0.1961517333984375, 0.206756591796875, 0.2173614501953125, 0.22796630859375, 0.2385711669921875, 0.249176025390625, 0.2597808837890625, 0.2703857421875, 0.2809906005859375, 0.291595458984375, 0.3022003173828125, 0.31280517578125, 0.3234100341796875, 0.334014892578125, 0.3446197509765625, 0.355224609375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 5.0, 11.0, 5.0, 13.0, 10.0, 30.0, 27.0, 56.0, 69.0, 62.0, 90.0, 99.0, 109.0, 96.0, 95.0, 76.0, 49.0, 37.0, 22.0, 15.0, 7.0, 7.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7718772888183594, -1.7314456701278687, -1.691014051437378, -1.6505823135375977, -1.610150694847107, -1.5697190761566162, -1.5292874574661255, -1.4888558387756348, -1.4484241008758545, -1.4079924821853638, -1.367560863494873, -1.3271291255950928, -1.286697506904602, -1.2462658882141113, -1.2058342695236206, -1.1654026508331299, -1.1249709129333496, -1.0845392942428589, -1.0441076755523682, -1.003675937652588, -0.9632443189620972, -0.9228127002716064, -0.8823810815811157, -0.8419494032859802, -0.8015178442001343, -0.7610862255096436, -0.7206545472145081, -0.6802229285240173, -0.6397912502288818, -0.5993596315383911, -0.5589280128479004, -0.5184963345527649, -0.4780645966529846, -0.4376329481601715, -0.3972012996673584, -0.3567696809768677, -0.3163380026817322, -0.27590638399124146, -0.23547473549842834, -0.19504308700561523, -0.15461143851280212, -0.11417979001998901, -0.0737481489777565, -0.03331650793552399, 0.0071151405572891235, 0.047546789050102234, 0.08797842264175415, 0.12841007113456726, 0.16884171962738037, 0.20927336812019348, 0.2497050166130066, 0.2901366353034973, 0.3305683135986328, 0.37099993228912354, 0.41143158078193665, 0.45186322927474976, 0.49229487776756287, 0.532726526260376, 0.5731581449508667, 0.6135898232460022, 0.6540214419364929, 0.6944531202316284, 0.7348847389221191, 0.7753163576126099, 0.8157480359077454]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 4.0, 6.0, 5.0, 8.0, 9.0, 22.0, 16.0, 16.0, 17.0, 21.0, 21.0, 22.0, 32.0, 33.0, 38.0, 30.0, 41.0, 33.0, 30.0, 41.0, 37.0, 38.0, 44.0, 34.0, 37.0, 34.0, 38.0, 27.0, 33.0, 22.0, 24.0, 24.0, 30.0, 16.0, 11.0, 21.0, 10.0, 13.0, 5.0, 11.0, 5.0, 9.0, 4.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.529818594455719, -0.511722207069397, -0.49362581968307495, -0.47552940249443054, -0.4574330151081085, -0.4393366277217865, -0.4212402105331421, -0.40314382314682007, -0.38504743576049805, -0.366951048374176, -0.348854660987854, -0.3307582437992096, -0.3126618564128876, -0.29456546902656555, -0.27646905183792114, -0.2583726644515991, -0.2402762770652771, -0.22217988967895508, -0.20408348739147186, -0.18598708510398865, -0.16789069771766663, -0.1497943103313446, -0.1316979080438614, -0.11360150575637817, -0.09550511837005615, -0.07740872353315353, -0.059312328696250916, -0.0412159338593483, -0.02311953902244568, -0.00502314418554306, 0.013073250651359558, 0.031169652938842773, 0.04926598072052002, 0.06736237555742264, 0.08545877039432526, 0.10355516523122787, 0.1216515600681305, 0.13974794745445251, 0.15784434974193573, 0.17594075202941895, 0.19403713941574097, 0.212133526802063, 0.2302299290895462, 0.24832633137702942, 0.26642271876335144, 0.28451910614967346, 0.30261552333831787, 0.3207119107246399, 0.3388082981109619, 0.35690468549728394, 0.37500107288360596, 0.39309749007225037, 0.4111938774585724, 0.4292902648448944, 0.4473866820335388, 0.46548306941986084, 0.48357945680618286, 0.5016758441925049, 0.5197722315788269, 0.5378686189651489, 0.5559650659561157, 0.5740614533424377, 0.5921578407287598, 0.6102542281150818, 0.6283506155014038]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 6.0, 13.0, 7.0, 21.0, 17.0, 24.0, 64.0, 69.0, 115.0, 176.0, 292.0, 554.0, 1079.0, 2232.0, 4918.0, 12375.0, 34794.0, 111923.0, 323503.0, 355895.0, 134446.0, 40860.0, 14307.0, 5687.0, 2476.0, 1189.0, 628.0, 352.0, 201.0, 100.0, 68.0, 52.0, 29.0, 16.0, 19.0, 7.0, 11.0, 9.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.290771484375, -0.2822380065917969, -0.27370452880859375, -0.2651710510253906, -0.2566375732421875, -0.24810409545898438, -0.23957061767578125, -0.23103713989257812, -0.222503662109375, -0.21397018432617188, -0.20543670654296875, -0.19690322875976562, -0.1883697509765625, -0.17983627319335938, -0.17130279541015625, -0.16276931762695312, -0.15423583984375, -0.14570236206054688, -0.13716888427734375, -0.12863540649414062, -0.1201019287109375, -0.11156845092773438, -0.10303497314453125, -0.09450149536132812, -0.085968017578125, -0.07743453979492188, -0.06890106201171875, -0.060367584228515625, -0.0518341064453125, -0.043300628662109375, -0.03476715087890625, -0.026233673095703125, -0.0177001953125, -0.009166717529296875, -0.00063323974609375, 0.007900238037109375, 0.0164337158203125, 0.024967193603515625, 0.03350067138671875, 0.042034149169921875, 0.050567626953125, 0.059101104736328125, 0.06763458251953125, 0.07616806030273438, 0.0847015380859375, 0.09323501586914062, 0.10176849365234375, 0.11030197143554688, 0.11883544921875, 0.12736892700195312, 0.13590240478515625, 0.14443588256835938, 0.1529693603515625, 0.16150283813476562, 0.17003631591796875, 0.17856979370117188, 0.187103271484375, 0.19563674926757812, 0.20417022705078125, 0.21270370483398438, 0.2212371826171875, 0.22977066040039062, 0.23830413818359375, 0.24683761596679688, 0.25537109375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 6.0, 2.0, 12.0, 11.0, 16.0, 22.0, 32.0, 22.0, 35.0, 44.0, 49.0, 60.0, 52.0, 59.0, 53.0, 55.0, 67.0, 44.0, 42.0, 48.0, 52.0, 34.0, 34.0, 25.0, 24.0, 22.0, 23.0, 16.0, 9.0, 8.0, 3.0, 8.0, 2.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5341796875, -0.518310546875, -0.50244140625, -0.486572265625, -0.470703125, -0.454833984375, -0.43896484375, -0.423095703125, -0.4072265625, -0.391357421875, -0.37548828125, -0.359619140625, -0.34375, -0.327880859375, -0.31201171875, -0.296142578125, -0.2802734375, -0.264404296875, -0.24853515625, -0.232666015625, -0.216796875, -0.200927734375, -0.18505859375, -0.169189453125, -0.1533203125, -0.137451171875, -0.12158203125, -0.105712890625, -0.08984375, -0.073974609375, -0.05810546875, -0.042236328125, -0.0263671875, -0.010498046875, 0.00537109375, 0.021240234375, 0.037109375, 0.052978515625, 0.06884765625, 0.084716796875, 0.1005859375, 0.116455078125, 0.13232421875, 0.148193359375, 0.1640625, 0.179931640625, 0.19580078125, 0.211669921875, 0.2275390625, 0.243408203125, 0.25927734375, 0.275146484375, 0.291015625, 0.306884765625, 0.32275390625, 0.338623046875, 0.3544921875, 0.370361328125, 0.38623046875, 0.402099609375, 0.41796875, 0.433837890625, 0.44970703125, 0.465576171875, 0.4814453125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 3.0, 0.0, 5.0, 4.0, 4.0, 11.0, 16.0, 16.0, 29.0, 32.0, 60.0, 65.0, 101.0, 141.0, 232.0, 358.0, 666.0, 1180.0, 2272.0, 4653.0, 9945.0, 23500.0, 60956.0, 159110.0, 299690.0, 273060.0, 128722.0, 48323.0, 18990.0, 8138.0, 3870.0, 1836.0, 1037.0, 559.0, 353.0, 206.0, 108.0, 79.0, 53.0, 48.0, 32.0, 30.0, 24.0, 8.0, 8.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.226806640625, -0.22048568725585938, -0.21416473388671875, -0.20784378051757812, -0.2015228271484375, -0.19520187377929688, -0.18888092041015625, -0.18255996704101562, -0.176239013671875, -0.16991806030273438, -0.16359710693359375, -0.15727615356445312, -0.1509552001953125, -0.14463424682617188, -0.13831329345703125, -0.13199234008789062, -0.12567138671875, -0.11935043334960938, -0.11302947998046875, -0.10670852661132812, -0.1003875732421875, -0.09406661987304688, -0.08774566650390625, -0.08142471313476562, -0.075103759765625, -0.06878280639648438, -0.06246185302734375, -0.056140899658203125, -0.0498199462890625, -0.043498992919921875, -0.03717803955078125, -0.030857086181640625, -0.0245361328125, -0.018215179443359375, -0.01189422607421875, -0.005573272705078125, 0.0007476806640625, 0.007068634033203125, 0.01338958740234375, 0.019710540771484375, 0.026031494140625, 0.032352447509765625, 0.03867340087890625, 0.044994354248046875, 0.0513153076171875, 0.057636260986328125, 0.06395721435546875, 0.07027816772460938, 0.07659912109375, 0.08292007446289062, 0.08924102783203125, 0.09556198120117188, 0.1018829345703125, 0.10820388793945312, 0.11452484130859375, 0.12084579467773438, 0.127166748046875, 0.13348770141601562, 0.13980865478515625, 0.14612960815429688, 0.1524505615234375, 0.15877151489257812, 0.16509246826171875, 0.17141342163085938, 0.177734375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 6.0, 6.0, 6.0, 8.0, 21.0, 13.0, 27.0, 24.0, 23.0, 28.0, 27.0, 28.0, 29.0, 50.0, 43.0, 38.0, 45.0, 55.0, 35.0, 43.0, 39.0, 50.0, 32.0, 41.0, 39.0, 39.0, 30.0, 24.0, 26.0, 23.0, 26.0, 18.0, 8.0, 8.0, 6.0, 5.0, 8.0, 6.0, 6.0, 5.0, 0.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.75634765625, -0.73394775390625, -0.7115478515625, -0.68914794921875, -0.666748046875, -0.64434814453125, -0.6219482421875, -0.59954833984375, -0.5771484375, -0.55474853515625, -0.5323486328125, -0.50994873046875, -0.487548828125, -0.46514892578125, -0.4427490234375, -0.42034912109375, -0.39794921875, -0.37554931640625, -0.3531494140625, -0.33074951171875, -0.308349609375, -0.28594970703125, -0.2635498046875, -0.24114990234375, -0.21875, -0.19635009765625, -0.1739501953125, -0.15155029296875, -0.129150390625, -0.10675048828125, -0.0843505859375, -0.06195068359375, -0.03955078125, -0.01715087890625, 0.0052490234375, 0.02764892578125, 0.050048828125, 0.07244873046875, 0.0948486328125, 0.11724853515625, 0.1396484375, 0.16204833984375, 0.1844482421875, 0.20684814453125, 0.229248046875, 0.25164794921875, 0.2740478515625, 0.29644775390625, 0.31884765625, 0.34124755859375, 0.3636474609375, 0.38604736328125, 0.408447265625, 0.43084716796875, 0.4532470703125, 0.47564697265625, 0.498046875, 0.52044677734375, 0.5428466796875, 0.56524658203125, 0.587646484375, 0.61004638671875, 0.6324462890625, 0.65484619140625, 0.67724609375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 8.0, 16.0, 19.0, 27.0, 40.0, 35.0, 75.0, 119.0, 159.0, 280.0, 435.0, 753.0, 1406.0, 2595.0, 5296.0, 11821.0, 29889.0, 86641.0, 258426.0, 381891.0, 174126.0, 56296.0, 20449.0, 8735.0, 4094.0, 2106.0, 1146.0, 599.0, 368.0, 248.0, 134.0, 101.0, 48.0, 47.0, 35.0, 22.0, 16.0, 15.0, 9.0, 5.0, 5.0, 2.0, 1.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.080078125, -0.07752037048339844, -0.07496261596679688, -0.07240486145019531, -0.06984710693359375, -0.06728935241699219, -0.06473159790039062, -0.06217384338378906, -0.0596160888671875, -0.05705833435058594, -0.054500579833984375, -0.05194282531738281, -0.04938507080078125, -0.04682731628417969, -0.044269561767578125, -0.04171180725097656, -0.039154052734375, -0.03659629821777344, -0.034038543701171875, -0.03148078918457031, -0.02892303466796875, -0.026365280151367188, -0.023807525634765625, -0.021249771118164062, -0.0186920166015625, -0.016134262084960938, -0.013576507568359375, -0.011018753051757812, -0.00846099853515625, -0.0059032440185546875, -0.003345489501953125, -0.0007877349853515625, 0.00177001953125, 0.0043277740478515625, 0.006885528564453125, 0.009443283081054688, 0.01200103759765625, 0.014558792114257812, 0.017116546630859375, 0.019674301147460938, 0.0222320556640625, 0.024789810180664062, 0.027347564697265625, 0.029905319213867188, 0.03246307373046875, 0.03502082824707031, 0.037578582763671875, 0.04013633728027344, 0.042694091796875, 0.04525184631347656, 0.047809600830078125, 0.05036735534667969, 0.05292510986328125, 0.05548286437988281, 0.058040618896484375, 0.06059837341308594, 0.0631561279296875, 0.06571388244628906, 0.06827163696289062, 0.07082939147949219, 0.07338714599609375, 0.07594490051269531, 0.07850265502929688, 0.08106040954589844, 0.0836181640625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 13.0, 13.0, 22.0, 27.0, 33.0, 48.0, 58.0, 64.0, 80.0, 82.0, 102.0, 87.0, 78.0, 74.0, 63.0, 40.0, 30.0, 19.0, 9.0, 10.0, 11.0, 4.0, 5.0, 6.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.143880844116211e-05, -4.984065890312195e-05, -4.824250936508179e-05, -4.6644359827041626e-05, -4.5046210289001465e-05, -4.3448060750961304e-05, -4.184991121292114e-05, -4.025176167488098e-05, -3.865361213684082e-05, -3.705546259880066e-05, -3.54573130607605e-05, -3.385916352272034e-05, -3.2261013984680176e-05, -3.0662864446640015e-05, -2.9064714908599854e-05, -2.7466565370559692e-05, -2.586841583251953e-05, -2.427026629447937e-05, -2.267211675643921e-05, -2.1073967218399048e-05, -1.9475817680358887e-05, -1.7877668142318726e-05, -1.6279518604278564e-05, -1.4681369066238403e-05, -1.3083219528198242e-05, -1.1485069990158081e-05, -9.88692045211792e-06, -8.288770914077759e-06, -6.690621376037598e-06, -5.0924718379974365e-06, -3.4943222999572754e-06, -1.8961727619171143e-06, -2.980232238769531e-07, 1.300126314163208e-06, 2.898275852203369e-06, 4.49642539024353e-06, 6.094574928283691e-06, 7.692724466323853e-06, 9.290874004364014e-06, 1.0889023542404175e-05, 1.2487173080444336e-05, 1.4085322618484497e-05, 1.5683472156524658e-05, 1.728162169456482e-05, 1.887977123260498e-05, 2.047792077064514e-05, 2.2076070308685303e-05, 2.3674219846725464e-05, 2.5272369384765625e-05, 2.6870518922805786e-05, 2.8468668460845947e-05, 3.006681799888611e-05, 3.166496753692627e-05, 3.326311707496643e-05, 3.486126661300659e-05, 3.645941615104675e-05, 3.8057565689086914e-05, 3.9655715227127075e-05, 4.1253864765167236e-05, 4.28520143032074e-05, 4.445016384124756e-05, 4.604831337928772e-05, 4.764646291732788e-05, 4.924461245536804e-05, 5.08427619934082e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 12.0, 17.0, 25.0, 56.0, 160.0, 638.0, 7256.0, 411791.0, 617014.0, 10438.0, 833.0, 157.0, 59.0, 36.0, 19.0, 12.0, 11.0, 9.0, 3.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.414306640625, -0.4028167724609375, -0.391326904296875, -0.3798370361328125, -0.36834716796875, -0.3568572998046875, -0.345367431640625, -0.3338775634765625, -0.3223876953125, -0.3108978271484375, -0.299407958984375, -0.2879180908203125, -0.27642822265625, -0.2649383544921875, -0.253448486328125, -0.2419586181640625, -0.23046875, -0.2189788818359375, -0.207489013671875, -0.1959991455078125, -0.18450927734375, -0.1730194091796875, -0.161529541015625, -0.1500396728515625, -0.1385498046875, -0.1270599365234375, -0.115570068359375, -0.1040802001953125, -0.09259033203125, -0.0811004638671875, -0.069610595703125, -0.0581207275390625, -0.046630859375, -0.0351409912109375, -0.023651123046875, -0.0121612548828125, -0.00067138671875, 0.0108184814453125, 0.022308349609375, 0.0337982177734375, 0.0452880859375, 0.0567779541015625, 0.068267822265625, 0.0797576904296875, 0.09124755859375, 0.1027374267578125, 0.114227294921875, 0.1257171630859375, 0.13720703125, 0.1486968994140625, 0.160186767578125, 0.1716766357421875, 0.18316650390625, 0.1946563720703125, 0.206146240234375, 0.2176361083984375, 0.2291259765625, 0.2406158447265625, 0.252105712890625, 0.2635955810546875, 0.27508544921875, 0.2865753173828125, 0.298065185546875, 0.3095550537109375, 0.321044921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 4.0, 6.0, 6.0, 3.0, 10.0, 11.0, 13.0, 17.0, 17.0, 31.0, 15.0, 25.0, 35.0, 40.0, 42.0, 39.0, 51.0, 37.0, 44.0, 53.0, 51.0, 52.0, 55.0, 48.0, 39.0, 36.0, 32.0, 16.0, 27.0, 24.0, 16.0, 17.0, 13.0, 12.0, 11.0, 4.0, 7.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0], "bins": [-0.0187530517578125, -0.0182039737701416, -0.017654895782470703, -0.017105817794799805, -0.016556739807128906, -0.016007661819458008, -0.01545858383178711, -0.014909505844116211, -0.014360427856445312, -0.013811349868774414, -0.013262271881103516, -0.012713193893432617, -0.012164115905761719, -0.01161503791809082, -0.011065959930419922, -0.010516881942749023, -0.009967803955078125, -0.009418725967407227, -0.008869647979736328, -0.00832056999206543, -0.007771492004394531, -0.007222414016723633, -0.006673336029052734, -0.006124258041381836, -0.0055751800537109375, -0.005026102066040039, -0.004477024078369141, -0.003927946090698242, -0.0033788681030273438, -0.0028297901153564453, -0.002280712127685547, -0.0017316341400146484, -0.00118255615234375, -0.0006334781646728516, -8.440017700195312e-05, 0.0004646778106689453, 0.0010137557983398438, 0.0015628337860107422, 0.0021119117736816406, 0.002660989761352539, 0.0032100677490234375, 0.003759145736694336, 0.004308223724365234, 0.004857301712036133, 0.005406379699707031, 0.00595545768737793, 0.006504535675048828, 0.0070536136627197266, 0.007602691650390625, 0.008151769638061523, 0.008700847625732422, 0.00924992561340332, 0.009799003601074219, 0.010348081588745117, 0.010897159576416016, 0.011446237564086914, 0.011995315551757812, 0.012544393539428711, 0.01309347152709961, 0.013642549514770508, 0.014191627502441406, 0.014740705490112305, 0.015289783477783203, 0.0158388614654541, 0.016387939453125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 11.0, 7.0, 5.0, 7.0, 10.0, 14.0, 17.0, 31.0, 42.0, 67.0, 54.0, 73.0, 91.0, 102.0, 95.0, 91.0, 70.0, 62.0, 47.0, 29.0, 29.0, 14.0, 12.0, 6.0, 2.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.7695910930633545, -0.7489527463912964, -0.7283143401145935, -0.7076759934425354, -0.6870375871658325, -0.6663992404937744, -0.6457608342170715, -0.6251224875450134, -0.6044840812683105, -0.5838457345962524, -0.5632073283195496, -0.5425689816474915, -0.5219305753707886, -0.5012922286987305, -0.48065385222435, -0.4600154757499695, -0.4393771290779114, -0.4187387526035309, -0.3981003761291504, -0.3774619996547699, -0.3568236231803894, -0.3361852765083313, -0.3155469000339508, -0.2949085235595703, -0.2742701470851898, -0.2536317706108093, -0.23299339413642883, -0.21235503256320953, -0.19171665608882904, -0.17107827961444855, -0.15043991804122925, -0.12980154156684875, -0.10916322469711304, -0.08852484822273254, -0.06788647919893265, -0.04724810644984245, -0.02660973370075226, -0.005971357226371765, 0.014667011797428131, 0.03530538082122803, 0.05594375729560852, 0.07658213376998901, 0.09722050279378891, 0.1178588718175888, 0.1384972482919693, 0.1591356247663498, 0.1797739863395691, 0.20041236281394958, 0.22105073928833008, 0.24168911576271057, 0.26232749223709106, 0.28296586871147156, 0.30360424518585205, 0.32424259185791016, 0.34488096833229065, 0.36551934480667114, 0.38615772128105164, 0.40679609775543213, 0.4274344742298126, 0.4480728507041931, 0.4687111973762512, 0.4893496036529541, 0.5099879503250122, 0.5306262969970703, 0.5512647032737732]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 5.0, 5.0, 3.0, 2.0, 9.0, 9.0, 16.0, 20.0, 19.0, 19.0, 25.0, 27.0, 42.0, 36.0, 34.0, 49.0, 39.0, 52.0, 38.0, 55.0, 53.0, 42.0, 56.0, 32.0, 39.0, 37.0, 34.0, 31.0, 27.0, 30.0, 21.0, 15.0, 16.0, 12.0, 8.0, 15.0, 8.0, 2.0, 6.0, 4.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.4578585922718048, -0.4452306628227234, -0.43260273337364197, -0.41997480392456055, -0.40734684467315674, -0.3947189152240753, -0.3820909857749939, -0.3694630563259125, -0.35683512687683105, -0.34420719742774963, -0.3315792679786682, -0.3189513087272644, -0.306323379278183, -0.29369544982910156, -0.28106752038002014, -0.2684395909309387, -0.2558116316795349, -0.2431837022304535, -0.23055575788021088, -0.21792782843112946, -0.20529988408088684, -0.19267195463180542, -0.180044025182724, -0.16741609573364258, -0.15478815138339996, -0.14216022193431854, -0.12953227758407593, -0.1169043481349945, -0.10427641123533249, -0.09164847433567047, -0.07902054488658905, -0.06639260798692703, -0.05376464128494263, -0.04113670438528061, -0.02850877121090889, -0.01588083803653717, -0.0032529011368751526, 0.009375035762786865, 0.022002965211868286, 0.034630902111530304, 0.04725883901119232, 0.05988677591085434, 0.07251471281051636, 0.08514264225959778, 0.0977705791592598, 0.11039851605892181, 0.12302644550800323, 0.13565438985824585, 0.14828231930732727, 0.1609102487564087, 0.1735381931066513, 0.18616612255573273, 0.19879406690597534, 0.21142199635505676, 0.22404992580413818, 0.2366778552532196, 0.24930579960346222, 0.26193374395370483, 0.27456167340278625, 0.2871896028518677, 0.2998175323009491, 0.3124454617500305, 0.3250734210014343, 0.33770135045051575, 0.35032927989959717]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 9.0, 22.0, 25.0, 32.0, 46.0, 80.0, 172.0, 323.0, 649.0, 1437.0, 3674.0, 10147.0, 34505.0, 165257.0, 575628.0, 198774.0, 39231.0, 11307.0, 4126.0, 1654.0, 698.0, 348.0, 164.0, 101.0, 48.0, 31.0, 17.0, 17.0, 7.0, 5.0, 6.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55078125, -0.5327529907226562, -0.5147247314453125, -0.49669647216796875, -0.478668212890625, -0.46063995361328125, -0.4426116943359375, -0.42458343505859375, -0.40655517578125, -0.38852691650390625, -0.3704986572265625, -0.35247039794921875, -0.334442138671875, -0.31641387939453125, -0.2983856201171875, -0.28035736083984375, -0.2623291015625, -0.24430084228515625, -0.2262725830078125, -0.20824432373046875, -0.190216064453125, -0.17218780517578125, -0.1541595458984375, -0.13613128662109375, -0.11810302734375, -0.10007476806640625, -0.0820465087890625, -0.06401824951171875, -0.045989990234375, -0.02796173095703125, -0.0099334716796875, 0.00809478759765625, 0.026123046875, 0.04415130615234375, 0.0621795654296875, 0.08020782470703125, 0.098236083984375, 0.11626434326171875, 0.1342926025390625, 0.15232086181640625, 0.17034912109375, 0.18837738037109375, 0.2064056396484375, 0.22443389892578125, 0.242462158203125, 0.26049041748046875, 0.2785186767578125, 0.29654693603515625, 0.3145751953125, 0.33260345458984375, 0.3506317138671875, 0.36865997314453125, 0.386688232421875, 0.40471649169921875, 0.4227447509765625, 0.44077301025390625, 0.45880126953125, 0.47682952880859375, 0.4948577880859375, 0.5128860473632812, 0.530914306640625, 0.5489425659179688, 0.5669708251953125, 0.5849990844726562, 0.60302734375]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 12.0, 3.0, 8.0, 8.0, 26.0, 12.0, 24.0, 35.0, 23.0, 33.0, 32.0, 35.0, 47.0, 50.0, 57.0, 43.0, 61.0, 51.0, 46.0, 58.0, 37.0, 35.0, 45.0, 35.0, 27.0, 26.0, 19.0, 20.0, 20.0, 9.0, 6.0, 17.0, 11.0, 10.0, 7.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 4.0, 1.0], "bins": [-1.0927734375, -1.0632858276367188, -1.0337982177734375, -1.0043106079101562, -0.974822998046875, -0.9453353881835938, -0.9158477783203125, -0.8863601684570312, -0.85687255859375, -0.8273849487304688, -0.7978973388671875, -0.7684097290039062, -0.738922119140625, -0.7094345092773438, -0.6799468994140625, -0.6504592895507812, -0.6209716796875, -0.5914840698242188, -0.5619964599609375, -0.5325088500976562, -0.503021240234375, -0.47353363037109375, -0.4440460205078125, -0.41455841064453125, -0.38507080078125, -0.35558319091796875, -0.3260955810546875, -0.29660797119140625, -0.267120361328125, -0.23763275146484375, -0.2081451416015625, -0.17865753173828125, -0.149169921875, -0.11968231201171875, -0.0901947021484375, -0.06070709228515625, -0.031219482421875, -0.00173187255859375, 0.0277557373046875, 0.05724334716796875, 0.08673095703125, 0.11621856689453125, 0.1457061767578125, 0.17519378662109375, 0.204681396484375, 0.23416900634765625, 0.2636566162109375, 0.29314422607421875, 0.3226318359375, 0.35211944580078125, 0.3816070556640625, 0.41109466552734375, 0.440582275390625, 0.47006988525390625, 0.4995574951171875, 0.5290451049804688, 0.55853271484375, 0.5880203247070312, 0.6175079345703125, 0.6469955444335938, 0.676483154296875, 0.7059707641601562, 0.7354583740234375, 0.7649459838867188, 0.79443359375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 8.0, 8.0, 19.0, 12.0, 15.0, 17.0, 11.0, 22.0, 17.0, 23.0, 22.0, 30.0, 34.0, 42.0, 39.0, 53.0, 95.0, 464.0, 41114.0, 1003683.0, 2213.0, 167.0, 69.0, 69.0, 45.0, 34.0, 30.0, 25.0, 18.0, 21.0, 19.0, 16.0, 21.0, 8.0, 10.0, 9.0, 9.0, 3.0, 8.0, 7.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.4453125, -3.3350830078125, -3.224853515625, -3.1146240234375, -3.00439453125, -2.8941650390625, -2.783935546875, -2.6737060546875, -2.5634765625, -2.4532470703125, -2.343017578125, -2.2327880859375, -2.12255859375, -2.0123291015625, -1.902099609375, -1.7918701171875, -1.681640625, -1.5714111328125, -1.461181640625, -1.3509521484375, -1.24072265625, -1.1304931640625, -1.020263671875, -0.9100341796875, -0.7998046875, -0.6895751953125, -0.579345703125, -0.4691162109375, -0.35888671875, -0.2486572265625, -0.138427734375, -0.0281982421875, 0.08203125, 0.1922607421875, 0.302490234375, 0.4127197265625, 0.52294921875, 0.6331787109375, 0.743408203125, 0.8536376953125, 0.9638671875, 1.0740966796875, 1.184326171875, 1.2945556640625, 1.40478515625, 1.5150146484375, 1.625244140625, 1.7354736328125, 1.845703125, 1.9559326171875, 2.066162109375, 2.1763916015625, 2.28662109375, 2.3968505859375, 2.507080078125, 2.6173095703125, 2.7275390625, 2.8377685546875, 2.947998046875, 3.0582275390625, 3.16845703125, 3.2786865234375, 3.388916015625, 3.4991455078125, 3.609375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 6.0, 8.0, 10.0, 16.0, 10.0, 10.0, 12.0, 25.0, 13.0, 21.0, 24.0, 29.0, 24.0, 32.0, 30.0, 52.0, 29.0, 33.0, 35.0, 48.0, 46.0, 30.0, 48.0, 29.0, 40.0, 45.0, 39.0, 38.0, 29.0, 27.0, 19.0, 18.0, 24.0, 12.0, 12.0, 13.0, 16.0, 6.0, 8.0, 3.0, 7.0, 7.0, 2.0, 4.0, 3.0, 2.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7724609375, -0.747314453125, -0.72216796875, -0.697021484375, -0.671875, -0.646728515625, -0.62158203125, -0.596435546875, -0.5712890625, -0.546142578125, -0.52099609375, -0.495849609375, -0.470703125, -0.445556640625, -0.42041015625, -0.395263671875, -0.3701171875, -0.344970703125, -0.31982421875, -0.294677734375, -0.26953125, -0.244384765625, -0.21923828125, -0.194091796875, -0.1689453125, -0.143798828125, -0.11865234375, -0.093505859375, -0.068359375, -0.043212890625, -0.01806640625, 0.007080078125, 0.0322265625, 0.057373046875, 0.08251953125, 0.107666015625, 0.1328125, 0.157958984375, 0.18310546875, 0.208251953125, 0.2333984375, 0.258544921875, 0.28369140625, 0.308837890625, 0.333984375, 0.359130859375, 0.38427734375, 0.409423828125, 0.4345703125, 0.459716796875, 0.48486328125, 0.510009765625, 0.53515625, 0.560302734375, 0.58544921875, 0.610595703125, 0.6357421875, 0.660888671875, 0.68603515625, 0.711181640625, 0.736328125, 0.761474609375, 0.78662109375, 0.811767578125, 0.8369140625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 5.0, 2.0, 7.0, 4.0, 8.0, 12.0, 21.0, 50.0, 71.0, 129.0, 336.0, 1209.0, 8953.0, 267491.0, 745744.0, 21480.0, 2117.0, 505.0, 204.0, 86.0, 49.0, 24.0, 21.0, 10.0, 10.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.62109375, -0.6063613891601562, -0.5916290283203125, -0.5768966674804688, -0.562164306640625, -0.5474319458007812, -0.5326995849609375, -0.5179672241210938, -0.50323486328125, -0.48850250244140625, -0.4737701416015625, -0.45903778076171875, -0.444305419921875, -0.42957305908203125, -0.4148406982421875, -0.40010833740234375, -0.3853759765625, -0.37064361572265625, -0.3559112548828125, -0.34117889404296875, -0.326446533203125, -0.31171417236328125, -0.2969818115234375, -0.28224945068359375, -0.26751708984375, -0.25278472900390625, -0.2380523681640625, -0.22332000732421875, -0.208587646484375, -0.19385528564453125, -0.1791229248046875, -0.16439056396484375, -0.149658203125, -0.13492584228515625, -0.1201934814453125, -0.10546112060546875, -0.090728759765625, -0.07599639892578125, -0.0612640380859375, -0.04653167724609375, -0.03179931640625, -0.01706695556640625, -0.0023345947265625, 0.01239776611328125, 0.027130126953125, 0.04186248779296875, 0.0565948486328125, 0.07132720947265625, 0.0860595703125, 0.10079193115234375, 0.1155242919921875, 0.13025665283203125, 0.144989013671875, 0.15972137451171875, 0.1744537353515625, 0.18918609619140625, 0.20391845703125, 0.21865081787109375, 0.2333831787109375, 0.24811553955078125, 0.262847900390625, 0.27758026123046875, 0.2923126220703125, 0.30704498291015625, 0.32177734375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 6.0, 5.0, 10.0, 19.0, 37.0, 34.0, 45.0, 59.0, 98.0, 105.0, 131.0, 111.0, 103.0, 69.0, 43.0, 35.0, 24.0, 16.0, 14.0, 11.0, 9.0, 5.0, 4.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.473592758178711e-05, -2.367887645959854e-05, -2.2621825337409973e-05, -2.1564774215221405e-05, -2.0507723093032837e-05, -1.945067197084427e-05, -1.83936208486557e-05, -1.7336569726467133e-05, -1.6279518604278564e-05, -1.5222467482089996e-05, -1.4165416359901428e-05, -1.310836523771286e-05, -1.2051314115524292e-05, -1.0994262993335724e-05, -9.937211871147156e-06, -8.880160748958588e-06, -7.82310962677002e-06, -6.766058504581451e-06, -5.709007382392883e-06, -4.651956260204315e-06, -3.594905138015747e-06, -2.537854015827179e-06, -1.4808028936386108e-06, -4.237517714500427e-07, 6.332993507385254e-07, 1.6903504729270935e-06, 2.7474015951156616e-06, 3.8044527173042297e-06, 4.861503839492798e-06, 5.918554961681366e-06, 6.975606083869934e-06, 8.032657206058502e-06, 9.08970832824707e-06, 1.0146759450435638e-05, 1.1203810572624207e-05, 1.2260861694812775e-05, 1.3317912817001343e-05, 1.4374963939189911e-05, 1.543201506137848e-05, 1.6489066183567047e-05, 1.7546117305755615e-05, 1.8603168427944183e-05, 1.966021955013275e-05, 2.071727067232132e-05, 2.1774321794509888e-05, 2.2831372916698456e-05, 2.3888424038887024e-05, 2.4945475161075592e-05, 2.600252628326416e-05, 2.7059577405452728e-05, 2.8116628527641296e-05, 2.9173679649829865e-05, 3.0230730772018433e-05, 3.1287781894207e-05, 3.234483301639557e-05, 3.340188413858414e-05, 3.4458935260772705e-05, 3.551598638296127e-05, 3.657303750514984e-05, 3.763008862733841e-05, 3.868713974952698e-05, 3.9744190871715546e-05, 4.0801241993904114e-05, 4.185829311609268e-05, 4.291534423828125e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 2.0, 7.0, 11.0, 9.0, 14.0, 11.0, 26.0, 31.0, 58.0, 71.0, 115.0, 232.0, 354.0, 794.0, 1570.0, 3912.0, 11426.0, 46652.0, 276876.0, 559407.0, 113028.0, 22418.0, 6582.0, 2418.0, 1137.0, 581.0, 308.0, 184.0, 100.0, 54.0, 46.0, 34.0, 16.0, 14.0, 10.0, 8.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.19580078125, -0.18973159790039062, -0.18366241455078125, -0.17759323120117188, -0.1715240478515625, -0.16545486450195312, -0.15938568115234375, -0.15331649780273438, -0.147247314453125, -0.14117813110351562, -0.13510894775390625, -0.12903976440429688, -0.1229705810546875, -0.11690139770507812, -0.11083221435546875, -0.10476303100585938, -0.09869384765625, -0.09262466430664062, -0.08655548095703125, -0.08048629760742188, -0.0744171142578125, -0.06834793090820312, -0.06227874755859375, -0.056209564208984375, -0.050140380859375, -0.044071197509765625, -0.03800201416015625, -0.031932830810546875, -0.0258636474609375, -0.019794464111328125, -0.01372528076171875, -0.007656097412109375, -0.0015869140625, 0.004482269287109375, 0.01055145263671875, 0.016620635986328125, 0.0226898193359375, 0.028759002685546875, 0.03482818603515625, 0.040897369384765625, 0.046966552734375, 0.053035736083984375, 0.05910491943359375, 0.06517410278320312, 0.0712432861328125, 0.07731246948242188, 0.08338165283203125, 0.08945083618164062, 0.09552001953125, 0.10158920288085938, 0.10765838623046875, 0.11372756958007812, 0.1197967529296875, 0.12586593627929688, 0.13193511962890625, 0.13800430297851562, 0.144073486328125, 0.15014266967773438, 0.15621185302734375, 0.16228103637695312, 0.1683502197265625, 0.17441940307617188, 0.18048858642578125, 0.18655776977539062, 0.192626953125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 8.0, 13.0, 10.0, 19.0, 23.0, 22.0, 30.0, 37.0, 59.0, 58.0, 77.0, 80.0, 85.0, 87.0, 69.0, 61.0, 60.0, 46.0, 39.0, 29.0, 18.0, 10.0, 15.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.088623046875, -0.08614444732666016, -0.08366584777832031, -0.08118724822998047, -0.07870864868164062, -0.07623004913330078, -0.07375144958496094, -0.0712728500366211, -0.06879425048828125, -0.0663156509399414, -0.06383705139160156, -0.06135845184326172, -0.058879852294921875, -0.05640125274658203, -0.05392265319824219, -0.051444053649902344, -0.0489654541015625, -0.046486854553222656, -0.04400825500488281, -0.04152965545654297, -0.039051055908203125, -0.03657245635986328, -0.03409385681152344, -0.031615257263183594, -0.02913665771484375, -0.026658058166503906, -0.024179458618164062, -0.02170085906982422, -0.019222259521484375, -0.01674365997314453, -0.014265060424804688, -0.011786460876464844, -0.009307861328125, -0.006829261779785156, -0.0043506622314453125, -0.0018720626831054688, 0.000606536865234375, 0.0030851364135742188, 0.0055637359619140625, 0.008042335510253906, 0.01052093505859375, 0.012999534606933594, 0.015478134155273438, 0.01795673370361328, 0.020435333251953125, 0.02291393280029297, 0.025392532348632812, 0.027871131896972656, 0.0303497314453125, 0.032828330993652344, 0.03530693054199219, 0.03778553009033203, 0.040264129638671875, 0.04274272918701172, 0.04522132873535156, 0.047699928283691406, 0.05017852783203125, 0.052657127380371094, 0.05513572692871094, 0.05761432647705078, 0.060092926025390625, 0.06257152557373047, 0.06505012512207031, 0.06752872467041016, 0.07000732421875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 30.0, 65.0, 186.0, 317.0, 270.0, 96.0, 30.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.866697072982788, -1.718356966972351, -1.5700169801712036, -1.4216768741607666, -1.2733368873596191, -1.1249967813491821, -0.9766566753387451, -0.8283166885375977, -0.6799765825271606, -0.5316365361213684, -0.3832964599132538, -0.23495638370513916, -0.08661633729934692, 0.06172370910644531, 0.21006381511688232, 0.3584038019180298, 0.5067439079284668, 0.655083954334259, 0.8034240007400513, 0.9517641067504883, 1.1001040935516357, 1.2484441995620728, 1.3967843055725098, 1.5451242923736572, 1.6934643983840942, 1.8418045043945312, 1.9901444911956787, 2.138484477996826, 2.2868247032165527, 2.4351646900177, 2.5835046768188477, 2.731844902038574, 2.8801846504211426, 3.02852463722229, 3.1768648624420166, 3.325204849243164, 3.4735448360443115, 3.621884822845459, 3.7702250480651855, 3.918565034866333, 4.0669050216674805, 4.215245246887207, 4.363584995269775, 4.511925220489502, 4.6602654457092285, 4.808605194091797, 4.956945419311523, 5.10528564453125, 5.253625869750977, 5.401966094970703, 5.5503058433532715, 5.698646068572998, 5.846986293792725, 5.995326042175293, 6.1436662673950195, 6.292006492614746, 6.4403462409973145, 6.588686466217041, 6.737026214599609, 6.885366439819336, 7.0337066650390625, 7.182046413421631, 7.330386638641357, 7.478726387023926, 7.627066612243652]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 4.0, 8.0, 21.0, 12.0, 18.0, 20.0, 30.0, 21.0, 32.0, 31.0, 37.0, 44.0, 36.0, 35.0, 40.0, 54.0, 44.0, 48.0, 36.0, 34.0, 49.0, 38.0, 22.0, 37.0, 28.0, 29.0, 33.0, 32.0, 22.0, 21.0, 20.0, 14.0, 3.0, 8.0, 9.0, 5.0, 6.0, 3.0, 1.0, 7.0, 7.0, 1.0, 4.0], "bins": [-1.5705806016921997, -1.5312174558639526, -1.4918543100357056, -1.452491044998169, -1.4131278991699219, -1.3737647533416748, -1.3344016075134277, -1.2950384616851807, -1.2556753158569336, -1.2163121700286865, -1.1769490242004395, -1.1375857591629028, -1.0982226133346558, -1.0588594675064087, -1.0194963216781616, -0.9801331758499146, -0.9407699108123779, -0.9014067649841309, -0.862043559551239, -0.8226804137229919, -0.7833172082901001, -0.743954062461853, -0.704590916633606, -0.6652277708053589, -0.625864565372467, -0.58650141954422, -0.5471382141113281, -0.507775068283081, -0.4684118926525116, -0.42904871702194214, -0.38968557119369507, -0.3503223955631256, -0.3109592795372009, -0.27159610390663147, -0.2322329431772232, -0.19286978244781494, -0.15350660681724548, -0.11414343118667603, -0.07478027045726776, -0.0354171097278595, 0.003946065902709961, 0.04330923408269882, 0.08267240226268768, 0.12203557044267654, 0.1613987386226654, 0.20076191425323486, 0.24012507498264313, 0.2794882357120514, 0.31885141134262085, 0.3582145869731903, 0.39757776260375977, 0.43694090843200684, 0.4763040840625763, 0.5156672596931458, 0.5550304055213928, 0.5943936109542847, 0.6337567567825317, 0.6731199026107788, 0.7124831080436707, 0.7518462538719177, 0.7912094593048096, 0.8305726051330566, 0.8699357509613037, 0.9092988967895508, 0.9486621022224426]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 2.0, 6.0, 4.0, 7.0, 13.0, 10.0, 20.0, 16.0, 25.0, 33.0, 37.0, 62.0, 100.0, 117.0, 211.0, 402.0, 755.0, 1639.0, 3867.0, 10631.0, 37752.0, 161126.0, 634401.0, 1622708.0, 1251378.0, 356881.0, 78183.0, 20939.0, 7156.0, 2875.0, 1278.0, 628.0, 354.0, 226.0, 123.0, 95.0, 52.0, 43.0, 30.0, 27.0, 10.0, 8.0, 18.0, 4.0, 9.0, 5.0, 6.0, 2.0, 4.0, 4.0, 2.0], "bins": [-0.77880859375, -0.7576370239257812, -0.7364654541015625, -0.7152938842773438, -0.694122314453125, -0.6729507446289062, -0.6517791748046875, -0.6306076049804688, -0.60943603515625, -0.5882644653320312, -0.5670928955078125, -0.5459213256835938, -0.524749755859375, -0.5035781860351562, -0.4824066162109375, -0.46123504638671875, -0.4400634765625, -0.41889190673828125, -0.3977203369140625, -0.37654876708984375, -0.355377197265625, -0.33420562744140625, -0.3130340576171875, -0.29186248779296875, -0.27069091796875, -0.24951934814453125, -0.2283477783203125, -0.20717620849609375, -0.186004638671875, -0.16483306884765625, -0.1436614990234375, -0.12248992919921875, -0.101318359375, -0.08014678955078125, -0.0589752197265625, -0.03780364990234375, -0.016632080078125, 0.00453948974609375, 0.0257110595703125, 0.04688262939453125, 0.06805419921875, 0.08922576904296875, 0.1103973388671875, 0.13156890869140625, 0.152740478515625, 0.17391204833984375, 0.1950836181640625, 0.21625518798828125, 0.2374267578125, 0.25859832763671875, 0.2797698974609375, 0.30094146728515625, 0.322113037109375, 0.34328460693359375, 0.3644561767578125, 0.38562774658203125, 0.40679931640625, 0.42797088623046875, 0.4491424560546875, 0.47031402587890625, 0.491485595703125, 0.5126571655273438, 0.5338287353515625, 0.5550003051757812, 0.576171875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 8.0, 10.0, 7.0, 10.0, 16.0, 21.0, 19.0, 18.0, 23.0, 26.0, 34.0, 25.0, 33.0, 41.0, 41.0, 40.0, 43.0, 39.0, 43.0, 40.0, 32.0, 41.0, 45.0, 43.0, 41.0, 34.0, 22.0, 24.0, 27.0, 31.0, 10.0, 11.0, 18.0, 13.0, 12.0, 9.0, 6.0, 7.0, 7.0, 6.0, 4.0, 9.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.50244140625, -0.48583221435546875, -0.4692230224609375, -0.45261383056640625, -0.436004638671875, -0.41939544677734375, -0.4027862548828125, -0.38617706298828125, -0.36956787109375, -0.35295867919921875, -0.3363494873046875, -0.31974029541015625, -0.303131103515625, -0.28652191162109375, -0.2699127197265625, -0.25330352783203125, -0.2366943359375, -0.22008514404296875, -0.2034759521484375, -0.18686676025390625, -0.170257568359375, -0.15364837646484375, -0.1370391845703125, -0.12042999267578125, -0.10382080078125, -0.08721160888671875, -0.0706024169921875, -0.05399322509765625, -0.037384033203125, -0.02077484130859375, -0.0041656494140625, 0.01244354248046875, 0.029052734375, 0.04566192626953125, 0.0622711181640625, 0.07888031005859375, 0.095489501953125, 0.11209869384765625, 0.1287078857421875, 0.14531707763671875, 0.16192626953125, 0.17853546142578125, 0.1951446533203125, 0.21175384521484375, 0.228363037109375, 0.24497222900390625, 0.2615814208984375, 0.27819061279296875, 0.2947998046875, 0.31140899658203125, 0.3280181884765625, 0.34462738037109375, 0.361236572265625, 0.37784576416015625, 0.3944549560546875, 0.41106414794921875, 0.42767333984375, 0.44428253173828125, 0.4608917236328125, 0.47750091552734375, 0.494110107421875, 0.5107192993164062, 0.5273284912109375, 0.5439376831054688, 0.560546875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 0.0, 6.0, 2.0, 5.0, 7.0, 11.0, 14.0, 20.0, 24.0, 38.0, 95.0, 247.0, 887.0, 11384.0, 3667564.0, 508921.0, 4136.0, 553.0, 173.0, 77.0, 43.0, 26.0, 18.0, 7.0, 7.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.974609375, -2.881195068359375, -2.78778076171875, -2.694366455078125, -2.6009521484375, -2.507537841796875, -2.41412353515625, -2.320709228515625, -2.227294921875, -2.133880615234375, -2.04046630859375, -1.947052001953125, -1.8536376953125, -1.760223388671875, -1.66680908203125, -1.573394775390625, -1.47998046875, -1.386566162109375, -1.29315185546875, -1.199737548828125, -1.1063232421875, -1.012908935546875, -0.91949462890625, -0.826080322265625, -0.732666015625, -0.639251708984375, -0.54583740234375, -0.452423095703125, -0.3590087890625, -0.265594482421875, -0.17218017578125, -0.078765869140625, 0.0146484375, 0.108062744140625, 0.20147705078125, 0.294891357421875, 0.3883056640625, 0.481719970703125, 0.57513427734375, 0.668548583984375, 0.761962890625, 0.855377197265625, 0.94879150390625, 1.042205810546875, 1.1356201171875, 1.229034423828125, 1.32244873046875, 1.415863037109375, 1.50927734375, 1.602691650390625, 1.69610595703125, 1.789520263671875, 1.8829345703125, 1.976348876953125, 2.06976318359375, 2.163177490234375, 2.256591796875, 2.350006103515625, 2.44342041015625, 2.536834716796875, 2.6302490234375, 2.723663330078125, 2.81707763671875, 2.910491943359375, 3.00390625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 14.0, 14.0, 17.0, 32.0, 48.0, 62.0, 99.0, 150.0, 243.0, 348.0, 529.0, 624.0, 582.0, 435.0, 318.0, 187.0, 128.0, 79.0, 63.0, 33.0, 18.0, 10.0, 8.0, 8.0, 5.0, 5.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2958984375, -0.28562164306640625, -0.2753448486328125, -0.26506805419921875, -0.254791259765625, -0.24451446533203125, -0.2342376708984375, -0.22396087646484375, -0.21368408203125, -0.20340728759765625, -0.1931304931640625, -0.18285369873046875, -0.172576904296875, -0.16230010986328125, -0.1520233154296875, -0.14174652099609375, -0.1314697265625, -0.12119293212890625, -0.1109161376953125, -0.10063934326171875, -0.090362548828125, -0.08008575439453125, -0.0698089599609375, -0.05953216552734375, -0.04925537109375, -0.03897857666015625, -0.0287017822265625, -0.01842498779296875, -0.008148193359375, 0.00212860107421875, 0.0124053955078125, 0.02268218994140625, 0.032958984375, 0.04323577880859375, 0.0535125732421875, 0.06378936767578125, 0.074066162109375, 0.08434295654296875, 0.0946197509765625, 0.10489654541015625, 0.11517333984375, 0.12545013427734375, 0.1357269287109375, 0.14600372314453125, 0.156280517578125, 0.16655731201171875, 0.1768341064453125, 0.18711090087890625, 0.1973876953125, 0.20766448974609375, 0.2179412841796875, 0.22821807861328125, 0.238494873046875, 0.24877166748046875, 0.2590484619140625, 0.26932525634765625, 0.27960205078125, 0.28987884521484375, 0.3001556396484375, 0.31043243408203125, 0.320709228515625, 0.33098602294921875, 0.3412628173828125, 0.35153961181640625, 0.36181640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 7.0, 4.0, 8.0, 6.0, 8.0, 17.0, 10.0, 30.0, 46.0, 48.0, 55.0, 79.0, 79.0, 83.0, 92.0, 76.0, 81.0, 75.0, 49.0, 39.0, 34.0, 14.0, 23.0, 10.0, 7.0, 7.0, 4.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8511802554130554, -0.8184229731559753, -0.7856656312942505, -0.7529083490371704, -0.7201510071754456, -0.6873937249183655, -0.6546363830566406, -0.6218791007995605, -0.5891218185424805, -0.5563645362854004, -0.5236071944236755, -0.49084991216659546, -0.4580925703048706, -0.4253352880477905, -0.39257797598838806, -0.3598206639289856, -0.32706332206726074, -0.2943060100078583, -0.2615486979484558, -0.22879140079021454, -0.19603408873081207, -0.1632767766714096, -0.13051947951316833, -0.09776216745376587, -0.0650048553943634, -0.032247547060251236, 0.0005097612738609314, 0.0332670658826828, 0.06602437794208527, 0.09878169000148773, 0.131538987159729, 0.16429629921913147, 0.1970536708831787, 0.22981098294258118, 0.26256829500198364, 0.2953255772590637, 0.3280829191207886, 0.36084020137786865, 0.3935975134372711, 0.4263548254966736, 0.45911213755607605, 0.4918694496154785, 0.5246267318725586, 0.5573840737342834, 0.5901413559913635, 0.6228986978530884, 0.6556559801101685, 0.6884132623672485, 0.7211706042289734, 0.7539278864860535, 0.7866852283477783, 0.8194425106048584, 0.8521998524665833, 0.8849571347236633, 0.9177144765853882, 0.9504717588424683, 0.9832290410995483, 1.0159863233566284, 1.0487436056137085, 1.0815010070800781, 1.1142582893371582, 1.1470155715942383, 1.1797728538513184, 1.2125301361083984, 1.245287537574768]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 6.0, 7.0, 13.0, 5.0, 13.0, 15.0, 14.0, 21.0, 18.0, 18.0, 30.0, 30.0, 20.0, 33.0, 36.0, 42.0, 35.0, 38.0, 29.0, 35.0, 42.0, 30.0, 33.0, 34.0, 31.0, 42.0, 39.0, 27.0, 42.0, 34.0, 28.0, 12.0, 26.0, 20.0, 14.0, 12.0, 10.0, 9.0, 15.0, 4.0, 10.0, 6.0, 6.0, 5.0, 4.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.5185228586196899, -0.5017445087432861, -0.4849661886692047, -0.4681878387928009, -0.4514095187187195, -0.4346311688423157, -0.41785281896591187, -0.40107449889183044, -0.384296178817749, -0.3675178289413452, -0.3507395088672638, -0.33396115899086, -0.31718283891677856, -0.30040448904037476, -0.28362613916397095, -0.2668478190898895, -0.2500694692134857, -0.2332911342382431, -0.2165127992630005, -0.19973444938659668, -0.18295612931251526, -0.16617777943611145, -0.14939944446086884, -0.13262110948562622, -0.1158427745103836, -0.09906443953514099, -0.08228610455989838, -0.06550776213407516, -0.04872942715883255, -0.031951092183589935, -0.015172749757766724, 0.0016055852174758911, 0.018383920192718506, 0.03516225516796112, 0.051940593868494034, 0.06871893256902695, 0.08549726754426956, 0.10227560251951218, 0.11905394494533539, 0.135832279920578, 0.15261061489582062, 0.16938894987106323, 0.18616728484630585, 0.20294561982154846, 0.21972396969795227, 0.2365022897720337, 0.2532806396484375, 0.2700589895248413, 0.28683730959892273, 0.30361565947532654, 0.32039397954940796, 0.33717232942581177, 0.3539506494998932, 0.370728999376297, 0.3875073194503784, 0.4042856693267822, 0.42106401920318604, 0.43784236907958984, 0.45462068915367126, 0.4713990390300751, 0.4881773591041565, 0.5049557089805603, 0.5217340588569641, 0.5385123491287231, 0.555290699005127]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 12.0, 20.0, 21.0, 37.0, 72.0, 97.0, 176.0, 373.0, 735.0, 1642.0, 3897.0, 11171.0, 42439.0, 214452.0, 542285.0, 178330.0, 36270.0, 10069.0, 3461.0, 1475.0, 715.0, 358.0, 169.0, 104.0, 62.0, 43.0, 21.0, 15.0, 13.0, 8.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3232421875, -0.3138580322265625, -0.304473876953125, -0.2950897216796875, -0.28570556640625, -0.2763214111328125, -0.266937255859375, -0.2575531005859375, -0.2481689453125, -0.2387847900390625, -0.229400634765625, -0.2200164794921875, -0.21063232421875, -0.2012481689453125, -0.191864013671875, -0.1824798583984375, -0.173095703125, -0.1637115478515625, -0.154327392578125, -0.1449432373046875, -0.13555908203125, -0.1261749267578125, -0.116790771484375, -0.1074066162109375, -0.0980224609375, -0.0886383056640625, -0.079254150390625, -0.0698699951171875, -0.06048583984375, -0.0511016845703125, -0.041717529296875, -0.0323333740234375, -0.02294921875, -0.0135650634765625, -0.004180908203125, 0.0052032470703125, 0.01458740234375, 0.0239715576171875, 0.033355712890625, 0.0427398681640625, 0.0521240234375, 0.0615081787109375, 0.070892333984375, 0.0802764892578125, 0.08966064453125, 0.0990447998046875, 0.108428955078125, 0.1178131103515625, 0.127197265625, 0.1365814208984375, 0.145965576171875, 0.1553497314453125, 0.16473388671875, 0.1741180419921875, 0.183502197265625, 0.1928863525390625, 0.2022705078125, 0.2116546630859375, 0.221038818359375, 0.2304229736328125, 0.23980712890625, 0.2491912841796875, 0.258575439453125, 0.2679595947265625, 0.27734375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 8.0, 13.0, 16.0, 14.0, 19.0, 14.0, 23.0, 38.0, 46.0, 30.0, 39.0, 32.0, 41.0, 49.0, 46.0, 38.0, 50.0, 37.0, 52.0, 47.0, 43.0, 41.0, 35.0, 29.0, 38.0, 21.0, 24.0, 22.0, 22.0, 13.0, 13.0, 4.0, 10.0, 11.0, 7.0, 7.0, 0.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4228515625, -0.4109535217285156, -0.39905548095703125, -0.3871574401855469, -0.3752593994140625, -0.3633613586425781, -0.35146331787109375, -0.3395652770996094, -0.327667236328125, -0.3157691955566406, -0.30387115478515625, -0.2919731140136719, -0.2800750732421875, -0.2681770324707031, -0.25627899169921875, -0.24438095092773438, -0.23248291015625, -0.22058486938476562, -0.20868682861328125, -0.19678878784179688, -0.1848907470703125, -0.17299270629882812, -0.16109466552734375, -0.14919662475585938, -0.137298583984375, -0.12540054321289062, -0.11350250244140625, -0.10160446166992188, -0.0897064208984375, -0.07780838012695312, -0.06591033935546875, -0.054012298583984375, -0.0421142578125, -0.030216217041015625, -0.01831817626953125, -0.006420135498046875, 0.0054779052734375, 0.017375946044921875, 0.02927398681640625, 0.041172027587890625, 0.053070068359375, 0.06496810913085938, 0.07686614990234375, 0.08876419067382812, 0.1006622314453125, 0.11256027221679688, 0.12445831298828125, 0.13635635375976562, 0.14825439453125, 0.16015243530273438, 0.17205047607421875, 0.18394851684570312, 0.1958465576171875, 0.20774459838867188, 0.21964263916015625, 0.23154067993164062, 0.243438720703125, 0.2553367614746094, 0.26723480224609375, 0.2791328430175781, 0.2910308837890625, 0.3029289245605469, 0.31482696533203125, 0.3267250061035156, 0.338623046875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 6.0, 11.0, 8.0, 15.0, 11.0, 20.0, 37.0, 39.0, 54.0, 82.0, 104.0, 127.0, 198.0, 258.0, 443.0, 659.0, 1146.0, 1939.0, 3555.0, 6500.0, 12991.0, 26670.0, 57439.0, 121500.0, 225691.0, 263449.0, 167863.0, 82192.0, 37751.0, 18020.0, 8790.0, 4565.0, 2548.0, 1410.0, 800.0, 524.0, 306.0, 243.0, 171.0, 112.0, 70.0, 46.0, 45.0, 34.0, 19.0, 22.0, 14.0, 16.0, 12.0, 12.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.126953125, -0.12301445007324219, -0.11907577514648438, -0.11513710021972656, -0.11119842529296875, -0.10725975036621094, -0.10332107543945312, -0.09938240051269531, -0.0954437255859375, -0.09150505065917969, -0.08756637573242188, -0.08362770080566406, -0.07968902587890625, -0.07575035095214844, -0.07181167602539062, -0.06787300109863281, -0.063934326171875, -0.05999565124511719, -0.056056976318359375, -0.05211830139160156, -0.04817962646484375, -0.04424095153808594, -0.040302276611328125, -0.03636360168457031, -0.0324249267578125, -0.028486251831054688, -0.024547576904296875, -0.020608901977539062, -0.01667022705078125, -0.012731552124023438, -0.008792877197265625, -0.0048542022705078125, -0.00091552734375, 0.0030231475830078125, 0.006961822509765625, 0.010900497436523438, 0.01483917236328125, 0.018777847290039062, 0.022716522216796875, 0.026655197143554688, 0.0305938720703125, 0.03453254699707031, 0.038471221923828125, 0.04240989685058594, 0.04634857177734375, 0.05028724670410156, 0.054225921630859375, 0.05816459655761719, 0.062103271484375, 0.06604194641113281, 0.06998062133789062, 0.07391929626464844, 0.07785797119140625, 0.08179664611816406, 0.08573532104492188, 0.08967399597167969, 0.0936126708984375, 0.09755134582519531, 0.10149002075195312, 0.10542869567871094, 0.10936737060546875, 0.11330604553222656, 0.11724472045898438, 0.12118339538574219, 0.1251220703125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 6.0, 4.0, 8.0, 12.0, 12.0, 18.0, 18.0, 18.0, 23.0, 34.0, 33.0, 33.0, 42.0, 41.0, 47.0, 46.0, 52.0, 52.0, 50.0, 50.0, 60.0, 49.0, 37.0, 37.0, 33.0, 27.0, 25.0, 28.0, 28.0, 17.0, 20.0, 17.0, 7.0, 8.0, 5.0, 8.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88525390625, -0.8594894409179688, -0.8337249755859375, -0.8079605102539062, -0.782196044921875, -0.7564315795898438, -0.7306671142578125, -0.7049026489257812, -0.67913818359375, -0.6533737182617188, -0.6276092529296875, -0.6018447875976562, -0.576080322265625, -0.5503158569335938, -0.5245513916015625, -0.49878692626953125, -0.4730224609375, -0.44725799560546875, -0.4214935302734375, -0.39572906494140625, -0.369964599609375, -0.34420013427734375, -0.3184356689453125, -0.29267120361328125, -0.26690673828125, -0.24114227294921875, -0.2153778076171875, -0.18961334228515625, -0.163848876953125, -0.13808441162109375, -0.1123199462890625, -0.08655548095703125, -0.060791015625, -0.03502655029296875, -0.0092620849609375, 0.01650238037109375, 0.042266845703125, 0.06803131103515625, 0.0937957763671875, 0.11956024169921875, 0.14532470703125, 0.17108917236328125, 0.1968536376953125, 0.22261810302734375, 0.248382568359375, 0.27414703369140625, 0.2999114990234375, 0.32567596435546875, 0.3514404296875, 0.37720489501953125, 0.4029693603515625, 0.42873382568359375, 0.454498291015625, 0.48026275634765625, 0.5060272216796875, 0.5317916870117188, 0.55755615234375, 0.5833206176757812, 0.6090850830078125, 0.6348495483398438, 0.660614013671875, 0.6863784790039062, 0.7121429443359375, 0.7379074096679688, 0.763671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 10.0, 6.0, 6.0, 9.0, 18.0, 22.0, 49.0, 64.0, 100.0, 158.0, 232.0, 464.0, 773.0, 1458.0, 2794.0, 6185.0, 15956.0, 52279.0, 251472.0, 527223.0, 135476.0, 32943.0, 11193.0, 4710.0, 2247.0, 1118.0, 625.0, 366.0, 202.0, 124.0, 80.0, 65.0, 43.0, 28.0, 15.0, 11.0, 9.0, 3.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09442138671875, -0.09130668640136719, -0.08819198608398438, -0.08507728576660156, -0.08196258544921875, -0.07884788513183594, -0.07573318481445312, -0.07261848449707031, -0.0695037841796875, -0.06638908386230469, -0.06327438354492188, -0.06015968322753906, -0.05704498291015625, -0.05393028259277344, -0.050815582275390625, -0.04770088195800781, -0.044586181640625, -0.04147148132324219, -0.038356781005859375, -0.03524208068847656, -0.03212738037109375, -0.029012680053710938, -0.025897979736328125, -0.022783279418945312, -0.0196685791015625, -0.016553878784179688, -0.013439178466796875, -0.010324478149414062, -0.00720977783203125, -0.0040950775146484375, -0.000980377197265625, 0.0021343231201171875, 0.0052490234375, 0.008363723754882812, 0.011478424072265625, 0.014593124389648438, 0.01770782470703125, 0.020822525024414062, 0.023937225341796875, 0.027051925659179688, 0.0301666259765625, 0.03328132629394531, 0.036396026611328125, 0.03951072692871094, 0.04262542724609375, 0.04574012756347656, 0.048854827880859375, 0.05196952819824219, 0.055084228515625, 0.05819892883300781, 0.061313629150390625, 0.06442832946777344, 0.06754302978515625, 0.07065773010253906, 0.07377243041992188, 0.07688713073730469, 0.0800018310546875, 0.08311653137207031, 0.08623123168945312, 0.08934593200683594, 0.09246063232421875, 0.09557533264160156, 0.09869003295898438, 0.10180473327636719, 0.10491943359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 8.0, 7.0, 2.0, 6.0, 10.0, 15.0, 17.0, 26.0, 32.0, 36.0, 52.0, 76.0, 88.0, 101.0, 116.0, 88.0, 66.0, 71.0, 33.0, 36.0, 29.0, 25.0, 17.0, 9.0, 8.0, 5.0, 5.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.029273986816406e-05, -3.9070844650268555e-05, -3.784894943237305e-05, -3.662705421447754e-05, -3.540515899658203e-05, -3.4183263778686523e-05, -3.2961368560791016e-05, -3.173947334289551e-05, -3.0517578125e-05, -2.9295682907104492e-05, -2.8073787689208984e-05, -2.6851892471313477e-05, -2.562999725341797e-05, -2.440810203552246e-05, -2.3186206817626953e-05, -2.1964311599731445e-05, -2.0742416381835938e-05, -1.952052116394043e-05, -1.8298625946044922e-05, -1.7076730728149414e-05, -1.5854835510253906e-05, -1.4632940292358398e-05, -1.341104507446289e-05, -1.2189149856567383e-05, -1.0967254638671875e-05, -9.745359420776367e-06, -8.52346420288086e-06, -7.3015689849853516e-06, -6.079673767089844e-06, -4.857778549194336e-06, -3.635883331298828e-06, -2.4139881134033203e-06, -1.1920928955078125e-06, 2.9802322387695312e-08, 1.2516975402832031e-06, 2.473592758178711e-06, 3.6954879760742188e-06, 4.9173831939697266e-06, 6.139278411865234e-06, 7.361173629760742e-06, 8.58306884765625e-06, 9.804964065551758e-06, 1.1026859283447266e-05, 1.2248754501342773e-05, 1.3470649719238281e-05, 1.4692544937133789e-05, 1.5914440155029297e-05, 1.7136335372924805e-05, 1.8358230590820312e-05, 1.958012580871582e-05, 2.0802021026611328e-05, 2.2023916244506836e-05, 2.3245811462402344e-05, 2.446770668029785e-05, 2.568960189819336e-05, 2.6911497116088867e-05, 2.8133392333984375e-05, 2.9355287551879883e-05, 3.057718276977539e-05, 3.17990779876709e-05, 3.3020973205566406e-05, 3.4242868423461914e-05, 3.546476364135742e-05, 3.668665885925293e-05, 3.790855407714844e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 9.0, 7.0, 8.0, 15.0, 24.0, 16.0, 31.0, 27.0, 61.0, 71.0, 125.0, 205.0, 367.0, 831.0, 1722.0, 3892.0, 10159.0, 32736.0, 142787.0, 540271.0, 241091.0, 49782.0, 14516.0, 5313.0, 2228.0, 1051.0, 496.0, 261.0, 119.0, 102.0, 65.0, 27.0, 27.0, 23.0, 16.0, 14.0, 11.0, 6.0, 12.0, 7.0, 2.0, 2.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1136474609375, -0.1101675033569336, -0.10668754577636719, -0.10320758819580078, -0.09972763061523438, -0.09624767303466797, -0.09276771545410156, -0.08928775787353516, -0.08580780029296875, -0.08232784271240234, -0.07884788513183594, -0.07536792755126953, -0.07188796997070312, -0.06840801239013672, -0.06492805480957031, -0.061448097229003906, -0.0579681396484375, -0.054488182067871094, -0.05100822448730469, -0.04752826690673828, -0.044048309326171875, -0.04056835174560547, -0.03708839416503906, -0.033608436584472656, -0.03012847900390625, -0.026648521423339844, -0.023168563842773438, -0.01968860626220703, -0.016208648681640625, -0.012728691101074219, -0.009248733520507812, -0.005768775939941406, -0.002288818359375, 0.0011911392211914062, 0.0046710968017578125, 0.008151054382324219, 0.011631011962890625, 0.015110969543457031, 0.018590927124023438, 0.022070884704589844, 0.02555084228515625, 0.029030799865722656, 0.03251075744628906, 0.03599071502685547, 0.039470672607421875, 0.04295063018798828, 0.04643058776855469, 0.049910545349121094, 0.0533905029296875, 0.056870460510253906, 0.06035041809082031, 0.06383037567138672, 0.06731033325195312, 0.07079029083251953, 0.07427024841308594, 0.07775020599365234, 0.08123016357421875, 0.08471012115478516, 0.08819007873535156, 0.09167003631591797, 0.09514999389648438, 0.09862995147705078, 0.10210990905761719, 0.1055898666381836, 0.10906982421875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 7.0, 10.0, 18.0, 24.0, 24.0, 44.0, 52.0, 60.0, 89.0, 90.0, 103.0, 109.0, 88.0, 69.0, 56.0, 33.0, 26.0, 19.0, 7.0, 12.0, 12.0, 7.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.02734375, -0.026418685913085938, -0.025493621826171875, -0.024568557739257812, -0.02364349365234375, -0.022718429565429688, -0.021793365478515625, -0.020868301391601562, -0.0199432373046875, -0.019018173217773438, -0.018093109130859375, -0.017168045043945312, -0.01624298095703125, -0.015317916870117188, -0.014392852783203125, -0.013467788696289062, -0.012542724609375, -0.011617660522460938, -0.010692596435546875, -0.009767532348632812, -0.00884246826171875, -0.007917404174804688, -0.006992340087890625, -0.0060672760009765625, -0.0051422119140625, -0.0042171478271484375, -0.003292083740234375, -0.0023670196533203125, -0.00144195556640625, -0.0005168914794921875, 0.000408172607421875, 0.0013332366943359375, 0.00225830078125, 0.0031833648681640625, 0.004108428955078125, 0.0050334930419921875, 0.00595855712890625, 0.0068836212158203125, 0.007808685302734375, 0.008733749389648438, 0.0096588134765625, 0.010583877563476562, 0.011508941650390625, 0.012434005737304688, 0.01335906982421875, 0.014284133911132812, 0.015209197998046875, 0.016134262084960938, 0.017059326171875, 0.017984390258789062, 0.018909454345703125, 0.019834518432617188, 0.02075958251953125, 0.021684646606445312, 0.022609710693359375, 0.023534774780273438, 0.0244598388671875, 0.025384902954101562, 0.026309967041015625, 0.027235031127929688, 0.02816009521484375, 0.029085159301757812, 0.030010223388671875, 0.030935287475585938, 0.0318603515625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 5.0, 8.0, 7.0, 7.0, 11.0, 11.0, 19.0, 30.0, 51.0, 62.0, 101.0, 107.0, 121.0, 100.0, 99.0, 86.0, 68.0, 32.0, 28.0, 25.0, 9.0, 5.0, 2.0, 5.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.640224277973175, -0.6162078976631165, -0.5921915173530579, -0.5681751370429993, -0.5441587567329407, -0.5201423764228821, -0.4961259663105011, -0.4721095860004425, -0.4480932056903839, -0.4240768253803253, -0.4000604450702667, -0.37604403495788574, -0.35202765464782715, -0.32801127433776855, -0.30399489402770996, -0.27997851371765137, -0.2559621334075928, -0.23194575309753418, -0.20792937278747559, -0.1839129775762558, -0.1598965972661972, -0.1358802169561386, -0.11186382174491882, -0.08784744143486023, -0.06383106112480164, -0.039814677089452744, -0.01579829305410385, 0.00821809470653534, 0.03223447501659393, 0.05625085532665253, 0.08026725053787231, 0.10428363084793091, 0.1283000111579895, 0.1523163914680481, 0.1763327717781067, 0.20034916698932648, 0.22436554729938507, 0.24838192760944366, 0.27239832282066345, 0.29641470313072205, 0.32043108344078064, 0.34444746375083923, 0.3684638440608978, 0.3924802541732788, 0.4164966344833374, 0.440513014793396, 0.4645293951034546, 0.4885457754135132, 0.5125621557235718, 0.5365785360336304, 0.560594916343689, 0.5846112966537476, 0.6086276769638062, 0.6326440572738647, 0.6566604375839233, 0.6806768178939819, 0.7046931982040405, 0.7287095785140991, 0.7527259588241577, 0.7767423391342163, 0.8007587194442749, 0.8247750997543335, 0.8487914800643921, 0.8728078603744507, 0.896824300289154]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 7.0, 9.0, 8.0, 4.0, 15.0, 11.0, 24.0, 15.0, 26.0, 30.0, 31.0, 29.0, 41.0, 33.0, 48.0, 38.0, 37.0, 47.0, 45.0, 38.0, 35.0, 38.0, 40.0, 46.0, 50.0, 40.0, 38.0, 21.0, 20.0, 25.0, 12.0, 23.0, 14.0, 11.0, 11.0, 11.0, 7.0, 8.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.3793233633041382, -0.36853253841400146, -0.35774171352386475, -0.346950888633728, -0.3361600637435913, -0.3253692388534546, -0.31457841396331787, -0.30378758907318115, -0.29299676418304443, -0.2822059392929077, -0.271415114402771, -0.2606242895126343, -0.24983346462249756, -0.23904263973236084, -0.22825182974338531, -0.2174610048532486, -0.20667019486427307, -0.19587936997413635, -0.18508854508399963, -0.17429772019386292, -0.1635068953037262, -0.15271607041358948, -0.14192526042461395, -0.13113443553447723, -0.12034361064434052, -0.1095527857542038, -0.09876196086406708, -0.08797114342451096, -0.07718031853437424, -0.06638949364423752, -0.055598676204681396, -0.04480785131454468, -0.03401699662208557, -0.023226173594594002, -0.012435350567102432, -0.001644529402256012, 0.009146295487880707, 0.019937120378017426, 0.030727937817573547, 0.041518762707710266, 0.052309587597846985, 0.0631004124879837, 0.07389123737812042, 0.08468205481767654, 0.09547287970781326, 0.10626370459794998, 0.1170545220375061, 0.12784534692764282, 0.13863617181777954, 0.14942699670791626, 0.16021782159805298, 0.1710086464881897, 0.18179947137832642, 0.19259029626846313, 0.20338110625743866, 0.21417193114757538, 0.2249627560377121, 0.23575358092784882, 0.24654440581798553, 0.25733521580696106, 0.2681260406970978, 0.2789168655872345, 0.2897076904773712, 0.30049851536750793, 0.31128934025764465]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 5.0, 5.0, 5.0, 6.0, 11.0, 13.0, 17.0, 31.0, 44.0, 89.0, 148.0, 291.0, 543.0, 1118.0, 2534.0, 6316.0, 18711.0, 74946.0, 360513.0, 443783.0, 102408.0, 23876.0, 7557.0, 2940.0, 1283.0, 648.0, 298.0, 148.0, 92.0, 57.0, 36.0, 30.0, 17.0, 8.0, 7.0, 9.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.64697265625, -0.6299896240234375, -0.613006591796875, -0.5960235595703125, -0.57904052734375, -0.5620574951171875, -0.545074462890625, -0.5280914306640625, -0.5111083984375, -0.4941253662109375, -0.477142333984375, -0.4601593017578125, -0.44317626953125, -0.4261932373046875, -0.409210205078125, -0.3922271728515625, -0.375244140625, -0.3582611083984375, -0.341278076171875, -0.3242950439453125, -0.30731201171875, -0.2903289794921875, -0.273345947265625, -0.2563629150390625, -0.2393798828125, -0.2223968505859375, -0.205413818359375, -0.1884307861328125, -0.17144775390625, -0.1544647216796875, -0.137481689453125, -0.1204986572265625, -0.103515625, -0.0865325927734375, -0.069549560546875, -0.0525665283203125, -0.03558349609375, -0.0186004638671875, -0.001617431640625, 0.0153656005859375, 0.0323486328125, 0.0493316650390625, 0.066314697265625, 0.0832977294921875, 0.10028076171875, 0.1172637939453125, 0.134246826171875, 0.1512298583984375, 0.168212890625, 0.1851959228515625, 0.202178955078125, 0.2191619873046875, 0.23614501953125, 0.2531280517578125, 0.270111083984375, 0.2870941162109375, 0.3040771484375, 0.3210601806640625, 0.338043212890625, 0.3550262451171875, 0.37200927734375, 0.3889923095703125, 0.405975341796875, 0.4229583740234375, 0.43994140625]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 7.0, 9.0, 14.0, 14.0, 24.0, 25.0, 28.0, 31.0, 36.0, 40.0, 44.0, 49.0, 38.0, 46.0, 44.0, 58.0, 45.0, 54.0, 53.0, 44.0, 50.0, 42.0, 38.0, 42.0, 14.0, 18.0, 18.0, 15.0, 9.0, 5.0, 12.0, 10.0, 5.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.98828125, -0.9619369506835938, -0.9355926513671875, -0.9092483520507812, -0.882904052734375, -0.8565597534179688, -0.8302154541015625, -0.8038711547851562, -0.77752685546875, -0.7511825561523438, -0.7248382568359375, -0.6984939575195312, -0.672149658203125, -0.6458053588867188, -0.6194610595703125, -0.5931167602539062, -0.5667724609375, -0.5404281616210938, -0.5140838623046875, -0.48773956298828125, -0.461395263671875, -0.43505096435546875, -0.4087066650390625, -0.38236236572265625, -0.35601806640625, -0.32967376708984375, -0.3033294677734375, -0.27698516845703125, -0.250640869140625, -0.22429656982421875, -0.1979522705078125, -0.17160797119140625, -0.145263671875, -0.11891937255859375, -0.0925750732421875, -0.06623077392578125, -0.039886474609375, -0.01354217529296875, 0.0128021240234375, 0.03914642333984375, 0.06549072265625, 0.09183502197265625, 0.1181793212890625, 0.14452362060546875, 0.170867919921875, 0.19721221923828125, 0.2235565185546875, 0.24990081787109375, 0.2762451171875, 0.30258941650390625, 0.3289337158203125, 0.35527801513671875, 0.381622314453125, 0.40796661376953125, 0.4343109130859375, 0.46065521240234375, 0.48699951171875, 0.5133438110351562, 0.5396881103515625, 0.5660324096679688, 0.592376708984375, 0.6187210083007812, 0.6450653076171875, 0.6714096069335938, 0.69775390625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 0.0, 4.0, 5.0, 6.0, 8.0, 9.0, 14.0, 8.0, 13.0, 21.0, 22.0, 16.0, 20.0, 42.0, 39.0, 48.0, 72.0, 102.0, 175.0, 412.0, 2527.0, 436067.0, 604778.0, 3116.0, 393.0, 195.0, 117.0, 67.0, 42.0, 34.0, 27.0, 26.0, 26.0, 18.0, 15.0, 18.0, 15.0, 8.0, 5.0, 6.0, 7.0, 4.0, 3.0, 2.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8544921875, -1.7832489013671875, -1.712005615234375, -1.6407623291015625, -1.56951904296875, -1.4982757568359375, -1.427032470703125, -1.3557891845703125, -1.2845458984375, -1.2133026123046875, -1.142059326171875, -1.0708160400390625, -0.99957275390625, -0.9283294677734375, -0.857086181640625, -0.7858428955078125, -0.714599609375, -0.6433563232421875, -0.572113037109375, -0.5008697509765625, -0.42962646484375, -0.3583831787109375, -0.287139892578125, -0.2158966064453125, -0.1446533203125, -0.0734100341796875, -0.002166748046875, 0.0690765380859375, 0.14031982421875, 0.2115631103515625, 0.282806396484375, 0.3540496826171875, 0.42529296875, 0.4965362548828125, 0.567779541015625, 0.6390228271484375, 0.71026611328125, 0.7815093994140625, 0.852752685546875, 0.9239959716796875, 0.9952392578125, 1.0664825439453125, 1.137725830078125, 1.2089691162109375, 1.28021240234375, 1.3514556884765625, 1.422698974609375, 1.4939422607421875, 1.565185546875, 1.6364288330078125, 1.707672119140625, 1.7789154052734375, 1.85015869140625, 1.9214019775390625, 1.992645263671875, 2.0638885498046875, 2.1351318359375, 2.2063751220703125, 2.277618408203125, 2.3488616943359375, 2.42010498046875, 2.4913482666015625, 2.562591552734375, 2.6338348388671875, 2.705078125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 2.0, 6.0, 2.0, 4.0, 9.0, 6.0, 10.0, 13.0, 14.0, 12.0, 21.0, 22.0, 19.0, 25.0, 36.0, 28.0, 35.0, 33.0, 34.0, 37.0, 43.0, 38.0, 36.0, 45.0, 42.0, 56.0, 49.0, 41.0, 33.0, 29.0, 29.0, 30.0, 27.0, 23.0, 22.0, 19.0, 8.0, 17.0, 11.0, 10.0, 8.0, 4.0, 5.0, 10.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6103515625, -0.5878219604492188, -0.5652923583984375, -0.5427627563476562, -0.520233154296875, -0.49770355224609375, -0.4751739501953125, -0.45264434814453125, -0.43011474609375, -0.40758514404296875, -0.3850555419921875, -0.36252593994140625, -0.339996337890625, -0.31746673583984375, -0.2949371337890625, -0.27240753173828125, -0.2498779296875, -0.22734832763671875, -0.2048187255859375, -0.18228912353515625, -0.159759521484375, -0.13722991943359375, -0.1147003173828125, -0.09217071533203125, -0.06964111328125, -0.04711151123046875, -0.0245819091796875, -0.00205230712890625, 0.020477294921875, 0.04300689697265625, 0.0655364990234375, 0.08806610107421875, 0.110595703125, 0.13312530517578125, 0.1556549072265625, 0.17818450927734375, 0.200714111328125, 0.22324371337890625, 0.2457733154296875, 0.26830291748046875, 0.29083251953125, 0.31336212158203125, 0.3358917236328125, 0.35842132568359375, 0.380950927734375, 0.40348052978515625, 0.4260101318359375, 0.44853973388671875, 0.4710693359375, 0.49359893798828125, 0.5161285400390625, 0.5386581420898438, 0.561187744140625, 0.5837173461914062, 0.6062469482421875, 0.6287765502929688, 0.65130615234375, 0.6738357543945312, 0.6963653564453125, 0.7188949584960938, 0.741424560546875, 0.7639541625976562, 0.7864837646484375, 0.8090133666992188, 0.83154296875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 3.0, 4.0, 8.0, 4.0, 5.0, 6.0, 14.0, 16.0, 18.0, 20.0, 48.0, 64.0, 115.0, 185.0, 363.0, 978.0, 3424.0, 20922.0, 227741.0, 688270.0, 92504.0, 10286.0, 2137.0, 659.0, 304.0, 157.0, 98.0, 59.0, 51.0, 29.0, 23.0, 13.0, 8.0, 3.0, 0.0, 6.0, 4.0, 0.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2427978515625, -0.23551177978515625, -0.2282257080078125, -0.22093963623046875, -0.213653564453125, -0.20636749267578125, -0.1990814208984375, -0.19179534912109375, -0.18450927734375, -0.17722320556640625, -0.1699371337890625, -0.16265106201171875, -0.155364990234375, -0.14807891845703125, -0.1407928466796875, -0.13350677490234375, -0.126220703125, -0.11893463134765625, -0.1116485595703125, -0.10436248779296875, -0.097076416015625, -0.08979034423828125, -0.0825042724609375, -0.07521820068359375, -0.06793212890625, -0.06064605712890625, -0.0533599853515625, -0.04607391357421875, -0.038787841796875, -0.03150177001953125, -0.0242156982421875, -0.01692962646484375, -0.0096435546875, -0.00235748291015625, 0.0049285888671875, 0.01221466064453125, 0.019500732421875, 0.02678680419921875, 0.0340728759765625, 0.04135894775390625, 0.04864501953125, 0.05593109130859375, 0.0632171630859375, 0.07050323486328125, 0.077789306640625, 0.08507537841796875, 0.0923614501953125, 0.09964752197265625, 0.10693359375, 0.11421966552734375, 0.1215057373046875, 0.12879180908203125, 0.136077880859375, 0.14336395263671875, 0.1506500244140625, 0.15793609619140625, 0.16522216796875, 0.17250823974609375, 0.1797943115234375, 0.18708038330078125, 0.194366455078125, 0.20165252685546875, 0.2089385986328125, 0.21622467041015625, 0.2235107421875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 6.0, 7.0, 9.0, 6.0, 11.0, 11.0, 18.0, 23.0, 28.0, 33.0, 41.0, 66.0, 68.0, 85.0, 73.0, 87.0, 85.0, 55.0, 59.0, 50.0, 39.0, 32.0, 21.0, 18.0, 22.0, 13.0, 11.0, 8.0, 6.0, 3.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.0384788513183594e-05, -1.9783154129981995e-05, -1.9181519746780396e-05, -1.8579885363578796e-05, -1.7978250980377197e-05, -1.7376616597175598e-05, -1.6774982213974e-05, -1.61733478307724e-05, -1.55717134475708e-05, -1.4970079064369202e-05, -1.4368444681167603e-05, -1.3766810297966003e-05, -1.3165175914764404e-05, -1.2563541531562805e-05, -1.1961907148361206e-05, -1.1360272765159607e-05, -1.0758638381958008e-05, -1.0157003998756409e-05, -9.55536961555481e-06, -8.95373523235321e-06, -8.352100849151611e-06, -7.750466465950012e-06, -7.148832082748413e-06, -6.547197699546814e-06, -5.945563316345215e-06, -5.343928933143616e-06, -4.742294549942017e-06, -4.1406601667404175e-06, -3.5390257835388184e-06, -2.9373914003372192e-06, -2.33575701713562e-06, -1.734122633934021e-06, -1.1324882507324219e-06, -5.308538675308228e-07, 7.078051567077637e-08, 6.724148988723755e-07, 1.2740492820739746e-06, 1.8756836652755737e-06, 2.477318048477173e-06, 3.078952431678772e-06, 3.680586814880371e-06, 4.28222119808197e-06, 4.883855581283569e-06, 5.4854899644851685e-06, 6.087124347686768e-06, 6.688758730888367e-06, 7.290393114089966e-06, 7.892027497291565e-06, 8.493661880493164e-06, 9.095296263694763e-06, 9.696930646896362e-06, 1.0298565030097961e-05, 1.090019941329956e-05, 1.150183379650116e-05, 1.2103468179702759e-05, 1.2705102562904358e-05, 1.3306736946105957e-05, 1.3908371329307556e-05, 1.4510005712509155e-05, 1.5111640095710754e-05, 1.5713274478912354e-05, 1.6314908862113953e-05, 1.6916543245315552e-05, 1.751817762851715e-05, 1.811981201171875e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 10.0, 8.0, 17.0, 17.0, 28.0, 39.0, 90.0, 121.0, 244.0, 507.0, 1457.0, 5766.0, 38865.0, 432503.0, 510913.0, 48250.0, 6854.0, 1678.0, 608.0, 244.0, 135.0, 68.0, 39.0, 34.0, 19.0, 9.0, 8.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25048828125, -0.24290847778320312, -0.23532867431640625, -0.22774887084960938, -0.2201690673828125, -0.21258926391601562, -0.20500946044921875, -0.19742965698242188, -0.189849853515625, -0.18227005004882812, -0.17469024658203125, -0.16711044311523438, -0.1595306396484375, -0.15195083618164062, -0.14437103271484375, -0.13679122924804688, -0.12921142578125, -0.12163162231445312, -0.11405181884765625, -0.10647201538085938, -0.0988922119140625, -0.09131240844726562, -0.08373260498046875, -0.07615280151367188, -0.068572998046875, -0.060993194580078125, -0.05341339111328125, -0.045833587646484375, -0.0382537841796875, -0.030673980712890625, -0.02309417724609375, -0.015514373779296875, -0.0079345703125, -0.000354766845703125, 0.00722503662109375, 0.014804840087890625, 0.0223846435546875, 0.029964447021484375, 0.03754425048828125, 0.045124053955078125, 0.052703857421875, 0.060283660888671875, 0.06786346435546875, 0.07544326782226562, 0.0830230712890625, 0.09060287475585938, 0.09818267822265625, 0.10576248168945312, 0.11334228515625, 0.12092208862304688, 0.12850189208984375, 0.13608169555664062, 0.1436614990234375, 0.15124130249023438, 0.15882110595703125, 0.16640090942382812, 0.173980712890625, 0.18156051635742188, 0.18914031982421875, 0.19672012329101562, 0.2042999267578125, 0.21187973022460938, 0.21945953369140625, 0.22703933715820312, 0.234619140625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 9.0, 9.0, 11.0, 16.0, 15.0, 31.0, 32.0, 60.0, 69.0, 96.0, 95.0, 103.0, 94.0, 90.0, 74.0, 41.0, 41.0, 23.0, 23.0, 19.0, 14.0, 7.0, 5.0, 5.0, 7.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.095947265625, -0.09324359893798828, -0.09053993225097656, -0.08783626556396484, -0.08513259887695312, -0.0824289321899414, -0.07972526550292969, -0.07702159881591797, -0.07431793212890625, -0.07161426544189453, -0.06891059875488281, -0.0662069320678711, -0.06350326538085938, -0.060799598693847656, -0.05809593200683594, -0.05539226531982422, -0.0526885986328125, -0.04998493194580078, -0.04728126525878906, -0.044577598571777344, -0.041873931884765625, -0.039170265197753906, -0.03646659851074219, -0.03376293182373047, -0.03105926513671875, -0.02835559844970703, -0.025651931762695312, -0.022948265075683594, -0.020244598388671875, -0.017540931701660156, -0.014837265014648438, -0.012133598327636719, -0.009429931640625, -0.006726264953613281, -0.0040225982666015625, -0.0013189315795898438, 0.001384735107421875, 0.004088401794433594, 0.0067920684814453125, 0.009495735168457031, 0.01219940185546875, 0.014903068542480469, 0.017606735229492188, 0.020310401916503906, 0.023014068603515625, 0.025717735290527344, 0.028421401977539062, 0.03112506866455078, 0.0338287353515625, 0.03653240203857422, 0.03923606872558594, 0.041939735412597656, 0.044643402099609375, 0.047347068786621094, 0.05005073547363281, 0.05275440216064453, 0.05545806884765625, 0.05816173553466797, 0.06086540222167969, 0.0635690689086914, 0.06627273559570312, 0.06897640228271484, 0.07168006896972656, 0.07438373565673828, 0.07708740234375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 9.0, 9.0, 12.0, 21.0, 39.0, 59.0, 97.0, 124.0, 155.0, 136.0, 119.0, 86.0, 56.0, 33.0, 20.0, 10.0, 6.0, 6.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.120443820953369, -2.0594565868377686, -1.998469352722168, -1.9374819993972778, -1.8764947652816772, -1.8155075311660767, -1.7545201778411865, -1.693532943725586, -1.6325457096099854, -1.5715584754943848, -1.5105712413787842, -1.449583888053894, -1.3885966539382935, -1.3276094198226929, -1.2666220664978027, -1.2056348323822021, -1.1446475982666016, -1.083660364151001, -1.0226731300354004, -0.9616857767105103, -0.9006985425949097, -0.8397113084793091, -0.7787240147590637, -0.7177367210388184, -0.6567494869232178, -0.5957622528076172, -0.5347749590873718, -0.47378769516944885, -0.4128004312515259, -0.3518131673336029, -0.29082590341567993, -0.22983863949775696, -0.16885149478912354, -0.10786423087120056, -0.04687696695327759, 0.014110296964645386, 0.07509756088256836, 0.13608482480049133, 0.1970720887184143, 0.2580593526363373, 0.31904661655426025, 0.3800338804721832, 0.4410211443901062, 0.5020084381103516, 0.5629956722259521, 0.6239829063415527, 0.6849702000617981, 0.7459574937820435, 0.806944727897644, 0.8679319620132446, 0.92891925573349, 0.9899065494537354, 1.050893783569336, 1.1118810176849365, 1.172868251800537, 1.2338556051254272, 1.2948428392410278, 1.3558300733566284, 1.4168174266815186, 1.4778046607971191, 1.5387918949127197, 1.5997791290283203, 1.660766363143921, 1.721753716468811, 1.7827409505844116]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 7.0, 4.0, 8.0, 7.0, 11.0, 10.0, 14.0, 15.0, 19.0, 18.0, 20.0, 24.0, 26.0, 33.0, 29.0, 22.0, 43.0, 41.0, 34.0, 38.0, 34.0, 43.0, 40.0, 45.0, 38.0, 33.0, 34.0, 38.0, 34.0, 33.0, 23.0, 30.0, 22.0, 21.0, 19.0, 16.0, 16.0, 8.0, 10.0, 8.0, 5.0, 8.0, 7.0, 9.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.0975044965744019, -1.0619765520095825, -1.0264486074447632, -0.9909206628799438, -0.9553927183151245, -0.9198647737503052, -0.8843368291854858, -0.8488088846206665, -0.8132809400558472, -0.7777529954910278, -0.7422250509262085, -0.7066971063613892, -0.6711691617965698, -0.6356412172317505, -0.6001132726669312, -0.5645853281021118, -0.5290573835372925, -0.49352943897247314, -0.4580014944076538, -0.4224735498428345, -0.38694560527801514, -0.3514176607131958, -0.31588971614837646, -0.28036177158355713, -0.2448338270187378, -0.20930588245391846, -0.17377793788909912, -0.13824999332427979, -0.10272204875946045, -0.06719410419464111, -0.03166615962982178, 0.0038617849349975586, 0.039389848709106445, 0.07491779327392578, 0.11044573783874512, 0.14597368240356445, 0.1815016269683838, 0.21702957153320312, 0.25255751609802246, 0.2880854606628418, 0.32361340522766113, 0.35914134979248047, 0.3946692943572998, 0.43019723892211914, 0.4657251834869385, 0.5012531280517578, 0.5367810726165771, 0.5723090171813965, 0.6078369617462158, 0.6433649063110352, 0.6788928508758545, 0.7144207954406738, 0.7499487400054932, 0.7854766845703125, 0.8210046291351318, 0.8565325736999512, 0.8920605182647705, 0.9275884628295898, 0.9631164073944092, 0.9986443519592285, 1.0341722965240479, 1.0697002410888672, 1.1052281856536865, 1.1407561302185059, 1.1762840747833252]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 13.0, 9.0, 11.0, 10.0, 21.0, 20.0, 36.0, 38.0, 47.0, 82.0, 111.0, 169.0, 333.0, 658.0, 1611.0, 4309.0, 15341.0, 79019.0, 492022.0, 1958639.0, 1346955.0, 240984.0, 39026.0, 9359.0, 3025.0, 1161.0, 523.0, 281.0, 144.0, 93.0, 59.0, 38.0, 29.0, 17.0, 15.0, 12.0, 17.0, 9.0, 10.0, 7.0, 8.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.80517578125, -0.7798614501953125, -0.754547119140625, -0.7292327880859375, -0.70391845703125, -0.6786041259765625, -0.653289794921875, -0.6279754638671875, -0.6026611328125, -0.5773468017578125, -0.552032470703125, -0.5267181396484375, -0.50140380859375, -0.4760894775390625, -0.450775146484375, -0.4254608154296875, -0.400146484375, -0.3748321533203125, -0.349517822265625, -0.3242034912109375, -0.29888916015625, -0.2735748291015625, -0.248260498046875, -0.2229461669921875, -0.1976318359375, -0.1723175048828125, -0.147003173828125, -0.1216888427734375, -0.09637451171875, -0.0710601806640625, -0.045745849609375, -0.0204315185546875, 0.0048828125, 0.0301971435546875, 0.055511474609375, 0.0808258056640625, 0.10614013671875, 0.1314544677734375, 0.156768798828125, 0.1820831298828125, 0.2073974609375, 0.2327117919921875, 0.258026123046875, 0.2833404541015625, 0.30865478515625, 0.3339691162109375, 0.359283447265625, 0.3845977783203125, 0.409912109375, 0.4352264404296875, 0.460540771484375, 0.4858551025390625, 0.51116943359375, 0.5364837646484375, 0.561798095703125, 0.5871124267578125, 0.6124267578125, 0.6377410888671875, 0.663055419921875, 0.6883697509765625, 0.71368408203125, 0.7389984130859375, 0.764312744140625, 0.7896270751953125, 0.81494140625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 4.0, 7.0, 7.0, 5.0, 16.0, 11.0, 15.0, 15.0, 20.0, 19.0, 35.0, 31.0, 40.0, 46.0, 36.0, 44.0, 54.0, 36.0, 35.0, 40.0, 52.0, 42.0, 53.0, 46.0, 39.0, 29.0, 37.0, 21.0, 28.0, 20.0, 23.0, 14.0, 12.0, 10.0, 12.0, 9.0, 6.0, 6.0, 3.0, 4.0, 4.0, 1.0, 6.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-0.60986328125, -0.5925750732421875, -0.575286865234375, -0.5579986572265625, -0.54071044921875, -0.5234222412109375, -0.506134033203125, -0.4888458251953125, -0.4715576171875, -0.4542694091796875, -0.436981201171875, -0.4196929931640625, -0.40240478515625, -0.3851165771484375, -0.367828369140625, -0.3505401611328125, -0.333251953125, -0.3159637451171875, -0.298675537109375, -0.2813873291015625, -0.26409912109375, -0.2468109130859375, -0.229522705078125, -0.2122344970703125, -0.1949462890625, -0.1776580810546875, -0.160369873046875, -0.1430816650390625, -0.12579345703125, -0.1085052490234375, -0.091217041015625, -0.0739288330078125, -0.056640625, -0.0393524169921875, -0.022064208984375, -0.0047760009765625, 0.01251220703125, 0.0298004150390625, 0.047088623046875, 0.0643768310546875, 0.0816650390625, 0.0989532470703125, 0.116241455078125, 0.1335296630859375, 0.15081787109375, 0.1681060791015625, 0.185394287109375, 0.2026824951171875, 0.219970703125, 0.2372589111328125, 0.254547119140625, 0.2718353271484375, 0.28912353515625, 0.3064117431640625, 0.323699951171875, 0.3409881591796875, 0.3582763671875, 0.3755645751953125, 0.392852783203125, 0.4101409912109375, 0.42742919921875, 0.4447174072265625, 0.462005615234375, 0.4792938232421875, 0.49658203125]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 3.0, 13.0, 6.0, 8.0, 16.0, 14.0, 23.0, 24.0, 35.0, 61.0, 89.0, 139.0, 296.0, 802.0, 5189.0, 243191.0, 3897024.0, 43932.0, 2277.0, 510.0, 219.0, 114.0, 77.0, 66.0, 38.0, 28.0, 21.0, 7.0, 14.0, 9.0, 9.0, 6.0, 4.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8583984375, -1.7950286865234375, -1.731658935546875, -1.6682891845703125, -1.60491943359375, -1.5415496826171875, -1.478179931640625, -1.4148101806640625, -1.3514404296875, -1.2880706787109375, -1.224700927734375, -1.1613311767578125, -1.09796142578125, -1.0345916748046875, -0.971221923828125, -0.9078521728515625, -0.844482421875, -0.7811126708984375, -0.717742919921875, -0.6543731689453125, -0.59100341796875, -0.5276336669921875, -0.464263916015625, -0.4008941650390625, -0.3375244140625, -0.2741546630859375, -0.210784912109375, -0.1474151611328125, -0.08404541015625, -0.0206756591796875, 0.042694091796875, 0.1060638427734375, 0.16943359375, 0.2328033447265625, 0.296173095703125, 0.3595428466796875, 0.42291259765625, 0.4862823486328125, 0.549652099609375, 0.6130218505859375, 0.6763916015625, 0.7397613525390625, 0.803131103515625, 0.8665008544921875, 0.92987060546875, 0.9932403564453125, 1.056610107421875, 1.1199798583984375, 1.183349609375, 1.2467193603515625, 1.310089111328125, 1.3734588623046875, 1.43682861328125, 1.5001983642578125, 1.563568115234375, 1.6269378662109375, 1.6903076171875, 1.7536773681640625, 1.817047119140625, 1.8804168701171875, 1.94378662109375, 2.0071563720703125, 2.070526123046875, 2.1338958740234375, 2.197265625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 13.0, 17.0, 19.0, 23.0, 35.0, 45.0, 45.0, 73.0, 122.0, 154.0, 226.0, 297.0, 428.0, 535.0, 510.0, 404.0, 321.0, 234.0, 165.0, 112.0, 91.0, 56.0, 35.0, 23.0, 26.0, 17.0, 7.0, 9.0, 8.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1866455078125, -0.17945289611816406, -0.17226028442382812, -0.1650676727294922, -0.15787506103515625, -0.1506824493408203, -0.14348983764648438, -0.13629722595214844, -0.1291046142578125, -0.12191200256347656, -0.11471939086914062, -0.10752677917480469, -0.10033416748046875, -0.09314155578613281, -0.08594894409179688, -0.07875633239746094, -0.071563720703125, -0.06437110900878906, -0.057178497314453125, -0.04998588562011719, -0.04279327392578125, -0.03560066223144531, -0.028408050537109375, -0.021215438842773438, -0.0140228271484375, -0.0068302154541015625, 0.000362396240234375, 0.0075550079345703125, 0.01474761962890625, 0.021940231323242188, 0.029132843017578125, 0.03632545471191406, 0.04351806640625, 0.05071067810058594, 0.057903289794921875, 0.06509590148925781, 0.07228851318359375, 0.07948112487792969, 0.08667373657226562, 0.09386634826660156, 0.1010589599609375, 0.10825157165527344, 0.11544418334960938, 0.12263679504394531, 0.12982940673828125, 0.1370220184326172, 0.14421463012695312, 0.15140724182128906, 0.158599853515625, 0.16579246520996094, 0.17298507690429688, 0.1801776885986328, 0.18737030029296875, 0.1945629119873047, 0.20175552368164062, 0.20894813537597656, 0.2161407470703125, 0.22333335876464844, 0.23052597045898438, 0.2377185821533203, 0.24491119384765625, 0.2521038055419922, 0.2592964172363281, 0.26648902893066406, 0.273681640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 8.0, 3.0, 7.0, 11.0, 8.0, 24.0, 34.0, 38.0, 67.0, 93.0, 98.0, 125.0, 134.0, 95.0, 70.0, 53.0, 45.0, 39.0, 15.0, 17.0, 6.0, 4.0, 6.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9110559225082397, -0.8727821111679077, -0.8345083594322205, -0.7962346076965332, -0.7579607963562012, -0.7196869850158691, -0.6814132332801819, -0.6431394815444946, -0.6048656702041626, -0.5665918588638306, -0.5283181071281433, -0.49004432559013367, -0.451770544052124, -0.4134967625141144, -0.37522298097610474, -0.3369491994380951, -0.29867541790008545, -0.2604016363620758, -0.22212785482406616, -0.18385407328605652, -0.14558029174804688, -0.10730651021003723, -0.06903272867202759, -0.030758947134017944, 0.007514834403991699, 0.04578861594200134, 0.08406239748001099, 0.12233617901802063, 0.16060996055603027, 0.19888374209403992, 0.23715752363204956, 0.2754313051700592, 0.3137049674987793, 0.35197874903678894, 0.3902525305747986, 0.4285263121128082, 0.46680009365081787, 0.5050739049911499, 0.5433476567268372, 0.5816214084625244, 0.6198952198028564, 0.6581690311431885, 0.6964427828788757, 0.734716534614563, 0.772990345954895, 0.811264157295227, 0.8495379090309143, 0.8878116607666016, 0.9260854721069336, 0.9643592834472656, 1.0026330947875977, 1.0409067869186401, 1.0791805982589722, 1.1174544095993042, 1.1557281017303467, 1.1940019130706787, 1.2322757244110107, 1.2705495357513428, 1.3088233470916748, 1.3470970392227173, 1.3853708505630493, 1.4236446619033813, 1.4619183540344238, 1.5001921653747559, 1.538465976715088]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 3.0, 4.0, 3.0, 4.0, 7.0, 5.0, 6.0, 8.0, 17.0, 21.0, 24.0, 16.0, 14.0, 21.0, 31.0, 25.0, 22.0, 31.0, 28.0, 36.0, 35.0, 41.0, 39.0, 32.0, 40.0, 30.0, 48.0, 30.0, 32.0, 31.0, 23.0, 21.0, 26.0, 37.0, 28.0, 27.0, 21.0, 14.0, 20.0, 9.0, 17.0, 8.0, 8.0, 10.0, 4.0, 6.0, 5.0, 7.0, 5.0, 3.0, 7.0, 6.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.45690181851387024, -0.4425037205219269, -0.4281056523323059, -0.41370755434036255, -0.3993094861507416, -0.3849113881587982, -0.37051331996917725, -0.3561152219772339, -0.3417171239852905, -0.32731902599334717, -0.3129209578037262, -0.29852285981178284, -0.28412479162216187, -0.2697266936302185, -0.25532859563827515, -0.24093052744865417, -0.226532444357872, -0.21213436126708984, -0.19773627817630768, -0.1833381950855255, -0.16894009709358215, -0.1545420140028, -0.14014393091201782, -0.12574583292007446, -0.1113477572798729, -0.09694967418909073, -0.08255158364772797, -0.0681535005569458, -0.05375541374087334, -0.03935732692480087, -0.024959243834018707, -0.010561153292655945, 0.0038369297981262207, 0.018235016614198685, 0.03263310343027115, 0.047031186521053314, 0.06142927333712578, 0.07582736015319824, 0.09022544324398041, 0.10462353378534317, 0.11902161687612534, 0.1334197074174881, 0.14781779050827026, 0.16221587359905243, 0.1766139566898346, 0.19101205468177795, 0.20541012287139893, 0.21980822086334229, 0.23420630395412445, 0.24860438704490662, 0.26300248503685, 0.27740055322647095, 0.2917986512184143, 0.30619674921035767, 0.32059481739997864, 0.334992915391922, 0.34939098358154297, 0.36378908157348633, 0.3781871497631073, 0.39258524775505066, 0.40698331594467163, 0.421381413936615, 0.43577951192855835, 0.4501775801181793, 0.4645756781101227]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 7.0, 6.0, 11.0, 19.0, 20.0, 40.0, 85.0, 189.0, 426.0, 1794.0, 11772.0, 134190.0, 736437.0, 147911.0, 12897.0, 1887.0, 473.0, 184.0, 93.0, 49.0, 29.0, 19.0, 6.0, 7.0, 5.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35302734375, -0.3424949645996094, -0.33196258544921875, -0.3214302062988281, -0.3108978271484375, -0.3003654479980469, -0.28983306884765625, -0.2793006896972656, -0.268768310546875, -0.2582359313964844, -0.24770355224609375, -0.23717117309570312, -0.2266387939453125, -0.21610641479492188, -0.20557403564453125, -0.19504165649414062, -0.18450927734375, -0.17397689819335938, -0.16344451904296875, -0.15291213989257812, -0.1423797607421875, -0.13184738159179688, -0.12131500244140625, -0.11078262329101562, -0.100250244140625, -0.08971786499023438, -0.07918548583984375, -0.06865310668945312, -0.0581207275390625, -0.047588348388671875, -0.03705596923828125, -0.026523590087890625, -0.0159912109375, -0.005458831787109375, 0.00507354736328125, 0.015605926513671875, 0.0261383056640625, 0.036670684814453125, 0.04720306396484375, 0.057735443115234375, 0.068267822265625, 0.07880020141601562, 0.08933258056640625, 0.09986495971679688, 0.1103973388671875, 0.12092971801757812, 0.13146209716796875, 0.14199447631835938, 0.15252685546875, 0.16305923461914062, 0.17359161376953125, 0.18412399291992188, 0.1946563720703125, 0.20518875122070312, 0.21572113037109375, 0.22625350952148438, 0.236785888671875, 0.24731826782226562, 0.25785064697265625, 0.2683830261230469, 0.2789154052734375, 0.2894477844238281, 0.29998016357421875, 0.3105125427246094, 0.321044921875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 4.0, 3.0, 7.0, 10.0, 9.0, 11.0, 23.0, 17.0, 22.0, 28.0, 33.0, 39.0, 45.0, 47.0, 54.0, 58.0, 45.0, 59.0, 58.0, 45.0, 47.0, 42.0, 44.0, 41.0, 40.0, 29.0, 31.0, 23.0, 19.0, 15.0, 10.0, 7.0, 11.0, 5.0, 8.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.4765625, -0.4632568359375, -0.449951171875, -0.4366455078125, -0.42333984375, -0.4100341796875, -0.396728515625, -0.3834228515625, -0.3701171875, -0.3568115234375, -0.343505859375, -0.3302001953125, -0.31689453125, -0.3035888671875, -0.290283203125, -0.2769775390625, -0.263671875, -0.2503662109375, -0.237060546875, -0.2237548828125, -0.21044921875, -0.1971435546875, -0.183837890625, -0.1705322265625, -0.1572265625, -0.1439208984375, -0.130615234375, -0.1173095703125, -0.10400390625, -0.0906982421875, -0.077392578125, -0.0640869140625, -0.05078125, -0.0374755859375, -0.024169921875, -0.0108642578125, 0.00244140625, 0.0157470703125, 0.029052734375, 0.0423583984375, 0.0556640625, 0.0689697265625, 0.082275390625, 0.0955810546875, 0.10888671875, 0.1221923828125, 0.135498046875, 0.1488037109375, 0.162109375, 0.1754150390625, 0.188720703125, 0.2020263671875, 0.21533203125, 0.2286376953125, 0.241943359375, 0.2552490234375, 0.2685546875, 0.2818603515625, 0.295166015625, 0.3084716796875, 0.32177734375, 0.3350830078125, 0.348388671875, 0.3616943359375, 0.375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 13.0, 9.0, 6.0, 8.0, 22.0, 24.0, 32.0, 56.0, 73.0, 110.0, 182.0, 242.0, 428.0, 694.0, 1366.0, 2864.0, 6578.0, 16814.0, 46302.0, 127870.0, 287929.0, 313299.0, 153183.0, 55964.0, 20068.0, 7533.0, 3237.0, 1529.0, 839.0, 440.0, 280.0, 169.0, 104.0, 77.0, 57.0, 45.0, 23.0, 25.0, 15.0, 10.0, 5.0, 8.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11260986328125, -0.10860157012939453, -0.10459327697753906, -0.1005849838256836, -0.09657669067382812, -0.09256839752197266, -0.08856010437011719, -0.08455181121826172, -0.08054351806640625, -0.07653522491455078, -0.07252693176269531, -0.06851863861083984, -0.06451034545898438, -0.060502052307128906, -0.05649375915527344, -0.05248546600341797, -0.0484771728515625, -0.04446887969970703, -0.04046058654785156, -0.036452293395996094, -0.032444000244140625, -0.028435707092285156, -0.024427413940429688, -0.02041912078857422, -0.01641082763671875, -0.012402534484863281, -0.008394241333007812, -0.004385948181152344, -0.000377655029296875, 0.0036306381225585938, 0.0076389312744140625, 0.011647224426269531, 0.015655517578125, 0.01966381072998047, 0.023672103881835938, 0.027680397033691406, 0.031688690185546875, 0.035696983337402344, 0.03970527648925781, 0.04371356964111328, 0.04772186279296875, 0.05173015594482422, 0.05573844909667969, 0.059746742248535156, 0.06375503540039062, 0.0677633285522461, 0.07177162170410156, 0.07577991485595703, 0.0797882080078125, 0.08379650115966797, 0.08780479431152344, 0.0918130874633789, 0.09582138061523438, 0.09982967376708984, 0.10383796691894531, 0.10784626007080078, 0.11185455322265625, 0.11586284637451172, 0.11987113952636719, 0.12387943267822266, 0.12788772583007812, 0.1318960189819336, 0.13590431213378906, 0.13991260528564453, 0.1439208984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 1.0, 4.0, 5.0, 5.0, 11.0, 11.0, 12.0, 20.0, 9.0, 23.0, 17.0, 22.0, 22.0, 30.0, 31.0, 23.0, 38.0, 45.0, 51.0, 28.0, 47.0, 46.0, 50.0, 43.0, 42.0, 59.0, 41.0, 33.0, 36.0, 22.0, 28.0, 32.0, 25.0, 16.0, 15.0, 16.0, 8.0, 12.0, 6.0, 9.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64208984375, -0.619781494140625, -0.59747314453125, -0.575164794921875, -0.5528564453125, -0.530548095703125, -0.50823974609375, -0.485931396484375, -0.463623046875, -0.441314697265625, -0.41900634765625, -0.396697998046875, -0.3743896484375, -0.352081298828125, -0.32977294921875, -0.307464599609375, -0.28515625, -0.262847900390625, -0.24053955078125, -0.218231201171875, -0.1959228515625, -0.173614501953125, -0.15130615234375, -0.128997802734375, -0.106689453125, -0.084381103515625, -0.06207275390625, -0.039764404296875, -0.0174560546875, 0.004852294921875, 0.02716064453125, 0.049468994140625, 0.07177734375, 0.094085693359375, 0.11639404296875, 0.138702392578125, 0.1610107421875, 0.183319091796875, 0.20562744140625, 0.227935791015625, 0.250244140625, 0.272552490234375, 0.29486083984375, 0.317169189453125, 0.3394775390625, 0.361785888671875, 0.38409423828125, 0.406402587890625, 0.4287109375, 0.451019287109375, 0.47332763671875, 0.495635986328125, 0.5179443359375, 0.540252685546875, 0.56256103515625, 0.584869384765625, 0.607177734375, 0.629486083984375, 0.65179443359375, 0.674102783203125, 0.6964111328125, 0.718719482421875, 0.74102783203125, 0.763336181640625, 0.78564453125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 6.0, 5.0, 10.0, 19.0, 35.0, 47.0, 85.0, 142.0, 233.0, 403.0, 846.0, 1865.0, 4684.0, 14723.0, 58215.0, 274625.0, 496409.0, 149104.0, 32217.0, 9032.0, 3133.0, 1304.0, 646.0, 318.0, 164.0, 113.0, 66.0, 39.0, 16.0, 10.0, 6.0, 5.0, 9.0, 5.0, 3.0, 1.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0615234375, -0.059493064880371094, -0.05746269226074219, -0.05543231964111328, -0.053401947021484375, -0.05137157440185547, -0.04934120178222656, -0.047310829162597656, -0.04528045654296875, -0.043250083923339844, -0.04121971130371094, -0.03918933868408203, -0.037158966064453125, -0.03512859344482422, -0.03309822082519531, -0.031067848205566406, -0.0290374755859375, -0.027007102966308594, -0.024976730346679688, -0.02294635772705078, -0.020915985107421875, -0.01888561248779297, -0.016855239868164062, -0.014824867248535156, -0.01279449462890625, -0.010764122009277344, -0.008733749389648438, -0.006703376770019531, -0.004673004150390625, -0.0026426315307617188, -0.0006122589111328125, 0.0014181137084960938, 0.003448486328125, 0.005478858947753906, 0.0075092315673828125, 0.009539604187011719, 0.011569976806640625, 0.013600349426269531, 0.015630722045898438, 0.017661094665527344, 0.01969146728515625, 0.021721839904785156, 0.023752212524414062, 0.02578258514404297, 0.027812957763671875, 0.02984333038330078, 0.03187370300292969, 0.033904075622558594, 0.0359344482421875, 0.037964820861816406, 0.03999519348144531, 0.04202556610107422, 0.044055938720703125, 0.04608631134033203, 0.04811668395996094, 0.050147056579589844, 0.05217742919921875, 0.054207801818847656, 0.05623817443847656, 0.05826854705810547, 0.060298919677734375, 0.06232929229736328, 0.06435966491699219, 0.0663900375366211, 0.06842041015625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 8.0, 3.0, 8.0, 3.0, 15.0, 10.0, 19.0, 39.0, 34.0, 37.0, 51.0, 47.0, 82.0, 82.0, 71.0, 89.0, 85.0, 89.0, 53.0, 41.0, 33.0, 23.0, 20.0, 16.0, 10.0, 10.0, 6.0, 3.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.913309097290039e-05, -1.8431805074214935e-05, -1.773051917552948e-05, -1.7029233276844025e-05, -1.632794737815857e-05, -1.5626661479473114e-05, -1.4925375580787659e-05, -1.4224089682102203e-05, -1.3522803783416748e-05, -1.2821517884731293e-05, -1.2120231986045837e-05, -1.1418946087360382e-05, -1.0717660188674927e-05, -1.0016374289989471e-05, -9.315088391304016e-06, -8.61380249261856e-06, -7.912516593933105e-06, -7.21123069524765e-06, -6.509944796562195e-06, -5.8086588978767395e-06, -5.107372999191284e-06, -4.406087100505829e-06, -3.7048012018203735e-06, -3.0035153031349182e-06, -2.302229404449463e-06, -1.6009435057640076e-06, -8.996576070785522e-07, -1.9837170839309692e-07, 5.029141902923584e-07, 1.2042000889778137e-06, 1.905485987663269e-06, 2.6067718863487244e-06, 3.3080577850341797e-06, 4.009343683719635e-06, 4.71062958240509e-06, 5.411915481090546e-06, 6.113201379776001e-06, 6.814487278461456e-06, 7.515773177146912e-06, 8.217059075832367e-06, 8.918344974517822e-06, 9.619630873203278e-06, 1.0320916771888733e-05, 1.1022202670574188e-05, 1.1723488569259644e-05, 1.2424774467945099e-05, 1.3126060366630554e-05, 1.382734626531601e-05, 1.4528632164001465e-05, 1.522991806268692e-05, 1.5931203961372375e-05, 1.663248986005783e-05, 1.7333775758743286e-05, 1.803506165742874e-05, 1.8736347556114197e-05, 1.9437633454799652e-05, 2.0138919353485107e-05, 2.0840205252170563e-05, 2.1541491150856018e-05, 2.2242777049541473e-05, 2.294406294822693e-05, 2.3645348846912384e-05, 2.434663474559784e-05, 2.5047920644283295e-05, 2.574920654296875e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 6.0, 8.0, 7.0, 7.0, 11.0, 7.0, 16.0, 25.0, 30.0, 45.0, 59.0, 81.0, 123.0, 203.0, 423.0, 894.0, 2348.0, 6912.0, 23209.0, 88493.0, 323779.0, 415026.0, 136397.0, 34999.0, 9858.0, 3155.0, 1190.0, 502.0, 263.0, 148.0, 85.0, 64.0, 45.0, 25.0, 22.0, 22.0, 16.0, 7.0, 7.0, 13.0, 7.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0], "bins": [-0.060089111328125, -0.05827665328979492, -0.056464195251464844, -0.054651737213134766, -0.05283927917480469, -0.05102682113647461, -0.04921436309814453, -0.04740190505981445, -0.045589447021484375, -0.0437769889831543, -0.04196453094482422, -0.04015207290649414, -0.03833961486816406, -0.036527156829833984, -0.034714698791503906, -0.03290224075317383, -0.03108978271484375, -0.029277324676513672, -0.027464866638183594, -0.025652408599853516, -0.023839950561523438, -0.02202749252319336, -0.02021503448486328, -0.018402576446533203, -0.016590118408203125, -0.014777660369873047, -0.012965202331542969, -0.01115274429321289, -0.009340286254882812, -0.007527828216552734, -0.005715370178222656, -0.003902912139892578, -0.0020904541015625, -0.0002779960632324219, 0.0015344619750976562, 0.0033469200134277344, 0.0051593780517578125, 0.006971836090087891, 0.008784294128417969, 0.010596752166748047, 0.012409210205078125, 0.014221668243408203, 0.01603412628173828, 0.01784658432006836, 0.019659042358398438, 0.021471500396728516, 0.023283958435058594, 0.025096416473388672, 0.02690887451171875, 0.028721332550048828, 0.030533790588378906, 0.032346248626708984, 0.03415870666503906, 0.03597116470336914, 0.03778362274169922, 0.0395960807800293, 0.041408538818359375, 0.04322099685668945, 0.04503345489501953, 0.04684591293334961, 0.04865837097167969, 0.050470829010009766, 0.052283287048339844, 0.05409574508666992, 0.055908203125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 4.0, 2.0, 3.0, 5.0, 6.0, 6.0, 8.0, 17.0, 22.0, 14.0, 17.0, 20.0, 19.0, 35.0, 36.0, 43.0, 58.0, 79.0, 64.0, 65.0, 76.0, 63.0, 56.0, 50.0, 31.0, 40.0, 25.0, 28.0, 20.0, 27.0, 11.0, 13.0, 11.0, 6.0, 4.0, 9.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014404296875, -0.013987421989440918, -0.013570547103881836, -0.013153672218322754, -0.012736797332763672, -0.01231992244720459, -0.011903047561645508, -0.011486172676086426, -0.011069297790527344, -0.010652422904968262, -0.01023554801940918, -0.009818673133850098, -0.009401798248291016, -0.008984923362731934, -0.008568048477172852, -0.00815117359161377, -0.0077342987060546875, -0.0073174238204956055, -0.0069005489349365234, -0.006483674049377441, -0.006066799163818359, -0.005649924278259277, -0.005233049392700195, -0.004816174507141113, -0.004399299621582031, -0.003982424736022949, -0.003565549850463867, -0.003148674964904785, -0.002731800079345703, -0.002314925193786621, -0.001898050308227539, -0.001481175422668457, -0.001064300537109375, -0.000647425651550293, -0.00023055076599121094, 0.0001863241195678711, 0.0006031990051269531, 0.0010200738906860352, 0.0014369487762451172, 0.0018538236618041992, 0.0022706985473632812, 0.0026875734329223633, 0.0031044483184814453, 0.0035213232040405273, 0.003938198089599609, 0.004355072975158691, 0.0047719478607177734, 0.0051888227462768555, 0.0056056976318359375, 0.0060225725173950195, 0.0064394474029541016, 0.006856322288513184, 0.007273197174072266, 0.007690072059631348, 0.00810694694519043, 0.008523821830749512, 0.008940696716308594, 0.009357571601867676, 0.009774446487426758, 0.01019132137298584, 0.010608196258544922, 0.011025071144104004, 0.011441946029663086, 0.011858820915222168, 0.01227569580078125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 10.0, 10.0, 17.0, 42.0, 70.0, 118.0, 171.0, 201.0, 141.0, 85.0, 59.0, 30.0, 16.0, 13.0, 9.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.970798134803772, -0.9376470446586609, -0.904495894908905, -0.871344804763794, -0.8381936550140381, -0.805042564868927, -0.7718914747238159, -0.7387403249740601, -0.705589234828949, -0.6724381446838379, -0.639286994934082, -0.606135904788971, -0.5729848146438599, -0.539833664894104, -0.5066825747489929, -0.47353145480155945, -0.440380334854126, -0.4072292149066925, -0.37407809495925903, -0.34092700481414795, -0.3077758848667145, -0.274624764919281, -0.24147365987300873, -0.20832255482673645, -0.17517143487930298, -0.1420203149318695, -0.10886920988559723, -0.07571809738874435, -0.04256698489189148, -0.009415864944458008, 0.02373524010181427, 0.05688634514808655, 0.09003746509552002, 0.1231885775923729, 0.15633969008922577, 0.18949079513549805, 0.22264191508293152, 0.255793035030365, 0.2889441251754761, 0.32209524512290955, 0.355246365070343, 0.3883974850177765, 0.42154860496520996, 0.45469969511032104, 0.4878508150577545, 0.521001935005188, 0.5541530251502991, 0.5873041152954102, 0.620455265045166, 0.6536063551902771, 0.686757504940033, 0.719908595085144, 0.7530597448348999, 0.786210834980011, 0.8193619251251221, 0.8525130748748779, 0.885664165019989, 0.9188152551651001, 0.951966404914856, 0.985117495059967, 1.0182685852050781, 1.051419734954834, 1.0845708847045898, 1.1177219152450562, 1.150873064994812]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 10.0, 7.0, 8.0, 5.0, 17.0, 18.0, 27.0, 30.0, 25.0, 35.0, 41.0, 42.0, 42.0, 60.0, 56.0, 60.0, 46.0, 50.0, 61.0, 50.0, 33.0, 41.0, 40.0, 46.0, 24.0, 27.0, 19.0, 14.0, 11.0, 10.0, 5.0, 10.0, 8.0, 9.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.4869082570075989, -0.4742285907268524, -0.46154892444610596, -0.4488692283630371, -0.43618956208229065, -0.4235098958015442, -0.41083022952079773, -0.39815056324005127, -0.3854708671569824, -0.37279120087623596, -0.3601115345954895, -0.34743183851242065, -0.3347521722316742, -0.32207250595092773, -0.3093928396701813, -0.2967131733894348, -0.28403347730636597, -0.2713538110256195, -0.25867414474487305, -0.2459944635629654, -0.23331478238105774, -0.22063511610031128, -0.20795544981956482, -0.19527576863765717, -0.1825961172580719, -0.16991645097732544, -0.15723676979541779, -0.14455710351467133, -0.13187742233276367, -0.11919775605201721, -0.10651808232069016, -0.0938384085893631, -0.08115872740745544, -0.06847905367612839, -0.05579937994480133, -0.04311970993876457, -0.030440036207437515, -0.017760366201400757, -0.0050806924700737, 0.007598981261253357, 0.020278654992580414, 0.03295832872390747, 0.04563800245523453, 0.058317672461271286, 0.07099734246730804, 0.0836770161986351, 0.09635668992996216, 0.10903636366128922, 0.12171603739261627, 0.13439570367336273, 0.14707538485527039, 0.15975505113601685, 0.1724347323179245, 0.18511439859867096, 0.1977940797805786, 0.21047374606132507, 0.22315341234207153, 0.235833078622818, 0.24851275980472565, 0.2611924409866333, 0.27387210726737976, 0.2865517735481262, 0.2992314398288727, 0.31191110610961914, 0.324590802192688]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 2.0, 3.0, 6.0, 16.0, 19.0, 35.0, 39.0, 86.0, 370.0, 3843.0, 470761.0, 568387.0, 4371.0, 383.0, 98.0, 49.0, 22.0, 18.0, 13.0, 4.0, 6.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.12890625, -2.0644378662109375, -1.999969482421875, -1.9355010986328125, -1.87103271484375, -1.8065643310546875, -1.742095947265625, -1.6776275634765625, -1.6131591796875, -1.5486907958984375, -1.484222412109375, -1.4197540283203125, -1.35528564453125, -1.2908172607421875, -1.226348876953125, -1.1618804931640625, -1.097412109375, -1.0329437255859375, -0.968475341796875, -0.9040069580078125, -0.83953857421875, -0.7750701904296875, -0.710601806640625, -0.6461334228515625, -0.5816650390625, -0.5171966552734375, -0.452728271484375, -0.3882598876953125, -0.32379150390625, -0.2593231201171875, -0.194854736328125, -0.1303863525390625, -0.06591796875, -0.0014495849609375, 0.063018798828125, 0.1274871826171875, 0.19195556640625, 0.2564239501953125, 0.320892333984375, 0.3853607177734375, 0.4498291015625, 0.5142974853515625, 0.578765869140625, 0.6432342529296875, 0.70770263671875, 0.7721710205078125, 0.836639404296875, 0.9011077880859375, 0.965576171875, 1.0300445556640625, 1.094512939453125, 1.1589813232421875, 1.22344970703125, 1.2879180908203125, 1.352386474609375, 1.4168548583984375, 1.4813232421875, 1.5457916259765625, 1.610260009765625, 1.6747283935546875, 1.73919677734375, 1.8036651611328125, 1.868133544921875, 1.9326019287109375, 1.9970703125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 16.0, 25.0, 30.0, 43.0, 76.0, 102.0, 124.0, 133.0, 115.0, 102.0, 86.0, 60.0, 36.0, 25.0, 22.0, 10.0, 8.0, 2.0, 2.0], "bins": [-3.03125, -2.9737701416015625, -2.916290283203125, -2.8588104248046875, -2.80133056640625, -2.7438507080078125, -2.686370849609375, -2.6288909912109375, -2.5714111328125, -2.5139312744140625, -2.456451416015625, -2.3989715576171875, -2.34149169921875, -2.2840118408203125, -2.226531982421875, -2.1690521240234375, -2.111572265625, -2.0540924072265625, -1.996612548828125, -1.9391326904296875, -1.88165283203125, -1.8241729736328125, -1.766693115234375, -1.7092132568359375, -1.6517333984375, -1.5942535400390625, -1.536773681640625, -1.4792938232421875, -1.42181396484375, -1.3643341064453125, -1.306854248046875, -1.2493743896484375, -1.19189453125, -1.1344146728515625, -1.076934814453125, -1.0194549560546875, -0.96197509765625, -0.9044952392578125, -0.847015380859375, -0.7895355224609375, -0.7320556640625, -0.6745758056640625, -0.617095947265625, -0.5596160888671875, -0.50213623046875, -0.4446563720703125, -0.387176513671875, -0.3296966552734375, -0.272216796875, -0.2147369384765625, -0.157257080078125, -0.0997772216796875, -0.04229736328125, 0.0151824951171875, 0.072662353515625, 0.1301422119140625, 0.1876220703125, 0.2451019287109375, 0.302581787109375, 0.3600616455078125, 0.41754150390625, 0.4750213623046875, 0.532501220703125, 0.5899810791015625, 0.6474609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 9.0, 7.0, 13.0, 7.0, 18.0, 15.0, 22.0, 42.0, 59.0, 70.0, 106.0, 117.0, 127.0, 216.0, 291.0, 555.0, 2601.0, 33212.0, 734423.0, 264754.0, 9416.0, 1126.0, 385.0, 243.0, 180.0, 122.0, 96.0, 79.0, 66.0, 49.0, 45.0, 14.0, 22.0, 13.0, 11.0, 8.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0], "bins": [-1.2431640625, -1.2093734741210938, -1.1755828857421875, -1.1417922973632812, -1.108001708984375, -1.0742111206054688, -1.0404205322265625, -1.0066299438476562, -0.97283935546875, -0.9390487670898438, -0.9052581787109375, -0.8714675903320312, -0.837677001953125, -0.8038864135742188, -0.7700958251953125, -0.7363052368164062, -0.7025146484375, -0.6687240600585938, -0.6349334716796875, -0.6011428833007812, -0.567352294921875, -0.5335617065429688, -0.4997711181640625, -0.46598052978515625, -0.43218994140625, -0.39839935302734375, -0.3646087646484375, -0.33081817626953125, -0.297027587890625, -0.26323699951171875, -0.2294464111328125, -0.19565582275390625, -0.161865234375, -0.12807464599609375, -0.0942840576171875, -0.06049346923828125, -0.026702880859375, 0.00708770751953125, 0.0408782958984375, 0.07466888427734375, 0.10845947265625, 0.14225006103515625, 0.1760406494140625, 0.20983123779296875, 0.243621826171875, 0.27741241455078125, 0.3112030029296875, 0.34499359130859375, 0.3787841796875, 0.41257476806640625, 0.4463653564453125, 0.48015594482421875, 0.513946533203125, 0.5477371215820312, 0.5815277099609375, 0.6153182983398438, 0.64910888671875, 0.6828994750976562, 0.7166900634765625, 0.7504806518554688, 0.784271240234375, 0.8180618286132812, 0.8518524169921875, 0.8856430053710938, 0.91943359375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 2.0, 6.0, 3.0, 7.0, 6.0, 7.0, 10.0, 16.0, 13.0, 17.0, 20.0, 16.0, 22.0, 25.0, 22.0, 30.0, 25.0, 39.0, 38.0, 38.0, 38.0, 40.0, 36.0, 31.0, 34.0, 45.0, 35.0, 42.0, 41.0, 33.0, 31.0, 35.0, 26.0, 31.0, 19.0, 17.0, 17.0, 15.0, 19.0, 9.0, 8.0, 8.0, 5.0, 5.0, 5.0, 4.0, 8.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.6005859375, -0.5823593139648438, -0.5641326904296875, -0.5459060668945312, -0.527679443359375, -0.5094528198242188, -0.4912261962890625, -0.47299957275390625, -0.45477294921875, -0.43654632568359375, -0.4183197021484375, -0.40009307861328125, -0.381866455078125, -0.36363983154296875, -0.3454132080078125, -0.32718658447265625, -0.3089599609375, -0.29073333740234375, -0.2725067138671875, -0.25428009033203125, -0.236053466796875, -0.21782684326171875, -0.1996002197265625, -0.18137359619140625, -0.16314697265625, -0.14492034912109375, -0.1266937255859375, -0.10846710205078125, -0.090240478515625, -0.07201385498046875, -0.0537872314453125, -0.03556060791015625, -0.017333984375, 0.00089263916015625, 0.0191192626953125, 0.03734588623046875, 0.055572509765625, 0.07379913330078125, 0.0920257568359375, 0.11025238037109375, 0.12847900390625, 0.14670562744140625, 0.1649322509765625, 0.18315887451171875, 0.201385498046875, 0.21961212158203125, 0.2378387451171875, 0.25606536865234375, 0.2742919921875, 0.29251861572265625, 0.3107452392578125, 0.32897186279296875, 0.347198486328125, 0.36542510986328125, 0.3836517333984375, 0.40187835693359375, 0.42010498046875, 0.43833160400390625, 0.4565582275390625, 0.47478485107421875, 0.493011474609375, 0.5112380981445312, 0.5294647216796875, 0.5476913452148438, 0.56591796875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 5.0, 7.0, 10.0, 10.0, 11.0, 8.0, 18.0, 27.0, 36.0, 42.0, 63.0, 100.0, 161.0, 304.0, 665.0, 1864.0, 7142.0, 36723.0, 244075.0, 572795.0, 153429.0, 23449.0, 4904.0, 1453.0, 515.0, 253.0, 138.0, 114.0, 62.0, 49.0, 28.0, 18.0, 17.0, 14.0, 8.0, 11.0, 8.0, 5.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.162109375, -0.15677261352539062, -0.15143585205078125, -0.14609909057617188, -0.1407623291015625, -0.13542556762695312, -0.13008880615234375, -0.12475204467773438, -0.119415283203125, -0.11407852172851562, -0.10874176025390625, -0.10340499877929688, -0.0980682373046875, -0.09273147583007812, -0.08739471435546875, -0.08205795288085938, -0.07672119140625, -0.07138442993164062, -0.06604766845703125, -0.060710906982421875, -0.0553741455078125, -0.050037384033203125, -0.04470062255859375, -0.039363861083984375, -0.034027099609375, -0.028690338134765625, -0.02335357666015625, -0.018016815185546875, -0.0126800537109375, -0.007343292236328125, -0.00200653076171875, 0.003330230712890625, 0.0086669921875, 0.014003753662109375, 0.01934051513671875, 0.024677276611328125, 0.0300140380859375, 0.035350799560546875, 0.04068756103515625, 0.046024322509765625, 0.051361083984375, 0.056697845458984375, 0.06203460693359375, 0.06737136840820312, 0.0727081298828125, 0.07804489135742188, 0.08338165283203125, 0.08871841430664062, 0.09405517578125, 0.09939193725585938, 0.10472869873046875, 0.11006546020507812, 0.1154022216796875, 0.12073898315429688, 0.12607574462890625, 0.13141250610351562, 0.136749267578125, 0.14208602905273438, 0.14742279052734375, 0.15275955200195312, 0.1580963134765625, 0.16343307495117188, 0.16876983642578125, 0.17410659790039062, 0.179443359375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 5.0, 9.0, 11.0, 14.0, 19.0, 21.0, 42.0, 43.0, 68.0, 80.0, 98.0, 115.0, 103.0, 82.0, 95.0, 53.0, 46.0, 45.0, 18.0, 13.0, 4.0, 2.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.528594970703125e-05, -3.437511622905731e-05, -3.3464282751083374e-05, -3.2553449273109436e-05, -3.16426157951355e-05, -3.073178231716156e-05, -2.9820948839187622e-05, -2.8910115361213684e-05, -2.7999281883239746e-05, -2.7088448405265808e-05, -2.617761492729187e-05, -2.5266781449317932e-05, -2.4355947971343994e-05, -2.3445114493370056e-05, -2.2534281015396118e-05, -2.162344753742218e-05, -2.0712614059448242e-05, -1.9801780581474304e-05, -1.8890947103500366e-05, -1.7980113625526428e-05, -1.706928014755249e-05, -1.6158446669578552e-05, -1.5247613191604614e-05, -1.4336779713630676e-05, -1.3425946235656738e-05, -1.25151127576828e-05, -1.1604279279708862e-05, -1.0693445801734924e-05, -9.782612323760986e-06, -8.871778845787048e-06, -7.96094536781311e-06, -7.050111889839172e-06, -6.139278411865234e-06, -5.228444933891296e-06, -4.317611455917358e-06, -3.4067779779434204e-06, -2.4959444999694824e-06, -1.5851110219955444e-06, -6.742775440216064e-07, 2.3655593395233154e-07, 1.1473894119262695e-06, 2.0582228899002075e-06, 2.9690563678741455e-06, 3.8798898458480835e-06, 4.7907233238220215e-06, 5.7015568017959595e-06, 6.6123902797698975e-06, 7.5232237577438354e-06, 8.434057235717773e-06, 9.344890713691711e-06, 1.025572419166565e-05, 1.1166557669639587e-05, 1.2077391147613525e-05, 1.2988224625587463e-05, 1.3899058103561401e-05, 1.480989158153534e-05, 1.5720725059509277e-05, 1.6631558537483215e-05, 1.7542392015457153e-05, 1.845322549343109e-05, 1.936405897140503e-05, 2.0274892449378967e-05, 2.1185725927352905e-05, 2.2096559405326843e-05, 2.300739288330078e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 12.0, 7.0, 14.0, 16.0, 28.0, 51.0, 67.0, 110.0, 251.0, 516.0, 1706.0, 8177.0, 83566.0, 729317.0, 204609.0, 15988.0, 2730.0, 729.0, 293.0, 137.0, 89.0, 46.0, 24.0, 22.0, 14.0, 8.0, 9.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.289794921875, -0.2811851501464844, -0.27257537841796875, -0.2639656066894531, -0.2553558349609375, -0.24674606323242188, -0.23813629150390625, -0.22952651977539062, -0.220916748046875, -0.21230697631835938, -0.20369720458984375, -0.19508743286132812, -0.1864776611328125, -0.17786788940429688, -0.16925811767578125, -0.16064834594726562, -0.15203857421875, -0.14342880249023438, -0.13481903076171875, -0.12620925903320312, -0.1175994873046875, -0.10898971557617188, -0.10037994384765625, -0.09177017211914062, -0.083160400390625, -0.07455062866210938, -0.06594085693359375, -0.057331085205078125, -0.0487213134765625, -0.040111541748046875, -0.03150177001953125, -0.022891998291015625, -0.0142822265625, -0.005672454833984375, 0.00293731689453125, 0.011547088623046875, 0.0201568603515625, 0.028766632080078125, 0.03737640380859375, 0.045986175537109375, 0.054595947265625, 0.06320571899414062, 0.07181549072265625, 0.08042526245117188, 0.0890350341796875, 0.09764480590820312, 0.10625457763671875, 0.11486434936523438, 0.12347412109375, 0.13208389282226562, 0.14069366455078125, 0.14930343627929688, 0.1579132080078125, 0.16652297973632812, 0.17513275146484375, 0.18374252319335938, 0.192352294921875, 0.20096206665039062, 0.20957183837890625, 0.21818161010742188, 0.2267913818359375, 0.23540115356445312, 0.24401092529296875, 0.2526206970214844, 0.26123046875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 6.0, 6.0, 12.0, 9.0, 17.0, 27.0, 33.0, 45.0, 44.0, 46.0, 61.0, 65.0, 63.0, 84.0, 88.0, 67.0, 45.0, 47.0, 47.0, 41.0, 34.0, 23.0, 18.0, 18.0, 17.0, 11.0, 9.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07257080078125, -0.07035064697265625, -0.0681304931640625, -0.06591033935546875, -0.063690185546875, -0.06147003173828125, -0.0592498779296875, -0.05702972412109375, -0.0548095703125, -0.05258941650390625, -0.0503692626953125, -0.04814910888671875, -0.045928955078125, -0.04370880126953125, -0.0414886474609375, -0.03926849365234375, -0.03704833984375, -0.03482818603515625, -0.0326080322265625, -0.03038787841796875, -0.028167724609375, -0.02594757080078125, -0.0237274169921875, -0.02150726318359375, -0.019287109375, -0.01706695556640625, -0.0148468017578125, -0.01262664794921875, -0.010406494140625, -0.00818634033203125, -0.0059661865234375, -0.00374603271484375, -0.00152587890625, 0.00069427490234375, 0.0029144287109375, 0.00513458251953125, 0.007354736328125, 0.00957489013671875, 0.0117950439453125, 0.01401519775390625, 0.0162353515625, 0.01845550537109375, 0.0206756591796875, 0.02289581298828125, 0.025115966796875, 0.02733612060546875, 0.0295562744140625, 0.03177642822265625, 0.03399658203125, 0.03621673583984375, 0.0384368896484375, 0.04065704345703125, 0.042877197265625, 0.04509735107421875, 0.0473175048828125, 0.04953765869140625, 0.0517578125, 0.05397796630859375, 0.0561981201171875, 0.05841827392578125, 0.060638427734375, 0.06285858154296875, 0.0650787353515625, 0.06729888916015625, 0.06951904296875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 14.0, 49.0, 254.0, 436.0, 194.0, 49.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.422909736633301, -4.248702049255371, -4.074494361877441, -3.9002864360809326, -3.726078510284424, -3.551870822906494, -3.3776631355285645, -3.2034554481506348, -3.029247522354126, -2.8550398349761963, -2.6808319091796875, -2.506624221801758, -2.332416534423828, -2.1582086086273193, -1.9840009212493896, -1.8097931146621704, -1.6355853080749512, -1.461377501487732, -1.2871696949005127, -1.112962007522583, -0.9387542009353638, -0.7645463943481445, -0.5903387069702148, -0.4161309003829956, -0.24192309379577637, -0.06771531701087952, 0.10649245977401733, 0.2807002067565918, 0.45490801334381104, 0.6291158199310303, 0.80332350730896, 0.9775313138961792, 1.1517391204833984, 1.3259469270706177, 1.500154733657837, 1.6743624210357666, 1.8485702276229858, 2.022778034210205, 2.1969857215881348, 2.3711934089660645, 2.5454013347625732, 2.719609022140503, 2.8938169479370117, 3.0680246353149414, 3.242232322692871, 3.41644024848938, 3.5906479358673096, 3.7648558616638184, 3.939063549041748, 4.113271236419678, 4.287478923797607, 4.461687088012695, 4.635894775390625, 4.810102462768555, 4.984310150146484, 5.158517837524414, 5.332725524902344, 5.506933212280273, 5.681140899658203, 5.855348587036133, 6.029556751251221, 6.20376443862915, 6.37797212600708, 6.55217981338501, 6.726387977600098]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 6.0, 12.0, 12.0, 16.0, 30.0, 36.0, 33.0, 26.0, 43.0, 45.0, 52.0, 51.0, 70.0, 63.0, 58.0, 61.0, 47.0, 59.0, 41.0, 45.0, 42.0, 33.0, 26.0, 30.0, 16.0, 10.0, 15.0, 8.0, 7.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0], "bins": [-2.1548409461975098, -2.104698896408081, -2.0545566082000732, -2.0044145584106445, -1.9542725086212158, -1.9041303396224976, -1.8539881706237793, -1.8038461208343506, -1.7537039518356323, -1.703561782836914, -1.6534197330474854, -1.603277564048767, -1.5531355142593384, -1.5029933452606201, -1.4528512954711914, -1.4027091264724731, -1.3525669574737549, -1.3024247884750366, -1.252282738685608, -1.2021405696868896, -1.151998519897461, -1.1018563508987427, -1.0517141819000244, -1.0015721321105957, -0.951430082321167, -0.9012879729270935, -0.85114586353302, -0.8010036945343018, -0.7508615851402283, -0.7007194757461548, -0.6505773663520813, -0.6004352569580078, -0.5502930879592896, -0.5001509785652161, -0.4500088393688202, -0.3998667299747467, -0.34972459077835083, -0.29958248138427734, -0.24944037199020386, -0.19929823279380798, -0.1491561233997345, -0.09901399910449982, -0.048871882259845734, 0.0012702345848083496, 0.05141235888004303, 0.10155448317527771, 0.1516965925693512, 0.20183873176574707, 0.25198084115982056, 0.30212295055389404, 0.3522650897502899, 0.4024071991443634, 0.4525493383407593, 0.5026914477348328, 0.5528335571289062, 0.6029757261276245, 0.6531177759170532, 0.7032598853111267, 0.7534019947052002, 0.8035441637039185, 0.8536862730979919, 0.9038283824920654, 0.9539704918861389, 1.0041126012802124, 1.0542547702789307]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 14.0, 8.0, 18.0, 17.0, 22.0, 49.0, 57.0, 95.0, 161.0, 258.0, 451.0, 856.0, 1619.0, 3725.0, 8922.0, 26944.0, 103671.0, 436046.0, 1433083.0, 1533489.0, 486195.0, 111491.0, 29328.0, 9631.0, 3793.0, 1919.0, 992.0, 539.0, 329.0, 184.0, 126.0, 70.0, 52.0, 41.0, 20.0, 26.0, 12.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.58447265625, -0.5667800903320312, -0.5490875244140625, -0.5313949584960938, -0.513702392578125, -0.49600982666015625, -0.4783172607421875, -0.46062469482421875, -0.44293212890625, -0.42523956298828125, -0.4075469970703125, -0.38985443115234375, -0.372161865234375, -0.35446929931640625, -0.3367767333984375, -0.31908416748046875, -0.3013916015625, -0.28369903564453125, -0.2660064697265625, -0.24831390380859375, -0.230621337890625, -0.21292877197265625, -0.1952362060546875, -0.17754364013671875, -0.15985107421875, -0.14215850830078125, -0.1244659423828125, -0.10677337646484375, -0.089080810546875, -0.07138824462890625, -0.0536956787109375, -0.03600311279296875, -0.018310546875, -0.00061798095703125, 0.0170745849609375, 0.03476715087890625, 0.052459716796875, 0.07015228271484375, 0.0878448486328125, 0.10553741455078125, 0.12322998046875, 0.14092254638671875, 0.1586151123046875, 0.17630767822265625, 0.194000244140625, 0.21169281005859375, 0.2293853759765625, 0.24707794189453125, 0.2647705078125, 0.28246307373046875, 0.3001556396484375, 0.31784820556640625, 0.335540771484375, 0.35323333740234375, 0.3709259033203125, 0.38861846923828125, 0.40631103515625, 0.42400360107421875, 0.4416961669921875, 0.45938873291015625, 0.477081298828125, 0.49477386474609375, 0.5124664306640625, 0.5301589965820312, 0.5478515625]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 3.0, 5.0, 12.0, 9.0, 16.0, 14.0, 17.0, 24.0, 22.0, 44.0, 26.0, 36.0, 40.0, 44.0, 52.0, 39.0, 51.0, 55.0, 41.0, 46.0, 54.0, 49.0, 44.0, 33.0, 37.0, 29.0, 26.0, 28.0, 26.0, 14.0, 15.0, 8.0, 16.0, 5.0, 4.0, 5.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6513671875, -0.633209228515625, -0.61505126953125, -0.596893310546875, -0.5787353515625, -0.560577392578125, -0.54241943359375, -0.524261474609375, -0.506103515625, -0.487945556640625, -0.46978759765625, -0.451629638671875, -0.4334716796875, -0.415313720703125, -0.39715576171875, -0.378997802734375, -0.36083984375, -0.342681884765625, -0.32452392578125, -0.306365966796875, -0.2882080078125, -0.270050048828125, -0.25189208984375, -0.233734130859375, -0.215576171875, -0.197418212890625, -0.17926025390625, -0.161102294921875, -0.1429443359375, -0.124786376953125, -0.10662841796875, -0.088470458984375, -0.0703125, -0.052154541015625, -0.03399658203125, -0.015838623046875, 0.0023193359375, 0.020477294921875, 0.03863525390625, 0.056793212890625, 0.074951171875, 0.093109130859375, 0.11126708984375, 0.129425048828125, 0.1475830078125, 0.165740966796875, 0.18389892578125, 0.202056884765625, 0.22021484375, 0.238372802734375, 0.25653076171875, 0.274688720703125, 0.2928466796875, 0.311004638671875, 0.32916259765625, 0.347320556640625, 0.365478515625, 0.383636474609375, 0.40179443359375, 0.419952392578125, 0.4381103515625, 0.456268310546875, 0.47442626953125, 0.492584228515625, 0.5107421875]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 13.0, 12.0, 17.0, 29.0, 68.0, 139.0, 271.0, 615.0, 2707.0, 40349.0, 3943700.0, 199586.0, 5217.0, 920.0, 315.0, 157.0, 78.0, 27.0, 26.0, 15.0, 4.0, 5.0, 7.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4287109375, -1.3656768798828125, -1.302642822265625, -1.2396087646484375, -1.17657470703125, -1.1135406494140625, -1.050506591796875, -0.9874725341796875, -0.9244384765625, -0.8614044189453125, -0.798370361328125, -0.7353363037109375, -0.67230224609375, -0.6092681884765625, -0.546234130859375, -0.4832000732421875, -0.420166015625, -0.3571319580078125, -0.294097900390625, -0.2310638427734375, -0.16802978515625, -0.1049957275390625, -0.041961669921875, 0.0210723876953125, 0.0841064453125, 0.1471405029296875, 0.210174560546875, 0.2732086181640625, 0.33624267578125, 0.3992767333984375, 0.462310791015625, 0.5253448486328125, 0.58837890625, 0.6514129638671875, 0.714447021484375, 0.7774810791015625, 0.84051513671875, 0.9035491943359375, 0.966583251953125, 1.0296173095703125, 1.0926513671875, 1.1556854248046875, 1.218719482421875, 1.2817535400390625, 1.34478759765625, 1.4078216552734375, 1.470855712890625, 1.5338897705078125, 1.596923828125, 1.6599578857421875, 1.722991943359375, 1.7860260009765625, 1.84906005859375, 1.9120941162109375, 1.975128173828125, 2.0381622314453125, 2.1011962890625, 2.1642303466796875, 2.227264404296875, 2.2902984619140625, 2.35333251953125, 2.4163665771484375, 2.479400634765625, 2.5424346923828125, 2.60546875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 12.0, 4.0, 11.0, 15.0, 23.0, 38.0, 45.0, 65.0, 116.0, 152.0, 268.0, 424.0, 522.0, 591.0, 534.0, 396.0, 278.0, 181.0, 129.0, 93.0, 52.0, 37.0, 22.0, 19.0, 11.0, 12.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.270751953125, -0.26291847229003906, -0.2550849914550781, -0.2472515106201172, -0.23941802978515625, -0.2315845489501953, -0.22375106811523438, -0.21591758728027344, -0.2080841064453125, -0.20025062561035156, -0.19241714477539062, -0.1845836639404297, -0.17675018310546875, -0.1689167022705078, -0.16108322143554688, -0.15324974060058594, -0.145416259765625, -0.13758277893066406, -0.12974929809570312, -0.12191581726074219, -0.11408233642578125, -0.10624885559082031, -0.09841537475585938, -0.09058189392089844, -0.0827484130859375, -0.07491493225097656, -0.06708145141601562, -0.05924797058105469, -0.05141448974609375, -0.04358100891113281, -0.035747528076171875, -0.027914047241210938, -0.02008056640625, -0.012247085571289062, -0.004413604736328125, 0.0034198760986328125, 0.01125335693359375, 0.019086837768554688, 0.026920318603515625, 0.03475379943847656, 0.0425872802734375, 0.05042076110839844, 0.058254241943359375, 0.06608772277832031, 0.07392120361328125, 0.08175468444824219, 0.08958816528320312, 0.09742164611816406, 0.105255126953125, 0.11308860778808594, 0.12092208862304688, 0.1287555694580078, 0.13658905029296875, 0.1444225311279297, 0.15225601196289062, 0.16008949279785156, 0.1679229736328125, 0.17575645446777344, 0.18358993530273438, 0.1914234161376953, 0.19925689697265625, 0.2070903778076172, 0.21492385864257812, 0.22275733947753906, 0.2305908203125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 4.0, 8.0, 16.0, 30.0, 48.0, 68.0, 80.0, 132.0, 129.0, 157.0, 87.0, 86.0, 57.0, 52.0, 21.0, 10.0, 8.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0451819896697998, -1.0011907815933228, -0.9571995735168457, -0.9132083654403687, -0.8692171573638916, -0.8252259492874146, -0.7812348008155823, -0.7372435927391052, -0.6932523846626282, -0.6492611765861511, -0.6052699685096741, -0.5612788200378418, -0.5172876119613647, -0.4732963740825653, -0.42930519580841064, -0.3853139877319336, -0.34132277965545654, -0.2973315715789795, -0.25334036350250244, -0.20934918522834778, -0.16535797715187073, -0.12136676907539368, -0.07737559080123901, -0.03338438272476196, 0.010606825351715088, 0.05459802597761154, 0.098589226603508, 0.14258041977882385, 0.1865716278553009, 0.23056283593177795, 0.2745540142059326, 0.31854522228240967, 0.36253654956817627, 0.4065277576446533, 0.45051896572113037, 0.49451014399528503, 0.5385013818740845, 0.5824925899505615, 0.6264837384223938, 0.6704749464988708, 0.7144661545753479, 0.758457362651825, 0.802448570728302, 0.8464397192001343, 0.8904309272766113, 0.9344221353530884, 0.9784133434295654, 1.0224045515060425, 1.0663957595825195, 1.1103869676589966, 1.1543781757354736, 1.1983693838119507, 1.2423605918884277, 1.2863517999649048, 1.3303430080413818, 1.3743340969085693, 1.418325424194336, 1.462316632270813, 1.50630784034729, 1.550299048423767, 1.5942902565002441, 1.6382814645767212, 1.6822726726531982, 1.7262637615203857, 1.7702549695968628]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 6.0, 10.0, 7.0, 17.0, 8.0, 12.0, 15.0, 19.0, 22.0, 27.0, 21.0, 21.0, 31.0, 40.0, 33.0, 38.0, 39.0, 36.0, 37.0, 52.0, 41.0, 45.0, 35.0, 37.0, 52.0, 33.0, 23.0, 30.0, 36.0, 20.0, 16.0, 35.0, 12.0, 16.0, 12.0, 7.0, 11.0, 9.0, 10.0, 5.0, 6.0, 2.0, 5.0, 3.0, 7.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5159679055213928, -0.49996817111968994, -0.48396843671798706, -0.46796873211860657, -0.4519689977169037, -0.4359692633152008, -0.4199695587158203, -0.40396982431411743, -0.38797008991241455, -0.37197035551071167, -0.3559706211090088, -0.3399709165096283, -0.3239711821079254, -0.30797144770622253, -0.29197174310684204, -0.27597200870513916, -0.2599722743034363, -0.2439725399017334, -0.2279728204011917, -0.21197310090065002, -0.19597336649894714, -0.17997363209724426, -0.16397391259670258, -0.1479741930961609, -0.131974458694458, -0.11597473174333572, -0.09997500479221344, -0.08397527784109116, -0.06797555088996887, -0.05197582393884659, -0.035976096987724304, -0.01997637003660202, -0.003976583480834961, 0.012023143470287323, 0.028022870421409607, 0.04402259737253189, 0.060022324323654175, 0.07602205127477646, 0.09202177822589874, 0.10802150517702103, 0.12402123212814331, 0.1400209665298462, 0.15602068603038788, 0.17202040553092957, 0.18802013993263245, 0.20401987433433533, 0.22001959383487701, 0.2360193133354187, 0.2520190477371216, 0.26801878213882446, 0.28401851654052734, 0.30001822113990784, 0.3160179555416107, 0.3320176899433136, 0.3480173945426941, 0.364017128944397, 0.38001686334609985, 0.39601659774780273, 0.4120163321495056, 0.4280160367488861, 0.444015771150589, 0.46001550555229187, 0.47601521015167236, 0.49201494455337524, 0.5080146789550781]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 2.0, 9.0, 10.0, 7.0, 11.0, 10.0, 21.0, 39.0, 76.0, 182.0, 566.0, 1834.0, 7969.0, 43595.0, 529377.0, 419081.0, 36288.0, 6944.0, 1698.0, 507.0, 142.0, 79.0, 34.0, 20.0, 13.0, 9.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-0.320556640625, -0.3101997375488281, -0.29984283447265625, -0.2894859313964844, -0.2791290283203125, -0.2687721252441406, -0.25841522216796875, -0.24805831909179688, -0.237701416015625, -0.22734451293945312, -0.21698760986328125, -0.20663070678710938, -0.1962738037109375, -0.18591690063476562, -0.17555999755859375, -0.16520309448242188, -0.15484619140625, -0.14448928833007812, -0.13413238525390625, -0.12377548217773438, -0.1134185791015625, -0.10306167602539062, -0.09270477294921875, -0.08234786987304688, -0.071990966796875, -0.061634063720703125, -0.05127716064453125, -0.040920257568359375, -0.0305633544921875, -0.020206451416015625, -0.00984954833984375, 0.000507354736328125, 0.0108642578125, 0.021221160888671875, 0.03157806396484375, 0.041934967041015625, 0.0522918701171875, 0.06264877319335938, 0.07300567626953125, 0.08336257934570312, 0.093719482421875, 0.10407638549804688, 0.11443328857421875, 0.12479019165039062, 0.1351470947265625, 0.14550399780273438, 0.15586090087890625, 0.16621780395507812, 0.17657470703125, 0.18693161010742188, 0.19728851318359375, 0.20764541625976562, 0.2180023193359375, 0.22835922241210938, 0.23871612548828125, 0.24907302856445312, 0.259429931640625, 0.2697868347167969, 0.28014373779296875, 0.2905006408691406, 0.3008575439453125, 0.3112144470214844, 0.32157135009765625, 0.3319282531738281, 0.34228515625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 4.0, 8.0, 9.0, 4.0, 16.0, 16.0, 21.0, 15.0, 27.0, 22.0, 30.0, 30.0, 35.0, 43.0, 43.0, 40.0, 51.0, 34.0, 52.0, 50.0, 50.0, 42.0, 43.0, 37.0, 39.0, 36.0, 36.0, 27.0, 16.0, 17.0, 20.0, 12.0, 22.0, 7.0, 12.0, 9.0, 5.0, 7.0, 4.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.4013671875, -0.3894157409667969, -0.37746429443359375, -0.3655128479003906, -0.3535614013671875, -0.3416099548339844, -0.32965850830078125, -0.3177070617675781, -0.305755615234375, -0.2938041687011719, -0.28185272216796875, -0.2699012756347656, -0.2579498291015625, -0.24599838256835938, -0.23404693603515625, -0.22209548950195312, -0.21014404296875, -0.19819259643554688, -0.18624114990234375, -0.17428970336914062, -0.1623382568359375, -0.15038681030273438, -0.13843536376953125, -0.12648391723632812, -0.114532470703125, -0.10258102416992188, -0.09062957763671875, -0.07867813110351562, -0.0667266845703125, -0.054775238037109375, -0.04282379150390625, -0.030872344970703125, -0.0189208984375, -0.006969451904296875, 0.00498199462890625, 0.016933441162109375, 0.0288848876953125, 0.040836334228515625, 0.05278778076171875, 0.06473922729492188, 0.076690673828125, 0.08864212036132812, 0.10059356689453125, 0.11254501342773438, 0.1244964599609375, 0.13644790649414062, 0.14839935302734375, 0.16035079956054688, 0.17230224609375, 0.18425369262695312, 0.19620513916015625, 0.20815658569335938, 0.2201080322265625, 0.23205947875976562, 0.24401092529296875, 0.2559623718261719, 0.267913818359375, 0.2798652648925781, 0.29181671142578125, 0.3037681579589844, 0.3157196044921875, 0.3276710510253906, 0.33962249755859375, 0.3515739440917969, 0.363525390625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 7.0, 7.0, 7.0, 13.0, 11.0, 23.0, 29.0, 40.0, 53.0, 88.0, 119.0, 211.0, 362.0, 769.0, 1511.0, 3481.0, 8365.0, 22948.0, 75238.0, 307181.0, 441503.0, 129968.0, 35254.0, 12231.0, 4956.0, 2027.0, 917.0, 481.0, 268.0, 162.0, 97.0, 66.0, 39.0, 34.0, 20.0, 17.0, 18.0, 6.0, 3.0, 8.0, 8.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.149169921875, -0.14438819885253906, -0.13960647583007812, -0.1348247528076172, -0.13004302978515625, -0.1252613067626953, -0.12047958374023438, -0.11569786071777344, -0.1109161376953125, -0.10613441467285156, -0.10135269165039062, -0.09657096862792969, -0.09178924560546875, -0.08700752258300781, -0.08222579956054688, -0.07744407653808594, -0.072662353515625, -0.06788063049316406, -0.06309890747070312, -0.05831718444824219, -0.05353546142578125, -0.04875373840332031, -0.043972015380859375, -0.03919029235839844, -0.0344085693359375, -0.029626846313476562, -0.024845123291015625, -0.020063400268554688, -0.01528167724609375, -0.010499954223632812, -0.005718231201171875, -0.0009365081787109375, 0.00384521484375, 0.008626937866210938, 0.013408660888671875, 0.018190383911132812, 0.02297210693359375, 0.027753829956054688, 0.032535552978515625, 0.03731727600097656, 0.0420989990234375, 0.04688072204589844, 0.051662445068359375, 0.05644416809082031, 0.06122589111328125, 0.06600761413574219, 0.07078933715820312, 0.07557106018066406, 0.080352783203125, 0.08513450622558594, 0.08991622924804688, 0.09469795227050781, 0.09947967529296875, 0.10426139831542969, 0.10904312133789062, 0.11382484436035156, 0.1186065673828125, 0.12338829040527344, 0.12817001342773438, 0.1329517364501953, 0.13773345947265625, 0.1425151824951172, 0.14729690551757812, 0.15207862854003906, 0.1568603515625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 8.0, 8.0, 7.0, 7.0, 15.0, 11.0, 17.0, 9.0, 17.0, 21.0, 19.0, 32.0, 26.0, 34.0, 28.0, 40.0, 35.0, 33.0, 54.0, 38.0, 32.0, 50.0, 55.0, 37.0, 43.0, 35.0, 28.0, 34.0, 21.0, 31.0, 19.0, 21.0, 16.0, 22.0, 18.0, 17.0, 7.0, 12.0, 10.0, 8.0, 6.0, 4.0, 2.0, 8.0, 4.0, 1.0, 2.0, 4.0, 1.0, 3.0], "bins": [-0.73974609375, -0.718994140625, -0.6982421875, -0.677490234375, -0.65673828125, -0.635986328125, -0.615234375, -0.594482421875, -0.57373046875, -0.552978515625, -0.5322265625, -0.511474609375, -0.49072265625, -0.469970703125, -0.44921875, -0.428466796875, -0.40771484375, -0.386962890625, -0.3662109375, -0.345458984375, -0.32470703125, -0.303955078125, -0.283203125, -0.262451171875, -0.24169921875, -0.220947265625, -0.2001953125, -0.179443359375, -0.15869140625, -0.137939453125, -0.1171875, -0.096435546875, -0.07568359375, -0.054931640625, -0.0341796875, -0.013427734375, 0.00732421875, 0.028076171875, 0.048828125, 0.069580078125, 0.09033203125, 0.111083984375, 0.1318359375, 0.152587890625, 0.17333984375, 0.194091796875, 0.21484375, 0.235595703125, 0.25634765625, 0.277099609375, 0.2978515625, 0.318603515625, 0.33935546875, 0.360107421875, 0.380859375, 0.401611328125, 0.42236328125, 0.443115234375, 0.4638671875, 0.484619140625, 0.50537109375, 0.526123046875, 0.546875, 0.567626953125, 0.58837890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 7.0, 3.0, 9.0, 8.0, 14.0, 15.0, 21.0, 44.0, 52.0, 96.0, 169.0, 282.0, 524.0, 1029.0, 2141.0, 5028.0, 13299.0, 45940.0, 238273.0, 549462.0, 143729.0, 30834.0, 9811.0, 4024.0, 1793.0, 861.0, 421.0, 270.0, 150.0, 82.0, 54.0, 27.0, 23.0, 9.0, 18.0, 9.0, 13.0, 5.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061553955078125, -0.05965137481689453, -0.05774879455566406, -0.055846214294433594, -0.053943634033203125, -0.052041053771972656, -0.05013847351074219, -0.04823589324951172, -0.04633331298828125, -0.04443073272705078, -0.04252815246582031, -0.040625572204589844, -0.038722991943359375, -0.036820411682128906, -0.03491783142089844, -0.03301525115966797, -0.0311126708984375, -0.02921009063720703, -0.027307510375976562, -0.025404930114746094, -0.023502349853515625, -0.021599769592285156, -0.019697189331054688, -0.01779460906982422, -0.01589202880859375, -0.013989448547363281, -0.012086868286132812, -0.010184288024902344, -0.008281707763671875, -0.006379127502441406, -0.0044765472412109375, -0.0025739669799804688, -0.00067138671875, 0.0012311935424804688, 0.0031337738037109375, 0.005036354064941406, 0.006938934326171875, 0.008841514587402344, 0.010744094848632812, 0.012646675109863281, 0.01454925537109375, 0.01645183563232422, 0.018354415893554688, 0.020256996154785156, 0.022159576416015625, 0.024062156677246094, 0.025964736938476562, 0.02786731719970703, 0.0297698974609375, 0.03167247772216797, 0.03357505798339844, 0.035477638244628906, 0.037380218505859375, 0.039282798767089844, 0.04118537902832031, 0.04308795928955078, 0.04499053955078125, 0.04689311981201172, 0.04879570007324219, 0.050698280334472656, 0.052600860595703125, 0.054503440856933594, 0.05640602111816406, 0.05830860137939453, 0.060211181640625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 6.0, 15.0, 11.0, 16.0, 24.0, 39.0, 41.0, 58.0, 64.0, 88.0, 100.0, 97.0, 95.0, 85.0, 68.0, 57.0, 28.0, 31.0, 20.0, 17.0, 14.0, 6.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.199411392211914e-05, -2.1243467926979065e-05, -2.049282193183899e-05, -1.9742175936698914e-05, -1.8991529941558838e-05, -1.8240883946418762e-05, -1.7490237951278687e-05, -1.673959195613861e-05, -1.5988945960998535e-05, -1.523829996585846e-05, -1.4487653970718384e-05, -1.3737007975578308e-05, -1.2986361980438232e-05, -1.2235715985298157e-05, -1.1485069990158081e-05, -1.0734423995018005e-05, -9.98377799987793e-06, -9.233132004737854e-06, -8.482486009597778e-06, -7.731840014457703e-06, -6.981194019317627e-06, -6.230548024177551e-06, -5.479902029037476e-06, -4.7292560338974e-06, -3.978610038757324e-06, -3.2279640436172485e-06, -2.477318048477173e-06, -1.7266720533370972e-06, -9.760260581970215e-07, -2.253800630569458e-07, 5.252659320831299e-07, 1.2759119272232056e-06, 2.0265579223632812e-06, 2.777203917503357e-06, 3.5278499126434326e-06, 4.278495907783508e-06, 5.029141902923584e-06, 5.77978789806366e-06, 6.530433893203735e-06, 7.281079888343811e-06, 8.031725883483887e-06, 8.782371878623962e-06, 9.533017873764038e-06, 1.0283663868904114e-05, 1.103430986404419e-05, 1.1784955859184265e-05, 1.253560185432434e-05, 1.3286247849464417e-05, 1.4036893844604492e-05, 1.4787539839744568e-05, 1.5538185834884644e-05, 1.628883183002472e-05, 1.7039477825164795e-05, 1.779012382030487e-05, 1.8540769815444946e-05, 1.9291415810585022e-05, 2.0042061805725098e-05, 2.0792707800865173e-05, 2.154335379600525e-05, 2.2293999791145325e-05, 2.30446457862854e-05, 2.3795291781425476e-05, 2.4545937776565552e-05, 2.5296583771705627e-05, 2.6047229766845703e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 5.0, 8.0, 8.0, 8.0, 15.0, 17.0, 20.0, 27.0, 56.0, 81.0, 138.0, 304.0, 788.0, 2078.0, 6620.0, 26345.0, 185276.0, 691526.0, 108995.0, 18507.0, 4943.0, 1525.0, 631.0, 280.0, 139.0, 64.0, 29.0, 27.0, 21.0, 16.0, 13.0, 12.0, 6.0, 6.0, 5.0, 4.0, 7.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09796142578125, -0.09519290924072266, -0.09242439270019531, -0.08965587615966797, -0.08688735961914062, -0.08411884307861328, -0.08135032653808594, -0.0785818099975586, -0.07581329345703125, -0.0730447769165039, -0.07027626037597656, -0.06750774383544922, -0.06473922729492188, -0.06197071075439453, -0.05920219421386719, -0.056433677673339844, -0.0536651611328125, -0.050896644592285156, -0.04812812805175781, -0.04535961151123047, -0.042591094970703125, -0.03982257843017578, -0.03705406188964844, -0.034285545349121094, -0.03151702880859375, -0.028748512268066406, -0.025979995727539062, -0.02321147918701172, -0.020442962646484375, -0.01767444610595703, -0.014905929565429688, -0.012137413024902344, -0.009368896484375, -0.006600379943847656, -0.0038318634033203125, -0.0010633468627929688, 0.001705169677734375, 0.004473686218261719, 0.0072422027587890625, 0.010010719299316406, 0.01277923583984375, 0.015547752380371094, 0.018316268920898438, 0.02108478546142578, 0.023853302001953125, 0.02662181854248047, 0.029390335083007812, 0.032158851623535156, 0.0349273681640625, 0.037695884704589844, 0.04046440124511719, 0.04323291778564453, 0.046001434326171875, 0.04876995086669922, 0.05153846740722656, 0.054306983947753906, 0.05707550048828125, 0.059844017028808594, 0.06261253356933594, 0.06538105010986328, 0.06814956665039062, 0.07091808319091797, 0.07368659973144531, 0.07645511627197266, 0.0792236328125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 9.0, 6.0, 7.0, 8.0, 7.0, 8.0, 21.0, 30.0, 32.0, 45.0, 59.0, 73.0, 94.0, 111.0, 108.0, 89.0, 83.0, 56.0, 40.0, 27.0, 25.0, 17.0, 12.0, 9.0, 5.0, 3.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01519775390625, -0.014630556106567383, -0.014063358306884766, -0.013496160507202148, -0.012928962707519531, -0.012361764907836914, -0.011794567108154297, -0.01122736930847168, -0.010660171508789062, -0.010092973709106445, -0.009525775909423828, -0.008958578109741211, -0.008391380310058594, -0.007824182510375977, -0.007256984710693359, -0.006689786911010742, -0.006122589111328125, -0.005555391311645508, -0.004988193511962891, -0.0044209957122802734, -0.0038537979125976562, -0.003286600112915039, -0.002719402313232422, -0.0021522045135498047, -0.0015850067138671875, -0.0010178089141845703, -0.0004506111145019531, 0.00011658668518066406, 0.0006837844848632812, 0.0012509822845458984, 0.0018181800842285156, 0.002385377883911133, 0.00295257568359375, 0.003519773483276367, 0.004086971282958984, 0.0046541690826416016, 0.005221366882324219, 0.005788564682006836, 0.006355762481689453, 0.00692296028137207, 0.0074901580810546875, 0.008057355880737305, 0.008624553680419922, 0.009191751480102539, 0.009758949279785156, 0.010326147079467773, 0.01089334487915039, 0.011460542678833008, 0.012027740478515625, 0.012594938278198242, 0.01316213607788086, 0.013729333877563477, 0.014296531677246094, 0.014863729476928711, 0.015430927276611328, 0.015998125076293945, 0.016565322875976562, 0.01713252067565918, 0.017699718475341797, 0.018266916275024414, 0.01883411407470703, 0.01940131187438965, 0.019968509674072266, 0.020535707473754883, 0.0211029052734375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 9.0, 7.0, 37.0, 76.0, 111.0, 177.0, 215.0, 166.0, 88.0, 61.0, 25.0, 16.0, 8.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1612666845321655, -1.1230378150939941, -1.0848090648651123, -1.046580195426941, -1.0083513259887695, -0.9701225757598877, -0.9318937063217163, -0.8936648964881897, -0.8554360866546631, -0.8172072768211365, -0.7789784669876099, -0.7407495975494385, -0.7025207877159119, -0.6642919778823853, -0.6260631084442139, -0.5878342986106873, -0.5496054887771606, -0.511376678943634, -0.47314783930778503, -0.43491899967193604, -0.3966901898384094, -0.3584613800048828, -0.3202325403690338, -0.2820037007331848, -0.2437748908996582, -0.2055460661649704, -0.1673172414302826, -0.1290884166955948, -0.09085959196090698, -0.05263076722621918, -0.014401942491531372, 0.023826897144317627, 0.06205570697784424, 0.10028453171253204, 0.13851335644721985, 0.17674218118190765, 0.21497100591659546, 0.25319981575012207, 0.29142865538597107, 0.32965749502182007, 0.3678863048553467, 0.4061151146888733, 0.4443439543247223, 0.4825727939605713, 0.5208016037940979, 0.5590304136276245, 0.5972592830657959, 0.6354880928993225, 0.6737169027328491, 0.7119457125663757, 0.7501745223999023, 0.7884033918380737, 0.8266322016716003, 0.864861011505127, 0.9030898809432983, 0.941318690776825, 0.9795475006103516, 1.017776370048523, 1.0560051202774048, 1.0942339897155762, 1.132462739944458, 1.1706916093826294, 1.2089204788208008, 1.2471492290496826, 1.285378098487854]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 11.0, 10.0, 11.0, 16.0, 15.0, 18.0, 16.0, 22.0, 22.0, 31.0, 30.0, 24.0, 44.0, 37.0, 36.0, 45.0, 47.0, 46.0, 47.0, 39.0, 36.0, 44.0, 48.0, 41.0, 18.0, 40.0, 25.0, 24.0, 26.0, 17.0, 16.0, 16.0, 11.0, 11.0, 13.0, 9.0, 5.0, 4.0, 4.0, 4.0, 7.0, 3.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.3482048809528351, -0.3377043604850769, -0.3272038400173187, -0.31670331954956055, -0.30620282888412476, -0.2957023084163666, -0.2852017879486084, -0.2747012674808502, -0.26420074701309204, -0.25370022654533386, -0.24319970607757568, -0.2326992005109787, -0.22219868004322052, -0.21169815957546234, -0.20119765400886536, -0.19069713354110718, -0.180196613073349, -0.16969609260559082, -0.15919557213783264, -0.14869506657123566, -0.13819454610347748, -0.1276940256357193, -0.11719351261854172, -0.10669299960136414, -0.09619247913360596, -0.08569195866584778, -0.0751914456486702, -0.06469093263149261, -0.054190412163734436, -0.043689895421266556, -0.033189378678798676, -0.022688865661621094, -0.012188374996185303, -0.0016878582537174225, 0.008812658488750458, 0.019313175231218338, 0.029813691973686218, 0.0403142087161541, 0.05081472545862198, 0.06131523847579956, 0.07181575894355774, 0.08231627941131592, 0.0928167924284935, 0.10331730544567108, 0.11381782591342926, 0.12431834638118744, 0.13481885194778442, 0.1453193724155426, 0.15581989288330078, 0.16632041335105896, 0.17682093381881714, 0.18732143938541412, 0.1978219598531723, 0.20832248032093048, 0.21882298588752747, 0.22932350635528564, 0.23982402682304382, 0.250324547290802, 0.2608250677585602, 0.27132558822631836, 0.28182607889175415, 0.29232659935951233, 0.3028271198272705, 0.3133276402950287, 0.32382816076278687]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 7.0, 2.0, 5.0, 5.0, 12.0, 19.0, 26.0, 58.0, 115.0, 646.0, 23300.0, 1011200.0, 12386.0, 535.0, 110.0, 43.0, 30.0, 11.0, 11.0, 12.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.34765625, -2.267913818359375, -2.18817138671875, -2.108428955078125, -2.0286865234375, -1.948944091796875, -1.86920166015625, -1.789459228515625, -1.709716796875, -1.629974365234375, -1.55023193359375, -1.470489501953125, -1.3907470703125, -1.311004638671875, -1.23126220703125, -1.151519775390625, -1.07177734375, -0.992034912109375, -0.91229248046875, -0.832550048828125, -0.7528076171875, -0.673065185546875, -0.59332275390625, -0.513580322265625, -0.433837890625, -0.354095458984375, -0.27435302734375, -0.194610595703125, -0.1148681640625, -0.035125732421875, 0.04461669921875, 0.124359130859375, 0.2041015625, 0.283843994140625, 0.36358642578125, 0.443328857421875, 0.5230712890625, 0.602813720703125, 0.68255615234375, 0.762298583984375, 0.842041015625, 0.921783447265625, 1.00152587890625, 1.081268310546875, 1.1610107421875, 1.240753173828125, 1.32049560546875, 1.400238037109375, 1.47998046875, 1.559722900390625, 1.63946533203125, 1.719207763671875, 1.7989501953125, 1.878692626953125, 1.95843505859375, 2.038177490234375, 2.117919921875, 2.197662353515625, 2.27740478515625, 2.357147216796875, 2.4368896484375, 2.516632080078125, 2.59637451171875, 2.676116943359375, 2.755859375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 12.0, 7.0, 15.0, 17.0, 30.0, 30.0, 50.0, 47.0, 62.0, 61.0, 81.0, 67.0, 86.0, 86.0, 71.0, 54.0, 53.0, 43.0, 32.0, 25.0, 15.0, 15.0, 16.0, 10.0, 8.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-1.583984375, -1.5479888916015625, -1.511993408203125, -1.4759979248046875, -1.44000244140625, -1.4040069580078125, -1.368011474609375, -1.3320159912109375, -1.2960205078125, -1.2600250244140625, -1.224029541015625, -1.1880340576171875, -1.15203857421875, -1.1160430908203125, -1.080047607421875, -1.0440521240234375, -1.008056640625, -0.9720611572265625, -0.936065673828125, -0.9000701904296875, -0.86407470703125, -0.8280792236328125, -0.792083740234375, -0.7560882568359375, -0.7200927734375, -0.6840972900390625, -0.648101806640625, -0.6121063232421875, -0.57611083984375, -0.5401153564453125, -0.504119873046875, -0.4681243896484375, -0.43212890625, -0.3961334228515625, -0.360137939453125, -0.3241424560546875, -0.28814697265625, -0.2521514892578125, -0.216156005859375, -0.1801605224609375, -0.1441650390625, -0.1081695556640625, -0.072174072265625, -0.0361785888671875, -0.00018310546875, 0.0358123779296875, 0.071807861328125, 0.1078033447265625, 0.143798828125, 0.1797943115234375, 0.215789794921875, 0.2517852783203125, 0.28778076171875, 0.3237762451171875, 0.359771728515625, 0.3957672119140625, 0.4317626953125, 0.4677581787109375, 0.503753662109375, 0.5397491455078125, 0.57574462890625, 0.6117401123046875, 0.647735595703125, 0.6837310791015625, 0.7197265625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 8.0, 8.0, 15.0, 17.0, 29.0, 33.0, 63.0, 73.0, 149.0, 201.0, 398.0, 953.0, 5971.0, 158974.0, 847629.0, 30258.0, 2413.0, 565.0, 280.0, 175.0, 113.0, 60.0, 54.0, 33.0, 33.0, 13.0, 15.0, 7.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1328125, -1.0954132080078125, -1.058013916015625, -1.0206146240234375, -0.98321533203125, -0.9458160400390625, -0.908416748046875, -0.8710174560546875, -0.8336181640625, -0.7962188720703125, -0.758819580078125, -0.7214202880859375, -0.68402099609375, -0.6466217041015625, -0.609222412109375, -0.5718231201171875, -0.534423828125, -0.4970245361328125, -0.459625244140625, -0.4222259521484375, -0.38482666015625, -0.3474273681640625, -0.310028076171875, -0.2726287841796875, -0.2352294921875, -0.1978302001953125, -0.160430908203125, -0.1230316162109375, -0.08563232421875, -0.0482330322265625, -0.010833740234375, 0.0265655517578125, 0.06396484375, 0.1013641357421875, 0.138763427734375, 0.1761627197265625, 0.21356201171875, 0.2509613037109375, 0.288360595703125, 0.3257598876953125, 0.3631591796875, 0.4005584716796875, 0.437957763671875, 0.4753570556640625, 0.51275634765625, 0.5501556396484375, 0.587554931640625, 0.6249542236328125, 0.662353515625, 0.6997528076171875, 0.737152099609375, 0.7745513916015625, 0.81195068359375, 0.8493499755859375, 0.886749267578125, 0.9241485595703125, 0.9615478515625, 0.9989471435546875, 1.036346435546875, 1.0737457275390625, 1.11114501953125, 1.1485443115234375, 1.185943603515625, 1.2233428955078125, 1.2607421875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 4.0, 5.0, 6.0, 8.0, 8.0, 8.0, 12.0, 15.0, 20.0, 31.0, 14.0, 20.0, 33.0, 39.0, 30.0, 39.0, 34.0, 48.0, 33.0, 48.0, 45.0, 59.0, 39.0, 44.0, 37.0, 45.0, 27.0, 28.0, 36.0, 29.0, 29.0, 19.0, 13.0, 18.0, 12.0, 13.0, 10.0, 6.0, 8.0, 12.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65771484375, -0.6344833374023438, -0.6112518310546875, -0.5880203247070312, -0.564788818359375, -0.5415573120117188, -0.5183258056640625, -0.49509429931640625, -0.47186279296875, -0.44863128662109375, -0.4253997802734375, -0.40216827392578125, -0.378936767578125, -0.35570526123046875, -0.3324737548828125, -0.30924224853515625, -0.2860107421875, -0.26277923583984375, -0.2395477294921875, -0.21631622314453125, -0.193084716796875, -0.16985321044921875, -0.1466217041015625, -0.12339019775390625, -0.10015869140625, -0.07692718505859375, -0.0536956787109375, -0.03046417236328125, -0.007232666015625, 0.01599884033203125, 0.0392303466796875, 0.06246185302734375, 0.085693359375, 0.10892486572265625, 0.1321563720703125, 0.15538787841796875, 0.178619384765625, 0.20185089111328125, 0.2250823974609375, 0.24831390380859375, 0.27154541015625, 0.29477691650390625, 0.3180084228515625, 0.34123992919921875, 0.364471435546875, 0.38770294189453125, 0.4109344482421875, 0.43416595458984375, 0.4573974609375, 0.48062896728515625, 0.5038604736328125, 0.5270919799804688, 0.550323486328125, 0.5735549926757812, 0.5967864990234375, 0.6200180053710938, 0.64324951171875, 0.6664810180664062, 0.6897125244140625, 0.7129440307617188, 0.736175537109375, 0.7594070434570312, 0.7826385498046875, 0.8058700561523438, 0.8291015625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 3.0, 5.0, 9.0, 22.0, 49.0, 66.0, 140.0, 342.0, 1168.0, 6458.0, 102913.0, 868121.0, 62837.0, 4871.0, 995.0, 302.0, 111.0, 58.0, 27.0, 17.0, 10.0, 8.0, 6.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.350341796875, -0.33882904052734375, -0.3273162841796875, -0.31580352783203125, -0.304290771484375, -0.29277801513671875, -0.2812652587890625, -0.26975250244140625, -0.25823974609375, -0.24672698974609375, -0.2352142333984375, -0.22370147705078125, -0.212188720703125, -0.20067596435546875, -0.1891632080078125, -0.17765045166015625, -0.1661376953125, -0.15462493896484375, -0.1431121826171875, -0.13159942626953125, -0.120086669921875, -0.10857391357421875, -0.0970611572265625, -0.08554840087890625, -0.07403564453125, -0.06252288818359375, -0.0510101318359375, -0.03949737548828125, -0.027984619140625, -0.01647186279296875, -0.0049591064453125, 0.00655364990234375, 0.01806640625, 0.02957916259765625, 0.0410919189453125, 0.05260467529296875, 0.064117431640625, 0.07563018798828125, 0.0871429443359375, 0.09865570068359375, 0.11016845703125, 0.12168121337890625, 0.1331939697265625, 0.14470672607421875, 0.156219482421875, 0.16773223876953125, 0.1792449951171875, 0.19075775146484375, 0.2022705078125, 0.21378326416015625, 0.2252960205078125, 0.23680877685546875, 0.248321533203125, 0.25983428955078125, 0.2713470458984375, 0.28285980224609375, 0.29437255859375, 0.30588531494140625, 0.3173980712890625, 0.32891082763671875, 0.340423583984375, 0.35193634033203125, 0.3634490966796875, 0.37496185302734375, 0.386474609375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 6.0, 6.0, 14.0, 15.0, 23.0, 20.0, 47.0, 49.0, 58.0, 62.0, 102.0, 93.0, 86.0, 94.0, 77.0, 62.0, 36.0, 36.0, 25.0, 21.0, 19.0, 9.0, 16.0, 3.0, 6.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.8014183044433594e-05, -2.721603959798813e-05, -2.6417896151542664e-05, -2.56197527050972e-05, -2.4821609258651733e-05, -2.402346581220627e-05, -2.3225322365760803e-05, -2.2427178919315338e-05, -2.1629035472869873e-05, -2.0830892026424408e-05, -2.0032748579978943e-05, -1.9234605133533478e-05, -1.8436461687088013e-05, -1.7638318240642548e-05, -1.6840174794197083e-05, -1.6042031347751617e-05, -1.5243887901306152e-05, -1.4445744454860687e-05, -1.3647601008415222e-05, -1.2849457561969757e-05, -1.2051314115524292e-05, -1.1253170669078827e-05, -1.0455027222633362e-05, -9.656883776187897e-06, -8.858740329742432e-06, -8.060596883296967e-06, -7.2624534368515015e-06, -6.464309990406036e-06, -5.666166543960571e-06, -4.868023097515106e-06, -4.069879651069641e-06, -3.271736204624176e-06, -2.473592758178711e-06, -1.6754493117332458e-06, -8.773058652877808e-07, -7.916241884231567e-08, 7.189810276031494e-07, 1.5171244740486145e-06, 2.3152679204940796e-06, 3.1134113669395447e-06, 3.91155481338501e-06, 4.709698259830475e-06, 5.50784170627594e-06, 6.305985152721405e-06, 7.10412859916687e-06, 7.902272045612335e-06, 8.7004154920578e-06, 9.498558938503265e-06, 1.029670238494873e-05, 1.1094845831394196e-05, 1.189298927783966e-05, 1.2691132724285126e-05, 1.348927617073059e-05, 1.4287419617176056e-05, 1.5085563063621521e-05, 1.5883706510066986e-05, 1.668184995651245e-05, 1.7479993402957916e-05, 1.827813684940338e-05, 1.9076280295848846e-05, 1.987442374229431e-05, 2.0672567188739777e-05, 2.1470710635185242e-05, 2.2268854081630707e-05, 2.3066997528076172e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 7.0, 16.0, 21.0, 53.0, 73.0, 145.0, 378.0, 1572.0, 13677.0, 599576.0, 421089.0, 10002.0, 1263.0, 362.0, 130.0, 84.0, 37.0, 18.0, 21.0, 13.0, 7.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.454833984375, -0.4405975341796875, -0.426361083984375, -0.4121246337890625, -0.39788818359375, -0.3836517333984375, -0.369415283203125, -0.3551788330078125, -0.3409423828125, -0.3267059326171875, -0.312469482421875, -0.2982330322265625, -0.28399658203125, -0.2697601318359375, -0.255523681640625, -0.2412872314453125, -0.22705078125, -0.2128143310546875, -0.198577880859375, -0.1843414306640625, -0.17010498046875, -0.1558685302734375, -0.141632080078125, -0.1273956298828125, -0.1131591796875, -0.0989227294921875, -0.084686279296875, -0.0704498291015625, -0.05621337890625, -0.0419769287109375, -0.027740478515625, -0.0135040283203125, 0.000732421875, 0.0149688720703125, 0.029205322265625, 0.0434417724609375, 0.05767822265625, 0.0719146728515625, 0.086151123046875, 0.1003875732421875, 0.1146240234375, 0.1288604736328125, 0.143096923828125, 0.1573333740234375, 0.17156982421875, 0.1858062744140625, 0.200042724609375, 0.2142791748046875, 0.228515625, 0.2427520751953125, 0.256988525390625, 0.2712249755859375, 0.28546142578125, 0.2996978759765625, 0.313934326171875, 0.3281707763671875, 0.3424072265625, 0.3566436767578125, 0.370880126953125, 0.3851165771484375, 0.39935302734375, 0.4135894775390625, 0.427825927734375, 0.4420623779296875, 0.456298828125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 9.0, 11.0, 15.0, 16.0, 26.0, 37.0, 80.0, 111.0, 150.0, 135.0, 137.0, 109.0, 57.0, 35.0, 26.0, 13.0, 9.0, 12.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13623046875, -0.13201522827148438, -0.12779998779296875, -0.12358474731445312, -0.1193695068359375, -0.11515426635742188, -0.11093902587890625, -0.10672378540039062, -0.102508544921875, -0.09829330444335938, -0.09407806396484375, -0.08986282348632812, -0.0856475830078125, -0.08143234252929688, -0.07721710205078125, -0.07300186157226562, -0.06878662109375, -0.06457138061523438, -0.06035614013671875, -0.056140899658203125, -0.0519256591796875, -0.047710418701171875, -0.04349517822265625, -0.039279937744140625, -0.035064697265625, -0.030849456787109375, -0.02663421630859375, -0.022418975830078125, -0.0182037353515625, -0.013988494873046875, -0.00977325439453125, -0.005558013916015625, -0.0013427734375, 0.002872467041015625, 0.00708770751953125, 0.011302947998046875, 0.0155181884765625, 0.019733428955078125, 0.02394866943359375, 0.028163909912109375, 0.032379150390625, 0.036594390869140625, 0.04080963134765625, 0.045024871826171875, 0.0492401123046875, 0.053455352783203125, 0.05767059326171875, 0.061885833740234375, 0.06610107421875, 0.07031631469726562, 0.07453155517578125, 0.07874679565429688, 0.0829620361328125, 0.08717727661132812, 0.09139251708984375, 0.09560775756835938, 0.099822998046875, 0.10403823852539062, 0.10825347900390625, 0.11246871948242188, 0.1166839599609375, 0.12089920043945312, 0.12511444091796875, 0.12932968139648438, 0.133544921875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 11.0, 17.0, 59.0, 162.0, 261.0, 250.0, 145.0, 70.0, 18.0, 9.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.296754240989685, -1.188986897468567, -1.0812195539474487, -0.9734522104263306, -0.8656848669052124, -0.757917582988739, -0.6501502394676208, -0.5423828959465027, -0.4346155524253845, -0.32684820890426636, -0.2190808802843094, -0.11131355166435242, -0.003546208143234253, 0.10422110557556152, 0.2119884490966797, 0.31975579261779785, 0.427523136138916, 0.5352904796600342, 0.6430578231811523, 0.7508251667022705, 0.8585925102233887, 0.9663597941398621, 1.074127197265625, 1.1818945407867432, 1.2896618843078613, 1.3974292278289795, 1.5051965713500977, 1.6129639148712158, 1.720731258392334, 1.8284986019134521, 1.9362659454345703, 2.0440332889556885, 2.1518003940582275, 2.2595677375793457, 2.367335081100464, 2.475102424621582, 2.5828697681427, 2.6906371116638184, 2.7984044551849365, 2.9061717987060547, 3.013939142227173, 3.121706485748291, 3.229473829269409, 3.3372411727905273, 3.4450085163116455, 3.5527758598327637, 3.660543203353882, 3.768310546875, 3.876077651977539, 3.9838449954986572, 4.091612339019775, 4.1993794441223145, 4.307147026062012, 4.414914131164551, 4.522681713104248, 4.630448818206787, 4.738216400146484, 4.845983505249023, 4.953751087188721, 5.06151819229126, 5.169285774230957, 5.277052879333496, 5.384820461273193, 5.492587566375732, 5.60035514831543]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 5.0, 3.0, 1.0, 2.0, 4.0, 7.0, 8.0, 8.0, 8.0, 9.0, 14.0, 18.0, 10.0, 16.0, 17.0, 26.0, 20.0, 33.0, 20.0, 22.0, 35.0, 32.0, 35.0, 29.0, 38.0, 37.0, 42.0, 25.0, 37.0, 31.0, 38.0, 28.0, 33.0, 27.0, 30.0, 28.0, 29.0, 28.0, 22.0, 19.0, 16.0, 23.0, 8.0, 16.0, 13.0, 16.0, 8.0, 8.0, 7.0, 5.0, 8.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.0631518363952637, -1.030463457107544, -0.997775137424469, -0.965086817741394, -0.9323984980583191, -0.8997101783752441, -0.8670217990875244, -0.8343334794044495, -0.8016451597213745, -0.7689568400382996, -0.7362684607505798, -0.7035801410675049, -0.6708918213844299, -0.638203501701355, -0.6055151224136353, -0.5728268027305603, -0.5401384234428406, -0.5074501037597656, -0.4747617542743683, -0.44207340478897095, -0.409385085105896, -0.37669673562049866, -0.3440083861351013, -0.31132006645202637, -0.27863171696662903, -0.24594338238239288, -0.21325504779815674, -0.1805666983127594, -0.14787836372852325, -0.11519002914428711, -0.08250167965888977, -0.049813345074653625, -0.01712501049041748, 0.015563327819108963, 0.048251666128635406, 0.08094000816345215, 0.1136283427476883, 0.14631667733192444, 0.17900502681732178, 0.21169336140155792, 0.24438169598579407, 0.2770700454711914, 0.30975836515426636, 0.3424467146396637, 0.37513506412506104, 0.407823383808136, 0.4405117332935333, 0.47320008277893066, 0.5058884024620056, 0.5385767221450806, 0.5712651014328003, 0.6039534211158752, 0.6366417407989502, 0.6693301200866699, 0.7020184397697449, 0.7347067594528198, 0.7673951387405396, 0.8000834584236145, 0.8327718377113342, 0.8654601573944092, 0.8981484770774841, 0.9308367967605591, 0.9635251760482788, 0.9962134957313538, 1.0289018154144287]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 7.0, 8.0, 10.0, 12.0, 23.0, 27.0, 40.0, 50.0, 101.0, 170.0, 342.0, 731.0, 1840.0, 5588.0, 24023.0, 164897.0, 1318892.0, 2248435.0, 370262.0, 44723.0, 9080.0, 2751.0, 1136.0, 530.0, 234.0, 137.0, 90.0, 54.0, 25.0, 27.0, 13.0, 8.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.84130859375, -0.8159637451171875, -0.790618896484375, -0.7652740478515625, -0.73992919921875, -0.7145843505859375, -0.689239501953125, -0.6638946533203125, -0.6385498046875, -0.6132049560546875, -0.587860107421875, -0.5625152587890625, -0.53717041015625, -0.5118255615234375, -0.486480712890625, -0.4611358642578125, -0.435791015625, -0.4104461669921875, -0.385101318359375, -0.3597564697265625, -0.33441162109375, -0.3090667724609375, -0.283721923828125, -0.2583770751953125, -0.2330322265625, -0.2076873779296875, -0.182342529296875, -0.1569976806640625, -0.13165283203125, -0.1063079833984375, -0.080963134765625, -0.0556182861328125, -0.0302734375, -0.0049285888671875, 0.020416259765625, 0.0457611083984375, 0.07110595703125, 0.0964508056640625, 0.121795654296875, 0.1471405029296875, 0.1724853515625, 0.1978302001953125, 0.223175048828125, 0.2485198974609375, 0.27386474609375, 0.2992095947265625, 0.324554443359375, 0.3498992919921875, 0.375244140625, 0.4005889892578125, 0.425933837890625, 0.4512786865234375, 0.47662353515625, 0.5019683837890625, 0.527313232421875, 0.5526580810546875, 0.5780029296875, 0.6033477783203125, 0.628692626953125, 0.6540374755859375, 0.67938232421875, 0.7047271728515625, 0.730072021484375, 0.7554168701171875, 0.78076171875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 3.0, 6.0, 4.0, 9.0, 8.0, 15.0, 8.0, 13.0, 20.0, 28.0, 27.0, 26.0, 29.0, 43.0, 42.0, 36.0, 41.0, 35.0, 48.0, 43.0, 56.0, 51.0, 44.0, 36.0, 37.0, 31.0, 36.0, 24.0, 33.0, 23.0, 26.0, 19.0, 19.0, 19.0, 12.0, 12.0, 15.0, 7.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.54052734375, -0.5247230529785156, -0.5089187622070312, -0.4931144714355469, -0.4773101806640625, -0.4615058898925781, -0.44570159912109375, -0.4298973083496094, -0.414093017578125, -0.3982887268066406, -0.38248443603515625, -0.3666801452636719, -0.3508758544921875, -0.3350715637207031, -0.31926727294921875, -0.3034629821777344, -0.28765869140625, -0.2718544006347656, -0.25605010986328125, -0.24024581909179688, -0.2244415283203125, -0.20863723754882812, -0.19283294677734375, -0.17702865600585938, -0.161224365234375, -0.14542007446289062, -0.12961578369140625, -0.11381149291992188, -0.0980072021484375, -0.08220291137695312, -0.06639862060546875, -0.050594329833984375, -0.0347900390625, -0.018985748291015625, -0.00318145751953125, 0.012622833251953125, 0.0284271240234375, 0.044231414794921875, 0.06003570556640625, 0.07583999633789062, 0.091644287109375, 0.10744857788085938, 0.12325286865234375, 0.13905715942382812, 0.1548614501953125, 0.17066574096679688, 0.18647003173828125, 0.20227432250976562, 0.21807861328125, 0.23388290405273438, 0.24968719482421875, 0.2654914855957031, 0.2812957763671875, 0.2971000671386719, 0.31290435791015625, 0.3287086486816406, 0.344512939453125, 0.3603172302246094, 0.37612152099609375, 0.3919258117675781, 0.4077301025390625, 0.4235343933105469, 0.43933868408203125, 0.4551429748535156, 0.470947265625]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 6.0, 5.0, 9.0, 13.0, 17.0, 37.0, 61.0, 92.0, 178.0, 406.0, 1034.0, 3843.0, 29642.0, 1999498.0, 2123261.0, 30626.0, 3761.0, 1019.0, 378.0, 189.0, 74.0, 57.0, 27.0, 20.0, 12.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.677734375, -1.6335906982421875, -1.589447021484375, -1.5453033447265625, -1.50115966796875, -1.4570159912109375, -1.412872314453125, -1.3687286376953125, -1.3245849609375, -1.2804412841796875, -1.236297607421875, -1.1921539306640625, -1.14801025390625, -1.1038665771484375, -1.059722900390625, -1.0155792236328125, -0.971435546875, -0.9272918701171875, -0.883148193359375, -0.8390045166015625, -0.79486083984375, -0.7507171630859375, -0.706573486328125, -0.6624298095703125, -0.6182861328125, -0.5741424560546875, -0.529998779296875, -0.4858551025390625, -0.44171142578125, -0.3975677490234375, -0.353424072265625, -0.3092803955078125, -0.26513671875, -0.2209930419921875, -0.176849365234375, -0.1327056884765625, -0.08856201171875, -0.0444183349609375, -0.000274658203125, 0.0438690185546875, 0.0880126953125, 0.1321563720703125, 0.176300048828125, 0.2204437255859375, 0.26458740234375, 0.3087310791015625, 0.352874755859375, 0.3970184326171875, 0.441162109375, 0.4853057861328125, 0.529449462890625, 0.5735931396484375, 0.61773681640625, 0.6618804931640625, 0.706024169921875, 0.7501678466796875, 0.7943115234375, 0.8384552001953125, 0.882598876953125, 0.9267425537109375, 0.97088623046875, 1.0150299072265625, 1.059173583984375, 1.1033172607421875, 1.1474609375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 10.0, 8.0, 16.0, 28.0, 38.0, 50.0, 98.0, 180.0, 373.0, 647.0, 868.0, 744.0, 441.0, 257.0, 130.0, 82.0, 34.0, 31.0, 13.0, 17.0, 5.0, 5.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.257568359375, -0.24622344970703125, -0.2348785400390625, -0.22353363037109375, -0.212188720703125, -0.20084381103515625, -0.1894989013671875, -0.17815399169921875, -0.16680908203125, -0.15546417236328125, -0.1441192626953125, -0.13277435302734375, -0.121429443359375, -0.11008453369140625, -0.0987396240234375, -0.08739471435546875, -0.0760498046875, -0.06470489501953125, -0.0533599853515625, -0.04201507568359375, -0.030670166015625, -0.01932525634765625, -0.0079803466796875, 0.00336456298828125, 0.01470947265625, 0.02605438232421875, 0.0373992919921875, 0.04874420166015625, 0.060089111328125, 0.07143402099609375, 0.0827789306640625, 0.09412384033203125, 0.10546875, 0.11681365966796875, 0.1281585693359375, 0.13950347900390625, 0.150848388671875, 0.16219329833984375, 0.1735382080078125, 0.18488311767578125, 0.19622802734375, 0.20757293701171875, 0.2189178466796875, 0.23026275634765625, 0.241607666015625, 0.25295257568359375, 0.2642974853515625, 0.27564239501953125, 0.2869873046875, 0.29833221435546875, 0.3096771240234375, 0.32102203369140625, 0.332366943359375, 0.34371185302734375, 0.3550567626953125, 0.36640167236328125, 0.37774658203125, 0.38909149169921875, 0.4004364013671875, 0.41178131103515625, 0.423126220703125, 0.43447113037109375, 0.4458160400390625, 0.45716094970703125, 0.468505859375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 5.0, 6.0, 9.0, 10.0, 22.0, 45.0, 58.0, 79.0, 113.0, 157.0, 121.0, 124.0, 86.0, 65.0, 52.0, 24.0, 12.0, 10.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.157740831375122, -1.1151161193847656, -1.0724912881851196, -1.0298665761947632, -0.987241804599762, -0.9446170330047607, -0.9019922614097595, -0.8593674898147583, -0.8167427778244019, -0.7741180062294006, -0.7314932346343994, -0.688868522644043, -0.6462437510490417, -0.6036189794540405, -0.5609942078590393, -0.5183694362640381, -0.47574466466903687, -0.43311989307403564, -0.3904951512813568, -0.3478703796863556, -0.30524563789367676, -0.26262086629867554, -0.21999609470367432, -0.17737135291099548, -0.13474658131599426, -0.09212182462215424, -0.04949706047773361, -0.006872296333312988, 0.03575246036052704, 0.07837721705436707, 0.12100198864936829, 0.16362673044204712, 0.20625150203704834, 0.24887625873088837, 0.2915010154247284, 0.3341257870197296, 0.37675052881240845, 0.41937530040740967, 0.4620000720024109, 0.5046248435974121, 0.5472495555877686, 0.5898743271827698, 0.632499098777771, 0.6751238107681274, 0.7177485823631287, 0.7603733539581299, 0.8029981255531311, 0.8456228971481323, 0.8882476687431335, 0.9308724403381348, 0.973497211933136, 1.0161219835281372, 1.0587466955184937, 1.1013715267181396, 1.143996238708496, 1.1866209506988525, 1.2292457818984985, 1.271870493888855, 1.314495325088501, 1.3571200370788574, 1.3997448682785034, 1.4423695802688599, 1.4849944114685059, 1.5276191234588623, 1.5702438354492188]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 4.0, 4.0, 6.0, 13.0, 13.0, 18.0, 16.0, 14.0, 15.0, 11.0, 29.0, 25.0, 34.0, 27.0, 25.0, 44.0, 37.0, 49.0, 36.0, 51.0, 37.0, 45.0, 35.0, 36.0, 36.0, 24.0, 39.0, 35.0, 32.0, 32.0, 26.0, 19.0, 14.0, 19.0, 9.0, 16.0, 18.0, 14.0, 10.0, 7.0, 4.0, 5.0, 6.0, 3.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.5457444787025452, -0.5296576619148254, -0.5135709047317505, -0.49748408794403076, -0.48139727115631104, -0.4653104841709137, -0.44922369718551636, -0.43313688039779663, -0.4170500934123993, -0.40096330642700195, -0.3848764896392822, -0.3687897026538849, -0.35270291566848755, -0.3366160988807678, -0.3205293118953705, -0.30444252490997314, -0.2883557081222534, -0.2722689211368561, -0.25618210434913635, -0.240095317363739, -0.22400851547718048, -0.20792171359062195, -0.1918349266052246, -0.17574812471866608, -0.15966132283210754, -0.143574520945549, -0.12748771905899048, -0.11140093207359314, -0.0953141301870346, -0.07922732830047607, -0.06314053386449814, -0.0470537394285202, -0.030966997146606445, -0.014880198985338211, 0.0012065991759300232, 0.017293397337198257, 0.03338019549846649, 0.049466997385025024, 0.06555379182100296, 0.0816405862569809, 0.09772738814353943, 0.11381419003009796, 0.1299009919166565, 0.14598777890205383, 0.16207458078861237, 0.1781613826751709, 0.19424816966056824, 0.21033497154712677, 0.2264217734336853, 0.24250857532024384, 0.25859537720680237, 0.2746821641921997, 0.29076898097991943, 0.3068557679653168, 0.3229425549507141, 0.33902937173843384, 0.3551161587238312, 0.3712029457092285, 0.38728976249694824, 0.4033765494823456, 0.4194633364677429, 0.43555015325546265, 0.45163694024086, 0.4677237272262573, 0.48381054401397705]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 6.0, 9.0, 8.0, 10.0, 16.0, 31.0, 45.0, 75.0, 122.0, 289.0, 765.0, 2631.0, 9783.0, 47223.0, 241313.0, 515732.0, 184080.0, 35484.0, 7617.0, 2140.0, 654.0, 244.0, 100.0, 59.0, 35.0, 18.0, 22.0, 17.0, 8.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1373291015625, -0.132659912109375, -0.12799072265625, -0.123321533203125, -0.11865234375, -0.113983154296875, -0.10931396484375, -0.104644775390625, -0.0999755859375, -0.095306396484375, -0.09063720703125, -0.085968017578125, -0.081298828125, -0.076629638671875, -0.07196044921875, -0.067291259765625, -0.0626220703125, -0.057952880859375, -0.05328369140625, -0.048614501953125, -0.0439453125, -0.039276123046875, -0.03460693359375, -0.029937744140625, -0.0252685546875, -0.020599365234375, -0.01593017578125, -0.011260986328125, -0.006591796875, -0.001922607421875, 0.00274658203125, 0.007415771484375, 0.0120849609375, 0.016754150390625, 0.02142333984375, 0.026092529296875, 0.03076171875, 0.035430908203125, 0.04010009765625, 0.044769287109375, 0.0494384765625, 0.054107666015625, 0.05877685546875, 0.063446044921875, 0.068115234375, 0.072784423828125, 0.07745361328125, 0.082122802734375, 0.0867919921875, 0.091461181640625, 0.09613037109375, 0.100799560546875, 0.10546875, 0.110137939453125, 0.11480712890625, 0.119476318359375, 0.1241455078125, 0.128814697265625, 0.13348388671875, 0.138153076171875, 0.142822265625, 0.147491455078125, 0.15216064453125, 0.156829833984375, 0.1614990234375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 8.0, 8.0, 12.0, 11.0, 24.0, 26.0, 20.0, 24.0, 26.0, 40.0, 35.0, 43.0, 53.0, 65.0, 48.0, 59.0, 61.0, 40.0, 48.0, 41.0, 43.0, 47.0, 31.0, 38.0, 23.0, 19.0, 16.0, 22.0, 21.0, 9.0, 12.0, 7.0, 8.0, 5.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.44384765625, -0.4308204650878906, -0.41779327392578125, -0.4047660827636719, -0.3917388916015625, -0.3787117004394531, -0.36568450927734375, -0.3526573181152344, -0.339630126953125, -0.3266029357910156, -0.31357574462890625, -0.3005485534667969, -0.2875213623046875, -0.2744941711425781, -0.26146697998046875, -0.24843978881835938, -0.23541259765625, -0.22238540649414062, -0.20935821533203125, -0.19633102416992188, -0.1833038330078125, -0.17027664184570312, -0.15724945068359375, -0.14422225952148438, -0.131195068359375, -0.11816787719726562, -0.10514068603515625, -0.09211349487304688, -0.0790863037109375, -0.06605911254882812, -0.05303192138671875, -0.040004730224609375, -0.0269775390625, -0.013950347900390625, -0.00092315673828125, 0.012104034423828125, 0.0251312255859375, 0.038158416748046875, 0.05118560791015625, 0.06421279907226562, 0.077239990234375, 0.09026718139648438, 0.10329437255859375, 0.11632156372070312, 0.1293487548828125, 0.14237594604492188, 0.15540313720703125, 0.16843032836914062, 0.18145751953125, 0.19448471069335938, 0.20751190185546875, 0.22053909301757812, 0.2335662841796875, 0.24659347534179688, 0.25962066650390625, 0.2726478576660156, 0.285675048828125, 0.2987022399902344, 0.31172943115234375, 0.3247566223144531, 0.3377838134765625, 0.3508110046386719, 0.36383819580078125, 0.3768653869628906, 0.389892578125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 11.0, 20.0, 17.0, 15.0, 39.0, 41.0, 61.0, 108.0, 146.0, 211.0, 408.0, 706.0, 1524.0, 3720.0, 9859.0, 29533.0, 92137.0, 246128.0, 350523.0, 205045.0, 71917.0, 22911.0, 7794.0, 2877.0, 1265.0, 569.0, 344.0, 199.0, 127.0, 86.0, 64.0, 48.0, 36.0, 21.0, 15.0, 7.0, 11.0, 7.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09136962890625, -0.08854866027832031, -0.08572769165039062, -0.08290672302246094, -0.08008575439453125, -0.07726478576660156, -0.07444381713867188, -0.07162284851074219, -0.0688018798828125, -0.06598091125488281, -0.06315994262695312, -0.06033897399902344, -0.05751800537109375, -0.05469703674316406, -0.051876068115234375, -0.04905509948730469, -0.046234130859375, -0.04341316223144531, -0.040592193603515625, -0.03777122497558594, -0.03495025634765625, -0.03212928771972656, -0.029308319091796875, -0.026487350463867188, -0.0236663818359375, -0.020845413208007812, -0.018024444580078125, -0.015203475952148438, -0.01238250732421875, -0.009561538696289062, -0.006740570068359375, -0.0039196014404296875, -0.0010986328125, 0.0017223358154296875, 0.004543304443359375, 0.0073642730712890625, 0.01018524169921875, 0.013006210327148438, 0.015827178955078125, 0.018648147583007812, 0.0214691162109375, 0.024290084838867188, 0.027111053466796875, 0.029932022094726562, 0.03275299072265625, 0.03557395935058594, 0.038394927978515625, 0.04121589660644531, 0.044036865234375, 0.04685783386230469, 0.049678802490234375, 0.05249977111816406, 0.05532073974609375, 0.05814170837402344, 0.060962677001953125, 0.06378364562988281, 0.0666046142578125, 0.06942558288574219, 0.07224655151367188, 0.07506752014160156, 0.07788848876953125, 0.08070945739746094, 0.08353042602539062, 0.08635139465332031, 0.08917236328125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 9.0, 5.0, 6.0, 9.0, 12.0, 14.0, 14.0, 18.0, 15.0, 27.0, 22.0, 29.0, 22.0, 38.0, 52.0, 36.0, 53.0, 47.0, 43.0, 42.0, 54.0, 53.0, 42.0, 38.0, 34.0, 41.0, 34.0, 31.0, 23.0, 20.0, 21.0, 20.0, 19.0, 10.0, 15.0, 12.0, 6.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69677734375, -0.6744918823242188, -0.6522064208984375, -0.6299209594726562, -0.607635498046875, -0.5853500366210938, -0.5630645751953125, -0.5407791137695312, -0.51849365234375, -0.49620819091796875, -0.4739227294921875, -0.45163726806640625, -0.429351806640625, -0.40706634521484375, -0.3847808837890625, -0.36249542236328125, -0.3402099609375, -0.31792449951171875, -0.2956390380859375, -0.27335357666015625, -0.251068115234375, -0.22878265380859375, -0.2064971923828125, -0.18421173095703125, -0.16192626953125, -0.13964080810546875, -0.1173553466796875, -0.09506988525390625, -0.072784423828125, -0.05049896240234375, -0.0282135009765625, -0.00592803955078125, 0.016357421875, 0.03864288330078125, 0.0609283447265625, 0.08321380615234375, 0.105499267578125, 0.12778472900390625, 0.1500701904296875, 0.17235565185546875, 0.19464111328125, 0.21692657470703125, 0.2392120361328125, 0.26149749755859375, 0.283782958984375, 0.30606842041015625, 0.3283538818359375, 0.35063934326171875, 0.3729248046875, 0.39521026611328125, 0.4174957275390625, 0.43978118896484375, 0.462066650390625, 0.48435211181640625, 0.5066375732421875, 0.5289230346679688, 0.55120849609375, 0.5734939575195312, 0.5957794189453125, 0.6180648803710938, 0.640350341796875, 0.6626358032226562, 0.6849212646484375, 0.7072067260742188, 0.7294921875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 9.0, 9.0, 21.0, 20.0, 34.0, 71.0, 135.0, 171.0, 271.0, 475.0, 957.0, 1896.0, 4547.0, 14045.0, 58106.0, 283479.0, 496991.0, 142935.0, 30054.0, 8158.0, 2990.0, 1377.0, 681.0, 427.0, 275.0, 133.0, 90.0, 56.0, 47.0, 23.0, 15.0, 5.0, 12.0, 5.0, 7.0, 4.0, 0.0, 1.0, 2.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.047760009765625, -0.0462803840637207, -0.044800758361816406, -0.04332113265991211, -0.04184150695800781, -0.040361881256103516, -0.03888225555419922, -0.03740262985229492, -0.035923004150390625, -0.03444337844848633, -0.03296375274658203, -0.031484127044677734, -0.030004501342773438, -0.02852487564086914, -0.027045249938964844, -0.025565624237060547, -0.02408599853515625, -0.022606372833251953, -0.021126747131347656, -0.01964712142944336, -0.018167495727539062, -0.016687870025634766, -0.015208244323730469, -0.013728618621826172, -0.012248992919921875, -0.010769367218017578, -0.009289741516113281, -0.007810115814208984, -0.0063304901123046875, -0.004850864410400391, -0.0033712387084960938, -0.0018916130065917969, -0.0004119873046875, 0.0010676383972167969, 0.0025472640991210938, 0.004026889801025391, 0.0055065155029296875, 0.006986141204833984, 0.008465766906738281, 0.009945392608642578, 0.011425018310546875, 0.012904644012451172, 0.014384269714355469, 0.015863895416259766, 0.017343521118164062, 0.01882314682006836, 0.020302772521972656, 0.021782398223876953, 0.02326202392578125, 0.024741649627685547, 0.026221275329589844, 0.02770090103149414, 0.029180526733398438, 0.030660152435302734, 0.03213977813720703, 0.03361940383911133, 0.035099029541015625, 0.03657865524291992, 0.03805828094482422, 0.039537906646728516, 0.04101753234863281, 0.04249715805053711, 0.043976783752441406, 0.0454564094543457, 0.04693603515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 6.0, 4.0, 10.0, 8.0, 15.0, 24.0, 23.0, 26.0, 30.0, 36.0, 59.0, 69.0, 86.0, 85.0, 63.0, 90.0, 80.0, 54.0, 56.0, 39.0, 36.0, 20.0, 21.0, 21.0, 14.0, 11.0, 4.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5079975128173828e-05, -1.4600344002246857e-05, -1.4120712876319885e-05, -1.3641081750392914e-05, -1.3161450624465942e-05, -1.2681819498538971e-05, -1.2202188372612e-05, -1.1722557246685028e-05, -1.1242926120758057e-05, -1.0763294994831085e-05, -1.0283663868904114e-05, -9.804032742977142e-06, -9.324401617050171e-06, -8.8447704911232e-06, -8.365139365196228e-06, -7.885508239269257e-06, -7.405877113342285e-06, -6.926245987415314e-06, -6.446614861488342e-06, -5.966983735561371e-06, -5.487352609634399e-06, -5.007721483707428e-06, -4.5280903577804565e-06, -4.048459231853485e-06, -3.5688281059265137e-06, -3.0891969799995422e-06, -2.609565854072571e-06, -2.1299347281455994e-06, -1.650303602218628e-06, -1.1706724762916565e-06, -6.910413503646851e-07, -2.1141022443771362e-07, 2.682209014892578e-07, 7.478520274162292e-07, 1.2274831533432007e-06, 1.7071142792701721e-06, 2.1867454051971436e-06, 2.666376531124115e-06, 3.1460076570510864e-06, 3.625638782978058e-06, 4.105269908905029e-06, 4.584901034832001e-06, 5.064532160758972e-06, 5.544163286685944e-06, 6.023794412612915e-06, 6.5034255385398865e-06, 6.983056664466858e-06, 7.462687790393829e-06, 7.9423189163208e-06, 8.421950042247772e-06, 8.901581168174744e-06, 9.381212294101715e-06, 9.860843420028687e-06, 1.0340474545955658e-05, 1.082010567188263e-05, 1.12997367978096e-05, 1.1779367923736572e-05, 1.2258999049663544e-05, 1.2738630175590515e-05, 1.3218261301517487e-05, 1.3697892427444458e-05, 1.417752355337143e-05, 1.4657154679298401e-05, 1.5136785805225372e-05, 1.5616416931152344e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 1.0, 3.0, 3.0, 8.0, 10.0, 13.0, 15.0, 16.0, 27.0, 29.0, 39.0, 69.0, 93.0, 147.0, 282.0, 600.0, 1656.0, 5938.0, 29942.0, 217383.0, 615588.0, 147934.0, 21644.0, 4651.0, 1289.0, 501.0, 254.0, 125.0, 78.0, 53.0, 41.0, 34.0, 29.0, 13.0, 13.0, 9.0, 4.0, 5.0, 8.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.08038330078125, -0.07823419570922852, -0.07608509063720703, -0.07393598556518555, -0.07178688049316406, -0.06963777542114258, -0.0674886703491211, -0.06533956527709961, -0.06319046020507812, -0.06104135513305664, -0.058892250061035156, -0.05674314498901367, -0.05459403991699219, -0.0524449348449707, -0.05029582977294922, -0.048146724700927734, -0.04599761962890625, -0.043848514556884766, -0.04169940948486328, -0.0395503044128418, -0.03740119934082031, -0.03525209426879883, -0.033102989196777344, -0.03095388412475586, -0.028804779052734375, -0.02665567398071289, -0.024506568908691406, -0.022357463836669922, -0.020208358764648438, -0.018059253692626953, -0.01591014862060547, -0.013761043548583984, -0.0116119384765625, -0.009462833404541016, -0.007313728332519531, -0.005164623260498047, -0.0030155181884765625, -0.0008664131164550781, 0.0012826919555664062, 0.0034317970275878906, 0.005580902099609375, 0.007730007171630859, 0.009879112243652344, 0.012028217315673828, 0.014177322387695312, 0.016326427459716797, 0.01847553253173828, 0.020624637603759766, 0.02277374267578125, 0.024922847747802734, 0.02707195281982422, 0.029221057891845703, 0.03137016296386719, 0.03351926803588867, 0.035668373107910156, 0.03781747817993164, 0.039966583251953125, 0.04211568832397461, 0.044264793395996094, 0.04641389846801758, 0.04856300354003906, 0.05071210861206055, 0.05286121368408203, 0.055010318756103516, 0.057159423828125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 5.0, 4.0, 14.0, 19.0, 11.0, 10.0, 14.0, 30.0, 32.0, 41.0, 65.0, 64.0, 83.0, 99.0, 78.0, 68.0, 59.0, 59.0, 37.0, 47.0, 36.0, 21.0, 29.0, 13.0, 9.0, 7.0, 10.0, 7.0, 3.0, 8.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0118408203125, -0.011399984359741211, -0.010959148406982422, -0.010518312454223633, -0.010077476501464844, -0.009636640548706055, -0.009195804595947266, -0.008754968643188477, -0.008314132690429688, -0.007873296737670898, -0.007432460784912109, -0.00699162483215332, -0.006550788879394531, -0.006109952926635742, -0.005669116973876953, -0.005228281021118164, -0.004787445068359375, -0.004346609115600586, -0.003905773162841797, -0.003464937210083008, -0.0030241012573242188, -0.0025832653045654297, -0.0021424293518066406, -0.0017015933990478516, -0.0012607574462890625, -0.0008199214935302734, -0.0003790855407714844, 6.175041198730469e-05, 0.0005025863647460938, 0.0009434223175048828, 0.0013842582702636719, 0.001825094223022461, 0.00226593017578125, 0.002706766128540039, 0.003147602081298828, 0.003588438034057617, 0.004029273986816406, 0.004470109939575195, 0.004910945892333984, 0.0053517818450927734, 0.0057926177978515625, 0.0062334537506103516, 0.006674289703369141, 0.00711512565612793, 0.007555961608886719, 0.007996797561645508, 0.008437633514404297, 0.008878469467163086, 0.009319305419921875, 0.009760141372680664, 0.010200977325439453, 0.010641813278198242, 0.011082649230957031, 0.01152348518371582, 0.01196432113647461, 0.012405157089233398, 0.012845993041992188, 0.013286828994750977, 0.013727664947509766, 0.014168500900268555, 0.014609336853027344, 0.015050172805786133, 0.015491008758544922, 0.01593184471130371, 0.0163726806640625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 8.0, 15.0, 36.0, 60.0, 121.0, 177.0, 206.0, 150.0, 119.0, 56.0, 25.0, 17.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1063568592071533, -1.0711039304733276, -1.0358508825302124, -1.0005979537963867, -0.9653449058532715, -0.930091917514801, -0.8948389291763306, -0.8595860004425049, -0.8243329524993896, -0.7890799641609192, -0.7538269758224487, -0.7185739874839783, -0.6833209991455078, -0.6480680108070374, -0.6128150224685669, -0.5775620937347412, -0.5423091053962708, -0.5070561170578003, -0.47180312871932983, -0.4365501403808594, -0.4012971520423889, -0.36604416370391846, -0.3307912051677704, -0.2955382168292999, -0.26028522849082947, -0.225032240152359, -0.18977925181388855, -0.15452627837657928, -0.11927329003810883, -0.08402030169963837, -0.0487673282623291, -0.013514339923858643, 0.021738648414611816, 0.05699163302779198, 0.09224461764097214, 0.127497598528862, 0.16275058686733246, 0.19800357520580292, 0.23325654864311218, 0.26850953698158264, 0.3037625253200531, 0.33901551365852356, 0.374268501996994, 0.4095214605331421, 0.44477444887161255, 0.480027437210083, 0.5152804255485535, 0.5505334138870239, 0.5857864022254944, 0.6210393905639648, 0.6562923789024353, 0.6915453672409058, 0.7267983555793762, 0.7620513439178467, 0.7973042726516724, 0.8325573205947876, 0.8678102493286133, 0.9030632376670837, 0.9383162260055542, 0.9735692143440247, 1.0088222026824951, 1.0440751314163208, 1.079328179359436, 1.1145811080932617, 1.149834156036377]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 2.0, 4.0, 4.0, 5.0, 11.0, 17.0, 16.0, 15.0, 21.0, 27.0, 28.0, 35.0, 31.0, 32.0, 45.0, 50.0, 54.0, 49.0, 47.0, 46.0, 62.0, 42.0, 40.0, 42.0, 40.0, 40.0, 30.0, 33.0, 22.0, 13.0, 13.0, 13.0, 29.0, 5.0, 10.0, 8.0, 5.0, 7.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.4031316637992859, -0.3914082944393158, -0.3796849250793457, -0.367961585521698, -0.3562382161617279, -0.3445148468017578, -0.3327914774417877, -0.3210681080818176, -0.3093447685241699, -0.29762139916419983, -0.28589802980422974, -0.27417469024658203, -0.26245132088661194, -0.25072795152664185, -0.23900458216667175, -0.22728121280670166, -0.21555784344673157, -0.20383447408676147, -0.19211111962795258, -0.18038775026798248, -0.16866439580917358, -0.1569410264492035, -0.1452176570892334, -0.1334942877292633, -0.1217709332704544, -0.11004757136106491, -0.09832420945167542, -0.08660084009170532, -0.07487747818231583, -0.06315411627292633, -0.05143074691295624, -0.03970738500356674, -0.027984023094177246, -0.0162606593221426, -0.004537295550107956, 0.007186070084571838, 0.018909431993961334, 0.03063279390335083, 0.04235616326332092, 0.05407952517271042, 0.06580288708209991, 0.07752624899148941, 0.0892496109008789, 0.100972980260849, 0.1126963421702385, 0.12441970407962799, 0.13614307343959808, 0.14786642789840698, 0.15958979725837708, 0.17131316661834717, 0.18303652107715607, 0.19475989043712616, 0.20648324489593506, 0.21820661425590515, 0.22992998361587524, 0.24165335297584534, 0.25337672233581543, 0.2651000916957855, 0.2768234610557556, 0.2885468006134033, 0.3002701699733734, 0.3119935393333435, 0.3237169086933136, 0.3354402780532837, 0.3471636176109314]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 7.0, 5.0, 12.0, 23.0, 40.0, 33.0, 53.0, 76.0, 125.0, 197.0, 338.0, 670.0, 1199.0, 2632.0, 5935.0, 14758.0, 40763.0, 126765.0, 387263.0, 319054.0, 95520.0, 31548.0, 11919.0, 4974.0, 2139.0, 1065.0, 565.0, 318.0, 171.0, 106.0, 80.0, 53.0, 40.0, 30.0, 16.0, 13.0, 14.0, 9.0, 7.0, 5.0, 0.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.343994140625, -0.3341331481933594, -0.32427215576171875, -0.3144111633300781, -0.3045501708984375, -0.2946891784667969, -0.28482818603515625, -0.2749671936035156, -0.265106201171875, -0.2552452087402344, -0.24538421630859375, -0.23552322387695312, -0.2256622314453125, -0.21580123901367188, -0.20594024658203125, -0.19607925415039062, -0.18621826171875, -0.17635726928710938, -0.16649627685546875, -0.15663528442382812, -0.1467742919921875, -0.13691329956054688, -0.12705230712890625, -0.11719131469726562, -0.107330322265625, -0.09746932983398438, -0.08760833740234375, -0.07774734497070312, -0.0678863525390625, -0.058025360107421875, -0.04816436767578125, -0.038303375244140625, -0.0284423828125, -0.018581390380859375, -0.00872039794921875, 0.001140594482421875, 0.0110015869140625, 0.020862579345703125, 0.03072357177734375, 0.040584564208984375, 0.050445556640625, 0.060306549072265625, 0.07016754150390625, 0.08002853393554688, 0.0898895263671875, 0.09975051879882812, 0.10961151123046875, 0.11947250366210938, 0.12933349609375, 0.13919448852539062, 0.14905548095703125, 0.15891647338867188, 0.1687774658203125, 0.17863845825195312, 0.18849945068359375, 0.19836044311523438, 0.208221435546875, 0.21808242797851562, 0.22794342041015625, 0.23780441284179688, 0.2476654052734375, 0.2575263977050781, 0.26738739013671875, 0.2772483825683594, 0.287109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 3.0, 8.0, 10.0, 10.0, 3.0, 16.0, 20.0, 13.0, 18.0, 27.0, 33.0, 30.0, 27.0, 24.0, 41.0, 47.0, 47.0, 43.0, 39.0, 45.0, 47.0, 54.0, 35.0, 57.0, 32.0, 42.0, 34.0, 37.0, 27.0, 20.0, 16.0, 11.0, 14.0, 6.0, 12.0, 11.0, 8.0, 10.0, 3.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.75732421875, -0.7348556518554688, -0.7123870849609375, -0.6899185180664062, -0.667449951171875, -0.6449813842773438, -0.6225128173828125, -0.6000442504882812, -0.57757568359375, -0.5551071166992188, -0.5326385498046875, -0.5101699829101562, -0.487701416015625, -0.46523284912109375, -0.4427642822265625, -0.42029571533203125, -0.3978271484375, -0.37535858154296875, -0.3528900146484375, -0.33042144775390625, -0.307952880859375, -0.28548431396484375, -0.2630157470703125, -0.24054718017578125, -0.21807861328125, -0.19561004638671875, -0.1731414794921875, -0.15067291259765625, -0.128204345703125, -0.10573577880859375, -0.0832672119140625, -0.06079864501953125, -0.038330078125, -0.01586151123046875, 0.0066070556640625, 0.02907562255859375, 0.051544189453125, 0.07401275634765625, 0.0964813232421875, 0.11894989013671875, 0.14141845703125, 0.16388702392578125, 0.1863555908203125, 0.20882415771484375, 0.231292724609375, 0.25376129150390625, 0.2762298583984375, 0.29869842529296875, 0.3211669921875, 0.34363555908203125, 0.3661041259765625, 0.38857269287109375, 0.411041259765625, 0.43350982666015625, 0.4559783935546875, 0.47844696044921875, 0.50091552734375, 0.5233840942382812, 0.5458526611328125, 0.5683212280273438, 0.590789794921875, 0.6132583618164062, 0.6357269287109375, 0.6581954956054688, 0.6806640625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 0.0, 8.0, 11.0, 13.0, 12.0, 23.0, 15.0, 41.0, 28.0, 54.0, 80.0, 94.0, 140.0, 195.0, 368.0, 652.0, 2524.0, 23424.0, 436296.0, 549268.0, 30359.0, 2958.0, 798.0, 367.0, 248.0, 138.0, 114.0, 85.0, 58.0, 54.0, 32.0, 19.0, 14.0, 9.0, 9.0, 15.0, 8.0, 0.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6923828125, -0.6700820922851562, -0.6477813720703125, -0.6254806518554688, -0.603179931640625, -0.5808792114257812, -0.5585784912109375, -0.5362777709960938, -0.51397705078125, -0.49167633056640625, -0.4693756103515625, -0.44707489013671875, -0.424774169921875, -0.40247344970703125, -0.3801727294921875, -0.35787200927734375, -0.3355712890625, -0.31327056884765625, -0.2909698486328125, -0.26866912841796875, -0.246368408203125, -0.22406768798828125, -0.2017669677734375, -0.17946624755859375, -0.15716552734375, -0.13486480712890625, -0.1125640869140625, -0.09026336669921875, -0.067962646484375, -0.04566192626953125, -0.0233612060546875, -0.00106048583984375, 0.021240234375, 0.04354095458984375, 0.0658416748046875, 0.08814239501953125, 0.110443115234375, 0.13274383544921875, 0.1550445556640625, 0.17734527587890625, 0.19964599609375, 0.22194671630859375, 0.2442474365234375, 0.26654815673828125, 0.288848876953125, 0.31114959716796875, 0.3334503173828125, 0.35575103759765625, 0.3780517578125, 0.40035247802734375, 0.4226531982421875, 0.44495391845703125, 0.467254638671875, 0.48955535888671875, 0.5118560791015625, 0.5341567993164062, 0.55645751953125, 0.5787582397460938, 0.6010589599609375, 0.6233596801757812, 0.645660400390625, 0.6679611206054688, 0.6902618408203125, 0.7125625610351562, 0.73486328125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 0.0, 4.0, 4.0, 19.0, 11.0, 10.0, 15.0, 17.0, 15.0, 25.0, 19.0, 22.0, 26.0, 39.0, 42.0, 44.0, 35.0, 37.0, 51.0, 38.0, 35.0, 44.0, 49.0, 32.0, 38.0, 44.0, 34.0, 31.0, 31.0, 27.0, 31.0, 19.0, 16.0, 16.0, 11.0, 10.0, 12.0, 11.0, 7.0, 8.0, 4.0, 1.0, 4.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.79736328125, -0.772491455078125, -0.74761962890625, -0.722747802734375, -0.6978759765625, -0.673004150390625, -0.64813232421875, -0.623260498046875, -0.598388671875, -0.573516845703125, -0.54864501953125, -0.523773193359375, -0.4989013671875, -0.474029541015625, -0.44915771484375, -0.424285888671875, -0.3994140625, -0.374542236328125, -0.34967041015625, -0.324798583984375, -0.2999267578125, -0.275054931640625, -0.25018310546875, -0.225311279296875, -0.200439453125, -0.175567626953125, -0.15069580078125, -0.125823974609375, -0.1009521484375, -0.076080322265625, -0.05120849609375, -0.026336669921875, -0.00146484375, 0.023406982421875, 0.04827880859375, 0.073150634765625, 0.0980224609375, 0.122894287109375, 0.14776611328125, 0.172637939453125, 0.197509765625, 0.222381591796875, 0.24725341796875, 0.272125244140625, 0.2969970703125, 0.321868896484375, 0.34674072265625, 0.371612548828125, 0.396484375, 0.421356201171875, 0.44622802734375, 0.471099853515625, 0.4959716796875, 0.520843505859375, 0.54571533203125, 0.570587158203125, 0.595458984375, 0.620330810546875, 0.64520263671875, 0.670074462890625, 0.6949462890625, 0.719818115234375, 0.74468994140625, 0.769561767578125, 0.79443359375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 3.0, 4.0, 2.0, 7.0, 12.0, 10.0, 25.0, 31.0, 41.0, 63.0, 95.0, 174.0, 376.0, 929.0, 2940.0, 14993.0, 166586.0, 758063.0, 90472.0, 9887.0, 2325.0, 772.0, 300.0, 161.0, 90.0, 58.0, 39.0, 19.0, 16.0, 13.0, 9.0, 5.0, 4.0, 4.0, 10.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2225341796875, -0.21566390991210938, -0.20879364013671875, -0.20192337036132812, -0.1950531005859375, -0.18818283081054688, -0.18131256103515625, -0.17444229125976562, -0.167572021484375, -0.16070175170898438, -0.15383148193359375, -0.14696121215820312, -0.1400909423828125, -0.13322067260742188, -0.12635040283203125, -0.11948013305664062, -0.11260986328125, -0.10573959350585938, -0.09886932373046875, -0.09199905395507812, -0.0851287841796875, -0.07825851440429688, -0.07138824462890625, -0.06451797485351562, -0.057647705078125, -0.050777435302734375, -0.04390716552734375, -0.037036895751953125, -0.0301666259765625, -0.023296356201171875, -0.01642608642578125, -0.009555816650390625, -0.002685546875, 0.004184722900390625, 0.01105499267578125, 0.017925262451171875, 0.0247955322265625, 0.031665802001953125, 0.03853607177734375, 0.045406341552734375, 0.052276611328125, 0.059146881103515625, 0.06601715087890625, 0.07288742065429688, 0.0797576904296875, 0.08662796020507812, 0.09349822998046875, 0.10036849975585938, 0.10723876953125, 0.11410903930664062, 0.12097930908203125, 0.12784957885742188, 0.1347198486328125, 0.14159011840820312, 0.14846038818359375, 0.15533065795898438, 0.162200927734375, 0.16907119750976562, 0.17594146728515625, 0.18281173706054688, 0.1896820068359375, 0.19655227661132812, 0.20342254638671875, 0.21029281616210938, 0.2171630859375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 8.0, 6.0, 7.0, 9.0, 11.0, 29.0, 35.0, 60.0, 71.0, 97.0, 94.0, 96.0, 99.0, 106.0, 71.0, 55.0, 53.0, 35.0, 13.0, 13.0, 9.0, 4.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.147125244140625e-05, -3.0734576284885406e-05, -2.9997900128364563e-05, -2.926122397184372e-05, -2.8524547815322876e-05, -2.7787871658802032e-05, -2.705119550228119e-05, -2.6314519345760345e-05, -2.5577843189239502e-05, -2.484116703271866e-05, -2.4104490876197815e-05, -2.336781471967697e-05, -2.2631138563156128e-05, -2.1894462406635284e-05, -2.115778625011444e-05, -2.0421110093593597e-05, -1.9684433937072754e-05, -1.894775778055191e-05, -1.8211081624031067e-05, -1.7474405467510223e-05, -1.673772931098938e-05, -1.6001053154468536e-05, -1.5264376997947693e-05, -1.452770084142685e-05, -1.3791024684906006e-05, -1.3054348528385162e-05, -1.2317672371864319e-05, -1.1580996215343475e-05, -1.0844320058822632e-05, -1.0107643902301788e-05, -9.370967745780945e-06, -8.634291589260101e-06, -7.897615432739258e-06, -7.160939276218414e-06, -6.424263119697571e-06, -5.687586963176727e-06, -4.950910806655884e-06, -4.21423465013504e-06, -3.4775584936141968e-06, -2.7408823370933533e-06, -2.0042061805725098e-06, -1.2675300240516663e-06, -5.308538675308228e-07, 2.0582228899002075e-07, 9.424984455108643e-07, 1.6791746020317078e-06, 2.4158507585525513e-06, 3.1525269150733948e-06, 3.889203071594238e-06, 4.625879228115082e-06, 5.362555384635925e-06, 6.099231541156769e-06, 6.835907697677612e-06, 7.572583854198456e-06, 8.3092600107193e-06, 9.045936167240143e-06, 9.782612323760986e-06, 1.051928848028183e-05, 1.1255964636802673e-05, 1.1992640793323517e-05, 1.272931694984436e-05, 1.3465993106365204e-05, 1.4202669262886047e-05, 1.4939345419406891e-05, 1.5676021575927734e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 7.0, 8.0, 16.0, 16.0, 27.0, 34.0, 48.0, 110.0, 181.0, 359.0, 970.0, 2677.0, 12807.0, 240403.0, 750084.0, 33701.0, 4627.0, 1394.0, 510.0, 243.0, 122.0, 75.0, 38.0, 21.0, 24.0, 16.0, 5.0, 4.0, 4.0, 7.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29541015625, -0.2856292724609375, -0.275848388671875, -0.2660675048828125, -0.25628662109375, -0.2465057373046875, -0.236724853515625, -0.2269439697265625, -0.2171630859375, -0.2073822021484375, -0.197601318359375, -0.1878204345703125, -0.17803955078125, -0.1682586669921875, -0.158477783203125, -0.1486968994140625, -0.138916015625, -0.1291351318359375, -0.119354248046875, -0.1095733642578125, -0.09979248046875, -0.0900115966796875, -0.080230712890625, -0.0704498291015625, -0.0606689453125, -0.0508880615234375, -0.041107177734375, -0.0313262939453125, -0.02154541015625, -0.0117645263671875, -0.001983642578125, 0.0077972412109375, 0.017578125, 0.0273590087890625, 0.037139892578125, 0.0469207763671875, 0.05670166015625, 0.0664825439453125, 0.076263427734375, 0.0860443115234375, 0.0958251953125, 0.1056060791015625, 0.115386962890625, 0.1251678466796875, 0.13494873046875, 0.1447296142578125, 0.154510498046875, 0.1642913818359375, 0.174072265625, 0.1838531494140625, 0.193634033203125, 0.2034149169921875, 0.21319580078125, 0.2229766845703125, 0.232757568359375, 0.2425384521484375, 0.2523193359375, 0.2621002197265625, 0.271881103515625, 0.2816619873046875, 0.29144287109375, 0.3012237548828125, 0.311004638671875, 0.3207855224609375, 0.33056640625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 7.0, 6.0, 10.0, 11.0, 27.0, 40.0, 54.0, 78.0, 87.0, 108.0, 130.0, 102.0, 91.0, 68.0, 47.0, 40.0, 23.0, 21.0, 14.0, 12.0, 4.0, 7.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09625244140625, -0.09344673156738281, -0.09064102172851562, -0.08783531188964844, -0.08502960205078125, -0.08222389221191406, -0.07941818237304688, -0.07661247253417969, -0.0738067626953125, -0.07100105285644531, -0.06819534301757812, -0.06538963317871094, -0.06258392333984375, -0.05977821350097656, -0.056972503662109375, -0.05416679382324219, -0.051361083984375, -0.04855537414550781, -0.045749664306640625, -0.04294395446777344, -0.04013824462890625, -0.03733253479003906, -0.034526824951171875, -0.03172111511230469, -0.0289154052734375, -0.026109695434570312, -0.023303985595703125, -0.020498275756835938, -0.01769256591796875, -0.014886856079101562, -0.012081146240234375, -0.009275436401367188, -0.0064697265625, -0.0036640167236328125, -0.000858306884765625, 0.0019474029541015625, 0.00475311279296875, 0.0075588226318359375, 0.010364532470703125, 0.013170242309570312, 0.0159759521484375, 0.018781661987304688, 0.021587371826171875, 0.024393081665039062, 0.02719879150390625, 0.030004501342773438, 0.032810211181640625, 0.03561592102050781, 0.038421630859375, 0.04122734069824219, 0.044033050537109375, 0.04683876037597656, 0.04964447021484375, 0.05245018005371094, 0.055255889892578125, 0.05806159973144531, 0.0608673095703125, 0.06367301940917969, 0.06647872924804688, 0.06928443908691406, 0.07209014892578125, 0.07489585876464844, 0.07770156860351562, 0.08050727844238281, 0.08331298828125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 11.0, 9.0, 32.0, 56.0, 79.0, 113.0, 166.0, 144.0, 106.0, 117.0, 63.0, 47.0, 25.0, 7.0, 10.0, 5.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8401200771331787, -1.7863998413085938, -1.7326794862747192, -1.6789592504501343, -1.6252390146255493, -1.5715186595916748, -1.5177984237670898, -1.4640781879425049, -1.41035795211792, -1.356637716293335, -1.3029173612594604, -1.2491971254348755, -1.1954768896102905, -1.141756534576416, -1.088036298751831, -1.034316062927246, -0.9805957078933716, -0.9268754124641418, -0.8731551766395569, -0.8194348812103271, -0.7657146453857422, -0.7119943499565125, -0.6582740545272827, -0.6045538187026978, -0.550833523273468, -0.49711325764656067, -0.4433929920196533, -0.3896726965904236, -0.33595243096351624, -0.2822321653366089, -0.22851186990737915, -0.1747916042804718, -0.1210712194442749, -0.06735094636678696, -0.013630673289299011, 0.04008960723876953, 0.09380987286567688, 0.14753013849258423, 0.20125043392181396, 0.2549706995487213, 0.30869096517562866, 0.362411230802536, 0.41613149642944336, 0.4698517918586731, 0.5235720872879028, 0.5772923231124878, 0.6310126185417175, 0.6847329139709473, 0.7384531497955322, 0.792173445224762, 0.8458936810493469, 0.8996139764785767, 0.9533342123031616, 1.0070545673370361, 1.060774803161621, 1.114495038986206, 1.168215274810791, 1.221935510635376, 1.2756558656692505, 1.3293761014938354, 1.3830963373184204, 1.436816692352295, 1.4905369281768799, 1.5442571640014648, 1.5979775190353394]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 4.0, 10.0, 5.0, 7.0, 14.0, 12.0, 12.0, 19.0, 21.0, 24.0, 28.0, 30.0, 29.0, 34.0, 44.0, 45.0, 41.0, 43.0, 41.0, 47.0, 43.0, 46.0, 34.0, 36.0, 38.0, 42.0, 20.0, 25.0, 37.0, 24.0, 16.0, 26.0, 17.0, 19.0, 14.0, 8.0, 9.0, 2.0, 4.0, 7.0, 4.0, 4.0, 5.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-1.43735933303833, -1.3946735858917236, -1.3519877195358276, -1.3093019723892212, -1.2666162252426147, -1.2239303588867188, -1.1812446117401123, -1.1385588645935059, -1.0958729982376099, -1.0531872510910034, -1.0105013847351074, -0.967815637588501, -0.9251298308372498, -0.8824440240859985, -0.8397582769393921, -0.7970724701881409, -0.7543867230415344, -0.7117009162902832, -0.6690151691436768, -0.6263293623924255, -0.5836435556411743, -0.5409578084945679, -0.49827200174331665, -0.45558619499206543, -0.4129004180431366, -0.37021464109420776, -0.32752883434295654, -0.2848430573940277, -0.24215726554393768, -0.19947147369384766, -0.15678569674491882, -0.1140998899936676, -0.07141411304473877, -0.02872832491993904, 0.013957463204860687, 0.05664324760437012, 0.09932903945446014, 0.14201483130455017, 0.184700608253479, 0.22738641500473022, 0.27007219195365906, 0.3127579689025879, 0.3554437756538391, 0.39812955260276794, 0.4408153295516968, 0.483501136302948, 0.5261869430541992, 0.5688726902008057, 0.6115584969520569, 0.6542443037033081, 0.6969300508499146, 0.7396158576011658, 0.782301664352417, 0.8249874114990234, 0.8676732182502747, 0.9103590250015259, 0.9530447721481323, 0.9957305788993835, 1.0384163856506348, 1.0811021327972412, 1.1237878799438477, 1.1664737462997437, 1.20915949344635, 1.251845359802246, 1.2945311069488525]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 8.0, 10.0, 24.0, 26.0, 45.0, 99.0, 175.0, 295.0, 600.0, 1449.0, 3827.0, 12624.0, 67879.0, 457585.0, 2209829.0, 1238807.0, 162885.0, 26826.0, 6875.0, 2388.0, 927.0, 470.0, 218.0, 138.0, 96.0, 50.0, 34.0, 15.0, 19.0, 14.0, 11.0, 6.0, 5.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.56494140625, -0.5421218872070312, -0.5193023681640625, -0.49648284912109375, -0.473663330078125, -0.45084381103515625, -0.4280242919921875, -0.40520477294921875, -0.38238525390625, -0.35956573486328125, -0.3367462158203125, -0.31392669677734375, -0.291107177734375, -0.26828765869140625, -0.2454681396484375, -0.22264862060546875, -0.1998291015625, -0.17700958251953125, -0.1541900634765625, -0.13137054443359375, -0.108551025390625, -0.08573150634765625, -0.0629119873046875, -0.04009246826171875, -0.01727294921875, 0.00554656982421875, 0.0283660888671875, 0.05118560791015625, 0.074005126953125, 0.09682464599609375, 0.1196441650390625, 0.14246368408203125, 0.165283203125, 0.18810272216796875, 0.2109222412109375, 0.23374176025390625, 0.256561279296875, 0.27938079833984375, 0.3022003173828125, 0.32501983642578125, 0.34783935546875, 0.37065887451171875, 0.3934783935546875, 0.41629791259765625, 0.439117431640625, 0.46193695068359375, 0.4847564697265625, 0.5075759887695312, 0.5303955078125, 0.5532150268554688, 0.5760345458984375, 0.5988540649414062, 0.621673583984375, 0.6444931030273438, 0.6673126220703125, 0.6901321411132812, 0.71295166015625, 0.7357711791992188, 0.7585906982421875, 0.7814102172851562, 0.804229736328125, 0.8270492553710938, 0.8498687744140625, 0.8726882934570312, 0.8955078125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 1.0, 4.0, 5.0, 9.0, 9.0, 4.0, 14.0, 11.0, 17.0, 19.0, 35.0, 35.0, 35.0, 20.0, 40.0, 30.0, 40.0, 57.0, 46.0, 66.0, 56.0, 43.0, 62.0, 38.0, 43.0, 36.0, 31.0, 26.0, 29.0, 19.0, 19.0, 14.0, 13.0, 14.0, 16.0, 6.0, 6.0, 5.0, 6.0, 6.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.52197265625, -0.5066871643066406, -0.49140167236328125, -0.4761161804199219, -0.4608306884765625, -0.4455451965332031, -0.43025970458984375, -0.4149742126464844, -0.399688720703125, -0.3844032287597656, -0.36911773681640625, -0.3538322448730469, -0.3385467529296875, -0.3232612609863281, -0.30797576904296875, -0.2926902770996094, -0.27740478515625, -0.2621192932128906, -0.24683380126953125, -0.23154830932617188, -0.2162628173828125, -0.20097732543945312, -0.18569183349609375, -0.17040634155273438, -0.155120849609375, -0.13983535766601562, -0.12454986572265625, -0.10926437377929688, -0.0939788818359375, -0.07869338989257812, -0.06340789794921875, -0.048122406005859375, -0.0328369140625, -0.017551422119140625, -0.00226593017578125, 0.013019561767578125, 0.0283050537109375, 0.043590545654296875, 0.05887603759765625, 0.07416152954101562, 0.089447021484375, 0.10473251342773438, 0.12001800537109375, 0.13530349731445312, 0.1505889892578125, 0.16587448120117188, 0.18115997314453125, 0.19644546508789062, 0.21173095703125, 0.22701644897460938, 0.24230194091796875, 0.2575874328613281, 0.2728729248046875, 0.2881584167480469, 0.30344390869140625, 0.3187294006347656, 0.334014892578125, 0.3493003845214844, 0.36458587646484375, 0.3798713684082031, 0.3951568603515625, 0.4104423522949219, 0.42572784423828125, 0.4410133361816406, 0.456298828125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 8.0, 6.0, 11.0, 18.0, 39.0, 52.0, 55.0, 96.0, 187.0, 297.0, 667.0, 1284.0, 3738.0, 16474.0, 134279.0, 2860129.0, 1103352.0, 59501.0, 9272.0, 2598.0, 1018.0, 496.0, 267.0, 145.0, 97.0, 55.0, 45.0, 29.0, 21.0, 14.0, 9.0, 11.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.814453125, -0.7862014770507812, -0.7579498291015625, -0.7296981811523438, -0.701446533203125, -0.6731948852539062, -0.6449432373046875, -0.6166915893554688, -0.58843994140625, -0.5601882934570312, -0.5319366455078125, -0.5036849975585938, -0.475433349609375, -0.44718170166015625, -0.4189300537109375, -0.39067840576171875, -0.3624267578125, -0.33417510986328125, -0.3059234619140625, -0.27767181396484375, -0.249420166015625, -0.22116851806640625, -0.1929168701171875, -0.16466522216796875, -0.13641357421875, -0.10816192626953125, -0.0799102783203125, -0.05165863037109375, -0.023406982421875, 0.00484466552734375, 0.0330963134765625, 0.06134796142578125, 0.089599609375, 0.11785125732421875, 0.1461029052734375, 0.17435455322265625, 0.202606201171875, 0.23085784912109375, 0.2591094970703125, 0.28736114501953125, 0.31561279296875, 0.34386444091796875, 0.3721160888671875, 0.40036773681640625, 0.428619384765625, 0.45687103271484375, 0.4851226806640625, 0.5133743286132812, 0.5416259765625, 0.5698776245117188, 0.5981292724609375, 0.6263809204101562, 0.654632568359375, 0.6828842163085938, 0.7111358642578125, 0.7393875122070312, 0.76763916015625, 0.7958908081054688, 0.8241424560546875, 0.8523941040039062, 0.880645751953125, 0.9088973999023438, 0.9371490478515625, 0.9654006958007812, 0.99365234375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 8.0, 13.0, 8.0, 19.0, 16.0, 26.0, 47.0, 53.0, 66.0, 132.0, 142.0, 247.0, 350.0, 495.0, 542.0, 522.0, 432.0, 315.0, 208.0, 142.0, 78.0, 63.0, 35.0, 33.0, 26.0, 14.0, 13.0, 5.0, 7.0, 7.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2401123046875, -0.2329864501953125, -0.225860595703125, -0.2187347412109375, -0.21160888671875, -0.2044830322265625, -0.197357177734375, -0.1902313232421875, -0.18310546875, -0.1759796142578125, -0.168853759765625, -0.1617279052734375, -0.15460205078125, -0.1474761962890625, -0.140350341796875, -0.1332244873046875, -0.1260986328125, -0.1189727783203125, -0.111846923828125, -0.1047210693359375, -0.09759521484375, -0.0904693603515625, -0.083343505859375, -0.0762176513671875, -0.069091796875, -0.0619659423828125, -0.054840087890625, -0.0477142333984375, -0.04058837890625, -0.0334625244140625, -0.026336669921875, -0.0192108154296875, -0.0120849609375, -0.0049591064453125, 0.002166748046875, 0.0092926025390625, 0.01641845703125, 0.0235443115234375, 0.030670166015625, 0.0377960205078125, 0.044921875, 0.0520477294921875, 0.059173583984375, 0.0662994384765625, 0.07342529296875, 0.0805511474609375, 0.087677001953125, 0.0948028564453125, 0.1019287109375, 0.1090545654296875, 0.116180419921875, 0.1233062744140625, 0.13043212890625, 0.1375579833984375, 0.144683837890625, 0.1518096923828125, 0.158935546875, 0.1660614013671875, 0.173187255859375, 0.1803131103515625, 0.18743896484375, 0.1945648193359375, 0.201690673828125, 0.2088165283203125, 0.2159423828125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 13.0, 17.0, 22.0, 39.0, 61.0, 112.0, 97.0, 137.0, 131.0, 119.0, 95.0, 46.0, 50.0, 24.0, 9.0, 14.0, 6.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3122243881225586, -1.2723603248596191, -1.2324962615966797, -1.1926320791244507, -1.1527680158615112, -1.1129039525985718, -1.0730398893356323, -1.0331757068634033, -0.9933116436004639, -0.9534475803375244, -0.9135834574699402, -0.8737193942070007, -0.8338552713394165, -0.793991208076477, -0.7541271448135376, -0.7142630219459534, -0.6743989586830139, -0.6345348954200745, -0.5946707725524902, -0.5548067092895508, -0.5149425864219666, -0.4750785231590271, -0.43521443009376526, -0.3953503370285034, -0.3554862439632416, -0.31562215089797974, -0.2757580578327179, -0.23589397966861725, -0.1960298866033554, -0.15616579353809357, -0.11630171537399292, -0.07643762230873108, -0.03657352924346924, 0.003290560096502304, 0.043154649436473846, 0.08301873505115509, 0.12288282811641693, 0.16274692118167877, 0.20261099934577942, 0.24247509241104126, 0.2823391854763031, 0.32220327854156494, 0.3620673716068268, 0.4019314646720886, 0.4417955279350281, 0.4816596508026123, 0.5215237140655518, 0.5613877773284912, 0.6012519001960754, 0.6411159634590149, 0.6809800863265991, 0.7208441495895386, 0.7607082724571228, 0.8005723357200623, 0.8404364585876465, 0.8803005218505859, 0.9201645851135254, 0.9600286483764648, 0.9998927712440491, 1.0397568941116333, 1.0796209573745728, 1.1194850206375122, 1.1593490839004517, 1.1992132663726807, 1.2390773296356201]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 3.0, 7.0, 10.0, 11.0, 14.0, 12.0, 10.0, 13.0, 16.0, 16.0, 20.0, 20.0, 27.0, 29.0, 27.0, 34.0, 32.0, 32.0, 35.0, 36.0, 37.0, 44.0, 43.0, 42.0, 46.0, 30.0, 38.0, 31.0, 38.0, 32.0, 23.0, 24.0, 22.0, 23.0, 19.0, 17.0, 7.0, 13.0, 14.0, 10.0, 10.0, 5.0, 7.0, 7.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.41921043395996094, -0.40491753816604614, -0.39062461256980896, -0.3763316869735718, -0.362038791179657, -0.3477458953857422, -0.333452969789505, -0.3191600441932678, -0.304867148399353, -0.29057425260543823, -0.27628132700920105, -0.26198840141296387, -0.24769550561904907, -0.23340259492397308, -0.2191096842288971, -0.2048167735338211, -0.19052386283874512, -0.17623095214366913, -0.16193804144859314, -0.14764513075351715, -0.13335222005844116, -0.11905930936336517, -0.10476639866828918, -0.0904734879732132, -0.07618057727813721, -0.06188766658306122, -0.04759475588798523, -0.03330184519290924, -0.019008934497833252, -0.004716023802757263, 0.009576886892318726, 0.023869797587394714, 0.0381627082824707, 0.05245561897754669, 0.06674852967262268, 0.08104144036769867, 0.09533435106277466, 0.10962726175785065, 0.12392017245292664, 0.13821308314800262, 0.1525059938430786, 0.1667989045381546, 0.1810918152332306, 0.19538472592830658, 0.20967763662338257, 0.22397054731845856, 0.23826345801353455, 0.25255638360977173, 0.2668492794036865, 0.2811421751976013, 0.2954351007938385, 0.3097280263900757, 0.3240209221839905, 0.3383138179779053, 0.35260674357414246, 0.36689966917037964, 0.38119256496429443, 0.39548546075820923, 0.4097783863544464, 0.4240713119506836, 0.4383642077445984, 0.4526571035385132, 0.46695002913475037, 0.48124295473098755, 0.49553585052490234]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 4.0, 5.0, 8.0, 8.0, 16.0, 26.0, 35.0, 51.0, 67.0, 108.0, 214.0, 497.0, 1092.0, 2847.0, 9074.0, 32733.0, 134866.0, 420128.0, 327778.0, 87112.0, 21720.0, 6297.0, 2149.0, 809.0, 367.0, 210.0, 122.0, 65.0, 52.0, 32.0, 16.0, 15.0, 13.0, 3.0, 2.0, 6.0, 2.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1307373046875, -0.12649917602539062, -0.12226104736328125, -0.11802291870117188, -0.1137847900390625, -0.10954666137695312, -0.10530853271484375, -0.10107040405273438, -0.096832275390625, -0.09259414672851562, -0.08835601806640625, -0.08411788940429688, -0.0798797607421875, -0.07564163208007812, -0.07140350341796875, -0.06716537475585938, -0.06292724609375, -0.058689117431640625, -0.05445098876953125, -0.050212860107421875, -0.0459747314453125, -0.041736602783203125, -0.03749847412109375, -0.033260345458984375, -0.029022216796875, -0.024784088134765625, -0.02054595947265625, -0.016307830810546875, -0.0120697021484375, -0.007831573486328125, -0.00359344482421875, 0.000644683837890625, 0.0048828125, 0.009120941162109375, 0.01335906982421875, 0.017597198486328125, 0.0218353271484375, 0.026073455810546875, 0.03031158447265625, 0.034549713134765625, 0.038787841796875, 0.043025970458984375, 0.04726409912109375, 0.051502227783203125, 0.0557403564453125, 0.059978485107421875, 0.06421661376953125, 0.06845474243164062, 0.07269287109375, 0.07693099975585938, 0.08116912841796875, 0.08540725708007812, 0.0896453857421875, 0.09388351440429688, 0.09812164306640625, 0.10235977172851562, 0.106597900390625, 0.11083602905273438, 0.11507415771484375, 0.11931228637695312, 0.1235504150390625, 0.12778854370117188, 0.13202667236328125, 0.13626480102539062, 0.1405029296875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 6.0, 3.0, 10.0, 7.0, 14.0, 10.0, 11.0, 14.0, 15.0, 21.0, 25.0, 18.0, 20.0, 25.0, 26.0, 31.0, 31.0, 44.0, 32.0, 39.0, 41.0, 44.0, 42.0, 36.0, 38.0, 37.0, 45.0, 39.0, 29.0, 27.0, 22.0, 32.0, 20.0, 22.0, 25.0, 10.0, 16.0, 20.0, 12.0, 7.0, 5.0, 7.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.30078125, -0.2908782958984375, -0.280975341796875, -0.2710723876953125, -0.26116943359375, -0.2512664794921875, -0.241363525390625, -0.2314605712890625, -0.2215576171875, -0.2116546630859375, -0.201751708984375, -0.1918487548828125, -0.18194580078125, -0.1720428466796875, -0.162139892578125, -0.1522369384765625, -0.142333984375, -0.1324310302734375, -0.122528076171875, -0.1126251220703125, -0.10272216796875, -0.0928192138671875, -0.082916259765625, -0.0730133056640625, -0.0631103515625, -0.0532073974609375, -0.043304443359375, -0.0334014892578125, -0.02349853515625, -0.0135955810546875, -0.003692626953125, 0.0062103271484375, 0.01611328125, 0.0260162353515625, 0.035919189453125, 0.0458221435546875, 0.05572509765625, 0.0656280517578125, 0.075531005859375, 0.0854339599609375, 0.0953369140625, 0.1052398681640625, 0.115142822265625, 0.1250457763671875, 0.13494873046875, 0.1448516845703125, 0.154754638671875, 0.1646575927734375, 0.174560546875, 0.1844635009765625, 0.194366455078125, 0.2042694091796875, 0.21417236328125, 0.2240753173828125, 0.233978271484375, 0.2438812255859375, 0.2537841796875, 0.2636871337890625, 0.273590087890625, 0.2834930419921875, 0.29339599609375, 0.3032989501953125, 0.313201904296875, 0.3231048583984375, 0.3330078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 7.0, 9.0, 15.0, 16.0, 21.0, 37.0, 45.0, 60.0, 96.0, 107.0, 165.0, 240.0, 346.0, 555.0, 1017.0, 1836.0, 3791.0, 8321.0, 19462.0, 48327.0, 116566.0, 238338.0, 289657.0, 182067.0, 79428.0, 32382.0, 13249.0, 5961.0, 2796.0, 1404.0, 791.0, 450.0, 290.0, 198.0, 144.0, 106.0, 68.0, 43.0, 31.0, 33.0, 18.0, 13.0, 12.0, 13.0, 7.0, 2.0, 3.0, 6.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.0806884765625, -0.07833480834960938, -0.07598114013671875, -0.07362747192382812, -0.0712738037109375, -0.06892013549804688, -0.06656646728515625, -0.06421279907226562, -0.061859130859375, -0.059505462646484375, -0.05715179443359375, -0.054798126220703125, -0.0524444580078125, -0.050090789794921875, -0.04773712158203125, -0.045383453369140625, -0.04302978515625, -0.040676116943359375, -0.03832244873046875, -0.035968780517578125, -0.0336151123046875, -0.031261444091796875, -0.02890777587890625, -0.026554107666015625, -0.024200439453125, -0.021846771240234375, -0.01949310302734375, -0.017139434814453125, -0.0147857666015625, -0.012432098388671875, -0.01007843017578125, -0.007724761962890625, -0.00537109375, -0.003017425537109375, -0.00066375732421875, 0.001689910888671875, 0.0040435791015625, 0.006397247314453125, 0.00875091552734375, 0.011104583740234375, 0.013458251953125, 0.015811920166015625, 0.01816558837890625, 0.020519256591796875, 0.0228729248046875, 0.025226593017578125, 0.02758026123046875, 0.029933929443359375, 0.03228759765625, 0.034641265869140625, 0.03699493408203125, 0.039348602294921875, 0.0417022705078125, 0.044055938720703125, 0.04640960693359375, 0.048763275146484375, 0.051116943359375, 0.053470611572265625, 0.05582427978515625, 0.058177947998046875, 0.0605316162109375, 0.06288528442382812, 0.06523895263671875, 0.06759262084960938, 0.0699462890625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 4.0, 7.0, 7.0, 5.0, 6.0, 8.0, 14.0, 14.0, 14.0, 21.0, 21.0, 24.0, 24.0, 30.0, 34.0, 35.0, 49.0, 40.0, 44.0, 40.0, 47.0, 45.0, 61.0, 53.0, 37.0, 39.0, 36.0, 42.0, 28.0, 33.0, 18.0, 25.0, 13.0, 14.0, 16.0, 13.0, 14.0, 5.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.716796875, -0.693145751953125, -0.66949462890625, -0.645843505859375, -0.6221923828125, -0.598541259765625, -0.57489013671875, -0.551239013671875, -0.527587890625, -0.503936767578125, -0.48028564453125, -0.456634521484375, -0.4329833984375, -0.409332275390625, -0.38568115234375, -0.362030029296875, -0.33837890625, -0.314727783203125, -0.29107666015625, -0.267425537109375, -0.2437744140625, -0.220123291015625, -0.19647216796875, -0.172821044921875, -0.149169921875, -0.125518798828125, -0.10186767578125, -0.078216552734375, -0.0545654296875, -0.030914306640625, -0.00726318359375, 0.016387939453125, 0.0400390625, 0.063690185546875, 0.08734130859375, 0.110992431640625, 0.1346435546875, 0.158294677734375, 0.18194580078125, 0.205596923828125, 0.229248046875, 0.252899169921875, 0.27655029296875, 0.300201416015625, 0.3238525390625, 0.347503662109375, 0.37115478515625, 0.394805908203125, 0.41845703125, 0.442108154296875, 0.46575927734375, 0.489410400390625, 0.5130615234375, 0.536712646484375, 0.56036376953125, 0.584014892578125, 0.607666015625, 0.631317138671875, 0.65496826171875, 0.678619384765625, 0.7022705078125, 0.725921630859375, 0.74957275390625, 0.773223876953125, 0.796875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 6.0, 8.0, 8.0, 7.0, 14.0, 28.0, 45.0, 57.0, 117.0, 205.0, 363.0, 668.0, 1424.0, 3226.0, 8840.0, 29693.0, 122217.0, 401842.0, 348314.0, 95024.0, 23568.0, 7376.0, 2794.0, 1295.0, 616.0, 346.0, 183.0, 109.0, 59.0, 34.0, 24.0, 20.0, 6.0, 14.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04461669921875, -0.043261051177978516, -0.04190540313720703, -0.04054975509643555, -0.03919410705566406, -0.03783845901489258, -0.036482810974121094, -0.03512716293334961, -0.033771514892578125, -0.03241586685180664, -0.031060218811035156, -0.029704570770263672, -0.028348922729492188, -0.026993274688720703, -0.02563762664794922, -0.024281978607177734, -0.02292633056640625, -0.021570682525634766, -0.02021503448486328, -0.018859386444091797, -0.017503738403320312, -0.016148090362548828, -0.014792442321777344, -0.01343679428100586, -0.012081146240234375, -0.01072549819946289, -0.009369850158691406, -0.008014202117919922, -0.0066585540771484375, -0.005302906036376953, -0.003947257995605469, -0.0025916099548339844, -0.0012359619140625, 0.00011968612670898438, 0.0014753341674804688, 0.002830982208251953, 0.0041866302490234375, 0.005542278289794922, 0.006897926330566406, 0.00825357437133789, 0.009609222412109375, 0.01096487045288086, 0.012320518493652344, 0.013676166534423828, 0.015031814575195312, 0.016387462615966797, 0.01774311065673828, 0.019098758697509766, 0.02045440673828125, 0.021810054779052734, 0.02316570281982422, 0.024521350860595703, 0.025876998901367188, 0.027232646942138672, 0.028588294982910156, 0.02994394302368164, 0.031299591064453125, 0.03265523910522461, 0.034010887145996094, 0.03536653518676758, 0.03672218322753906, 0.03807783126831055, 0.03943347930908203, 0.040789127349853516, 0.042144775390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 3.0, 12.0, 7.0, 9.0, 23.0, 28.0, 30.0, 52.0, 43.0, 67.0, 57.0, 68.0, 77.0, 67.0, 71.0, 75.0, 72.0, 46.0, 34.0, 37.0, 38.0, 27.0, 18.0, 14.0, 9.0, 3.0, 10.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6033649444580078e-05, -1.5533529222011566e-05, -1.5033408999443054e-05, -1.4533288776874542e-05, -1.403316855430603e-05, -1.3533048331737518e-05, -1.3032928109169006e-05, -1.2532807886600494e-05, -1.2032687664031982e-05, -1.153256744146347e-05, -1.1032447218894958e-05, -1.0532326996326447e-05, -1.0032206773757935e-05, -9.532086551189423e-06, -9.03196632862091e-06, -8.531846106052399e-06, -8.031725883483887e-06, -7.531605660915375e-06, -7.031485438346863e-06, -6.531365215778351e-06, -6.031244993209839e-06, -5.531124770641327e-06, -5.031004548072815e-06, -4.530884325504303e-06, -4.030764102935791e-06, -3.530643880367279e-06, -3.030523657798767e-06, -2.530403435230255e-06, -2.030283212661743e-06, -1.5301629900932312e-06, -1.0300427675247192e-06, -5.299225449562073e-07, -2.9802322387695312e-08, 4.7031790018081665e-07, 9.704381227493286e-07, 1.4705583453178406e-06, 1.9706785678863525e-06, 2.4707987904548645e-06, 2.9709190130233765e-06, 3.4710392355918884e-06, 3.9711594581604e-06, 4.471279680728912e-06, 4.971399903297424e-06, 5.471520125865936e-06, 5.971640348434448e-06, 6.47176057100296e-06, 6.971880793571472e-06, 7.472001016139984e-06, 7.972121238708496e-06, 8.472241461277008e-06, 8.97236168384552e-06, 9.472481906414032e-06, 9.972602128982544e-06, 1.0472722351551056e-05, 1.0972842574119568e-05, 1.147296279668808e-05, 1.1973083019256592e-05, 1.2473203241825104e-05, 1.2973323464393616e-05, 1.3473443686962128e-05, 1.397356390953064e-05, 1.4473684132099152e-05, 1.4973804354667664e-05, 1.5473924577236176e-05, 1.5974044799804688e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 13.0, 7.0, 8.0, 10.0, 13.0, 24.0, 27.0, 53.0, 61.0, 75.0, 119.0, 191.0, 265.0, 444.0, 738.0, 1553.0, 3151.0, 7388.0, 20451.0, 63694.0, 205962.0, 402738.0, 230457.0, 72356.0, 23173.0, 8148.0, 3445.0, 1705.0, 828.0, 508.0, 292.0, 189.0, 135.0, 94.0, 58.0, 42.0, 35.0, 28.0, 18.0, 8.0, 12.0, 8.0, 10.0, 7.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.041107177734375, -0.039844512939453125, -0.03858184814453125, -0.037319183349609375, -0.0360565185546875, -0.034793853759765625, -0.03353118896484375, -0.032268524169921875, -0.031005859375, -0.029743194580078125, -0.02848052978515625, -0.027217864990234375, -0.0259552001953125, -0.024692535400390625, -0.02342987060546875, -0.022167205810546875, -0.020904541015625, -0.019641876220703125, -0.01837921142578125, -0.017116546630859375, -0.0158538818359375, -0.014591217041015625, -0.01332855224609375, -0.012065887451171875, -0.01080322265625, -0.009540557861328125, -0.00827789306640625, -0.007015228271484375, -0.0057525634765625, -0.004489898681640625, -0.00322723388671875, -0.001964569091796875, -0.000701904296875, 0.000560760498046875, 0.00182342529296875, 0.003086090087890625, 0.0043487548828125, 0.005611419677734375, 0.00687408447265625, 0.008136749267578125, 0.0093994140625, 0.010662078857421875, 0.01192474365234375, 0.013187408447265625, 0.0144500732421875, 0.015712738037109375, 0.01697540283203125, 0.018238067626953125, 0.019500732421875, 0.020763397216796875, 0.02202606201171875, 0.023288726806640625, 0.0245513916015625, 0.025814056396484375, 0.02707672119140625, 0.028339385986328125, 0.02960205078125, 0.030864715576171875, 0.03212738037109375, 0.033390045166015625, 0.0346527099609375, 0.035915374755859375, 0.03717803955078125, 0.038440704345703125, 0.039703369140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 4.0, 8.0, 11.0, 8.0, 15.0, 21.0, 22.0, 27.0, 41.0, 46.0, 37.0, 39.0, 61.0, 56.0, 62.0, 68.0, 58.0, 60.0, 61.0, 51.0, 33.0, 50.0, 34.0, 23.0, 25.0, 15.0, 16.0, 10.0, 9.0, 6.0, 4.0, 4.0, 8.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00968170166015625, -0.009288549423217773, -0.008895397186279297, -0.00850224494934082, -0.008109092712402344, -0.007715940475463867, -0.007322788238525391, -0.006929636001586914, -0.0065364837646484375, -0.006143331527709961, -0.005750179290771484, -0.005357027053833008, -0.004963874816894531, -0.004570722579956055, -0.004177570343017578, -0.0037844181060791016, -0.003391265869140625, -0.0029981136322021484, -0.002604961395263672, -0.0022118091583251953, -0.0018186569213867188, -0.0014255046844482422, -0.0010323524475097656, -0.0006392002105712891, -0.0002460479736328125, 0.00014710426330566406, 0.0005402565002441406, 0.0009334087371826172, 0.0013265609741210938, 0.0017197132110595703, 0.002112865447998047, 0.0025060176849365234, 0.002899169921875, 0.0032923221588134766, 0.003685474395751953, 0.00407862663269043, 0.004471778869628906, 0.004864931106567383, 0.005258083343505859, 0.005651235580444336, 0.0060443878173828125, 0.006437540054321289, 0.006830692291259766, 0.007223844528198242, 0.007616996765136719, 0.008010149002075195, 0.008403301239013672, 0.008796453475952148, 0.009189605712890625, 0.009582757949829102, 0.009975910186767578, 0.010369062423706055, 0.010762214660644531, 0.011155366897583008, 0.011548519134521484, 0.011941671371459961, 0.012334823608398438, 0.012727975845336914, 0.01312112808227539, 0.013514280319213867, 0.013907432556152344, 0.01430058479309082, 0.014693737030029297, 0.015086889266967773, 0.01548004150390625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 8.0, 13.0, 18.0, 31.0, 54.0, 80.0, 119.0, 137.0, 166.0, 142.0, 93.0, 67.0, 30.0, 18.0, 13.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.830352246761322, -0.802791953086853, -0.775231659412384, -0.747671365737915, -0.7201110124588013, -0.692550778388977, -0.6649904251098633, -0.6374301314353943, -0.6098698377609253, -0.5823095440864563, -0.5547492504119873, -0.5271889567375183, -0.49962863326072693, -0.47206833958625793, -0.44450801610946655, -0.41694772243499756, -0.38938742876052856, -0.36182713508605957, -0.3342668414115906, -0.3067065179347992, -0.2791462242603302, -0.2515859305858612, -0.22402562201023102, -0.19646531343460083, -0.16890501976013184, -0.14134472608566284, -0.11378441751003265, -0.08622411638498306, -0.05866381525993347, -0.031103521585464478, -0.0035432130098342896, 0.0240170955657959, 0.05157744884490967, 0.07913774996995926, 0.10669805109500885, 0.13425835967063904, 0.16181865334510803, 0.18937894701957703, 0.21693925559520721, 0.2444995641708374, 0.2720598578453064, 0.2996201515197754, 0.3271804451942444, 0.35474076867103577, 0.38230106234550476, 0.40986135601997375, 0.43742167949676514, 0.46498197317123413, 0.4925422668457031, 0.5201025605201721, 0.5476628541946411, 0.5752231478691101, 0.6027834415435791, 0.6303437948226929, 0.6579040884971619, 0.6854643821716309, 0.7130246758460999, 0.7405849695205688, 0.7681452631950378, 0.7957055568695068, 0.8232659101486206, 0.8508261442184448, 0.8783864974975586, 0.9059467911720276, 0.9335070848464966]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 2.0, 3.0, 9.0, 4.0, 6.0, 16.0, 14.0, 7.0, 19.0, 21.0, 15.0, 23.0, 21.0, 29.0, 31.0, 33.0, 37.0, 35.0, 42.0, 46.0, 37.0, 46.0, 51.0, 47.0, 39.0, 39.0, 37.0, 47.0, 36.0, 24.0, 31.0, 24.0, 17.0, 19.0, 12.0, 14.0, 16.0, 12.0, 8.0, 7.0, 8.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.30832287669181824, -0.2980031967163086, -0.28768354654312134, -0.2773638963699341, -0.26704421639442444, -0.2567245364189148, -0.24640488624572754, -0.2360852211713791, -0.22576555609703064, -0.2154458910226822, -0.20512622594833374, -0.1948065608739853, -0.18448689579963684, -0.1741672307252884, -0.16384756565093994, -0.1535279005765915, -0.14320823550224304, -0.1328885704278946, -0.12256890535354614, -0.11224924027919769, -0.10192957520484924, -0.0916099101305008, -0.08129024505615234, -0.0709705799818039, -0.060650914907455444, -0.050331249833106995, -0.040011584758758545, -0.029691919684410095, -0.019372254610061646, -0.009052589535713196, 0.001267075538635254, 0.011586740612983704, 0.021906375885009766, 0.032226040959358215, 0.042545706033706665, 0.052865371108055115, 0.06318503618240356, 0.07350470125675201, 0.08382436633110046, 0.09414403140544891, 0.10446369647979736, 0.11478336155414581, 0.12510302662849426, 0.1354226917028427, 0.14574235677719116, 0.1560620218515396, 0.16638168692588806, 0.1767013520002365, 0.18702101707458496, 0.1973406821489334, 0.20766034722328186, 0.2179800122976303, 0.22829967737197876, 0.2386193424463272, 0.24893900752067566, 0.2592586874961853, 0.26957833766937256, 0.2798979878425598, 0.29021766781806946, 0.3005373477935791, 0.31085699796676636, 0.3211766481399536, 0.33149632811546326, 0.3418160080909729, 0.35213565826416016]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 7.0, 12.0, 15.0, 18.0, 26.0, 59.0, 78.0, 140.0, 197.0, 285.0, 586.0, 1002.0, 1893.0, 3630.0, 7239.0, 14951.0, 34291.0, 87687.0, 287252.0, 403923.0, 122534.0, 44832.0, 19209.0, 9009.0, 4471.0, 2262.0, 1269.0, 697.0, 376.0, 192.0, 141.0, 97.0, 59.0, 38.0, 35.0, 18.0, 11.0, 6.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.323486328125, -0.31453895568847656, -0.3055915832519531, -0.2966442108154297, -0.28769683837890625, -0.2787494659423828, -0.2698020935058594, -0.26085472106933594, -0.2519073486328125, -0.24295997619628906, -0.23401260375976562, -0.2250652313232422, -0.21611785888671875, -0.2071704864501953, -0.19822311401367188, -0.18927574157714844, -0.180328369140625, -0.17138099670410156, -0.16243362426757812, -0.1534862518310547, -0.14453887939453125, -0.1355915069580078, -0.12664413452148438, -0.11769676208496094, -0.1087493896484375, -0.09980201721191406, -0.09085464477539062, -0.08190727233886719, -0.07295989990234375, -0.06401252746582031, -0.055065155029296875, -0.04611778259277344, -0.03717041015625, -0.028223037719726562, -0.019275665283203125, -0.010328292846679688, -0.00138092041015625, 0.0075664520263671875, 0.016513824462890625, 0.025461196899414062, 0.0344085693359375, 0.04335594177246094, 0.052303314208984375, 0.06125068664550781, 0.07019805908203125, 0.07914543151855469, 0.08809280395507812, 0.09704017639160156, 0.105987548828125, 0.11493492126464844, 0.12388229370117188, 0.1328296661376953, 0.14177703857421875, 0.1507244110107422, 0.15967178344726562, 0.16861915588378906, 0.1775665283203125, 0.18651390075683594, 0.19546127319335938, 0.2044086456298828, 0.21335601806640625, 0.2223033905029297, 0.23125076293945312, 0.24019813537597656, 0.2491455078125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 7.0, 2.0, 2.0, 6.0, 5.0, 5.0, 11.0, 9.0, 16.0, 7.0, 16.0, 15.0, 21.0, 20.0, 22.0, 19.0, 29.0, 34.0, 37.0, 28.0, 36.0, 35.0, 38.0, 37.0, 38.0, 49.0, 42.0, 44.0, 33.0, 42.0, 34.0, 47.0, 24.0, 27.0, 21.0, 23.0, 23.0, 14.0, 13.0, 21.0, 9.0, 12.0, 5.0, 2.0, 9.0, 7.0, 1.0, 2.0, 3.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.57373046875, -0.5545272827148438, -0.5353240966796875, -0.5161209106445312, -0.496917724609375, -0.47771453857421875, -0.4585113525390625, -0.43930816650390625, -0.42010498046875, -0.40090179443359375, -0.3816986083984375, -0.36249542236328125, -0.343292236328125, -0.32408905029296875, -0.3048858642578125, -0.28568267822265625, -0.2664794921875, -0.24727630615234375, -0.2280731201171875, -0.20886993408203125, -0.189666748046875, -0.17046356201171875, -0.1512603759765625, -0.13205718994140625, -0.11285400390625, -0.09365081787109375, -0.0744476318359375, -0.05524444580078125, -0.036041259765625, -0.01683807373046875, 0.0023651123046875, 0.02156829833984375, 0.040771484375, 0.05997467041015625, 0.0791778564453125, 0.09838104248046875, 0.117584228515625, 0.13678741455078125, 0.1559906005859375, 0.17519378662109375, 0.19439697265625, 0.21360015869140625, 0.2328033447265625, 0.25200653076171875, 0.271209716796875, 0.29041290283203125, 0.3096160888671875, 0.32881927490234375, 0.3480224609375, 0.36722564697265625, 0.3864288330078125, 0.40563201904296875, 0.424835205078125, 0.44403839111328125, 0.4632415771484375, 0.48244476318359375, 0.50164794921875, 0.5208511352539062, 0.5400543212890625, 0.5592575073242188, 0.578460693359375, 0.5976638793945312, 0.6168670654296875, 0.6360702514648438, 0.6552734375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 2.0, 8.0, 10.0, 6.0, 15.0, 18.0, 24.0, 45.0, 68.0, 96.0, 136.0, 267.0, 591.0, 2423.0, 21864.0, 696857.0, 310877.0, 12430.0, 1671.0, 521.0, 241.0, 142.0, 93.0, 43.0, 35.0, 18.0, 18.0, 14.0, 9.0, 6.0, 5.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.0517578125, -1.0216140747070312, -0.9914703369140625, -0.9613265991210938, -0.931182861328125, -0.9010391235351562, -0.8708953857421875, -0.8407516479492188, -0.81060791015625, -0.7804641723632812, -0.7503204345703125, -0.7201766967773438, -0.690032958984375, -0.6598892211914062, -0.6297454833984375, -0.5996017456054688, -0.5694580078125, -0.5393142700195312, -0.5091705322265625, -0.47902679443359375, -0.448883056640625, -0.41873931884765625, -0.3885955810546875, -0.35845184326171875, -0.32830810546875, -0.29816436767578125, -0.2680206298828125, -0.23787689208984375, -0.207733154296875, -0.17758941650390625, -0.1474456787109375, -0.11730194091796875, -0.087158203125, -0.05701446533203125, -0.0268707275390625, 0.00327301025390625, 0.033416748046875, 0.06356048583984375, 0.0937042236328125, 0.12384796142578125, 0.15399169921875, 0.18413543701171875, 0.2142791748046875, 0.24442291259765625, 0.274566650390625, 0.30471038818359375, 0.3348541259765625, 0.36499786376953125, 0.3951416015625, 0.42528533935546875, 0.4554290771484375, 0.48557281494140625, 0.515716552734375, 0.5458602905273438, 0.5760040283203125, 0.6061477661132812, 0.63629150390625, 0.6664352416992188, 0.6965789794921875, 0.7267227172851562, 0.756866455078125, 0.7870101928710938, 0.8171539306640625, 0.8472976684570312, 0.87744140625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 3.0, 5.0, 6.0, 6.0, 6.0, 7.0, 15.0, 12.0, 12.0, 15.0, 13.0, 26.0, 20.0, 30.0, 38.0, 36.0, 43.0, 49.0, 32.0, 52.0, 41.0, 44.0, 39.0, 41.0, 46.0, 55.0, 35.0, 50.0, 34.0, 29.0, 23.0, 21.0, 22.0, 17.0, 22.0, 10.0, 13.0, 4.0, 4.0, 4.0, 10.0, 3.0, 4.0, 4.0, 0.0, 3.0, 0.0, 3.0, 3.0], "bins": [-0.9736328125, -0.9471435546875, -0.920654296875, -0.8941650390625, -0.86767578125, -0.8411865234375, -0.814697265625, -0.7882080078125, -0.76171875, -0.7352294921875, -0.708740234375, -0.6822509765625, -0.65576171875, -0.6292724609375, -0.602783203125, -0.5762939453125, -0.5498046875, -0.5233154296875, -0.496826171875, -0.4703369140625, -0.44384765625, -0.4173583984375, -0.390869140625, -0.3643798828125, -0.337890625, -0.3114013671875, -0.284912109375, -0.2584228515625, -0.23193359375, -0.2054443359375, -0.178955078125, -0.1524658203125, -0.1259765625, -0.0994873046875, -0.072998046875, -0.0465087890625, -0.02001953125, 0.0064697265625, 0.032958984375, 0.0594482421875, 0.0859375, 0.1124267578125, 0.138916015625, 0.1654052734375, 0.19189453125, 0.2183837890625, 0.244873046875, 0.2713623046875, 0.2978515625, 0.3243408203125, 0.350830078125, 0.3773193359375, 0.40380859375, 0.4302978515625, 0.456787109375, 0.4832763671875, 0.509765625, 0.5362548828125, 0.562744140625, 0.5892333984375, 0.61572265625, 0.6422119140625, 0.668701171875, 0.6951904296875, 0.7216796875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 7.0, 11.0, 15.0, 24.0, 44.0, 75.0, 154.0, 267.0, 611.0, 2062.0, 11138.0, 268824.0, 737544.0, 23060.0, 3045.0, 838.0, 394.0, 189.0, 84.0, 52.0, 35.0, 21.0, 18.0, 8.0, 3.0, 6.0, 1.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.330322265625, -0.3197174072265625, -0.309112548828125, -0.2985076904296875, -0.28790283203125, -0.2772979736328125, -0.266693115234375, -0.2560882568359375, -0.2454833984375, -0.2348785400390625, -0.224273681640625, -0.2136688232421875, -0.20306396484375, -0.1924591064453125, -0.181854248046875, -0.1712493896484375, -0.16064453125, -0.1500396728515625, -0.139434814453125, -0.1288299560546875, -0.11822509765625, -0.1076202392578125, -0.097015380859375, -0.0864105224609375, -0.0758056640625, -0.0652008056640625, -0.054595947265625, -0.0439910888671875, -0.03338623046875, -0.0227813720703125, -0.012176513671875, -0.0015716552734375, 0.009033203125, 0.0196380615234375, 0.030242919921875, 0.0408477783203125, 0.05145263671875, 0.0620574951171875, 0.072662353515625, 0.0832672119140625, 0.0938720703125, 0.1044769287109375, 0.115081787109375, 0.1256866455078125, 0.13629150390625, 0.1468963623046875, 0.157501220703125, 0.1681060791015625, 0.1787109375, 0.1893157958984375, 0.199920654296875, 0.2105255126953125, 0.22113037109375, 0.2317352294921875, 0.242340087890625, 0.2529449462890625, 0.2635498046875, 0.2741546630859375, 0.284759521484375, 0.2953643798828125, 0.30596923828125, 0.3165740966796875, 0.327178955078125, 0.3377838134765625, 0.348388671875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 8.0, 2.0, 8.0, 12.0, 4.0, 20.0, 18.0, 28.0, 40.0, 52.0, 83.0, 87.0, 126.0, 125.0, 109.0, 81.0, 43.0, 38.0, 24.0, 19.0, 12.0, 14.0, 10.0, 12.0, 4.0, 4.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.002716064453125e-05, -1.9253231585025787e-05, -1.8479302525520325e-05, -1.7705373466014862e-05, -1.69314444065094e-05, -1.6157515347003937e-05, -1.5383586287498474e-05, -1.4609657227993011e-05, -1.3835728168487549e-05, -1.3061799108982086e-05, -1.2287870049476624e-05, -1.1513940989971161e-05, -1.0740011930465698e-05, -9.966082870960236e-06, -9.192153811454773e-06, -8.41822475194931e-06, -7.644295692443848e-06, -6.870366632938385e-06, -6.096437573432922e-06, -5.32250851392746e-06, -4.548579454421997e-06, -3.7746503949165344e-06, -3.0007213354110718e-06, -2.226792275905609e-06, -1.4528632164001465e-06, -6.789341568946838e-07, 9.499490261077881e-08, 8.689239621162415e-07, 1.642853021621704e-06, 2.4167820811271667e-06, 3.1907111406326294e-06, 3.964640200138092e-06, 4.738569259643555e-06, 5.512498319149017e-06, 6.28642737865448e-06, 7.060356438159943e-06, 7.834285497665405e-06, 8.608214557170868e-06, 9.38214361667633e-06, 1.0156072676181793e-05, 1.0930001735687256e-05, 1.1703930795192719e-05, 1.2477859854698181e-05, 1.3251788914203644e-05, 1.4025717973709106e-05, 1.4799647033214569e-05, 1.5573576092720032e-05, 1.6347505152225494e-05, 1.7121434211730957e-05, 1.789536327123642e-05, 1.8669292330741882e-05, 1.9443221390247345e-05, 2.0217150449752808e-05, 2.099107950925827e-05, 2.1765008568763733e-05, 2.2538937628269196e-05, 2.3312866687774658e-05, 2.408679574728012e-05, 2.4860724806785583e-05, 2.5634653866291046e-05, 2.640858292579651e-05, 2.718251198530197e-05, 2.7956441044807434e-05, 2.8730370104312897e-05, 2.950429916381836e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 2.0, 3.0, 8.0, 6.0, 9.0, 16.0, 25.0, 42.0, 57.0, 137.0, 208.0, 368.0, 749.0, 2019.0, 7919.0, 117654.0, 865814.0, 45675.0, 4956.0, 1526.0, 611.0, 301.0, 173.0, 93.0, 68.0, 36.0, 16.0, 17.0, 6.0, 12.0, 5.0, 7.0, 3.0, 0.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29443359375, -0.2836723327636719, -0.27291107177734375, -0.2621498107910156, -0.2513885498046875, -0.24062728881835938, -0.22986602783203125, -0.21910476684570312, -0.208343505859375, -0.19758224487304688, -0.18682098388671875, -0.17605972290039062, -0.1652984619140625, -0.15453720092773438, -0.14377593994140625, -0.13301467895507812, -0.12225341796875, -0.11149215698242188, -0.10073089599609375, -0.08996963500976562, -0.0792083740234375, -0.06844711303710938, -0.05768585205078125, -0.046924591064453125, -0.036163330078125, -0.025402069091796875, -0.01464080810546875, -0.003879547119140625, 0.0068817138671875, 0.017642974853515625, 0.02840423583984375, 0.039165496826171875, 0.0499267578125, 0.060688018798828125, 0.07144927978515625, 0.08221054077148438, 0.0929718017578125, 0.10373306274414062, 0.11449432373046875, 0.12525558471679688, 0.136016845703125, 0.14677810668945312, 0.15753936767578125, 0.16830062866210938, 0.1790618896484375, 0.18982315063476562, 0.20058441162109375, 0.21134567260742188, 0.22210693359375, 0.23286819458007812, 0.24362945556640625, 0.2543907165527344, 0.2651519775390625, 0.2759132385253906, 0.28667449951171875, 0.2974357604980469, 0.308197021484375, 0.3189582824707031, 0.32971954345703125, 0.3404808044433594, 0.3512420654296875, 0.3620033264160156, 0.37276458740234375, 0.3835258483886719, 0.394287109375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 7.0, 15.0, 13.0, 26.0, 28.0, 43.0, 80.0, 92.0, 128.0, 141.0, 128.0, 78.0, 68.0, 42.0, 44.0, 17.0, 10.0, 11.0, 7.0, 6.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.140869140625, -0.13730716705322266, -0.1337451934814453, -0.13018321990966797, -0.12662124633789062, -0.12305927276611328, -0.11949729919433594, -0.1159353256225586, -0.11237335205078125, -0.1088113784790039, -0.10524940490722656, -0.10168743133544922, -0.09812545776367188, -0.09456348419189453, -0.09100151062011719, -0.08743953704833984, -0.0838775634765625, -0.08031558990478516, -0.07675361633300781, -0.07319164276123047, -0.06962966918945312, -0.06606769561767578, -0.06250572204589844, -0.058943748474121094, -0.05538177490234375, -0.051819801330566406, -0.04825782775878906, -0.04469585418701172, -0.041133880615234375, -0.03757190704345703, -0.03400993347167969, -0.030447959899902344, -0.026885986328125, -0.023324012756347656, -0.019762039184570312, -0.01620006561279297, -0.012638092041015625, -0.009076118469238281, -0.0055141448974609375, -0.0019521713256835938, 0.00160980224609375, 0.005171775817871094, 0.008733749389648438, 0.012295722961425781, 0.015857696533203125, 0.01941967010498047, 0.022981643676757812, 0.026543617248535156, 0.0301055908203125, 0.033667564392089844, 0.03722953796386719, 0.04079151153564453, 0.044353485107421875, 0.04791545867919922, 0.05147743225097656, 0.055039405822753906, 0.05860137939453125, 0.062163352966308594, 0.06572532653808594, 0.06928730010986328, 0.07284927368164062, 0.07641124725341797, 0.07997322082519531, 0.08353519439697266, 0.08709716796875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 10.0, 17.0, 30.0, 52.0, 86.0, 144.0, 194.0, 209.0, 127.0, 73.0, 33.0, 19.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3770989179611206, -1.3074686527252197, -1.2378385066986084, -1.1682082414627075, -1.0985779762268066, -1.0289478302001953, -0.9593175649642944, -0.8896872997283936, -0.8200570940971375, -0.7504268884658813, -0.6807966232299805, -0.6111664175987244, -0.5415362119674683, -0.4719059467315674, -0.4022757411003113, -0.3326455056667328, -0.2630152702331543, -0.1933850347995758, -0.12375481426715851, -0.05412459373474121, 0.01550564169883728, 0.08513587713241577, 0.15476608276367188, 0.22439631819725037, 0.29402655363082886, 0.36365678906440735, 0.43328702449798584, 0.5029172301292419, 0.572547435760498, 0.6421777009963989, 0.711807906627655, 0.7814381122589111, 0.8510684967041016, 0.9206987023353577, 0.9903289675712585, 1.0599591732025146, 1.1295894384384155, 1.1992197036743164, 1.2688498497009277, 1.3384801149368286, 1.4081103801727295, 1.4777406454086304, 1.5473707914352417, 1.6170010566711426, 1.6866313219070435, 1.7562615871429443, 1.8258917331695557, 1.8955219984054565, 1.9651521444320679, 2.0347824096679688, 2.10441255569458, 2.1740427017211914, 2.243673086166382, 2.313303232192993, 2.3829336166381836, 2.452563762664795, 2.5221939086914062, 2.5918240547180176, 2.661454439163208, 2.7310845851898193, 2.8007147312164307, 2.870345115661621, 2.9399752616882324, 3.0096054077148438, 3.079235792160034]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 5.0, 4.0, 5.0, 7.0, 8.0, 13.0, 17.0, 10.0, 14.0, 19.0, 27.0, 25.0, 20.0, 34.0, 33.0, 37.0, 38.0, 35.0, 38.0, 41.0, 44.0, 43.0, 43.0, 46.0, 39.0, 37.0, 38.0, 41.0, 33.0, 32.0, 23.0, 18.0, 21.0, 12.0, 22.0, 15.0, 15.0, 14.0, 12.0, 7.0, 1.0, 3.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.158236026763916, -1.1192200183868408, -1.080203890800476, -1.0411878824234009, -1.0021718740463257, -0.9631558060646057, -0.9241397380828857, -0.8851237297058105, -0.8461077213287354, -0.8070916533470154, -0.7680756449699402, -0.7290595769882202, -0.690043568611145, -0.651027500629425, -0.6120114326477051, -0.5729954242706299, -0.5339793562889099, -0.49496331810951233, -0.45594727993011475, -0.4169312119483948, -0.3779152035713196, -0.3388991355895996, -0.299883097410202, -0.26086705923080444, -0.22185102105140686, -0.18283498287200928, -0.1438189446926117, -0.10480289161205292, -0.06578685343265533, -0.02677081525325775, 0.012245237827301025, 0.05126127600669861, 0.09027731418609619, 0.12929335236549377, 0.16830939054489136, 0.20732544362545013, 0.24634148180484772, 0.2853575348854065, 0.3243735730648041, 0.36338961124420166, 0.40240564942359924, 0.4414216876029968, 0.4804377257823944, 0.519453763961792, 0.558469831943512, 0.5974858403205872, 0.6365019083023071, 0.6755179166793823, 0.7145339846611023, 0.7535500526428223, 0.7925660610198975, 0.8315821290016174, 0.8705981373786926, 0.9096142053604126, 0.9486302137374878, 0.9876462817192078, 1.0266623497009277, 1.065678358078003, 1.1046944856643677, 1.1437104940414429, 1.182726502418518, 1.2217425107955933, 1.260758638381958, 1.2997746467590332, 1.3387906551361084]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 9.0, 6.0, 10.0, 12.0, 18.0, 26.0, 63.0, 78.0, 141.0, 264.0, 581.0, 1299.0, 3818.0, 14855.0, 104714.0, 1224940.0, 2498569.0, 303719.0, 30990.0, 6540.0, 2020.0, 781.0, 349.0, 167.0, 118.0, 59.0, 42.0, 31.0, 22.0, 12.0, 8.0, 7.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.900390625, -0.8724441528320312, -0.8444976806640625, -0.8165512084960938, -0.788604736328125, -0.7606582641601562, -0.7327117919921875, -0.7047653198242188, -0.67681884765625, -0.6488723754882812, -0.6209259033203125, -0.5929794311523438, -0.565032958984375, -0.5370864868164062, -0.5091400146484375, -0.48119354248046875, -0.4532470703125, -0.42530059814453125, -0.3973541259765625, -0.36940765380859375, -0.341461181640625, -0.31351470947265625, -0.2855682373046875, -0.25762176513671875, -0.22967529296875, -0.20172882080078125, -0.1737823486328125, -0.14583587646484375, -0.117889404296875, -0.08994293212890625, -0.0619964599609375, -0.03404998779296875, -0.006103515625, 0.02184295654296875, 0.0497894287109375, 0.07773590087890625, 0.105682373046875, 0.13362884521484375, 0.1615753173828125, 0.18952178955078125, 0.21746826171875, 0.24541473388671875, 0.2733612060546875, 0.30130767822265625, 0.329254150390625, 0.35720062255859375, 0.3851470947265625, 0.41309356689453125, 0.4410400390625, 0.46898651123046875, 0.4969329833984375, 0.5248794555664062, 0.552825927734375, 0.5807723999023438, 0.6087188720703125, 0.6366653442382812, 0.66461181640625, 0.6925582885742188, 0.7205047607421875, 0.7484512329101562, 0.776397705078125, 0.8043441772460938, 0.8322906494140625, 0.8602371215820312, 0.88818359375]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 1.0, 6.0, 10.0, 6.0, 10.0, 8.0, 16.0, 17.0, 17.0, 20.0, 25.0, 19.0, 21.0, 29.0, 30.0, 54.0, 29.0, 45.0, 44.0, 35.0, 46.0, 42.0, 52.0, 35.0, 47.0, 35.0, 33.0, 38.0, 28.0, 27.0, 31.0, 22.0, 20.0, 13.0, 15.0, 15.0, 11.0, 13.0, 7.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.435546875, -0.4223480224609375, -0.409149169921875, -0.3959503173828125, -0.38275146484375, -0.3695526123046875, -0.356353759765625, -0.3431549072265625, -0.3299560546875, -0.3167572021484375, -0.303558349609375, -0.2903594970703125, -0.27716064453125, -0.2639617919921875, -0.250762939453125, -0.2375640869140625, -0.224365234375, -0.2111663818359375, -0.197967529296875, -0.1847686767578125, -0.17156982421875, -0.1583709716796875, -0.145172119140625, -0.1319732666015625, -0.1187744140625, -0.1055755615234375, -0.092376708984375, -0.0791778564453125, -0.06597900390625, -0.0527801513671875, -0.039581298828125, -0.0263824462890625, -0.01318359375, 1.52587890625e-05, 0.013214111328125, 0.0264129638671875, 0.03961181640625, 0.0528106689453125, 0.066009521484375, 0.0792083740234375, 0.0924072265625, 0.1056060791015625, 0.118804931640625, 0.1320037841796875, 0.14520263671875, 0.1584014892578125, 0.171600341796875, 0.1847991943359375, 0.197998046875, 0.2111968994140625, 0.224395751953125, 0.2375946044921875, 0.25079345703125, 0.2639923095703125, 0.277191162109375, 0.2903900146484375, 0.3035888671875, 0.3167877197265625, 0.329986572265625, 0.3431854248046875, 0.35638427734375, 0.3695831298828125, 0.382781982421875, 0.3959808349609375, 0.4091796875]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 9.0, 5.0, 7.0, 8.0, 23.0, 32.0, 45.0, 71.0, 108.0, 197.0, 403.0, 911.0, 2615.0, 10420.0, 73120.0, 1918974.0, 2092384.0, 78789.0, 11244.0, 2873.0, 1008.0, 448.0, 218.0, 110.0, 92.0, 59.0, 44.0, 20.0, 7.0, 8.0, 5.0, 6.0, 8.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8125, -0.7812652587890625, -0.750030517578125, -0.7187957763671875, -0.68756103515625, -0.6563262939453125, -0.625091552734375, -0.5938568115234375, -0.5626220703125, -0.5313873291015625, -0.500152587890625, -0.4689178466796875, -0.43768310546875, -0.4064483642578125, -0.375213623046875, -0.3439788818359375, -0.312744140625, -0.2815093994140625, -0.250274658203125, -0.2190399169921875, -0.18780517578125, -0.1565704345703125, -0.125335693359375, -0.0941009521484375, -0.0628662109375, -0.0316314697265625, -0.000396728515625, 0.0308380126953125, 0.06207275390625, 0.0933074951171875, 0.124542236328125, 0.1557769775390625, 0.18701171875, 0.2182464599609375, 0.249481201171875, 0.2807159423828125, 0.31195068359375, 0.3431854248046875, 0.374420166015625, 0.4056549072265625, 0.4368896484375, 0.4681243896484375, 0.499359130859375, 0.5305938720703125, 0.56182861328125, 0.5930633544921875, 0.624298095703125, 0.6555328369140625, 0.686767578125, 0.7180023193359375, 0.749237060546875, 0.7804718017578125, 0.81170654296875, 0.8429412841796875, 0.874176025390625, 0.9054107666015625, 0.9366455078125, 0.9678802490234375, 0.999114990234375, 1.0303497314453125, 1.06158447265625, 1.0928192138671875, 1.124053955078125, 1.1552886962890625, 1.1865234375]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 5.0, 4.0, 2.0, 2.0, 7.0, 9.0, 6.0, 9.0, 17.0, 32.0, 34.0, 46.0, 63.0, 73.0, 143.0, 210.0, 275.0, 450.0, 568.0, 545.0, 473.0, 345.0, 249.0, 150.0, 124.0, 68.0, 47.0, 32.0, 30.0, 26.0, 13.0, 10.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27001953125, -0.2627696990966797, -0.2555198669433594, -0.24827003479003906, -0.24102020263671875, -0.23377037048339844, -0.22652053833007812, -0.2192707061767578, -0.2120208740234375, -0.2047710418701172, -0.19752120971679688, -0.19027137756347656, -0.18302154541015625, -0.17577171325683594, -0.16852188110351562, -0.1612720489501953, -0.154022216796875, -0.1467723846435547, -0.13952255249023438, -0.13227272033691406, -0.12502288818359375, -0.11777305603027344, -0.11052322387695312, -0.10327339172363281, -0.0960235595703125, -0.08877372741699219, -0.08152389526367188, -0.07427406311035156, -0.06702423095703125, -0.05977439880371094, -0.052524566650390625, -0.04527473449707031, -0.03802490234375, -0.030775070190429688, -0.023525238037109375, -0.016275405883789062, -0.00902557373046875, -0.0017757415771484375, 0.005474090576171875, 0.012723922729492188, 0.0199737548828125, 0.027223587036132812, 0.034473419189453125, 0.04172325134277344, 0.04897308349609375, 0.05622291564941406, 0.06347274780273438, 0.07072257995605469, 0.077972412109375, 0.08522224426269531, 0.09247207641601562, 0.09972190856933594, 0.10697174072265625, 0.11422157287597656, 0.12147140502929688, 0.1287212371826172, 0.1359710693359375, 0.1432209014892578, 0.15047073364257812, 0.15772056579589844, 0.16497039794921875, 0.17222023010253906, 0.17947006225585938, 0.1867198944091797, 0.1939697265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 14.0, 16.0, 27.0, 46.0, 77.0, 104.0, 131.0, 141.0, 145.0, 103.0, 81.0, 46.0, 38.0, 18.0, 8.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5321861505508423, -1.486545205116272, -1.4409042596817017, -1.3952631950378418, -1.3496222496032715, -1.3039813041687012, -1.2583403587341309, -1.2126994132995605, -1.1670584678649902, -1.12141752243042, -1.0757765769958496, -1.0301356315612793, -0.9844945669174194, -0.9388536214828491, -0.8932126760482788, -0.8475717306137085, -0.8019306659698486, -0.7562897205352783, -0.7106487154960632, -0.6650077700614929, -0.6193667650222778, -0.5737258195877075, -0.5280848741531372, -0.4824438989162445, -0.4368029236793518, -0.3911619484424591, -0.3455209732055664, -0.2998800277709961, -0.2542390525341034, -0.2085980772972107, -0.16295713186264038, -0.11731615662574768, -0.07167518138885498, -0.026034213602542877, 0.019606754183769226, 0.06524771451950073, 0.11088868975639343, 0.15652966499328613, 0.20217061042785645, 0.24781158566474915, 0.29345256090164185, 0.33909353613853455, 0.38473451137542725, 0.43037545680999756, 0.47601643204689026, 0.521657407283783, 0.5672983527183533, 0.6129393577575684, 0.6585803031921387, 0.704221248626709, 0.7498622536659241, 0.7955031991004944, 0.8411442041397095, 0.8867851495742798, 0.9324260950088501, 0.9780670404434204, 1.0237081050872803, 1.0693490505218506, 1.114989995956421, 1.1606309413909912, 1.206272006034851, 1.2519129514694214, 1.2975538969039917, 1.343194842338562, 1.3888357877731323]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 10.0, 4.0, 4.0, 12.0, 10.0, 14.0, 15.0, 15.0, 19.0, 30.0, 26.0, 25.0, 35.0, 44.0, 37.0, 37.0, 34.0, 40.0, 34.0, 52.0, 46.0, 34.0, 37.0, 42.0, 34.0, 44.0, 35.0, 42.0, 26.0, 21.0, 25.0, 18.0, 11.0, 15.0, 14.0, 8.0, 7.0, 12.0, 9.0, 8.0, 5.0, 1.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4953939616680145, -0.4797289967536926, -0.4640640318393707, -0.44839906692504883, -0.43273407220840454, -0.41706913709640503, -0.40140414237976074, -0.38573917746543884, -0.37007421255111694, -0.35440924763679504, -0.33874428272247314, -0.32307931780815125, -0.30741435289382935, -0.29174935817718506, -0.27608439326286316, -0.26041942834854126, -0.24475446343421936, -0.22908949851989746, -0.21342453360557556, -0.19775955379009247, -0.18209458887577057, -0.16642962396144867, -0.15076464414596558, -0.13509967923164368, -0.11943471431732178, -0.10376974940299988, -0.08810477703809738, -0.07243980467319489, -0.056774839758872986, -0.041109874844551086, -0.02544490247964859, -0.009779930114746094, 0.005885064601898193, 0.02155003324151039, 0.03721500188112259, 0.05287997052073479, 0.06854493916034698, 0.08420990407466888, 0.09987487643957138, 0.11553984880447388, 0.13120481371879578, 0.14686977863311768, 0.16253474354743958, 0.17819972336292267, 0.19386468827724457, 0.20952965319156647, 0.22519463300704956, 0.24085959792137146, 0.25652456283569336, 0.27218952775001526, 0.28785449266433716, 0.30351945757865906, 0.31918442249298096, 0.33484941720962524, 0.35051438212394714, 0.36617934703826904, 0.38184431195259094, 0.39750927686691284, 0.41317424178123474, 0.42883920669555664, 0.4445042014122009, 0.46016913652420044, 0.4758341312408447, 0.4914990961551666, 0.5071640610694885]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 8.0, 9.0, 8.0, 16.0, 22.0, 46.0, 88.0, 142.0, 315.0, 818.0, 2033.0, 6050.0, 23891.0, 155502.0, 656166.0, 168297.0, 25064.0, 6441.0, 2114.0, 815.0, 376.0, 154.0, 84.0, 35.0, 22.0, 9.0, 7.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.238037109375, -0.22997283935546875, -0.2219085693359375, -0.21384429931640625, -0.205780029296875, -0.19771575927734375, -0.1896514892578125, -0.18158721923828125, -0.17352294921875, -0.16545867919921875, -0.1573944091796875, -0.14933013916015625, -0.141265869140625, -0.13320159912109375, -0.1251373291015625, -0.11707305908203125, -0.1090087890625, -0.10094451904296875, -0.0928802490234375, -0.08481597900390625, -0.076751708984375, -0.06868743896484375, -0.0606231689453125, -0.05255889892578125, -0.04449462890625, -0.03643035888671875, -0.0283660888671875, -0.02030181884765625, -0.012237548828125, -0.00417327880859375, 0.0038909912109375, 0.01195526123046875, 0.02001953125, 0.02808380126953125, 0.0361480712890625, 0.04421234130859375, 0.052276611328125, 0.06034088134765625, 0.0684051513671875, 0.07646942138671875, 0.08453369140625, 0.09259796142578125, 0.1006622314453125, 0.10872650146484375, 0.116790771484375, 0.12485504150390625, 0.1329193115234375, 0.14098358154296875, 0.1490478515625, 0.15711212158203125, 0.1651763916015625, 0.17324066162109375, 0.181304931640625, 0.18936920166015625, 0.1974334716796875, 0.20549774169921875, 0.21356201171875, 0.22162628173828125, 0.2296905517578125, 0.23775482177734375, 0.245819091796875, 0.25388336181640625, 0.2619476318359375, 0.27001190185546875, 0.278076171875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 8.0, 8.0, 10.0, 18.0, 15.0, 16.0, 20.0, 22.0, 25.0, 37.0, 40.0, 47.0, 38.0, 64.0, 51.0, 43.0, 40.0, 59.0, 53.0, 44.0, 51.0, 49.0, 43.0, 28.0, 32.0, 26.0, 17.0, 17.0, 11.0, 9.0, 12.0, 11.0, 3.0, 10.0, 5.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.4306640625, -0.41888427734375, -0.4071044921875, -0.39532470703125, -0.383544921875, -0.37176513671875, -0.3599853515625, -0.34820556640625, -0.33642578125, -0.32464599609375, -0.3128662109375, -0.30108642578125, -0.289306640625, -0.27752685546875, -0.2657470703125, -0.25396728515625, -0.2421875, -0.23040771484375, -0.2186279296875, -0.20684814453125, -0.195068359375, -0.18328857421875, -0.1715087890625, -0.15972900390625, -0.14794921875, -0.13616943359375, -0.1243896484375, -0.11260986328125, -0.100830078125, -0.08905029296875, -0.0772705078125, -0.06549072265625, -0.0537109375, -0.04193115234375, -0.0301513671875, -0.01837158203125, -0.006591796875, 0.00518798828125, 0.0169677734375, 0.02874755859375, 0.04052734375, 0.05230712890625, 0.0640869140625, 0.07586669921875, 0.087646484375, 0.09942626953125, 0.1112060546875, 0.12298583984375, 0.134765625, 0.14654541015625, 0.1583251953125, 0.17010498046875, 0.181884765625, 0.19366455078125, 0.2054443359375, 0.21722412109375, 0.22900390625, 0.24078369140625, 0.2525634765625, 0.26434326171875, 0.276123046875, 0.28790283203125, 0.2996826171875, 0.31146240234375, 0.3232421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 3.0, 5.0, 10.0, 16.0, 14.0, 24.0, 38.0, 46.0, 77.0, 124.0, 231.0, 409.0, 802.0, 1562.0, 3326.0, 8273.0, 24915.0, 90688.0, 317496.0, 401396.0, 141848.0, 37096.0, 11567.0, 4441.0, 1958.0, 963.0, 516.0, 258.0, 172.0, 82.0, 59.0, 50.0, 21.0, 18.0, 21.0, 7.0, 8.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1143798828125, -0.11058807373046875, -0.1067962646484375, -0.10300445556640625, -0.099212646484375, -0.09542083740234375, -0.0916290283203125, -0.08783721923828125, -0.08404541015625, -0.08025360107421875, -0.0764617919921875, -0.07266998291015625, -0.068878173828125, -0.06508636474609375, -0.0612945556640625, -0.05750274658203125, -0.0537109375, -0.04991912841796875, -0.0461273193359375, -0.04233551025390625, -0.038543701171875, -0.03475189208984375, -0.0309600830078125, -0.02716827392578125, -0.02337646484375, -0.01958465576171875, -0.0157928466796875, -0.01200103759765625, -0.008209228515625, -0.00441741943359375, -0.0006256103515625, 0.00316619873046875, 0.0069580078125, 0.01074981689453125, 0.0145416259765625, 0.01833343505859375, 0.022125244140625, 0.02591705322265625, 0.0297088623046875, 0.03350067138671875, 0.03729248046875, 0.04108428955078125, 0.0448760986328125, 0.04866790771484375, 0.052459716796875, 0.05625152587890625, 0.0600433349609375, 0.06383514404296875, 0.067626953125, 0.07141876220703125, 0.0752105712890625, 0.07900238037109375, 0.082794189453125, 0.08658599853515625, 0.0903778076171875, 0.09416961669921875, 0.09796142578125, 0.10175323486328125, 0.1055450439453125, 0.10933685302734375, 0.113128662109375, 0.11692047119140625, 0.1207122802734375, 0.12450408935546875, 0.1282958984375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 0.0, 2.0, 6.0, 8.0, 4.0, 7.0, 9.0, 20.0, 17.0, 13.0, 21.0, 25.0, 19.0, 26.0, 30.0, 30.0, 37.0, 34.0, 29.0, 49.0, 54.0, 35.0, 35.0, 37.0, 35.0, 50.0, 40.0, 41.0, 36.0, 39.0, 30.0, 28.0, 24.0, 18.0, 22.0, 18.0, 11.0, 10.0, 7.0, 7.0, 5.0, 7.0, 5.0, 1.0, 10.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.60302734375, -0.5830841064453125, -0.563140869140625, -0.5431976318359375, -0.52325439453125, -0.5033111572265625, -0.483367919921875, -0.4634246826171875, -0.4434814453125, -0.4235382080078125, -0.403594970703125, -0.3836517333984375, -0.36370849609375, -0.3437652587890625, -0.323822021484375, -0.3038787841796875, -0.283935546875, -0.2639923095703125, -0.244049072265625, -0.2241058349609375, -0.20416259765625, -0.1842193603515625, -0.164276123046875, -0.1443328857421875, -0.1243896484375, -0.1044464111328125, -0.084503173828125, -0.0645599365234375, -0.04461669921875, -0.0246734619140625, -0.004730224609375, 0.0152130126953125, 0.03515625, 0.0550994873046875, 0.075042724609375, 0.0949859619140625, 0.11492919921875, 0.1348724365234375, 0.154815673828125, 0.1747589111328125, 0.1947021484375, 0.2146453857421875, 0.234588623046875, 0.2545318603515625, 0.27447509765625, 0.2944183349609375, 0.314361572265625, 0.3343048095703125, 0.354248046875, 0.3741912841796875, 0.394134521484375, 0.4140777587890625, 0.43402099609375, 0.4539642333984375, 0.473907470703125, 0.4938507080078125, 0.5137939453125, 0.5337371826171875, 0.553680419921875, 0.5736236572265625, 0.59356689453125, 0.6135101318359375, 0.633453369140625, 0.6533966064453125, 0.67333984375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 4.0, 15.0, 7.0, 11.0, 20.0, 26.0, 36.0, 62.0, 87.0, 131.0, 178.0, 307.0, 584.0, 1029.0, 1822.0, 3512.0, 7322.0, 16681.0, 46431.0, 201142.0, 533492.0, 165950.0, 40464.0, 15130.0, 6838.0, 3226.0, 1724.0, 912.0, 521.0, 292.0, 185.0, 134.0, 90.0, 55.0, 47.0, 20.0, 17.0, 19.0, 7.0, 6.0, 10.0, 4.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.061553955078125, -0.059656620025634766, -0.05775928497314453, -0.0558619499206543, -0.05396461486816406, -0.05206727981567383, -0.050169944763183594, -0.04827260971069336, -0.046375274658203125, -0.04447793960571289, -0.042580604553222656, -0.04068326950073242, -0.03878593444824219, -0.03688859939575195, -0.03499126434326172, -0.033093929290771484, -0.03119659423828125, -0.029299259185791016, -0.02740192413330078, -0.025504589080810547, -0.023607254028320312, -0.021709918975830078, -0.019812583923339844, -0.01791524887084961, -0.016017913818359375, -0.01412057876586914, -0.012223243713378906, -0.010325908660888672, -0.008428573608398438, -0.006531238555908203, -0.004633903503417969, -0.0027365684509277344, -0.0008392333984375, 0.0010581016540527344, 0.0029554367065429688, 0.004852771759033203, 0.0067501068115234375, 0.008647441864013672, 0.010544776916503906, 0.01244211196899414, 0.014339447021484375, 0.01623678207397461, 0.018134117126464844, 0.020031452178955078, 0.021928787231445312, 0.023826122283935547, 0.02572345733642578, 0.027620792388916016, 0.02951812744140625, 0.031415462493896484, 0.03331279754638672, 0.03521013259887695, 0.03710746765136719, 0.03900480270385742, 0.040902137756347656, 0.04279947280883789, 0.044696807861328125, 0.04659414291381836, 0.048491477966308594, 0.05038881301879883, 0.05228614807128906, 0.0541834831237793, 0.05608081817626953, 0.057978153228759766, 0.05987548828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 8.0, 10.0, 20.0, 25.0, 52.0, 71.0, 121.0, 140.0, 165.0, 137.0, 77.0, 60.0, 33.0, 20.0, 10.0, 9.0, 8.0, 1.0, 5.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.1113624572753906e-05, -3.001280128955841e-05, -2.8911978006362915e-05, -2.781115472316742e-05, -2.6710331439971924e-05, -2.5609508156776428e-05, -2.4508684873580933e-05, -2.3407861590385437e-05, -2.230703830718994e-05, -2.1206215023994446e-05, -2.010539174079895e-05, -1.9004568457603455e-05, -1.790374517440796e-05, -1.6802921891212463e-05, -1.5702098608016968e-05, -1.4601275324821472e-05, -1.3500452041625977e-05, -1.2399628758430481e-05, -1.1298805475234985e-05, -1.019798219203949e-05, -9.097158908843994e-06, -7.996335625648499e-06, -6.895512342453003e-06, -5.794689059257507e-06, -4.693865776062012e-06, -3.593042492866516e-06, -2.4922192096710205e-06, -1.391395926475525e-06, -2.905726432800293e-07, 8.102506399154663e-07, 1.911073923110962e-06, 3.0118972063064575e-06, 4.112720489501953e-06, 5.213543772697449e-06, 6.314367055892944e-06, 7.41519033908844e-06, 8.516013622283936e-06, 9.616836905479431e-06, 1.0717660188674927e-05, 1.1818483471870422e-05, 1.2919306755065918e-05, 1.4020130038261414e-05, 1.512095332145691e-05, 1.6221776604652405e-05, 1.73225998878479e-05, 1.8423423171043396e-05, 1.952424645423889e-05, 2.0625069737434387e-05, 2.1725893020629883e-05, 2.282671630382538e-05, 2.3927539587020874e-05, 2.502836287021637e-05, 2.6129186153411865e-05, 2.723000943660736e-05, 2.8330832719802856e-05, 2.9431656002998352e-05, 3.053247928619385e-05, 3.163330256938934e-05, 3.273412585258484e-05, 3.3834949135780334e-05, 3.493577241897583e-05, 3.6036595702171326e-05, 3.713741898536682e-05, 3.823824226856232e-05, 3.933906555175781e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 7.0, 5.0, 2.0, 10.0, 7.0, 11.0, 17.0, 19.0, 29.0, 30.0, 36.0, 48.0, 70.0, 140.0, 227.0, 428.0, 831.0, 1707.0, 3623.0, 8833.0, 24590.0, 99682.0, 549671.0, 283596.0, 48913.0, 15004.0, 5803.0, 2495.0, 1200.0, 619.0, 309.0, 204.0, 120.0, 70.0, 55.0, 33.0, 23.0, 18.0, 17.0, 11.0, 9.0, 9.0, 5.0, 6.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.07830810546875, -0.07567787170410156, -0.07304763793945312, -0.07041740417480469, -0.06778717041015625, -0.06515693664550781, -0.06252670288085938, -0.05989646911621094, -0.0572662353515625, -0.05463600158691406, -0.052005767822265625, -0.04937553405761719, -0.04674530029296875, -0.04411506652832031, -0.041484832763671875, -0.03885459899902344, -0.036224365234375, -0.03359413146972656, -0.030963897705078125, -0.028333663940429688, -0.02570343017578125, -0.023073196411132812, -0.020442962646484375, -0.017812728881835938, -0.0151824951171875, -0.012552261352539062, -0.009922027587890625, -0.0072917938232421875, -0.00466156005859375, -0.0020313262939453125, 0.000598907470703125, 0.0032291412353515625, 0.005859375, 0.008489608764648438, 0.011119842529296875, 0.013750076293945312, 0.01638031005859375, 0.019010543823242188, 0.021640777587890625, 0.024271011352539062, 0.0269012451171875, 0.029531478881835938, 0.032161712646484375, 0.03479194641113281, 0.03742218017578125, 0.04005241394042969, 0.042682647705078125, 0.04531288146972656, 0.047943115234375, 0.05057334899902344, 0.053203582763671875, 0.05583381652832031, 0.05846405029296875, 0.06109428405761719, 0.06372451782226562, 0.06635475158691406, 0.0689849853515625, 0.07161521911621094, 0.07424545288085938, 0.07687568664550781, 0.07950592041015625, 0.08213615417480469, 0.08476638793945312, 0.08739662170410156, 0.09002685546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 7.0, 7.0, 9.0, 11.0, 5.0, 22.0, 22.0, 30.0, 61.0, 73.0, 95.0, 126.0, 117.0, 110.0, 99.0, 49.0, 40.0, 24.0, 16.0, 16.0, 14.0, 12.0, 8.0, 5.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03289794921875, -0.031966447830200195, -0.03103494644165039, -0.030103445053100586, -0.02917194366455078, -0.028240442276000977, -0.027308940887451172, -0.026377439498901367, -0.025445938110351562, -0.024514436721801758, -0.023582935333251953, -0.02265143394470215, -0.021719932556152344, -0.02078843116760254, -0.019856929779052734, -0.01892542839050293, -0.017993927001953125, -0.01706242561340332, -0.016130924224853516, -0.015199422836303711, -0.014267921447753906, -0.013336420059204102, -0.012404918670654297, -0.011473417282104492, -0.010541915893554688, -0.009610414505004883, -0.008678913116455078, -0.0077474117279052734, -0.006815910339355469, -0.005884408950805664, -0.004952907562255859, -0.004021406173706055, -0.00308990478515625, -0.0021584033966064453, -0.0012269020080566406, -0.00029540061950683594, 0.0006361007690429688, 0.0015676021575927734, 0.002499103546142578, 0.003430604934692383, 0.0043621063232421875, 0.005293607711791992, 0.006225109100341797, 0.0071566104888916016, 0.008088111877441406, 0.009019613265991211, 0.009951114654541016, 0.01088261604309082, 0.011814117431640625, 0.01274561882019043, 0.013677120208740234, 0.014608621597290039, 0.015540122985839844, 0.01647162437438965, 0.017403125762939453, 0.018334627151489258, 0.019266128540039062, 0.020197629928588867, 0.021129131317138672, 0.022060632705688477, 0.02299213409423828, 0.023923635482788086, 0.02485513687133789, 0.025786638259887695, 0.0267181396484375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 9.0, 23.0, 35.0, 58.0, 84.0, 137.0, 161.0, 154.0, 140.0, 80.0, 54.0, 40.0, 12.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9094133377075195, -0.8789806365966797, -0.8485479354858398, -0.818115234375, -0.7876825332641602, -0.7572498321533203, -0.7268170714378357, -0.6963843703269958, -0.665951669216156, -0.6355189681053162, -0.6050862669944763, -0.5746535658836365, -0.5442208051681519, -0.513788104057312, -0.48335540294647217, -0.4529227018356323, -0.4224900007247925, -0.39205729961395264, -0.3616245985031128, -0.33119186758995056, -0.3007591664791107, -0.2703264653682709, -0.23989374935626984, -0.2094610333442688, -0.17902833223342896, -0.1485956311225891, -0.11816291511058807, -0.08773020654916763, -0.05729749798774719, -0.02686479687690735, 0.003567919135093689, 0.03400063514709473, 0.06443333625793457, 0.09486604481935501, 0.12529875338077545, 0.1557314693927765, 0.18616417050361633, 0.21659687161445618, 0.24702958762645721, 0.27746230363845825, 0.3078950047492981, 0.33832770586013794, 0.3687604069709778, 0.39919313788414, 0.42962583899497986, 0.4600585401058197, 0.49049127101898193, 0.5209239721298218, 0.5513566732406616, 0.5817893743515015, 0.6122220754623413, 0.6426547765731812, 0.673087477684021, 0.7035201787948608, 0.7339529395103455, 0.7643856406211853, 0.7948183417320251, 0.825251042842865, 0.8556837439537048, 0.8861164450645447, 0.9165492057800293, 0.9469819068908691, 0.977414608001709, 1.0078473091125488, 1.0382800102233887]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 6.0, 3.0, 13.0, 13.0, 14.0, 13.0, 23.0, 25.0, 20.0, 26.0, 40.0, 41.0, 38.0, 49.0, 40.0, 34.0, 55.0, 48.0, 48.0, 39.0, 38.0, 50.0, 48.0, 37.0, 35.0, 31.0, 28.0, 26.0, 22.0, 13.0, 13.0, 10.0, 11.0, 8.0, 13.0, 6.0, 2.0, 5.0, 4.0, 3.0, 4.0, 3.0, 1.0, 3.0], "bins": [-0.4059903621673584, -0.3953148126602173, -0.38463926315307617, -0.37396374344825745, -0.36328819394111633, -0.3526126444339752, -0.3419370949268341, -0.3312615752220154, -0.32058602571487427, -0.30991047620773315, -0.29923492670059204, -0.2885594069957733, -0.2778838574886322, -0.2672083079814911, -0.25653275847435, -0.24585722386837006, -0.23518167436122894, -0.22450612485408783, -0.2138305902481079, -0.2031550407409668, -0.19247950613498688, -0.18180395662784576, -0.17112842202186584, -0.16045287251472473, -0.14977732300758362, -0.1391017735004425, -0.12842623889446259, -0.11775068938732147, -0.10707515478134155, -0.09639960527420044, -0.08572406321763992, -0.0750485211610794, -0.06437298655509949, -0.05369744449853897, -0.043021902441978455, -0.03234635666012764, -0.021670814603567123, -0.010995272547006607, -0.00031972676515579224, 0.010355815291404724, 0.02103135734796524, 0.03170689940452576, 0.04238244146108627, 0.05305798724293709, 0.0637335330247879, 0.07440906763076782, 0.08508461713790894, 0.09576015919446945, 0.10643570125102997, 0.11711124330759048, 0.127786785364151, 0.13846233487129211, 0.14913786947727203, 0.15981341898441315, 0.17048895359039307, 0.18116450309753418, 0.1918400526046753, 0.2025156021118164, 0.21319113671779633, 0.22386668622493744, 0.23454222083091736, 0.24521777033805847, 0.2558933198451996, 0.2665688395500183, 0.2772443890571594]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 7.0, 7.0, 5.0, 17.0, 15.0, 17.0, 48.0, 55.0, 90.0, 122.0, 229.0, 382.0, 671.0, 1518.0, 3745.0, 10316.0, 32350.0, 155245.0, 665793.0, 132404.0, 29469.0, 9566.0, 3439.0, 1495.0, 614.0, 350.0, 217.0, 136.0, 65.0, 60.0, 35.0, 18.0, 22.0, 12.0, 7.0, 9.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.447265625, -0.43389892578125, -0.4205322265625, -0.40716552734375, -0.393798828125, -0.38043212890625, -0.3670654296875, -0.35369873046875, -0.34033203125, -0.32696533203125, -0.3135986328125, -0.30023193359375, -0.286865234375, -0.27349853515625, -0.2601318359375, -0.24676513671875, -0.2333984375, -0.22003173828125, -0.2066650390625, -0.19329833984375, -0.179931640625, -0.16656494140625, -0.1531982421875, -0.13983154296875, -0.12646484375, -0.11309814453125, -0.0997314453125, -0.08636474609375, -0.072998046875, -0.05963134765625, -0.0462646484375, -0.03289794921875, -0.01953125, -0.00616455078125, 0.0072021484375, 0.02056884765625, 0.033935546875, 0.04730224609375, 0.0606689453125, 0.07403564453125, 0.08740234375, 0.10076904296875, 0.1141357421875, 0.12750244140625, 0.140869140625, 0.15423583984375, 0.1676025390625, 0.18096923828125, 0.1943359375, 0.20770263671875, 0.2210693359375, 0.23443603515625, 0.247802734375, 0.26116943359375, 0.2745361328125, 0.28790283203125, 0.30126953125, 0.31463623046875, 0.3280029296875, 0.34136962890625, 0.354736328125, 0.36810302734375, 0.3814697265625, 0.39483642578125, 0.408203125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 8.0, 10.0, 4.0, 11.0, 11.0, 19.0, 20.0, 35.0, 20.0, 34.0, 33.0, 43.0, 46.0, 41.0, 50.0, 45.0, 47.0, 44.0, 52.0, 41.0, 56.0, 52.0, 44.0, 26.0, 39.0, 27.0, 26.0, 15.0, 20.0, 15.0, 17.0, 10.0, 15.0, 3.0, 12.0, 3.0, 0.0, 3.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.755859375, -0.7333450317382812, -0.7108306884765625, -0.6883163452148438, -0.665802001953125, -0.6432876586914062, -0.6207733154296875, -0.5982589721679688, -0.57574462890625, -0.5532302856445312, -0.5307159423828125, -0.5082015991210938, -0.485687255859375, -0.46317291259765625, -0.4406585693359375, -0.41814422607421875, -0.3956298828125, -0.37311553955078125, -0.3506011962890625, -0.32808685302734375, -0.305572509765625, -0.28305816650390625, -0.2605438232421875, -0.23802947998046875, -0.21551513671875, -0.19300079345703125, -0.1704864501953125, -0.14797210693359375, -0.125457763671875, -0.10294342041015625, -0.0804290771484375, -0.05791473388671875, -0.035400390625, -0.01288604736328125, 0.0096282958984375, 0.03214263916015625, 0.054656982421875, 0.07717132568359375, 0.0996856689453125, 0.12220001220703125, 0.14471435546875, 0.16722869873046875, 0.1897430419921875, 0.21225738525390625, 0.234771728515625, 0.25728607177734375, 0.2798004150390625, 0.30231475830078125, 0.3248291015625, 0.34734344482421875, 0.3698577880859375, 0.39237213134765625, 0.414886474609375, 0.43740081787109375, 0.4599151611328125, 0.48242950439453125, 0.50494384765625, 0.5274581909179688, 0.5499725341796875, 0.5724868774414062, 0.595001220703125, 0.6175155639648438, 0.6400299072265625, 0.6625442504882812, 0.68505859375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 7.0, 1.0, 9.0, 3.0, 13.0, 3.0, 20.0, 23.0, 33.0, 30.0, 36.0, 60.0, 82.0, 113.0, 187.0, 292.0, 605.0, 1994.0, 16078.0, 631601.0, 381495.0, 12577.0, 1819.0, 565.0, 288.0, 156.0, 121.0, 86.0, 53.0, 46.0, 31.0, 19.0, 20.0, 16.0, 14.0, 11.0, 9.0, 13.0, 6.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.0302734375, -0.9990081787109375, -0.967742919921875, -0.9364776611328125, -0.90521240234375, -0.8739471435546875, -0.842681884765625, -0.8114166259765625, -0.7801513671875, -0.7488861083984375, -0.717620849609375, -0.6863555908203125, -0.65509033203125, -0.6238250732421875, -0.592559814453125, -0.5612945556640625, -0.530029296875, -0.4987640380859375, -0.467498779296875, -0.4362335205078125, -0.40496826171875, -0.3737030029296875, -0.342437744140625, -0.3111724853515625, -0.2799072265625, -0.2486419677734375, -0.217376708984375, -0.1861114501953125, -0.15484619140625, -0.1235809326171875, -0.092315673828125, -0.0610504150390625, -0.02978515625, 0.0014801025390625, 0.032745361328125, 0.0640106201171875, 0.09527587890625, 0.1265411376953125, 0.157806396484375, 0.1890716552734375, 0.2203369140625, 0.2516021728515625, 0.282867431640625, 0.3141326904296875, 0.34539794921875, 0.3766632080078125, 0.407928466796875, 0.4391937255859375, 0.470458984375, 0.5017242431640625, 0.532989501953125, 0.5642547607421875, 0.59552001953125, 0.6267852783203125, 0.658050537109375, 0.6893157958984375, 0.7205810546875, 0.7518463134765625, 0.783111572265625, 0.8143768310546875, 0.84564208984375, 0.8769073486328125, 0.908172607421875, 0.9394378662109375, 0.970703125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 8.0, 9.0, 7.0, 4.0, 6.0, 8.0, 12.0, 9.0, 10.0, 16.0, 26.0, 27.0, 33.0, 32.0, 31.0, 42.0, 33.0, 54.0, 45.0, 43.0, 48.0, 43.0, 37.0, 52.0, 47.0, 31.0, 24.0, 35.0, 19.0, 27.0, 32.0, 30.0, 18.0, 17.0, 10.0, 15.0, 13.0, 11.0, 7.0, 5.0, 5.0, 6.0, 3.0, 1.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.75634765625, -0.732391357421875, -0.70843505859375, -0.684478759765625, -0.6605224609375, -0.636566162109375, -0.61260986328125, -0.588653564453125, -0.564697265625, -0.540740966796875, -0.51678466796875, -0.492828369140625, -0.4688720703125, -0.444915771484375, -0.42095947265625, -0.397003173828125, -0.373046875, -0.349090576171875, -0.32513427734375, -0.301177978515625, -0.2772216796875, -0.253265380859375, -0.22930908203125, -0.205352783203125, -0.181396484375, -0.157440185546875, -0.13348388671875, -0.109527587890625, -0.0855712890625, -0.061614990234375, -0.03765869140625, -0.013702392578125, 0.01025390625, 0.034210205078125, 0.05816650390625, 0.082122802734375, 0.1060791015625, 0.130035400390625, 0.15399169921875, 0.177947998046875, 0.201904296875, 0.225860595703125, 0.24981689453125, 0.273773193359375, 0.2977294921875, 0.321685791015625, 0.34564208984375, 0.369598388671875, 0.3935546875, 0.417510986328125, 0.44146728515625, 0.465423583984375, 0.4893798828125, 0.513336181640625, 0.53729248046875, 0.561248779296875, 0.585205078125, 0.609161376953125, 0.63311767578125, 0.657073974609375, 0.6810302734375, 0.704986572265625, 0.72894287109375, 0.752899169921875, 0.77685546875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 2.0, 3.0, 15.0, 17.0, 23.0, 31.0, 48.0, 55.0, 88.0, 85.0, 146.0, 190.0, 319.0, 512.0, 878.0, 1603.0, 3271.0, 9185.0, 45765.0, 667927.0, 279945.0, 26064.0, 6465.0, 2600.0, 1293.0, 724.0, 408.0, 260.0, 187.0, 123.0, 83.0, 74.0, 35.0, 36.0, 18.0, 10.0, 16.0, 9.0, 12.0, 3.0, 3.0, 6.0, 7.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.173828125, -0.16800498962402344, -0.16218185424804688, -0.1563587188720703, -0.15053558349609375, -0.1447124481201172, -0.13888931274414062, -0.13306617736816406, -0.1272430419921875, -0.12141990661621094, -0.11559677124023438, -0.10977363586425781, -0.10395050048828125, -0.09812736511230469, -0.09230422973632812, -0.08648109436035156, -0.080657958984375, -0.07483482360839844, -0.06901168823242188, -0.06318855285644531, -0.05736541748046875, -0.05154228210449219, -0.045719146728515625, -0.03989601135253906, -0.0340728759765625, -0.028249740600585938, -0.022426605224609375, -0.016603469848632812, -0.01078033447265625, -0.0049571990966796875, 0.000865936279296875, 0.0066890716552734375, 0.01251220703125, 0.018335342407226562, 0.024158477783203125, 0.029981613159179688, 0.03580474853515625, 0.04162788391113281, 0.047451019287109375, 0.05327415466308594, 0.0590972900390625, 0.06492042541503906, 0.07074356079101562, 0.07656669616699219, 0.08238983154296875, 0.08821296691894531, 0.09403610229492188, 0.09985923767089844, 0.105682373046875, 0.11150550842285156, 0.11732864379882812, 0.12315177917480469, 0.12897491455078125, 0.1347980499267578, 0.14062118530273438, 0.14644432067871094, 0.1522674560546875, 0.15809059143066406, 0.16391372680664062, 0.1697368621826172, 0.17555999755859375, 0.1813831329345703, 0.18720626831054688, 0.19302940368652344, 0.1988525390625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 8.0, 6.0, 5.0, 7.0, 16.0, 20.0, 36.0, 82.0, 136.0, 207.0, 202.0, 107.0, 74.0, 31.0, 22.0, 10.0, 11.0, 5.0, 8.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.522634506225586e-05, -3.4125521779060364e-05, -3.302469849586487e-05, -3.192387521266937e-05, -3.082305192947388e-05, -2.972222864627838e-05, -2.8621405363082886e-05, -2.752058207988739e-05, -2.6419758796691895e-05, -2.53189355134964e-05, -2.4218112230300903e-05, -2.3117288947105408e-05, -2.2016465663909912e-05, -2.0915642380714417e-05, -1.981481909751892e-05, -1.8713995814323425e-05, -1.761317253112793e-05, -1.6512349247932434e-05, -1.541152596473694e-05, -1.4310702681541443e-05, -1.3209879398345947e-05, -1.2109056115150452e-05, -1.1008232831954956e-05, -9.90740954875946e-06, -8.806586265563965e-06, -7.70576298236847e-06, -6.604939699172974e-06, -5.504116415977478e-06, -4.403293132781982e-06, -3.302469849586487e-06, -2.201646566390991e-06, -1.1008232831954956e-06, 0.0, 1.1008232831954956e-06, 2.201646566390991e-06, 3.302469849586487e-06, 4.403293132781982e-06, 5.504116415977478e-06, 6.604939699172974e-06, 7.70576298236847e-06, 8.806586265563965e-06, 9.90740954875946e-06, 1.1008232831954956e-05, 1.2109056115150452e-05, 1.3209879398345947e-05, 1.4310702681541443e-05, 1.541152596473694e-05, 1.6512349247932434e-05, 1.761317253112793e-05, 1.8713995814323425e-05, 1.981481909751892e-05, 2.0915642380714417e-05, 2.2016465663909912e-05, 2.3117288947105408e-05, 2.4218112230300903e-05, 2.53189355134964e-05, 2.6419758796691895e-05, 2.752058207988739e-05, 2.8621405363082886e-05, 2.972222864627838e-05, 3.082305192947388e-05, 3.192387521266937e-05, 3.302469849586487e-05, 3.4125521779060364e-05, 3.522634506225586e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 8.0, 12.0, 11.0, 19.0, 28.0, 24.0, 49.0, 71.0, 97.0, 158.0, 241.0, 388.0, 626.0, 1075.0, 2058.0, 3882.0, 10605.0, 64264.0, 779484.0, 157199.0, 17291.0, 5049.0, 2434.0, 1319.0, 830.0, 472.0, 308.0, 167.0, 137.0, 84.0, 49.0, 29.0, 28.0, 17.0, 16.0, 4.0, 7.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2291259765625, -0.2218914031982422, -0.21465682983398438, -0.20742225646972656, -0.20018768310546875, -0.19295310974121094, -0.18571853637695312, -0.1784839630126953, -0.1712493896484375, -0.1640148162841797, -0.15678024291992188, -0.14954566955566406, -0.14231109619140625, -0.13507652282714844, -0.12784194946289062, -0.12060737609863281, -0.113372802734375, -0.10613822937011719, -0.09890365600585938, -0.09166908264160156, -0.08443450927734375, -0.07719993591308594, -0.06996536254882812, -0.06273078918457031, -0.0554962158203125, -0.04826164245605469, -0.041027069091796875, -0.03379249572753906, -0.02655792236328125, -0.019323348999023438, -0.012088775634765625, -0.0048542022705078125, 0.00238037109375, 0.009614944458007812, 0.016849517822265625, 0.024084091186523438, 0.03131866455078125, 0.03855323791503906, 0.045787811279296875, 0.05302238464355469, 0.0602569580078125, 0.06749153137207031, 0.07472610473632812, 0.08196067810058594, 0.08919525146484375, 0.09642982482910156, 0.10366439819335938, 0.11089897155761719, 0.118133544921875, 0.1253681182861328, 0.13260269165039062, 0.13983726501464844, 0.14707183837890625, 0.15430641174316406, 0.16154098510742188, 0.1687755584716797, 0.1760101318359375, 0.1832447052001953, 0.19047927856445312, 0.19771385192871094, 0.20494842529296875, 0.21218299865722656, 0.21941757202148438, 0.2266521453857422, 0.23388671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 8.0, 8.0, 6.0, 19.0, 27.0, 36.0, 61.0, 106.0, 176.0, 203.0, 110.0, 86.0, 42.0, 35.0, 25.0, 16.0, 7.0, 9.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0950927734375, -0.09182071685791016, -0.08854866027832031, -0.08527660369873047, -0.08200454711914062, -0.07873249053955078, -0.07546043395996094, -0.0721883773803711, -0.06891632080078125, -0.0656442642211914, -0.06237220764160156, -0.05910015106201172, -0.055828094482421875, -0.05255603790283203, -0.04928398132324219, -0.046011924743652344, -0.0427398681640625, -0.039467811584472656, -0.03619575500488281, -0.03292369842529297, -0.029651641845703125, -0.02637958526611328, -0.023107528686523438, -0.019835472106933594, -0.01656341552734375, -0.013291358947753906, -0.010019302368164062, -0.006747245788574219, -0.003475189208984375, -0.00020313262939453125, 0.0030689239501953125, 0.006340980529785156, 0.009613037109375, 0.012885093688964844, 0.016157150268554688, 0.01942920684814453, 0.022701263427734375, 0.02597332000732422, 0.029245376586914062, 0.032517433166503906, 0.03578948974609375, 0.039061546325683594, 0.04233360290527344, 0.04560565948486328, 0.048877716064453125, 0.05214977264404297, 0.05542182922363281, 0.058693885803222656, 0.0619659423828125, 0.06523799896240234, 0.06851005554199219, 0.07178211212158203, 0.07505416870117188, 0.07832622528076172, 0.08159828186035156, 0.0848703384399414, 0.08814239501953125, 0.0914144515991211, 0.09468650817871094, 0.09795856475830078, 0.10123062133789062, 0.10450267791748047, 0.10777473449707031, 0.11104679107666016, 0.11431884765625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 3.0, 12.0, 14.0, 31.0, 30.0, 44.0, 57.0, 74.0, 117.0, 94.0, 112.0, 98.0, 93.0, 73.0, 51.0, 34.0, 24.0, 20.0, 8.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3720266819000244, -1.329236388206482, -1.286446213722229, -1.2436559200286865, -1.2008657455444336, -1.1580754518508911, -1.1152851581573486, -1.0724949836730957, -1.0297046899795532, -0.9869144558906555, -0.9441242218017578, -0.9013339281082153, -0.8585436940193176, -0.8157534599304199, -0.7729632258415222, -0.7301729917526245, -0.6873827576637268, -0.6445925235748291, -0.6018022894859314, -0.5590120553970337, -0.5162217617034912, -0.4734315276145935, -0.4306412935256958, -0.3878510296344757, -0.345060795545578, -0.3022705614566803, -0.2594802975654602, -0.2166900634765625, -0.1738998144865036, -0.1311095654964447, -0.088319331407547, -0.045529067516326904, -0.0027388334274291992, 0.0400514118373394, 0.082841657102108, 0.1256318986415863, 0.1684221476316452, 0.2112123966217041, 0.2540026307106018, 0.2967928946018219, 0.3395831286907196, 0.3823733627796173, 0.4251636266708374, 0.4679538607597351, 0.5107440948486328, 0.5535343885421753, 0.5963245630264282, 0.6391148567199707, 0.6819050908088684, 0.7246953248977661, 0.7674855589866638, 0.8102757930755615, 0.853066086769104, 0.8958563208580017, 0.9386465549468994, 0.9814368486404419, 1.0242270231246948, 1.0670173168182373, 1.1098074913024902, 1.1525977849960327, 1.1953879594802856, 1.2381782531738281, 1.280968427658081, 1.3237587213516235, 1.366549015045166]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 7.0, 1.0, 3.0, 6.0, 10.0, 12.0, 14.0, 15.0, 11.0, 17.0, 21.0, 28.0, 26.0, 31.0, 23.0, 33.0, 45.0, 36.0, 42.0, 42.0, 38.0, 44.0, 35.0, 32.0, 43.0, 48.0, 39.0, 33.0, 35.0, 34.0, 29.0, 27.0, 28.0, 18.0, 20.0, 17.0, 15.0, 16.0, 8.0, 4.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0769579410552979, -1.0398415327072144, -1.0027251243591309, -0.9656087756156921, -0.9284924268722534, -0.8913760185241699, -0.8542596101760864, -0.8171432018280029, -0.7800268530845642, -0.7429104447364807, -0.705794095993042, -0.6686776876449585, -0.631561279296875, -0.5944449305534363, -0.5573285222053528, -0.5202121734619141, -0.48309576511383057, -0.44597938656806946, -0.40886300802230835, -0.37174659967422485, -0.33463022112846375, -0.29751384258270264, -0.26039743423461914, -0.22328105568885803, -0.18616467714309692, -0.14904829859733582, -0.11193190515041351, -0.07481551915407181, -0.0376991331577301, -0.0005827546119689941, 0.03653363883495331, 0.07365003228187561, 0.11076641082763672, 0.14788278937339783, 0.18499918282032013, 0.22211557626724243, 0.25923195481300354, 0.29634833335876465, 0.33346474170684814, 0.37058112025260925, 0.40769749879837036, 0.44481387734413147, 0.4819302558898926, 0.5190466642379761, 0.5561630725860596, 0.5932794213294983, 0.6303958296775818, 0.6675121784210205, 0.704628586769104, 0.7417449951171875, 0.7788613438606262, 0.8159777522087097, 0.8530941009521484, 0.8902105093002319, 0.9273269176483154, 0.9644433259963989, 1.0015597343444824, 1.038676142692566, 1.0757925510406494, 1.1129088401794434, 1.1500252485275269, 1.1871416568756104, 1.2242580652236938, 1.2613744735717773, 1.2984907627105713]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 7.0, 4.0, 16.0, 11.0, 16.0, 21.0, 37.0, 46.0, 31.0, 45.0, 70.0, 159.0, 492.0, 2987.0, 54056.0, 3617311.0, 507969.0, 9221.0, 1111.0, 247.0, 104.0, 72.0, 34.0, 44.0, 35.0, 21.0, 31.0, 19.0, 12.0, 8.0, 2.0, 10.0, 8.0, 8.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.052734375, -1.9918670654296875, -1.930999755859375, -1.8701324462890625, -1.80926513671875, -1.7483978271484375, -1.687530517578125, -1.6266632080078125, -1.5657958984375, -1.5049285888671875, -1.444061279296875, -1.3831939697265625, -1.32232666015625, -1.2614593505859375, -1.200592041015625, -1.1397247314453125, -1.078857421875, -1.0179901123046875, -0.957122802734375, -0.8962554931640625, -0.83538818359375, -0.7745208740234375, -0.713653564453125, -0.6527862548828125, -0.5919189453125, -0.5310516357421875, -0.470184326171875, -0.4093170166015625, -0.34844970703125, -0.2875823974609375, -0.226715087890625, -0.1658477783203125, -0.10498046875, -0.0441131591796875, 0.016754150390625, 0.0776214599609375, 0.13848876953125, 0.1993560791015625, 0.260223388671875, 0.3210906982421875, 0.3819580078125, 0.4428253173828125, 0.503692626953125, 0.5645599365234375, 0.62542724609375, 0.6862945556640625, 0.747161865234375, 0.8080291748046875, 0.868896484375, 0.9297637939453125, 0.990631103515625, 1.0514984130859375, 1.11236572265625, 1.1732330322265625, 1.234100341796875, 1.2949676513671875, 1.3558349609375, 1.4167022705078125, 1.477569580078125, 1.5384368896484375, 1.59930419921875, 1.6601715087890625, 1.721038818359375, 1.7819061279296875, 1.8427734375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 9.0, 12.0, 14.0, 19.0, 23.0, 24.0, 30.0, 29.0, 28.0, 41.0, 41.0, 46.0, 39.0, 53.0, 59.0, 44.0, 56.0, 64.0, 46.0, 42.0, 43.0, 43.0, 43.0, 27.0, 23.0, 16.0, 18.0, 16.0, 13.0, 11.0, 8.0, 4.0, 1.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.488525390625, -0.4729728698730469, -0.45742034912109375, -0.4418678283691406, -0.4263153076171875, -0.4107627868652344, -0.39521026611328125, -0.3796577453613281, -0.364105224609375, -0.3485527038574219, -0.33300018310546875, -0.3174476623535156, -0.3018951416015625, -0.2863426208496094, -0.27079010009765625, -0.2552375793457031, -0.23968505859375, -0.22413253784179688, -0.20858001708984375, -0.19302749633789062, -0.1774749755859375, -0.16192245483398438, -0.14636993408203125, -0.13081741333007812, -0.115264892578125, -0.09971237182617188, -0.08415985107421875, -0.06860733032226562, -0.0530548095703125, -0.037502288818359375, -0.02194976806640625, -0.006397247314453125, 0.0091552734375, 0.024707794189453125, 0.04026031494140625, 0.055812835693359375, 0.0713653564453125, 0.08691787719726562, 0.10247039794921875, 0.11802291870117188, 0.133575439453125, 0.14912796020507812, 0.16468048095703125, 0.18023300170898438, 0.1957855224609375, 0.21133804321289062, 0.22689056396484375, 0.24244308471679688, 0.25799560546875, 0.2735481262207031, 0.28910064697265625, 0.3046531677246094, 0.3202056884765625, 0.3357582092285156, 0.35131072998046875, 0.3668632507324219, 0.382415771484375, 0.3979682922363281, 0.41352081298828125, 0.4290733337402344, 0.4446258544921875, 0.4601783752441406, 0.47573089599609375, 0.4912834167480469, 0.5068359375]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 5.0, 4.0, 26.0, 26.0, 40.0, 76.0, 149.0, 325.0, 710.0, 2002.0, 8435.0, 86433.0, 3636868.0, 434598.0, 19168.0, 3464.0, 1049.0, 469.0, 204.0, 91.0, 50.0, 28.0, 20.0, 11.0, 7.0, 9.0, 2.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.720703125, -1.673828125, -1.626953125, -1.580078125, -1.533203125, -1.486328125, -1.439453125, -1.392578125, -1.345703125, -1.298828125, -1.251953125, -1.205078125, -1.158203125, -1.111328125, -1.064453125, -1.017578125, -0.970703125, -0.923828125, -0.876953125, -0.830078125, -0.783203125, -0.736328125, -0.689453125, -0.642578125, -0.595703125, -0.548828125, -0.501953125, -0.455078125, -0.408203125, -0.361328125, -0.314453125, -0.267578125, -0.220703125, -0.173828125, -0.126953125, -0.080078125, -0.033203125, 0.013671875, 0.060546875, 0.107421875, 0.154296875, 0.201171875, 0.248046875, 0.294921875, 0.341796875, 0.388671875, 0.435546875, 0.482421875, 0.529296875, 0.576171875, 0.623046875, 0.669921875, 0.716796875, 0.763671875, 0.810546875, 0.857421875, 0.904296875, 0.951171875, 0.998046875, 1.044921875, 1.091796875, 1.138671875, 1.185546875, 1.232421875, 1.279296875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 10.0, 16.0, 14.0, 22.0, 27.0, 50.0, 67.0, 107.0, 187.0, 279.0, 493.0, 636.0, 717.0, 546.0, 349.0, 210.0, 113.0, 77.0, 55.0, 35.0, 23.0, 15.0, 7.0, 3.0, 9.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.384033203125, -0.37421417236328125, -0.3643951416015625, -0.35457611083984375, -0.344757080078125, -0.33493804931640625, -0.3251190185546875, -0.31529998779296875, -0.30548095703125, -0.29566192626953125, -0.2858428955078125, -0.27602386474609375, -0.266204833984375, -0.25638580322265625, -0.2465667724609375, -0.23674774169921875, -0.2269287109375, -0.21710968017578125, -0.2072906494140625, -0.19747161865234375, -0.187652587890625, -0.17783355712890625, -0.1680145263671875, -0.15819549560546875, -0.14837646484375, -0.13855743408203125, -0.1287384033203125, -0.11891937255859375, -0.109100341796875, -0.09928131103515625, -0.0894622802734375, -0.07964324951171875, -0.06982421875, -0.06000518798828125, -0.0501861572265625, -0.04036712646484375, -0.030548095703125, -0.02072906494140625, -0.0109100341796875, -0.00109100341796875, 0.00872802734375, 0.01854705810546875, 0.0283660888671875, 0.03818511962890625, 0.048004150390625, 0.05782318115234375, 0.0676422119140625, 0.07746124267578125, 0.0872802734375, 0.09709930419921875, 0.1069183349609375, 0.11673736572265625, 0.126556396484375, 0.13637542724609375, 0.1461944580078125, 0.15601348876953125, 0.16583251953125, 0.17565155029296875, 0.1854705810546875, 0.19528961181640625, 0.205108642578125, 0.21492767333984375, 0.2247467041015625, 0.23456573486328125, 0.244384765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 10.0, 13.0, 27.0, 52.0, 76.0, 86.0, 105.0, 128.0, 136.0, 127.0, 88.0, 56.0, 45.0, 26.0, 10.0, 6.0, 9.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.057590961456299, -2.0117831230163574, -1.9659751653671265, -1.920167326927185, -1.874359369277954, -1.8285515308380127, -1.7827436923980713, -1.7369357347488403, -1.6911277770996094, -1.645319938659668, -1.599511981010437, -1.5537041425704956, -1.5078961849212646, -1.4620883464813232, -1.4162805080413818, -1.3704725503921509, -1.3246647119522095, -1.278856873512268, -1.233048915863037, -1.1872410774230957, -1.1414331197738647, -1.0956252813339233, -1.0498173236846924, -1.004009485244751, -0.9582015872001648, -0.9123936891555786, -0.8665857911109924, -0.8207778930664062, -0.7749700546264648, -0.7291620969772339, -0.6833542585372925, -0.6375463604927063, -0.5917384624481201, -0.5459305644035339, -0.5001226663589478, -0.45431479811668396, -0.4085069000720978, -0.3626990020275116, -0.3168911337852478, -0.2710832357406616, -0.22527533769607544, -0.17946743965148926, -0.13365955650806427, -0.08785167336463928, -0.0420437753200531, 0.003764122724533081, 0.049571990966796875, 0.09537988901138306, 0.14118778705596924, 0.18699568510055542, 0.2328035682439804, 0.2786114513874054, 0.3244193494319916, 0.37022724747657776, 0.41603511571884155, 0.46184301376342773, 0.5076509118080139, 0.5534588098526001, 0.5992667078971863, 0.6450746059417725, 0.6908824443817139, 0.7366904020309448, 0.7824982404708862, 0.8283061385154724, 0.8741140365600586]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 3.0, 5.0, 16.0, 10.0, 16.0, 34.0, 17.0, 19.0, 23.0, 20.0, 24.0, 30.0, 42.0, 41.0, 35.0, 38.0, 43.0, 32.0, 35.0, 33.0, 34.0, 39.0, 42.0, 37.0, 28.0, 31.0, 47.0, 26.0, 24.0, 28.0, 23.0, 28.0, 19.0, 19.0, 8.0, 6.0, 9.0, 6.0, 6.0, 5.0, 9.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5137552618980408, -0.4969230890274048, -0.4800908863544464, -0.4632587134838104, -0.44642651081085205, -0.42959433794021606, -0.4127621650695801, -0.3959299921989441, -0.3790977895259857, -0.36226561665534973, -0.34543341398239136, -0.32860124111175537, -0.3117690682411194, -0.294936865568161, -0.278104692697525, -0.26127249002456665, -0.24444031715393066, -0.22760812938213348, -0.2107759416103363, -0.19394376873970032, -0.17711158096790314, -0.16027939319610596, -0.14344722032546997, -0.1266150325536728, -0.10978284478187561, -0.09295065701007843, -0.07611847668886185, -0.059286292642354965, -0.042454108595848083, -0.025621920824050903, -0.00878974050283432, 0.008042439818382263, 0.024874567985534668, 0.04170675203204155, 0.05853893607854843, 0.07537111639976501, 0.0922033041715622, 0.10903549194335938, 0.12586766481399536, 0.14269985258579254, 0.15953204035758972, 0.1763642281293869, 0.19319641590118408, 0.21002858877182007, 0.22686077654361725, 0.24369296431541443, 0.2605251371860504, 0.2773573398590088, 0.2941895127296448, 0.31102168560028076, 0.32785388827323914, 0.3446860611438751, 0.3615182638168335, 0.3783504366874695, 0.39518260955810547, 0.41201478242874146, 0.42884698510169983, 0.4456791579723358, 0.4625113606452942, 0.4793435335159302, 0.49617570638656616, 0.5130078792572021, 0.5298401117324829, 0.5466722846031189, 0.5635044574737549]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 8.0, 8.0, 10.0, 15.0, 24.0, 54.0, 69.0, 119.0, 257.0, 602.0, 1671.0, 6031.0, 33947.0, 598491.0, 377202.0, 23076.0, 4584.0, 1398.0, 525.0, 214.0, 88.0, 53.0, 33.0, 32.0, 10.0, 10.0, 8.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37939453125, -0.363525390625, -0.34765625, -0.331787109375, -0.31591796875, -0.300048828125, -0.2841796875, -0.268310546875, -0.25244140625, -0.236572265625, -0.220703125, -0.204833984375, -0.18896484375, -0.173095703125, -0.1572265625, -0.141357421875, -0.12548828125, -0.109619140625, -0.09375, -0.077880859375, -0.06201171875, -0.046142578125, -0.0302734375, -0.014404296875, 0.00146484375, 0.017333984375, 0.033203125, 0.049072265625, 0.06494140625, 0.080810546875, 0.0966796875, 0.112548828125, 0.12841796875, 0.144287109375, 0.16015625, 0.176025390625, 0.19189453125, 0.207763671875, 0.2236328125, 0.239501953125, 0.25537109375, 0.271240234375, 0.287109375, 0.302978515625, 0.31884765625, 0.334716796875, 0.3505859375, 0.366455078125, 0.38232421875, 0.398193359375, 0.4140625, 0.429931640625, 0.44580078125, 0.461669921875, 0.4775390625, 0.493408203125, 0.50927734375, 0.525146484375, 0.541015625, 0.556884765625, 0.57275390625, 0.588623046875, 0.6044921875, 0.620361328125, 0.63623046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 0.0, 3.0, 6.0, 12.0, 9.0, 13.0, 24.0, 18.0, 24.0, 37.0, 35.0, 37.0, 46.0, 57.0, 46.0, 46.0, 52.0, 52.0, 52.0, 56.0, 45.0, 37.0, 56.0, 43.0, 41.0, 26.0, 31.0, 22.0, 22.0, 13.0, 12.0, 10.0, 7.0, 6.0, 6.0, 4.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3828125, -0.36733245849609375, -0.3518524169921875, -0.33637237548828125, -0.320892333984375, -0.30541229248046875, -0.2899322509765625, -0.27445220947265625, -0.25897216796875, -0.24349212646484375, -0.2280120849609375, -0.21253204345703125, -0.197052001953125, -0.18157196044921875, -0.1660919189453125, -0.15061187744140625, -0.1351318359375, -0.11965179443359375, -0.1041717529296875, -0.08869171142578125, -0.073211669921875, -0.05773162841796875, -0.0422515869140625, -0.02677154541015625, -0.01129150390625, 0.00418853759765625, 0.0196685791015625, 0.03514862060546875, 0.050628662109375, 0.06610870361328125, 0.0815887451171875, 0.09706878662109375, 0.112548828125, 0.12802886962890625, 0.1435089111328125, 0.15898895263671875, 0.174468994140625, 0.18994903564453125, 0.2054290771484375, 0.22090911865234375, 0.23638916015625, 0.25186920166015625, 0.2673492431640625, 0.28282928466796875, 0.298309326171875, 0.31378936767578125, 0.3292694091796875, 0.34474945068359375, 0.3602294921875, 0.37570953369140625, 0.3911895751953125, 0.40666961669921875, 0.422149658203125, 0.43762969970703125, 0.4531097412109375, 0.46858978271484375, 0.48406982421875, 0.49954986572265625, 0.5150299072265625, 0.5305099487304688, 0.545989990234375, 0.5614700317382812, 0.5769500732421875, 0.5924301147460938, 0.60791015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 2.0, 5.0, 4.0, 10.0, 8.0, 12.0, 7.0, 18.0, 43.0, 53.0, 67.0, 101.0, 156.0, 272.0, 398.0, 738.0, 1222.0, 2235.0, 4453.0, 10070.0, 32382.0, 145275.0, 465817.0, 290053.0, 64592.0, 17034.0, 6359.0, 2995.0, 1635.0, 959.0, 607.0, 357.0, 208.0, 134.0, 91.0, 42.0, 44.0, 22.0, 23.0, 9.0, 13.0, 7.0, 5.0, 3.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.1790771484375, -0.17343521118164062, -0.16779327392578125, -0.16215133666992188, -0.1565093994140625, -0.15086746215820312, -0.14522552490234375, -0.13958358764648438, -0.133941650390625, -0.12829971313476562, -0.12265777587890625, -0.11701583862304688, -0.1113739013671875, -0.10573196411132812, -0.10009002685546875, -0.09444808959960938, -0.08880615234375, -0.08316421508789062, -0.07752227783203125, -0.07188034057617188, -0.0662384033203125, -0.060596466064453125, -0.05495452880859375, -0.049312591552734375, -0.043670654296875, -0.038028717041015625, -0.03238677978515625, -0.026744842529296875, -0.0211029052734375, -0.015460968017578125, -0.00981903076171875, -0.004177093505859375, 0.00146484375, 0.007106781005859375, 0.01274871826171875, 0.018390655517578125, 0.0240325927734375, 0.029674530029296875, 0.03531646728515625, 0.040958404541015625, 0.046600341796875, 0.052242279052734375, 0.05788421630859375, 0.06352615356445312, 0.0691680908203125, 0.07481002807617188, 0.08045196533203125, 0.08609390258789062, 0.09173583984375, 0.09737777709960938, 0.10301971435546875, 0.10866165161132812, 0.1143035888671875, 0.11994552612304688, 0.12558746337890625, 0.13122940063476562, 0.136871337890625, 0.14251327514648438, 0.14815521240234375, 0.15379714965820312, 0.1594390869140625, 0.16508102416992188, 0.17072296142578125, 0.17636489868164062, 0.1820068359375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 9.0, 5.0, 9.0, 7.0, 9.0, 16.0, 23.0, 19.0, 12.0, 13.0, 19.0, 32.0, 28.0, 28.0, 43.0, 29.0, 40.0, 47.0, 40.0, 32.0, 40.0, 38.0, 39.0, 41.0, 40.0, 37.0, 36.0, 34.0, 29.0, 31.0, 21.0, 27.0, 19.0, 14.0, 14.0, 15.0, 12.0, 10.0, 9.0, 6.0, 7.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.7900390625, -0.7660903930664062, -0.7421417236328125, -0.7181930541992188, -0.694244384765625, -0.6702957153320312, -0.6463470458984375, -0.6223983764648438, -0.59844970703125, -0.5745010375976562, -0.5505523681640625, -0.5266036987304688, -0.502655029296875, -0.47870635986328125, -0.4547576904296875, -0.43080902099609375, -0.4068603515625, -0.38291168212890625, -0.3589630126953125, -0.33501434326171875, -0.311065673828125, -0.28711700439453125, -0.2631683349609375, -0.23921966552734375, -0.21527099609375, -0.19132232666015625, -0.1673736572265625, -0.14342498779296875, -0.119476318359375, -0.09552764892578125, -0.0715789794921875, -0.04763031005859375, -0.023681640625, 0.00026702880859375, 0.0242156982421875, 0.04816436767578125, 0.072113037109375, 0.09606170654296875, 0.1200103759765625, 0.14395904541015625, 0.16790771484375, 0.19185638427734375, 0.2158050537109375, 0.23975372314453125, 0.263702392578125, 0.28765106201171875, 0.3115997314453125, 0.33554840087890625, 0.3594970703125, 0.38344573974609375, 0.4073944091796875, 0.43134307861328125, 0.455291748046875, 0.47924041748046875, 0.5031890869140625, 0.5271377563476562, 0.55108642578125, 0.5750350952148438, 0.5989837646484375, 0.6229324340820312, 0.646881103515625, 0.6708297729492188, 0.6947784423828125, 0.7187271118164062, 0.74267578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 15.0, 18.0, 25.0, 34.0, 60.0, 137.0, 232.0, 454.0, 949.0, 2310.0, 6549.0, 29064.0, 435808.0, 526979.0, 33679.0, 7399.0, 2557.0, 1086.0, 554.0, 242.0, 148.0, 92.0, 58.0, 36.0, 24.0, 11.0, 7.0, 6.0, 8.0, 8.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1551513671875, -0.15030860900878906, -0.14546585083007812, -0.1406230926513672, -0.13578033447265625, -0.1309375762939453, -0.12609481811523438, -0.12125205993652344, -0.1164093017578125, -0.11156654357910156, -0.10672378540039062, -0.10188102722167969, -0.09703826904296875, -0.09219551086425781, -0.08735275268554688, -0.08250999450683594, -0.077667236328125, -0.07282447814941406, -0.06798171997070312, -0.06313896179199219, -0.05829620361328125, -0.05345344543457031, -0.048610687255859375, -0.04376792907714844, -0.0389251708984375, -0.03408241271972656, -0.029239654541015625, -0.024396896362304688, -0.01955413818359375, -0.014711380004882812, -0.009868621826171875, -0.0050258636474609375, -0.00018310546875, 0.0046596527099609375, 0.009502410888671875, 0.014345169067382812, 0.01918792724609375, 0.024030685424804688, 0.028873443603515625, 0.03371620178222656, 0.0385589599609375, 0.04340171813964844, 0.048244476318359375, 0.05308723449707031, 0.05792999267578125, 0.06277275085449219, 0.06761550903320312, 0.07245826721191406, 0.077301025390625, 0.08214378356933594, 0.08698654174804688, 0.09182929992675781, 0.09667205810546875, 0.10151481628417969, 0.10635757446289062, 0.11120033264160156, 0.1160430908203125, 0.12088584899902344, 0.12572860717773438, 0.1305713653564453, 0.13541412353515625, 0.1402568817138672, 0.14509963989257812, 0.14994239807128906, 0.15478515625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 10.0, 23.0, 27.0, 58.0, 98.0, 206.0, 233.0, 164.0, 72.0, 48.0, 25.0, 14.0, 6.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.246566772460938e-05, -6.046891212463379e-05, -5.84721565246582e-05, -5.647540092468262e-05, -5.447864532470703e-05, -5.2481889724731445e-05, -5.048513412475586e-05, -4.8488378524780273e-05, -4.649162292480469e-05, -4.44948673248291e-05, -4.2498111724853516e-05, -4.050135612487793e-05, -3.8504600524902344e-05, -3.650784492492676e-05, -3.451108932495117e-05, -3.2514333724975586e-05, -3.0517578125e-05, -2.8520822525024414e-05, -2.6524066925048828e-05, -2.4527311325073242e-05, -2.2530555725097656e-05, -2.053380012512207e-05, -1.8537044525146484e-05, -1.65402889251709e-05, -1.4543533325195312e-05, -1.2546777725219727e-05, -1.055002212524414e-05, -8.553266525268555e-06, -6.556510925292969e-06, -4.559755325317383e-06, -2.562999725341797e-06, -5.662441253662109e-07, 1.430511474609375e-06, 3.427267074584961e-06, 5.424022674560547e-06, 7.420778274536133e-06, 9.417533874511719e-06, 1.1414289474487305e-05, 1.341104507446289e-05, 1.5407800674438477e-05, 1.7404556274414062e-05, 1.940131187438965e-05, 2.1398067474365234e-05, 2.339482307434082e-05, 2.5391578674316406e-05, 2.7388334274291992e-05, 2.9385089874267578e-05, 3.1381845474243164e-05, 3.337860107421875e-05, 3.5375356674194336e-05, 3.737211227416992e-05, 3.936886787414551e-05, 4.1365623474121094e-05, 4.336237907409668e-05, 4.5359134674072266e-05, 4.735589027404785e-05, 4.935264587402344e-05, 5.1349401473999023e-05, 5.334615707397461e-05, 5.5342912673950195e-05, 5.733966827392578e-05, 5.933642387390137e-05, 6.133317947387695e-05, 6.332993507385254e-05, 6.532669067382812e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 5.0, 4.0, 9.0, 14.0, 10.0, 24.0, 36.0, 48.0, 82.0, 155.0, 378.0, 993.0, 3303.0, 12288.0, 75478.0, 753149.0, 175154.0, 20167.0, 4916.0, 1423.0, 470.0, 194.0, 85.0, 60.0, 36.0, 21.0, 14.0, 11.0, 4.0, 6.0, 0.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.174560546875, -0.16904640197753906, -0.16353225708007812, -0.1580181121826172, -0.15250396728515625, -0.1469898223876953, -0.14147567749023438, -0.13596153259277344, -0.1304473876953125, -0.12493324279785156, -0.11941909790039062, -0.11390495300292969, -0.10839080810546875, -0.10287666320800781, -0.09736251831054688, -0.09184837341308594, -0.086334228515625, -0.08082008361816406, -0.07530593872070312, -0.06979179382324219, -0.06427764892578125, -0.05876350402832031, -0.053249359130859375, -0.04773521423339844, -0.0422210693359375, -0.03670692443847656, -0.031192779541015625, -0.025678634643554688, -0.02016448974609375, -0.014650344848632812, -0.009136199951171875, -0.0036220550537109375, 0.00189208984375, 0.0074062347412109375, 0.012920379638671875, 0.018434524536132812, 0.02394866943359375, 0.029462814331054688, 0.034976959228515625, 0.04049110412597656, 0.0460052490234375, 0.05151939392089844, 0.057033538818359375, 0.06254768371582031, 0.06806182861328125, 0.07357597351074219, 0.07909011840820312, 0.08460426330566406, 0.090118408203125, 0.09563255310058594, 0.10114669799804688, 0.10666084289550781, 0.11217498779296875, 0.11768913269042969, 0.12320327758789062, 0.12871742248535156, 0.1342315673828125, 0.13974571228027344, 0.14525985717773438, 0.1507740020751953, 0.15628814697265625, 0.1618022918701172, 0.16731643676757812, 0.17283058166503906, 0.1783447265625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 4.0, 8.0, 6.0, 6.0, 12.0, 18.0, 17.0, 34.0, 41.0, 70.0, 105.0, 124.0, 132.0, 119.0, 89.0, 52.0, 50.0, 30.0, 20.0, 16.0, 12.0, 5.0, 6.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.03448486328125, -0.033267974853515625, -0.03205108642578125, -0.030834197998046875, -0.0296173095703125, -0.028400421142578125, -0.02718353271484375, -0.025966644287109375, -0.024749755859375, -0.023532867431640625, -0.02231597900390625, -0.021099090576171875, -0.0198822021484375, -0.018665313720703125, -0.01744842529296875, -0.016231536865234375, -0.0150146484375, -0.013797760009765625, -0.01258087158203125, -0.011363983154296875, -0.0101470947265625, -0.008930206298828125, -0.00771331787109375, -0.006496429443359375, -0.005279541015625, -0.004062652587890625, -0.00284576416015625, -0.001628875732421875, -0.0004119873046875, 0.000804901123046875, 0.00202178955078125, 0.003238677978515625, 0.00445556640625, 0.005672454833984375, 0.00688934326171875, 0.008106231689453125, 0.0093231201171875, 0.010540008544921875, 0.01175689697265625, 0.012973785400390625, 0.014190673828125, 0.015407562255859375, 0.01662445068359375, 0.017841339111328125, 0.0190582275390625, 0.020275115966796875, 0.02149200439453125, 0.022708892822265625, 0.02392578125, 0.025142669677734375, 0.02635955810546875, 0.027576446533203125, 0.0287933349609375, 0.030010223388671875, 0.03122711181640625, 0.032444000244140625, 0.033660888671875, 0.034877777099609375, 0.03609466552734375, 0.037311553955078125, 0.0385284423828125, 0.039745330810546875, 0.04096221923828125, 0.042179107666015625, 0.04339599609375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 12.0, 8.0, 25.0, 44.0, 55.0, 62.0, 65.0, 81.0, 117.0, 110.0, 105.0, 80.0, 79.0, 57.0, 35.0, 25.0, 16.0, 5.0, 9.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8808908462524414, -0.856532633304596, -0.8321743607521057, -0.8078161478042603, -0.7834579348564148, -0.7590997219085693, -0.7347414493560791, -0.7103832364082336, -0.6860250234603882, -0.6616668105125427, -0.6373085379600525, -0.612950325012207, -0.5885921120643616, -0.5642338991165161, -0.5398756265640259, -0.5155174136161804, -0.4911591410636902, -0.46680089831352234, -0.4424426853656769, -0.41808444261550903, -0.3937262296676636, -0.3693679869174957, -0.3450097441673279, -0.3206515312194824, -0.2962932884693146, -0.27193504571914673, -0.24757683277130127, -0.22321859002113342, -0.19886036217212677, -0.17450213432312012, -0.15014389157295227, -0.12578566372394562, -0.10142743587493896, -0.07706920802593231, -0.05271097272634506, -0.028352737426757812, -0.00399450957775116, 0.020363718271255493, 0.04472196102142334, 0.06908018887042999, 0.09343841671943665, 0.1177966445684433, 0.14215487241744995, 0.1665131151676178, 0.19087134301662445, 0.2152295708656311, 0.23958781361579895, 0.2639460563659668, 0.28830426931381226, 0.3126625120639801, 0.33702072501182556, 0.3613789677619934, 0.38573718070983887, 0.4100954234600067, 0.43445366621017456, 0.45881187915802, 0.48317012190818787, 0.5075283646583557, 0.5318865776062012, 0.5562448501586914, 0.5806030631065369, 0.6049612760543823, 0.6293195486068726, 0.653677761554718, 0.6780359745025635]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 4.0, 8.0, 3.0, 13.0, 10.0, 22.0, 30.0, 17.0, 23.0, 27.0, 22.0, 29.0, 36.0, 36.0, 31.0, 32.0, 36.0, 53.0, 41.0, 29.0, 33.0, 37.0, 34.0, 31.0, 35.0, 45.0, 41.0, 36.0, 23.0, 25.0, 27.0, 20.0, 17.0, 17.0, 13.0, 14.0, 11.0, 7.0, 7.0, 4.0, 10.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32876482605934143, -0.31749704480171204, -0.30622926354408264, -0.29496151208877563, -0.28369373083114624, -0.27242594957351685, -0.26115816831588745, -0.24989038705825806, -0.23862262070178986, -0.22735483944416046, -0.21608707308769226, -0.20481929183006287, -0.19355151057243347, -0.18228374421596527, -0.17101596295833588, -0.15974819660186768, -0.14848041534423828, -0.1372126340866089, -0.12594486773014069, -0.11467708647251129, -0.1034093126654625, -0.0921415388584137, -0.0808737576007843, -0.0696059837937355, -0.05833820998668671, -0.04707043617963791, -0.03580265864729881, -0.024534881114959717, -0.01326710730791092, -0.0019993335008621216, 0.009268447756767273, 0.02053622156381607, 0.03180399537086487, 0.043071769177913666, 0.05433954671025276, 0.06560732424259186, 0.07687509804964066, 0.08814287185668945, 0.09941065311431885, 0.11067842692136765, 0.12194620072841644, 0.13321398198604584, 0.14448174834251404, 0.15574952960014343, 0.16701731085777283, 0.17828507721424103, 0.18955285847187042, 0.20082062482833862, 0.21208840608596802, 0.2233561873435974, 0.2346239537000656, 0.245891734957695, 0.2571595013141632, 0.2684272825717926, 0.279695063829422, 0.2909628450870514, 0.3022305965423584, 0.3134983777999878, 0.3247661590576172, 0.3360339403152466, 0.3473016917705536, 0.358569473028183, 0.3698372542858124, 0.3811050355434418, 0.39237281680107117]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 5.0, 8.0, 12.0, 12.0, 20.0, 20.0, 45.0, 57.0, 86.0, 100.0, 179.0, 286.0, 409.0, 725.0, 1212.0, 2419.0, 4983.0, 11363.0, 29534.0, 97737.0, 484824.0, 307540.0, 67428.0, 22115.0, 8736.0, 3966.0, 2019.0, 1064.0, 550.0, 363.0, 235.0, 164.0, 115.0, 55.0, 59.0, 30.0, 19.0, 13.0, 20.0, 8.0, 8.0, 9.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.53173828125, -0.5160331726074219, -0.5003280639648438, -0.4846229553222656, -0.4689178466796875, -0.4532127380371094, -0.43750762939453125, -0.4218025207519531, -0.406097412109375, -0.3903923034667969, -0.37468719482421875, -0.3589820861816406, -0.3432769775390625, -0.3275718688964844, -0.31186676025390625, -0.2961616516113281, -0.28045654296875, -0.2647514343261719, -0.24904632568359375, -0.23334121704101562, -0.2176361083984375, -0.20193099975585938, -0.18622589111328125, -0.17052078247070312, -0.154815673828125, -0.13911056518554688, -0.12340545654296875, -0.10770034790039062, -0.0919952392578125, -0.07629013061523438, -0.06058502197265625, -0.044879913330078125, -0.0291748046875, -0.013469696044921875, 0.00223541259765625, 0.017940521240234375, 0.0336456298828125, 0.049350738525390625, 0.06505584716796875, 0.08076095581054688, 0.096466064453125, 0.11217117309570312, 0.12787628173828125, 0.14358139038085938, 0.1592864990234375, 0.17499160766601562, 0.19069671630859375, 0.20640182495117188, 0.22210693359375, 0.23781204223632812, 0.25351715087890625, 0.2692222595214844, 0.2849273681640625, 0.3006324768066406, 0.31633758544921875, 0.3320426940917969, 0.347747802734375, 0.3634529113769531, 0.37915802001953125, 0.3948631286621094, 0.4105682373046875, 0.4262733459472656, 0.44197845458984375, 0.4576835632324219, 0.473388671875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 11.0, 5.0, 6.0, 13.0, 10.0, 19.0, 23.0, 29.0, 30.0, 31.0, 49.0, 37.0, 43.0, 51.0, 56.0, 55.0, 55.0, 41.0, 56.0, 43.0, 45.0, 47.0, 30.0, 48.0, 35.0, 23.0, 26.0, 14.0, 21.0, 16.0, 10.0, 1.0, 7.0, 8.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8369140625, -0.8096694946289062, -0.7824249267578125, -0.7551803588867188, -0.727935791015625, -0.7006912231445312, -0.6734466552734375, -0.6462020874023438, -0.61895751953125, -0.5917129516601562, -0.5644683837890625, -0.5372238159179688, -0.509979248046875, -0.48273468017578125, -0.4554901123046875, -0.42824554443359375, -0.4010009765625, -0.37375640869140625, -0.3465118408203125, -0.31926727294921875, -0.292022705078125, -0.26477813720703125, -0.2375335693359375, -0.21028900146484375, -0.18304443359375, -0.15579986572265625, -0.1285552978515625, -0.10131072998046875, -0.074066162109375, -0.04682159423828125, -0.0195770263671875, 0.00766754150390625, 0.034912109375, 0.06215667724609375, 0.0894012451171875, 0.11664581298828125, 0.143890380859375, 0.17113494873046875, 0.1983795166015625, 0.22562408447265625, 0.25286865234375, 0.28011322021484375, 0.3073577880859375, 0.33460235595703125, 0.361846923828125, 0.38909149169921875, 0.4163360595703125, 0.44358062744140625, 0.4708251953125, 0.49806976318359375, 0.5253143310546875, 0.5525588989257812, 0.579803466796875, 0.6070480346679688, 0.6342926025390625, 0.6615371704101562, 0.68878173828125, 0.7160263061523438, 0.7432708740234375, 0.7705154418945312, 0.797760009765625, 0.8250045776367188, 0.8522491455078125, 0.8794937133789062, 0.90673828125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 3.0, 4.0, 4.0, 11.0, 12.0, 15.0, 19.0, 23.0, 44.0, 62.0, 99.0, 159.0, 331.0, 988.0, 5693.0, 118651.0, 897729.0, 21380.0, 2156.0, 561.0, 203.0, 140.0, 76.0, 49.0, 38.0, 22.0, 14.0, 10.0, 11.0, 11.0, 7.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8212890625, -1.7665252685546875, -1.711761474609375, -1.6569976806640625, -1.60223388671875, -1.5474700927734375, -1.492706298828125, -1.4379425048828125, -1.3831787109375, -1.3284149169921875, -1.273651123046875, -1.2188873291015625, -1.16412353515625, -1.1093597412109375, -1.054595947265625, -0.9998321533203125, -0.945068359375, -0.8903045654296875, -0.835540771484375, -0.7807769775390625, -0.72601318359375, -0.6712493896484375, -0.616485595703125, -0.5617218017578125, -0.5069580078125, -0.4521942138671875, -0.397430419921875, -0.3426666259765625, -0.28790283203125, -0.2331390380859375, -0.178375244140625, -0.1236114501953125, -0.06884765625, -0.0140838623046875, 0.040679931640625, 0.0954437255859375, 0.15020751953125, 0.2049713134765625, 0.259735107421875, 0.3144989013671875, 0.3692626953125, 0.4240264892578125, 0.478790283203125, 0.5335540771484375, 0.58831787109375, 0.6430816650390625, 0.697845458984375, 0.7526092529296875, 0.807373046875, 0.8621368408203125, 0.916900634765625, 0.9716644287109375, 1.02642822265625, 1.0811920166015625, 1.135955810546875, 1.1907196044921875, 1.2454833984375, 1.3002471923828125, 1.355010986328125, 1.4097747802734375, 1.46453857421875, 1.5193023681640625, 1.574066162109375, 1.6288299560546875, 1.68359375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 4.0, 7.0, 10.0, 3.0, 2.0, 7.0, 10.0, 11.0, 14.0, 27.0, 28.0, 28.0, 31.0, 35.0, 36.0, 37.0, 55.0, 53.0, 68.0, 60.0, 55.0, 42.0, 47.0, 42.0, 43.0, 40.0, 38.0, 33.0, 26.0, 20.0, 21.0, 8.0, 9.0, 18.0, 7.0, 8.0, 2.0, 2.0, 0.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.08203125, -1.0514602661132812, -1.0208892822265625, -0.9903182983398438, -0.959747314453125, -0.9291763305664062, -0.8986053466796875, -0.8680343627929688, -0.83746337890625, -0.8068923950195312, -0.7763214111328125, -0.7457504272460938, -0.715179443359375, -0.6846084594726562, -0.6540374755859375, -0.6234664916992188, -0.5928955078125, -0.5623245239257812, -0.5317535400390625, -0.5011825561523438, -0.470611572265625, -0.44004058837890625, -0.4094696044921875, -0.37889862060546875, -0.34832763671875, -0.31775665283203125, -0.2871856689453125, -0.25661468505859375, -0.226043701171875, -0.19547271728515625, -0.1649017333984375, -0.13433074951171875, -0.103759765625, -0.07318878173828125, -0.0426177978515625, -0.01204681396484375, 0.018524169921875, 0.04909515380859375, 0.0796661376953125, 0.11023712158203125, 0.14080810546875, 0.17137908935546875, 0.2019500732421875, 0.23252105712890625, 0.263092041015625, 0.29366302490234375, 0.3242340087890625, 0.35480499267578125, 0.3853759765625, 0.41594696044921875, 0.4465179443359375, 0.47708892822265625, 0.507659912109375, 0.5382308959960938, 0.5688018798828125, 0.5993728637695312, 0.62994384765625, 0.6605148315429688, 0.6910858154296875, 0.7216567993164062, 0.752227783203125, 0.7827987670898438, 0.8133697509765625, 0.8439407348632812, 0.87451171875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 7.0, 29.0, 36.0, 62.0, 87.0, 230.0, 573.0, 2181.0, 14151.0, 266774.0, 728353.0, 30891.0, 3696.0, 851.0, 329.0, 126.0, 55.0, 43.0, 24.0, 14.0, 10.0, 7.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2216796875, -0.21167755126953125, -0.2016754150390625, -0.19167327880859375, -0.181671142578125, -0.17166900634765625, -0.1616668701171875, -0.15166473388671875, -0.14166259765625, -0.13166046142578125, -0.1216583251953125, -0.11165618896484375, -0.101654052734375, -0.09165191650390625, -0.0816497802734375, -0.07164764404296875, -0.0616455078125, -0.05164337158203125, -0.0416412353515625, -0.03163909912109375, -0.021636962890625, -0.01163482666015625, -0.0016326904296875, 0.00836944580078125, 0.01837158203125, 0.02837371826171875, 0.0383758544921875, 0.04837799072265625, 0.058380126953125, 0.06838226318359375, 0.0783843994140625, 0.08838653564453125, 0.098388671875, 0.10839080810546875, 0.1183929443359375, 0.12839508056640625, 0.138397216796875, 0.14839935302734375, 0.1584014892578125, 0.16840362548828125, 0.17840576171875, 0.18840789794921875, 0.1984100341796875, 0.20841217041015625, 0.218414306640625, 0.22841644287109375, 0.2384185791015625, 0.24842071533203125, 0.2584228515625, 0.26842498779296875, 0.2784271240234375, 0.28842926025390625, 0.298431396484375, 0.30843353271484375, 0.3184356689453125, 0.32843780517578125, 0.33843994140625, 0.34844207763671875, 0.3584442138671875, 0.36844635009765625, 0.378448486328125, 0.38845062255859375, 0.3984527587890625, 0.40845489501953125, 0.41845703125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 11.0, 13.0, 17.0, 24.0, 41.0, 49.0, 88.0, 152.0, 198.0, 146.0, 85.0, 65.0, 35.0, 25.0, 14.0, 7.0, 11.0, 9.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9921531677246094e-05, -2.8461217880249023e-05, -2.7000904083251953e-05, -2.5540590286254883e-05, -2.4080276489257812e-05, -2.2619962692260742e-05, -2.1159648895263672e-05, -1.96993350982666e-05, -1.823902130126953e-05, -1.677870750427246e-05, -1.531839370727539e-05, -1.385807991027832e-05, -1.239776611328125e-05, -1.093745231628418e-05, -9.47713851928711e-06, -8.016824722290039e-06, -6.556510925292969e-06, -5.0961971282958984e-06, -3.635883331298828e-06, -2.175569534301758e-06, -7.152557373046875e-07, 7.450580596923828e-07, 2.205371856689453e-06, 3.6656856536865234e-06, 5.125999450683594e-06, 6.586313247680664e-06, 8.046627044677734e-06, 9.506940841674805e-06, 1.0967254638671875e-05, 1.2427568435668945e-05, 1.3887882232666016e-05, 1.5348196029663086e-05, 1.6808509826660156e-05, 1.8268823623657227e-05, 1.9729137420654297e-05, 2.1189451217651367e-05, 2.2649765014648438e-05, 2.4110078811645508e-05, 2.5570392608642578e-05, 2.703070640563965e-05, 2.849102020263672e-05, 2.995133399963379e-05, 3.141164779663086e-05, 3.287196159362793e-05, 3.4332275390625e-05, 3.579258918762207e-05, 3.725290298461914e-05, 3.871321678161621e-05, 4.017353057861328e-05, 4.163384437561035e-05, 4.309415817260742e-05, 4.455447196960449e-05, 4.601478576660156e-05, 4.747509956359863e-05, 4.89354133605957e-05, 5.0395727157592773e-05, 5.1856040954589844e-05, 5.3316354751586914e-05, 5.4776668548583984e-05, 5.6236982345581055e-05, 5.7697296142578125e-05, 5.9157609939575195e-05, 6.0617923736572266e-05, 6.207823753356934e-05, 6.35385513305664e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 12.0, 23.0, 49.0, 81.0, 197.0, 444.0, 1326.0, 8145.0, 181141.0, 827390.0, 25739.0, 2778.0, 727.0, 258.0, 99.0, 57.0, 38.0, 21.0, 14.0, 6.0, 5.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57421875, -0.5606193542480469, -0.5470199584960938, -0.5334205627441406, -0.5198211669921875, -0.5062217712402344, -0.49262237548828125, -0.4790229797363281, -0.465423583984375, -0.4518241882324219, -0.43822479248046875, -0.4246253967285156, -0.4110260009765625, -0.3974266052246094, -0.38382720947265625, -0.3702278137207031, -0.35662841796875, -0.3430290222167969, -0.32942962646484375, -0.3158302307128906, -0.3022308349609375, -0.2886314392089844, -0.27503204345703125, -0.2614326477050781, -0.247833251953125, -0.23423385620117188, -0.22063446044921875, -0.20703506469726562, -0.1934356689453125, -0.17983627319335938, -0.16623687744140625, -0.15263748168945312, -0.1390380859375, -0.12543869018554688, -0.11183929443359375, -0.09823989868164062, -0.0846405029296875, -0.07104110717773438, -0.05744171142578125, -0.043842315673828125, -0.030242919921875, -0.016643524169921875, -0.00304412841796875, 0.010555267333984375, 0.0241546630859375, 0.037754058837890625, 0.05135345458984375, 0.06495285034179688, 0.07855224609375, 0.09215164184570312, 0.10575103759765625, 0.11935043334960938, 0.1329498291015625, 0.14654922485351562, 0.16014862060546875, 0.17374801635742188, 0.187347412109375, 0.20094680786132812, 0.21454620361328125, 0.22814559936523438, 0.2417449951171875, 0.2553443908691406, 0.26894378662109375, 0.2825431823730469, 0.296142578125]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 0.0, 5.0, 2.0, 6.0, 12.0, 10.0, 25.0, 38.0, 93.0, 134.0, 256.0, 189.0, 101.0, 50.0, 30.0, 22.0, 14.0, 13.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07476806640625, -0.06971073150634766, -0.06465339660644531, -0.05959606170654297, -0.054538726806640625, -0.04948139190673828, -0.04442405700683594, -0.039366722106933594, -0.03430938720703125, -0.029252052307128906, -0.024194717407226562, -0.01913738250732422, -0.014080047607421875, -0.009022712707519531, -0.0039653778076171875, 0.0010919570922851562, 0.0061492919921875, 0.011206626892089844, 0.016263961791992188, 0.02132129669189453, 0.026378631591796875, 0.03143596649169922, 0.03649330139160156, 0.041550636291503906, 0.04660797119140625, 0.051665306091308594, 0.05672264099121094, 0.06177997589111328, 0.06683731079101562, 0.07189464569091797, 0.07695198059082031, 0.08200931549072266, 0.087066650390625, 0.09212398529052734, 0.09718132019042969, 0.10223865509033203, 0.10729598999023438, 0.11235332489013672, 0.11741065979003906, 0.1224679946899414, 0.12752532958984375, 0.1325826644897461, 0.13763999938964844, 0.14269733428955078, 0.14775466918945312, 0.15281200408935547, 0.1578693389892578, 0.16292667388916016, 0.1679840087890625, 0.17304134368896484, 0.1780986785888672, 0.18315601348876953, 0.18821334838867188, 0.19327068328857422, 0.19832801818847656, 0.2033853530883789, 0.20844268798828125, 0.2135000228881836, 0.21855735778808594, 0.22361469268798828, 0.22867202758789062, 0.23372936248779297, 0.2387866973876953, 0.24384403228759766, 0.2489013671875]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 9.0, 34.0, 60.0, 112.0, 102.0, 151.0, 149.0, 151.0, 100.0, 63.0, 34.0, 20.0, 10.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2313326597213745, -1.1596059799194336, -1.0878793001174927, -1.0161526203155518, -0.9444258809089661, -0.8726992011070251, -0.8009724617004395, -0.7292457818984985, -0.6575191020965576, -0.5857924222946167, -0.5140657424926758, -0.4423390030860901, -0.37061232328414917, -0.29888564348220825, -0.22715893387794495, -0.15543222427368164, -0.08370554447174072, -0.01197884976863861, 0.0597478449344635, 0.1314745396375656, 0.20320123434066772, 0.27492791414260864, 0.34665462374687195, 0.41838133335113525, 0.49010801315307617, 0.5618346929550171, 0.633561372756958, 0.7052881121635437, 0.7770147919654846, 0.8487414717674255, 0.9204682111740112, 0.9921948909759521, 1.0639216899871826, 1.1356483697891235, 1.2073750495910645, 1.2791017293930054, 1.3508284091949463, 1.4225552082061768, 1.4942818880081177, 1.5660085678100586, 1.6377352476119995, 1.7094619274139404, 1.7811886072158813, 1.8529152870178223, 1.9246420860290527, 1.996368646621704, 2.0680954456329346, 2.139822006225586, 2.2115488052368164, 2.283275604248047, 2.3550021648406982, 2.4267289638519287, 2.49845552444458, 2.5701823234558105, 2.641908884048462, 2.7136356830596924, 2.7853622436523438, 2.857089042663574, 2.9288156032562256, 3.000542402267456, 3.0722689628601074, 3.143995761871338, 3.2157223224639893, 3.2874491214752197, 3.35917592048645]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 2.0, 10.0, 3.0, 8.0, 4.0, 10.0, 17.0, 16.0, 16.0, 13.0, 28.0, 34.0, 26.0, 30.0, 27.0, 35.0, 32.0, 41.0, 41.0, 39.0, 40.0, 52.0, 41.0, 35.0, 36.0, 41.0, 34.0, 37.0, 29.0, 38.0, 29.0, 33.0, 21.0, 19.0, 18.0, 17.0, 10.0, 11.0, 11.0, 5.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3773609399795532, -1.333045482635498, -1.2887301445007324, -1.2444146871566772, -1.200099229812622, -1.155783772468567, -1.1114684343338013, -1.067152976989746, -1.022837519645691, -0.9785221219062805, -0.9342066645622253, -0.8898912668228149, -0.8455758094787598, -0.8012604117393494, -0.756945013999939, -0.7126295566558838, -0.6683141589164734, -0.623998761177063, -0.5796833038330078, -0.5353679060935974, -0.49105244874954224, -0.44673705101013184, -0.40242162346839905, -0.35810619592666626, -0.31379076838493347, -0.2694753408432007, -0.2251599133014679, -0.1808445006608963, -0.1365290731191635, -0.09221364557743073, -0.04789823293685913, -0.0035828053951263428, 0.040732622146606445, 0.08504804968833923, 0.12936347723007202, 0.17367888987064362, 0.2179943174123764, 0.262309730052948, 0.3066251575946808, 0.3509405851364136, 0.39525601267814636, 0.43957144021987915, 0.48388686776161194, 0.5282022953033447, 0.5725176930427551, 0.6168331503868103, 0.6611485481262207, 0.7054640054702759, 0.7497794032096863, 0.7940948009490967, 0.8384102582931519, 0.8827256560325623, 0.9270411133766174, 0.9713565111160278, 1.015671968460083, 1.0599873065948486, 1.1043027639389038, 1.148618221282959, 1.1929335594177246, 1.2372490167617798, 1.281564474105835, 1.3258799314498901, 1.3701952695846558, 1.414510726928711, 1.4588261842727661]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 6.0, 9.0, 15.0, 20.0, 25.0, 37.0, 30.0, 50.0, 82.0, 93.0, 143.0, 230.0, 407.0, 1022.0, 2493.0, 7809.0, 37971.0, 452097.0, 2827779.0, 791634.0, 55959.0, 10313.0, 3233.0, 1320.0, 592.0, 335.0, 168.0, 105.0, 87.0, 49.0, 37.0, 32.0, 18.0, 22.0, 13.0, 11.0, 4.0, 7.0, 4.0, 4.0, 2.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.97021484375, -0.93951416015625, -0.9088134765625, -0.87811279296875, -0.847412109375, -0.81671142578125, -0.7860107421875, -0.75531005859375, -0.724609375, -0.69390869140625, -0.6632080078125, -0.63250732421875, -0.601806640625, -0.57110595703125, -0.5404052734375, -0.50970458984375, -0.47900390625, -0.44830322265625, -0.4176025390625, -0.38690185546875, -0.356201171875, -0.32550048828125, -0.2947998046875, -0.26409912109375, -0.2333984375, -0.20269775390625, -0.1719970703125, -0.14129638671875, -0.110595703125, -0.07989501953125, -0.0491943359375, -0.01849365234375, 0.01220703125, 0.04290771484375, 0.0736083984375, 0.10430908203125, 0.135009765625, 0.16571044921875, 0.1964111328125, 0.22711181640625, 0.2578125, 0.28851318359375, 0.3192138671875, 0.34991455078125, 0.380615234375, 0.41131591796875, 0.4420166015625, 0.47271728515625, 0.50341796875, 0.53411865234375, 0.5648193359375, 0.59552001953125, 0.626220703125, 0.65692138671875, 0.6876220703125, 0.71832275390625, 0.7490234375, 0.77972412109375, 0.8104248046875, 0.84112548828125, 0.871826171875, 0.90252685546875, 0.9332275390625, 0.96392822265625, 0.99462890625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 6.0, 12.0, 10.0, 12.0, 16.0, 14.0, 23.0, 30.0, 27.0, 23.0, 38.0, 51.0, 31.0, 35.0, 61.0, 35.0, 50.0, 44.0, 46.0, 49.0, 32.0, 46.0, 47.0, 37.0, 35.0, 23.0, 14.0, 28.0, 23.0, 15.0, 18.0, 17.0, 12.0, 11.0, 8.0, 6.0, 5.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41455078125, -0.39963531494140625, -0.3847198486328125, -0.36980438232421875, -0.354888916015625, -0.33997344970703125, -0.3250579833984375, -0.31014251708984375, -0.29522705078125, -0.28031158447265625, -0.2653961181640625, -0.25048065185546875, -0.235565185546875, -0.22064971923828125, -0.2057342529296875, -0.19081878662109375, -0.1759033203125, -0.16098785400390625, -0.1460723876953125, -0.13115692138671875, -0.116241455078125, -0.10132598876953125, -0.0864105224609375, -0.07149505615234375, -0.05657958984375, -0.04166412353515625, -0.0267486572265625, -0.01183319091796875, 0.003082275390625, 0.01799774169921875, 0.0329132080078125, 0.04782867431640625, 0.062744140625, 0.07765960693359375, 0.0925750732421875, 0.10749053955078125, 0.122406005859375, 0.13732147216796875, 0.1522369384765625, 0.16715240478515625, 0.18206787109375, 0.19698333740234375, 0.2118988037109375, 0.22681427001953125, 0.241729736328125, 0.25664520263671875, 0.2715606689453125, 0.28647613525390625, 0.3013916015625, 0.31630706787109375, 0.3312225341796875, 0.34613800048828125, 0.361053466796875, 0.37596893310546875, 0.3908843994140625, 0.40579986572265625, 0.42071533203125, 0.43563079833984375, 0.4505462646484375, 0.46546173095703125, 0.480377197265625, 0.49529266357421875, 0.5102081298828125, 0.5251235961914062, 0.5400390625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 3.0, 3.0, 5.0, 5.0, 15.0, 14.0, 22.0, 26.0, 54.0, 80.0, 115.0, 241.0, 528.0, 1256.0, 3823.0, 16930.0, 156813.0, 3529445.0, 447215.0, 29258.0, 5427.0, 1724.0, 622.0, 279.0, 160.0, 84.0, 40.0, 26.0, 27.0, 11.0, 8.0, 8.0, 5.0, 3.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5810546875, -1.5390625, -1.4970703125, -1.455078125, -1.4130859375, -1.37109375, -1.3291015625, -1.287109375, -1.2451171875, -1.203125, -1.1611328125, -1.119140625, -1.0771484375, -1.03515625, -0.9931640625, -0.951171875, -0.9091796875, -0.8671875, -0.8251953125, -0.783203125, -0.7412109375, -0.69921875, -0.6572265625, -0.615234375, -0.5732421875, -0.53125, -0.4892578125, -0.447265625, -0.4052734375, -0.36328125, -0.3212890625, -0.279296875, -0.2373046875, -0.1953125, -0.1533203125, -0.111328125, -0.0693359375, -0.02734375, 0.0146484375, 0.056640625, 0.0986328125, 0.140625, 0.1826171875, 0.224609375, 0.2666015625, 0.30859375, 0.3505859375, 0.392578125, 0.4345703125, 0.4765625, 0.5185546875, 0.560546875, 0.6025390625, 0.64453125, 0.6865234375, 0.728515625, 0.7705078125, 0.8125, 0.8544921875, 0.896484375, 0.9384765625, 0.98046875, 1.0224609375, 1.064453125, 1.1064453125]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 6.0, 2.0, 6.0, 9.0, 10.0, 16.0, 28.0, 29.0, 41.0, 68.0, 93.0, 137.0, 186.0, 268.0, 372.0, 467.0, 482.0, 489.0, 377.0, 287.0, 194.0, 152.0, 95.0, 58.0, 50.0, 26.0, 21.0, 23.0, 18.0, 12.0, 7.0, 10.0, 6.0, 5.0, 5.0, 3.0, 5.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.249267578125, -0.2411346435546875, -0.233001708984375, -0.2248687744140625, -0.21673583984375, -0.2086029052734375, -0.200469970703125, -0.1923370361328125, -0.1842041015625, -0.1760711669921875, -0.167938232421875, -0.1598052978515625, -0.15167236328125, -0.1435394287109375, -0.135406494140625, -0.1272735595703125, -0.119140625, -0.1110076904296875, -0.102874755859375, -0.0947418212890625, -0.08660888671875, -0.0784759521484375, -0.070343017578125, -0.0622100830078125, -0.0540771484375, -0.0459442138671875, -0.037811279296875, -0.0296783447265625, -0.02154541015625, -0.0134124755859375, -0.005279541015625, 0.0028533935546875, 0.010986328125, 0.0191192626953125, 0.027252197265625, 0.0353851318359375, 0.04351806640625, 0.0516510009765625, 0.059783935546875, 0.0679168701171875, 0.0760498046875, 0.0841827392578125, 0.092315673828125, 0.1004486083984375, 0.10858154296875, 0.1167144775390625, 0.124847412109375, 0.1329803466796875, 0.14111328125, 0.1492462158203125, 0.157379150390625, 0.1655120849609375, 0.17364501953125, 0.1817779541015625, 0.189910888671875, 0.1980438232421875, 0.2061767578125, 0.2143096923828125, 0.222442626953125, 0.2305755615234375, 0.23870849609375, 0.2468414306640625, 0.254974365234375, 0.2631072998046875, 0.271240234375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 8.0, 5.0, 7.0, 15.0, 13.0, 14.0, 29.0, 36.0, 52.0, 52.0, 65.0, 77.0, 68.0, 80.0, 80.0, 72.0, 49.0, 71.0, 64.0, 34.0, 32.0, 30.0, 11.0, 13.0, 9.0, 5.0, 3.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0232040882110596, -0.994565486907959, -0.9659268260002136, -0.937288224697113, -0.9086496233940125, -0.8800109624862671, -0.8513723611831665, -0.8227337598800659, -0.7940950989723206, -0.76545649766922, -0.7368178367614746, -0.708179235458374, -0.6795406341552734, -0.6509019732475281, -0.6222633719444275, -0.5936247110366821, -0.5649861097335815, -0.536347508430481, -0.5077088475227356, -0.479070246219635, -0.45043161511421204, -0.42179298400878906, -0.3931543827056885, -0.3645157516002655, -0.3358771800994873, -0.30723854899406433, -0.27859994769096375, -0.24996131658554077, -0.2213226854801178, -0.19268406927585602, -0.16404545307159424, -0.13540682196617126, -0.10676819086074829, -0.07812956720590591, -0.049490947276353836, -0.020852327346801758, 0.007786296308040619, 0.036424919962882996, 0.06506353616714478, 0.09370216727256775, 0.12234078347682953, 0.1509793996810913, 0.17961803078651428, 0.20825664699077606, 0.23689526319503784, 0.2655338943004608, 0.2941725254058838, 0.3228111267089844, 0.35144975781440735, 0.3800883889198303, 0.4087269902229309, 0.4373656213283539, 0.46600425243377686, 0.49464285373687744, 0.523281455039978, 0.5519201159477234, 0.580558717250824, 0.6091973185539246, 0.6378359794616699, 0.6664745807647705, 0.6951131820678711, 0.7237518429756165, 0.752390444278717, 0.7810291051864624, 0.809667706489563]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 6.0, 4.0, 3.0, 3.0, 5.0, 9.0, 9.0, 8.0, 17.0, 10.0, 14.0, 15.0, 27.0, 19.0, 33.0, 32.0, 31.0, 24.0, 29.0, 35.0, 37.0, 38.0, 43.0, 34.0, 46.0, 49.0, 36.0, 33.0, 35.0, 30.0, 32.0, 29.0, 24.0, 21.0, 22.0, 22.0, 17.0, 18.0, 18.0, 11.0, 17.0, 13.0, 11.0, 13.0, 11.0, 3.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5270301699638367, -0.5106033682823181, -0.49417659640312195, -0.4777498245239258, -0.4613230228424072, -0.44489622116088867, -0.4284694492816925, -0.41204267740249634, -0.3956158757209778, -0.37918907403945923, -0.36276230216026306, -0.3463355302810669, -0.32990872859954834, -0.3134819269180298, -0.2970551550388336, -0.28062838315963745, -0.2642015814781189, -0.24777479469776154, -0.23134800791740417, -0.21492122113704681, -0.19849443435668945, -0.1820676475763321, -0.16564086079597473, -0.14921407401561737, -0.13278728723526, -0.11636050045490265, -0.09993371367454529, -0.08350692689418793, -0.06708014011383057, -0.050653353333473206, -0.034226566553115845, -0.017799779772758484, -0.0013729333877563477, 0.015053853392601013, 0.031480640172958374, 0.047907426953315735, 0.0643342137336731, 0.08076100051403046, 0.09718778729438782, 0.11361457407474518, 0.13004136085510254, 0.1464681476354599, 0.16289493441581726, 0.17932172119617462, 0.19574850797653198, 0.21217529475688934, 0.2286020815372467, 0.24502886831760406, 0.2614556550979614, 0.27788245677948, 0.29430922865867615, 0.3107360005378723, 0.32716280221939087, 0.3435896039009094, 0.3600163757801056, 0.37644314765930176, 0.3928699493408203, 0.40929675102233887, 0.42572352290153503, 0.4421502947807312, 0.45857709646224976, 0.4750038981437683, 0.4914306700229645, 0.5078574419021606, 0.5242842435836792]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 16.0, 25.0, 25.0, 61.0, 114.0, 212.0, 435.0, 919.0, 2425.0, 7231.0, 25352.0, 125125.0, 600014.0, 231190.0, 39428.0, 10274.0, 3329.0, 1199.0, 561.0, 268.0, 144.0, 81.0, 45.0, 32.0, 19.0, 9.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.257568359375, -0.24790573120117188, -0.23824310302734375, -0.22858047485351562, -0.2189178466796875, -0.20925521850585938, -0.19959259033203125, -0.18992996215820312, -0.180267333984375, -0.17060470581054688, -0.16094207763671875, -0.15127944946289062, -0.1416168212890625, -0.13195419311523438, -0.12229156494140625, -0.11262893676757812, -0.10296630859375, -0.09330368041992188, -0.08364105224609375, -0.07397842407226562, -0.0643157958984375, -0.054653167724609375, -0.04499053955078125, -0.035327911376953125, -0.025665283203125, -0.016002655029296875, -0.00634002685546875, 0.003322601318359375, 0.0129852294921875, 0.022647857666015625, 0.03231048583984375, 0.041973114013671875, 0.0516357421875, 0.061298370361328125, 0.07096099853515625, 0.08062362670898438, 0.0902862548828125, 0.09994888305664062, 0.10961151123046875, 0.11927413940429688, 0.128936767578125, 0.13859939575195312, 0.14826202392578125, 0.15792465209960938, 0.1675872802734375, 0.17724990844726562, 0.18691253662109375, 0.19657516479492188, 0.20623779296875, 0.21590042114257812, 0.22556304931640625, 0.23522567749023438, 0.2448883056640625, 0.2545509338378906, 0.26421356201171875, 0.2738761901855469, 0.283538818359375, 0.2932014465332031, 0.30286407470703125, 0.3125267028808594, 0.3221893310546875, 0.3318519592285156, 0.34151458740234375, 0.3511772155761719, 0.36083984375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 8.0, 8.0, 7.0, 16.0, 18.0, 21.0, 18.0, 42.0, 39.0, 46.0, 29.0, 49.0, 48.0, 54.0, 52.0, 54.0, 53.0, 61.0, 57.0, 40.0, 34.0, 36.0, 29.0, 35.0, 24.0, 21.0, 16.0, 16.0, 16.0, 11.0, 14.0, 11.0, 6.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.441162109375, -0.42810821533203125, -0.4150543212890625, -0.40200042724609375, -0.388946533203125, -0.37589263916015625, -0.3628387451171875, -0.34978485107421875, -0.33673095703125, -0.32367706298828125, -0.3106231689453125, -0.29756927490234375, -0.284515380859375, -0.27146148681640625, -0.2584075927734375, -0.24535369873046875, -0.2322998046875, -0.21924591064453125, -0.2061920166015625, -0.19313812255859375, -0.180084228515625, -0.16703033447265625, -0.1539764404296875, -0.14092254638671875, -0.12786865234375, -0.11481475830078125, -0.1017608642578125, -0.08870697021484375, -0.075653076171875, -0.06259918212890625, -0.0495452880859375, -0.03649139404296875, -0.0234375, -0.01038360595703125, 0.0026702880859375, 0.01572418212890625, 0.028778076171875, 0.04183197021484375, 0.0548858642578125, 0.06793975830078125, 0.08099365234375, 0.09404754638671875, 0.1071014404296875, 0.12015533447265625, 0.133209228515625, 0.14626312255859375, 0.1593170166015625, 0.17237091064453125, 0.1854248046875, 0.19847869873046875, 0.2115325927734375, 0.22458648681640625, 0.237640380859375, 0.25069427490234375, 0.2637481689453125, 0.27680206298828125, 0.28985595703125, 0.30290985107421875, 0.3159637451171875, 0.32901763916015625, 0.342071533203125, 0.35512542724609375, 0.3681793212890625, 0.38123321533203125, 0.394287109375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 1.0, 8.0, 11.0, 7.0, 9.0, 17.0, 25.0, 32.0, 40.0, 69.0, 97.0, 109.0, 164.0, 243.0, 383.0, 608.0, 1077.0, 1986.0, 3961.0, 8346.0, 18845.0, 46699.0, 124843.0, 301668.0, 315857.0, 135346.0, 49904.0, 20033.0, 8885.0, 4142.0, 2112.0, 1124.0, 645.0, 395.0, 263.0, 174.0, 115.0, 91.0, 60.0, 35.0, 32.0, 26.0, 12.0, 15.0, 12.0, 5.0, 4.0, 10.0, 7.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.124267578125, -0.12026405334472656, -0.11626052856445312, -0.11225700378417969, -0.10825347900390625, -0.10424995422363281, -0.10024642944335938, -0.09624290466308594, -0.0922393798828125, -0.08823585510253906, -0.08423233032226562, -0.08022880554199219, -0.07622528076171875, -0.07222175598144531, -0.06821823120117188, -0.06421470642089844, -0.060211181640625, -0.05620765686035156, -0.052204132080078125, -0.04820060729980469, -0.04419708251953125, -0.04019355773925781, -0.036190032958984375, -0.03218650817871094, -0.0281829833984375, -0.024179458618164062, -0.020175933837890625, -0.016172409057617188, -0.01216888427734375, -0.008165359497070312, -0.004161834716796875, -0.0001583099365234375, 0.00384521484375, 0.007848739624023438, 0.011852264404296875, 0.015855789184570312, 0.01985931396484375, 0.023862838745117188, 0.027866363525390625, 0.03186988830566406, 0.0358734130859375, 0.03987693786621094, 0.043880462646484375, 0.04788398742675781, 0.05188751220703125, 0.05589103698730469, 0.059894561767578125, 0.06389808654785156, 0.067901611328125, 0.07190513610839844, 0.07590866088867188, 0.07991218566894531, 0.08391571044921875, 0.08791923522949219, 0.09192276000976562, 0.09592628479003906, 0.0999298095703125, 0.10393333435058594, 0.10793685913085938, 0.11194038391113281, 0.11594390869140625, 0.11994743347167969, 0.12395095825195312, 0.12795448303222656, 0.1319580078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 5.0, 6.0, 4.0, 7.0, 4.0, 8.0, 5.0, 8.0, 9.0, 11.0, 16.0, 17.0, 16.0, 24.0, 24.0, 36.0, 32.0, 27.0, 43.0, 36.0, 65.0, 54.0, 68.0, 54.0, 48.0, 37.0, 52.0, 29.0, 33.0, 39.0, 27.0, 28.0, 30.0, 16.0, 14.0, 14.0, 12.0, 7.0, 8.0, 7.0, 5.0, 9.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.67236328125, -0.6480178833007812, -0.6236724853515625, -0.5993270874023438, -0.574981689453125, -0.5506362915039062, -0.5262908935546875, -0.5019454956054688, -0.47760009765625, -0.45325469970703125, -0.4289093017578125, -0.40456390380859375, -0.380218505859375, -0.35587310791015625, -0.3315277099609375, -0.30718231201171875, -0.2828369140625, -0.25849151611328125, -0.2341461181640625, -0.20980072021484375, -0.185455322265625, -0.16110992431640625, -0.1367645263671875, -0.11241912841796875, -0.08807373046875, -0.06372833251953125, -0.0393829345703125, -0.01503753662109375, 0.009307861328125, 0.03365325927734375, 0.0579986572265625, 0.08234405517578125, 0.106689453125, 0.13103485107421875, 0.1553802490234375, 0.17972564697265625, 0.204071044921875, 0.22841644287109375, 0.2527618408203125, 0.27710723876953125, 0.30145263671875, 0.32579803466796875, 0.3501434326171875, 0.37448883056640625, 0.398834228515625, 0.42317962646484375, 0.4475250244140625, 0.47187042236328125, 0.4962158203125, 0.5205612182617188, 0.5449066162109375, 0.5692520141601562, 0.593597412109375, 0.6179428100585938, 0.6422882080078125, 0.6666336059570312, 0.69097900390625, 0.7153244018554688, 0.7396697998046875, 0.7640151977539062, 0.788360595703125, 0.8127059936523438, 0.8370513916015625, 0.8613967895507812, 0.8857421875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 1.0, 8.0, 17.0, 23.0, 32.0, 53.0, 67.0, 100.0, 144.0, 233.0, 347.0, 660.0, 1260.0, 2459.0, 5870.0, 14900.0, 44175.0, 183686.0, 532939.0, 189499.0, 45390.0, 15281.0, 5773.0, 2525.0, 1303.0, 678.0, 400.0, 237.0, 171.0, 100.0, 49.0, 47.0, 24.0, 26.0, 25.0, 15.0, 9.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10968017578125, -0.10640716552734375, -0.1031341552734375, -0.09986114501953125, -0.096588134765625, -0.09331512451171875, -0.0900421142578125, -0.08676910400390625, -0.08349609375, -0.08022308349609375, -0.0769500732421875, -0.07367706298828125, -0.070404052734375, -0.06713104248046875, -0.0638580322265625, -0.06058502197265625, -0.05731201171875, -0.05403900146484375, -0.0507659912109375, -0.04749298095703125, -0.044219970703125, -0.04094696044921875, -0.0376739501953125, -0.03440093994140625, -0.0311279296875, -0.02785491943359375, -0.0245819091796875, -0.02130889892578125, -0.018035888671875, -0.01476287841796875, -0.0114898681640625, -0.00821685791015625, -0.00494384765625, -0.00167083740234375, 0.0016021728515625, 0.00487518310546875, 0.008148193359375, 0.01142120361328125, 0.0146942138671875, 0.01796722412109375, 0.021240234375, 0.02451324462890625, 0.0277862548828125, 0.03105926513671875, 0.034332275390625, 0.03760528564453125, 0.0408782958984375, 0.04415130615234375, 0.04742431640625, 0.05069732666015625, 0.0539703369140625, 0.05724334716796875, 0.060516357421875, 0.06378936767578125, 0.0670623779296875, 0.07033538818359375, 0.0736083984375, 0.07688140869140625, 0.0801544189453125, 0.08342742919921875, 0.086700439453125, 0.08997344970703125, 0.0932464599609375, 0.09651947021484375, 0.09979248046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 10.0, 11.0, 8.0, 10.0, 11.0, 23.0, 23.0, 34.0, 51.0, 63.0, 70.0, 92.0, 97.0, 94.0, 88.0, 74.0, 56.0, 40.0, 29.0, 29.0, 20.0, 19.0, 6.0, 7.0, 11.0, 6.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.337860107421875e-05, -3.2220035791397095e-05, -3.106147050857544e-05, -2.9902905225753784e-05, -2.874433994293213e-05, -2.7585774660110474e-05, -2.642720937728882e-05, -2.5268644094467163e-05, -2.4110078811645508e-05, -2.2951513528823853e-05, -2.1792948246002197e-05, -2.0634382963180542e-05, -1.9475817680358887e-05, -1.831725239753723e-05, -1.7158687114715576e-05, -1.600012183189392e-05, -1.4841556549072266e-05, -1.368299126625061e-05, -1.2524425983428955e-05, -1.13658607006073e-05, -1.0207295417785645e-05, -9.04873013496399e-06, -7.890164852142334e-06, -6.731599569320679e-06, -5.5730342864990234e-06, -4.414469003677368e-06, -3.255903720855713e-06, -2.0973384380340576e-06, -9.387731552124023e-07, 2.1979212760925293e-07, 1.3783574104309082e-06, 2.5369226932525635e-06, 3.6954879760742188e-06, 4.854053258895874e-06, 6.012618541717529e-06, 7.1711838245391846e-06, 8.32974910736084e-06, 9.488314390182495e-06, 1.064687967300415e-05, 1.1805444955825806e-05, 1.2964010238647461e-05, 1.4122575521469116e-05, 1.528114080429077e-05, 1.6439706087112427e-05, 1.7598271369934082e-05, 1.8756836652755737e-05, 1.9915401935577393e-05, 2.1073967218399048e-05, 2.2232532501220703e-05, 2.339109778404236e-05, 2.4549663066864014e-05, 2.570822834968567e-05, 2.6866793632507324e-05, 2.802535891532898e-05, 2.9183924198150635e-05, 3.034248948097229e-05, 3.1501054763793945e-05, 3.26596200466156e-05, 3.3818185329437256e-05, 3.497675061225891e-05, 3.6135315895080566e-05, 3.729388117790222e-05, 3.845244646072388e-05, 3.961101174354553e-05, 4.076957702636719e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 12.0, 20.0, 14.0, 32.0, 42.0, 70.0, 152.0, 258.0, 616.0, 1599.0, 4868.0, 18216.0, 91957.0, 610388.0, 267415.0, 39205.0, 9148.0, 2686.0, 983.0, 410.0, 196.0, 101.0, 56.0, 36.0, 26.0, 10.0, 10.0, 6.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.23583984375, -0.23005294799804688, -0.22426605224609375, -0.21847915649414062, -0.2126922607421875, -0.20690536499023438, -0.20111846923828125, -0.19533157348632812, -0.189544677734375, -0.18375778198242188, -0.17797088623046875, -0.17218399047851562, -0.1663970947265625, -0.16061019897460938, -0.15482330322265625, -0.14903640747070312, -0.14324951171875, -0.13746261596679688, -0.13167572021484375, -0.12588882446289062, -0.1201019287109375, -0.11431503295898438, -0.10852813720703125, -0.10274124145507812, -0.096954345703125, -0.09116744995117188, -0.08538055419921875, -0.07959365844726562, -0.0738067626953125, -0.06801986694335938, -0.06223297119140625, -0.056446075439453125, -0.0506591796875, -0.044872283935546875, -0.03908538818359375, -0.033298492431640625, -0.0275115966796875, -0.021724700927734375, -0.01593780517578125, -0.010150909423828125, -0.004364013671875, 0.001422882080078125, 0.00720977783203125, 0.012996673583984375, 0.0187835693359375, 0.024570465087890625, 0.03035736083984375, 0.036144256591796875, 0.04193115234375, 0.047718048095703125, 0.05350494384765625, 0.059291839599609375, 0.0650787353515625, 0.07086563110351562, 0.07665252685546875, 0.08243942260742188, 0.088226318359375, 0.09401321411132812, 0.09980010986328125, 0.10558700561523438, 0.1113739013671875, 0.11716079711914062, 0.12294769287109375, 0.12873458862304688, 0.134521484375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 7.0, 11.0, 7.0, 11.0, 12.0, 15.0, 18.0, 35.0, 23.0, 38.0, 57.0, 65.0, 79.0, 96.0, 113.0, 98.0, 58.0, 60.0, 37.0, 35.0, 27.0, 20.0, 20.0, 19.0, 12.0, 6.0, 4.0, 6.0, 0.0, 1.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02777099609375, -0.026614665985107422, -0.025458335876464844, -0.024302005767822266, -0.023145675659179688, -0.02198934555053711, -0.02083301544189453, -0.019676685333251953, -0.018520355224609375, -0.017364025115966797, -0.01620769500732422, -0.01505136489868164, -0.013895034790039062, -0.012738704681396484, -0.011582374572753906, -0.010426044464111328, -0.00926971435546875, -0.008113384246826172, -0.006957054138183594, -0.005800724029541016, -0.0046443939208984375, -0.0034880638122558594, -0.0023317337036132812, -0.0011754035949707031, -1.9073486328125e-05, 0.0011372566223144531, 0.0022935867309570312, 0.0034499168395996094, 0.0046062469482421875, 0.005762577056884766, 0.006918907165527344, 0.008075237274169922, 0.0092315673828125, 0.010387897491455078, 0.011544227600097656, 0.012700557708740234, 0.013856887817382812, 0.01501321792602539, 0.01616954803466797, 0.017325878143310547, 0.018482208251953125, 0.019638538360595703, 0.02079486846923828, 0.02195119857788086, 0.023107528686523438, 0.024263858795166016, 0.025420188903808594, 0.026576519012451172, 0.02773284912109375, 0.028889179229736328, 0.030045509338378906, 0.031201839447021484, 0.03235816955566406, 0.03351449966430664, 0.03467082977294922, 0.0358271598815918, 0.036983489990234375, 0.03813982009887695, 0.03929615020751953, 0.04045248031616211, 0.04160881042480469, 0.042765140533447266, 0.043921470642089844, 0.04507780075073242, 0.046234130859375]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 11.0, 7.0, 16.0, 19.0, 38.0, 45.0, 63.0, 83.0, 95.0, 104.0, 95.0, 108.0, 85.0, 69.0, 50.0, 32.0, 32.0, 18.0, 15.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6906836628913879, -0.6698765158653259, -0.6490693092346191, -0.6282621622085571, -0.6074550151824951, -0.5866478681564331, -0.5658407211303711, -0.5450335144996643, -0.5242263674736023, -0.5034192204475403, -0.4826120436191559, -0.4618048667907715, -0.4409977197647095, -0.42019057273864746, -0.39938339591026306, -0.37857621908187866, -0.35776907205581665, -0.33696192502975464, -0.31615474820137024, -0.29534757137298584, -0.27454042434692383, -0.2537332773208618, -0.23292610049247742, -0.2121189385652542, -0.191311776638031, -0.1705046147108078, -0.1496974527835846, -0.1288902908563614, -0.10808312892913818, -0.08727596700191498, -0.06646880507469177, -0.04566164314746857, -0.024854540824890137, -0.004047378897666931, 0.016759783029556274, 0.03756694495677948, 0.058374106884002686, 0.07918126881122589, 0.0999884307384491, 0.1207955926656723, 0.1416027545928955, 0.1624099165201187, 0.18321707844734192, 0.20402424037456512, 0.22483140230178833, 0.24563856422901154, 0.26644572615623474, 0.28725290298461914, 0.30806005001068115, 0.32886719703674316, 0.34967437386512756, 0.37048155069351196, 0.391288697719574, 0.412095844745636, 0.4329030215740204, 0.4537101984024048, 0.4745173454284668, 0.4953244924545288, 0.5161316394805908, 0.5369388461112976, 0.5577459931373596, 0.5785531401634216, 0.5993603467941284, 0.6201674938201904, 0.6409746408462524]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 9.0, 10.0, 13.0, 14.0, 19.0, 17.0, 29.0, 30.0, 24.0, 32.0, 35.0, 45.0, 47.0, 49.0, 43.0, 49.0, 48.0, 66.0, 46.0, 47.0, 39.0, 31.0, 30.0, 31.0, 36.0, 21.0, 25.0, 28.0, 14.0, 19.0, 12.0, 12.0, 9.0, 9.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.43076878786087036, -0.4190334975719452, -0.40729817748069763, -0.39556288719177246, -0.3838275671005249, -0.37209227681159973, -0.36035698652267456, -0.348621666431427, -0.33688637614250183, -0.32515108585357666, -0.3134157657623291, -0.30168047547340393, -0.28994518518447876, -0.2782098650932312, -0.26647457480430603, -0.25473928451538086, -0.2430039644241333, -0.23126865923404694, -0.21953335404396057, -0.2077980637550354, -0.19606275856494904, -0.18432745337486267, -0.1725921630859375, -0.16085685789585114, -0.14912155270576477, -0.1373862475156784, -0.12565094232559204, -0.11391565203666687, -0.1021803468465805, -0.09044504165649414, -0.07870974391698837, -0.0669744461774826, -0.05523917078971863, -0.04350386932492256, -0.031768567860126495, -0.02003326639533043, -0.008297964930534363, 0.0034373365342617035, 0.01517263799905777, 0.026907935738563538, 0.0386432409286499, 0.05037854239344597, 0.062113843858242035, 0.0738491415977478, 0.08558444678783417, 0.09731975197792053, 0.1090550497174263, 0.12079034745693207, 0.13252565264701843, 0.1442609578371048, 0.15599626302719116, 0.16773155331611633, 0.1794668585062027, 0.19120216369628906, 0.20293745398521423, 0.2146727591753006, 0.22640806436538696, 0.23814336955547333, 0.2498786747455597, 0.26161396503448486, 0.2733492851257324, 0.2850845754146576, 0.29681986570358276, 0.3085551857948303, 0.3202904760837555]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 1.0, 7.0, 10.0, 19.0, 18.0, 50.0, 89.0, 227.0, 425.0, 975.0, 2231.0, 5805.0, 17618.0, 79869.0, 556619.0, 318694.0, 46689.0, 11956.0, 4196.0, 1621.0, 736.0, 342.0, 169.0, 81.0, 41.0, 22.0, 13.0, 8.0, 7.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8271484375, -0.802703857421875, -0.77825927734375, -0.753814697265625, -0.7293701171875, -0.704925537109375, -0.68048095703125, -0.656036376953125, -0.631591796875, -0.607147216796875, -0.58270263671875, -0.558258056640625, -0.5338134765625, -0.509368896484375, -0.48492431640625, -0.460479736328125, -0.43603515625, -0.411590576171875, -0.38714599609375, -0.362701416015625, -0.3382568359375, -0.313812255859375, -0.28936767578125, -0.264923095703125, -0.240478515625, -0.216033935546875, -0.19158935546875, -0.167144775390625, -0.1427001953125, -0.118255615234375, -0.09381103515625, -0.069366455078125, -0.044921875, -0.020477294921875, 0.00396728515625, 0.028411865234375, 0.0528564453125, 0.077301025390625, 0.10174560546875, 0.126190185546875, 0.150634765625, 0.175079345703125, 0.19952392578125, 0.223968505859375, 0.2484130859375, 0.272857666015625, 0.29730224609375, 0.321746826171875, 0.34619140625, 0.370635986328125, 0.39508056640625, 0.419525146484375, 0.4439697265625, 0.468414306640625, 0.49285888671875, 0.517303466796875, 0.541748046875, 0.566192626953125, 0.59063720703125, 0.615081787109375, 0.6395263671875, 0.663970947265625, 0.68841552734375, 0.712860107421875, 0.7373046875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 8.0, 8.0, 5.0, 12.0, 14.0, 21.0, 13.0, 20.0, 24.0, 30.0, 35.0, 42.0, 30.0, 32.0, 45.0, 45.0, 47.0, 41.0, 59.0, 48.0, 47.0, 42.0, 39.0, 35.0, 36.0, 30.0, 23.0, 30.0, 14.0, 27.0, 16.0, 20.0, 16.0, 18.0, 7.0, 10.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.68212890625, -0.6590347290039062, -0.6359405517578125, -0.6128463745117188, -0.589752197265625, -0.5666580200195312, -0.5435638427734375, -0.5204696655273438, -0.49737548828125, -0.47428131103515625, -0.4511871337890625, -0.42809295654296875, -0.404998779296875, -0.38190460205078125, -0.3588104248046875, -0.33571624755859375, -0.3126220703125, -0.28952789306640625, -0.2664337158203125, -0.24333953857421875, -0.220245361328125, -0.19715118408203125, -0.1740570068359375, -0.15096282958984375, -0.12786865234375, -0.10477447509765625, -0.0816802978515625, -0.05858612060546875, -0.035491943359375, -0.01239776611328125, 0.0106964111328125, 0.03379058837890625, 0.056884765625, 0.07997894287109375, 0.1030731201171875, 0.12616729736328125, 0.149261474609375, 0.17235565185546875, 0.1954498291015625, 0.21854400634765625, 0.24163818359375, 0.26473236083984375, 0.2878265380859375, 0.31092071533203125, 0.334014892578125, 0.35710906982421875, 0.3802032470703125, 0.40329742431640625, 0.4263916015625, 0.44948577880859375, 0.4725799560546875, 0.49567413330078125, 0.518768310546875, 0.5418624877929688, 0.5649566650390625, 0.5880508422851562, 0.61114501953125, 0.6342391967773438, 0.6573333740234375, 0.6804275512695312, 0.703521728515625, 0.7266159057617188, 0.7497100830078125, 0.7728042602539062, 0.7958984375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 10.0, 15.0, 14.0, 26.0, 35.0, 49.0, 88.0, 130.0, 260.0, 546.0, 1195.0, 3859.0, 17716.0, 204095.0, 752363.0, 56152.0, 8094.0, 2230.0, 800.0, 381.0, 199.0, 98.0, 57.0, 53.0, 23.0, 20.0, 18.0, 7.0, 6.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.51953125, -1.4817962646484375, -1.444061279296875, -1.4063262939453125, -1.36859130859375, -1.3308563232421875, -1.293121337890625, -1.2553863525390625, -1.2176513671875, -1.1799163818359375, -1.142181396484375, -1.1044464111328125, -1.06671142578125, -1.0289764404296875, -0.991241455078125, -0.9535064697265625, -0.915771484375, -0.8780364990234375, -0.840301513671875, -0.8025665283203125, -0.76483154296875, -0.7270965576171875, -0.689361572265625, -0.6516265869140625, -0.6138916015625, -0.5761566162109375, -0.538421630859375, -0.5006866455078125, -0.46295166015625, -0.4252166748046875, -0.387481689453125, -0.3497467041015625, -0.31201171875, -0.2742767333984375, -0.236541748046875, -0.1988067626953125, -0.16107177734375, -0.1233367919921875, -0.085601806640625, -0.0478668212890625, -0.0101318359375, 0.0276031494140625, 0.065338134765625, 0.1030731201171875, 0.14080810546875, 0.1785430908203125, 0.216278076171875, 0.2540130615234375, 0.291748046875, 0.3294830322265625, 0.367218017578125, 0.4049530029296875, 0.44268798828125, 0.4804229736328125, 0.518157958984375, 0.5558929443359375, 0.5936279296875, 0.6313629150390625, 0.669097900390625, 0.7068328857421875, 0.74456787109375, 0.7823028564453125, 0.820037841796875, 0.8577728271484375, 0.8955078125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 8.0, 5.0, 5.0, 4.0, 8.0, 4.0, 10.0, 11.0, 13.0, 26.0, 18.0, 37.0, 43.0, 52.0, 55.0, 56.0, 50.0, 53.0, 81.0, 59.0, 57.0, 49.0, 56.0, 43.0, 41.0, 29.0, 21.0, 18.0, 22.0, 17.0, 8.0, 11.0, 9.0, 7.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.11328125, -1.080780029296875, -1.04827880859375, -1.015777587890625, -0.9832763671875, -0.950775146484375, -0.91827392578125, -0.885772705078125, -0.853271484375, -0.820770263671875, -0.78826904296875, -0.755767822265625, -0.7232666015625, -0.690765380859375, -0.65826416015625, -0.625762939453125, -0.59326171875, -0.560760498046875, -0.52825927734375, -0.495758056640625, -0.4632568359375, -0.430755615234375, -0.39825439453125, -0.365753173828125, -0.333251953125, -0.300750732421875, -0.26824951171875, -0.235748291015625, -0.2032470703125, -0.170745849609375, -0.13824462890625, -0.105743408203125, -0.0732421875, -0.040740966796875, -0.00823974609375, 0.024261474609375, 0.0567626953125, 0.089263916015625, 0.12176513671875, 0.154266357421875, 0.186767578125, 0.219268798828125, 0.25177001953125, 0.284271240234375, 0.3167724609375, 0.349273681640625, 0.38177490234375, 0.414276123046875, 0.44677734375, 0.479278564453125, 0.51177978515625, 0.544281005859375, 0.5767822265625, 0.609283447265625, 0.64178466796875, 0.674285888671875, 0.706787109375, 0.739288330078125, 0.77178955078125, 0.804290771484375, 0.8367919921875, 0.869293212890625, 0.90179443359375, 0.934295654296875, 0.966796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 9.0, 12.0, 15.0, 35.0, 64.0, 130.0, 244.0, 733.0, 2712.0, 14242.0, 139338.0, 781119.0, 95711.0, 10872.0, 2235.0, 620.0, 233.0, 109.0, 46.0, 23.0, 11.0, 11.0, 7.0, 10.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.292236328125, -0.2837486267089844, -0.27526092529296875, -0.2667732238769531, -0.2582855224609375, -0.24979782104492188, -0.24131011962890625, -0.23282241821289062, -0.224334716796875, -0.21584701538085938, -0.20735931396484375, -0.19887161254882812, -0.1903839111328125, -0.18189620971679688, -0.17340850830078125, -0.16492080688476562, -0.15643310546875, -0.14794540405273438, -0.13945770263671875, -0.13097000122070312, -0.1224822998046875, -0.11399459838867188, -0.10550689697265625, -0.09701919555664062, -0.088531494140625, -0.08004379272460938, -0.07155609130859375, -0.06306838989257812, -0.0545806884765625, -0.046092987060546875, -0.03760528564453125, -0.029117584228515625, -0.0206298828125, -0.012142181396484375, -0.00365447998046875, 0.004833221435546875, 0.0133209228515625, 0.021808624267578125, 0.03029632568359375, 0.038784027099609375, 0.047271728515625, 0.055759429931640625, 0.06424713134765625, 0.07273483276367188, 0.0812225341796875, 0.08971023559570312, 0.09819793701171875, 0.10668563842773438, 0.11517333984375, 0.12366104125976562, 0.13214874267578125, 0.14063644409179688, 0.1491241455078125, 0.15761184692382812, 0.16609954833984375, 0.17458724975585938, 0.183074951171875, 0.19156265258789062, 0.20005035400390625, 0.20853805541992188, 0.2170257568359375, 0.22551345825195312, 0.23400115966796875, 0.24248886108398438, 0.2509765625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 7.0, 7.0, 6.0, 13.0, 14.0, 17.0, 39.0, 58.0, 85.0, 118.0, 147.0, 130.0, 115.0, 86.0, 50.0, 41.0, 29.0, 16.0, 7.0, 6.0, 4.0, 4.0, 0.0, 6.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.661083221435547e-05, -4.550628364086151e-05, -4.4401735067367554e-05, -4.3297186493873596e-05, -4.219263792037964e-05, -4.108808934688568e-05, -3.9983540773391724e-05, -3.8878992199897766e-05, -3.777444362640381e-05, -3.666989505290985e-05, -3.5565346479415894e-05, -3.4460797905921936e-05, -3.335624933242798e-05, -3.225170075893402e-05, -3.1147152185440063e-05, -3.0042603611946106e-05, -2.893805503845215e-05, -2.783350646495819e-05, -2.6728957891464233e-05, -2.5624409317970276e-05, -2.451986074447632e-05, -2.341531217098236e-05, -2.2310763597488403e-05, -2.1206215023994446e-05, -2.0101666450500488e-05, -1.899711787700653e-05, -1.7892569303512573e-05, -1.6788020730018616e-05, -1.5683472156524658e-05, -1.45789235830307e-05, -1.3474375009536743e-05, -1.2369826436042786e-05, -1.1265277862548828e-05, -1.016072928905487e-05, -9.056180715560913e-06, -7.951632142066956e-06, -6.847083568572998e-06, -5.7425349950790405e-06, -4.637986421585083e-06, -3.5334378480911255e-06, -2.428889274597168e-06, -1.3243407011032104e-06, -2.1979212760925293e-07, 8.847564458847046e-07, 1.989305019378662e-06, 3.0938535928726196e-06, 4.198402166366577e-06, 5.302950739860535e-06, 6.407499313354492e-06, 7.51204788684845e-06, 8.616596460342407e-06, 9.721145033836365e-06, 1.0825693607330322e-05, 1.193024218082428e-05, 1.3034790754318237e-05, 1.4139339327812195e-05, 1.5243887901306152e-05, 1.634843647480011e-05, 1.7452985048294067e-05, 1.8557533621788025e-05, 1.9662082195281982e-05, 2.076663076877594e-05, 2.1871179342269897e-05, 2.2975727915763855e-05, 2.4080276489257812e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 8.0, 8.0, 19.0, 19.0, 45.0, 70.0, 180.0, 653.0, 2405.0, 13944.0, 252277.0, 737485.0, 35432.0, 4406.0, 1041.0, 290.0, 123.0, 65.0, 25.0, 22.0, 13.0, 5.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.5068359375, -0.49390411376953125, -0.4809722900390625, -0.46804046630859375, -0.455108642578125, -0.44217681884765625, -0.4292449951171875, -0.41631317138671875, -0.40338134765625, -0.39044952392578125, -0.3775177001953125, -0.36458587646484375, -0.351654052734375, -0.33872222900390625, -0.3257904052734375, -0.31285858154296875, -0.2999267578125, -0.28699493408203125, -0.2740631103515625, -0.26113128662109375, -0.248199462890625, -0.23526763916015625, -0.2223358154296875, -0.20940399169921875, -0.19647216796875, -0.18354034423828125, -0.1706085205078125, -0.15767669677734375, -0.144744873046875, -0.13181304931640625, -0.1188812255859375, -0.10594940185546875, -0.093017578125, -0.08008575439453125, -0.0671539306640625, -0.05422210693359375, -0.041290283203125, -0.02835845947265625, -0.0154266357421875, -0.00249481201171875, 0.01043701171875, 0.02336883544921875, 0.0363006591796875, 0.04923248291015625, 0.062164306640625, 0.07509613037109375, 0.0880279541015625, 0.10095977783203125, 0.1138916015625, 0.12682342529296875, 0.1397552490234375, 0.15268707275390625, 0.165618896484375, 0.17855072021484375, 0.1914825439453125, 0.20441436767578125, 0.21734619140625, 0.23027801513671875, 0.2432098388671875, 0.25614166259765625, 0.269073486328125, 0.28200531005859375, 0.2949371337890625, 0.30786895751953125, 0.32080078125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 7.0, 10.0, 19.0, 28.0, 42.0, 73.0, 91.0, 114.0, 175.0, 151.0, 97.0, 85.0, 39.0, 27.0, 12.0, 9.0, 3.0, 5.0, 6.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1116943359375, -0.107177734375, -0.1026611328125, -0.09814453125, -0.0936279296875, -0.089111328125, -0.0845947265625, -0.080078125, -0.0755615234375, -0.071044921875, -0.0665283203125, -0.06201171875, -0.0574951171875, -0.052978515625, -0.0484619140625, -0.0439453125, -0.0394287109375, -0.034912109375, -0.0303955078125, -0.02587890625, -0.0213623046875, -0.016845703125, -0.0123291015625, -0.0078125, -0.0032958984375, 0.001220703125, 0.0057373046875, 0.01025390625, 0.0147705078125, 0.019287109375, 0.0238037109375, 0.0283203125, 0.0328369140625, 0.037353515625, 0.0418701171875, 0.04638671875, 0.0509033203125, 0.055419921875, 0.0599365234375, 0.064453125, 0.0689697265625, 0.073486328125, 0.0780029296875, 0.08251953125, 0.0870361328125, 0.091552734375, 0.0960693359375, 0.1005859375, 0.1051025390625, 0.109619140625, 0.1141357421875, 0.11865234375, 0.1231689453125, 0.127685546875, 0.1322021484375, 0.13671875, 0.1412353515625, 0.145751953125, 0.1502685546875, 0.15478515625, 0.1593017578125, 0.163818359375, 0.1683349609375, 0.1728515625, 0.1773681640625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 11.0, 27.0, 44.0, 123.0, 185.0, 191.0, 178.0, 134.0, 65.0, 34.0, 13.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.579605221748352, -1.4899643659591675, -1.4003233909606934, -1.3106825351715088, -1.2210416793823242, -1.1314008235931396, -1.041759967803955, -0.952118992805481, -0.8624781370162964, -0.7728372812271118, -0.6831963658332825, -0.5935554504394531, -0.5039145946502686, -0.4142737090587616, -0.32463282346725464, -0.2349919080734253, -0.14535105228424072, -0.055710166692733765, 0.03393071889877319, 0.12357160449028015, 0.2132124900817871, 0.30285337567329407, 0.392494261264801, 0.48213517665863037, 0.5717760324478149, 0.6614168882369995, 0.7510578036308289, 0.8406987190246582, 0.9303395748138428, 1.0199804306030273, 1.109621286392212, 1.199262261390686, 1.2889032363891602, 1.3785440921783447, 1.4681849479675293, 1.5578259229660034, 1.647466778755188, 1.7371076345443726, 1.8267486095428467, 1.9163894653320312, 2.006030321121216, 2.0956711769104004, 2.185312032699585, 2.2749528884887695, 2.364593982696533, 2.4542348384857178, 2.5438756942749023, 2.633516550064087, 2.7231574058532715, 2.812798261642456, 2.9024391174316406, 2.992079973220825, 3.0817208290100098, 3.1713619232177734, 3.261002779006958, 3.3506436347961426, 3.440284490585327, 3.5299253463745117, 3.6195662021636963, 3.709207057952881, 3.7988481521606445, 3.888489007949829, 3.9781298637390137, 4.067770957946777, 4.157411575317383]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 8.0, 4.0, 2.0, 12.0, 15.0, 10.0, 21.0, 10.0, 19.0, 14.0, 24.0, 16.0, 26.0, 24.0, 37.0, 35.0, 31.0, 41.0, 43.0, 56.0, 49.0, 43.0, 47.0, 35.0, 41.0, 46.0, 37.0, 35.0, 30.0, 33.0, 20.0, 26.0, 14.0, 19.0, 17.0, 9.0, 7.0, 10.0, 15.0, 7.0, 9.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2883727550506592, -1.2457438707351685, -1.2031149864196777, -1.1604862213134766, -1.1178573369979858, -1.0752284526824951, -1.0325995683670044, -0.9899707436561584, -0.9473419189453125, -0.9047130346298218, -0.8620842099189758, -0.8194553256034851, -0.7768265008926392, -0.7341976165771484, -0.6915687322616577, -0.6489399075508118, -0.606311023235321, -0.5636821389198303, -0.5210533142089844, -0.47842442989349365, -0.4357956051826477, -0.393166720867157, -0.35053786635398865, -0.3079090118408203, -0.265280157327652, -0.22265130281448364, -0.1800224483013153, -0.13739357888698578, -0.09476472437381744, -0.05213586986064911, -0.00950700044631958, 0.033121854066848755, 0.07575070858001709, 0.11837956309318542, 0.16100841760635376, 0.2036372870206833, 0.24626614153385162, 0.28889501094818115, 0.3315238654613495, 0.3741527199745178, 0.41678157448768616, 0.4594104290008545, 0.5020393133163452, 0.5446681380271912, 0.5872970223426819, 0.6299258470535278, 0.6725547313690186, 0.7151836156845093, 0.7578124403953552, 0.800441324710846, 0.8430701494216919, 0.8856990337371826, 0.9283278584480286, 0.9709567427635193, 1.0135855674743652, 1.056214451789856, 1.0988433361053467, 1.1414722204208374, 1.1841011047363281, 1.2267298698425293, 1.26935875415802, 1.3119876384735107, 1.3546165227890015, 1.3972454071044922, 1.4398741722106934]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 6.0, 7.0, 10.0, 12.0, 15.0, 18.0, 24.0, 35.0, 40.0, 51.0, 85.0, 149.0, 241.0, 466.0, 1014.0, 2397.0, 7093.0, 30366.0, 355066.0, 2993356.0, 741667.0, 46951.0, 9446.0, 3146.0, 1228.0, 569.0, 281.0, 189.0, 107.0, 51.0, 51.0, 23.0, 25.0, 15.0, 13.0, 14.0, 12.0, 10.0, 7.0, 5.0, 7.0, 1.0, 6.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.99609375, -0.96356201171875, -0.9310302734375, -0.89849853515625, -0.865966796875, -0.83343505859375, -0.8009033203125, -0.76837158203125, -0.73583984375, -0.70330810546875, -0.6707763671875, -0.63824462890625, -0.605712890625, -0.57318115234375, -0.5406494140625, -0.50811767578125, -0.4755859375, -0.44305419921875, -0.4105224609375, -0.37799072265625, -0.345458984375, -0.31292724609375, -0.2803955078125, -0.24786376953125, -0.21533203125, -0.18280029296875, -0.1502685546875, -0.11773681640625, -0.085205078125, -0.05267333984375, -0.0201416015625, 0.01239013671875, 0.044921875, 0.07745361328125, 0.1099853515625, 0.14251708984375, 0.175048828125, 0.20758056640625, 0.2401123046875, 0.27264404296875, 0.30517578125, 0.33770751953125, 0.3702392578125, 0.40277099609375, 0.435302734375, 0.46783447265625, 0.5003662109375, 0.53289794921875, 0.5654296875, 0.59796142578125, 0.6304931640625, 0.66302490234375, 0.695556640625, 0.72808837890625, 0.7606201171875, 0.79315185546875, 0.82568359375, 0.85821533203125, 0.8907470703125, 0.92327880859375, 0.955810546875, 0.98834228515625, 1.0208740234375, 1.05340576171875, 1.0859375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 1.0, 5.0, 4.0, 9.0, 8.0, 2.0, 13.0, 13.0, 14.0, 24.0, 22.0, 17.0, 21.0, 38.0, 28.0, 40.0, 41.0, 38.0, 36.0, 44.0, 43.0, 43.0, 38.0, 47.0, 40.0, 41.0, 37.0, 40.0, 36.0, 33.0, 24.0, 26.0, 26.0, 26.0, 11.0, 14.0, 8.0, 11.0, 6.0, 8.0, 3.0, 2.0, 4.0, 6.0, 2.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.372802734375, -0.3603630065917969, -0.34792327880859375, -0.3354835510253906, -0.3230438232421875, -0.3106040954589844, -0.29816436767578125, -0.2857246398925781, -0.273284912109375, -0.2608451843261719, -0.24840545654296875, -0.23596572875976562, -0.2235260009765625, -0.21108627319335938, -0.19864654541015625, -0.18620681762695312, -0.17376708984375, -0.16132736206054688, -0.14888763427734375, -0.13644790649414062, -0.1240081787109375, -0.11156845092773438, -0.09912872314453125, -0.08668899536132812, -0.074249267578125, -0.061809539794921875, -0.04936981201171875, -0.036930084228515625, -0.0244903564453125, -0.012050628662109375, 0.00038909912109375, 0.012828826904296875, 0.0252685546875, 0.037708282470703125, 0.05014801025390625, 0.06258773803710938, 0.0750274658203125, 0.08746719360351562, 0.09990692138671875, 0.11234664916992188, 0.124786376953125, 0.13722610473632812, 0.14966583251953125, 0.16210556030273438, 0.1745452880859375, 0.18698501586914062, 0.19942474365234375, 0.21186447143554688, 0.22430419921875, 0.23674392700195312, 0.24918365478515625, 0.2616233825683594, 0.2740631103515625, 0.2865028381347656, 0.29894256591796875, 0.3113822937011719, 0.323822021484375, 0.3362617492675781, 0.34870147705078125, 0.3611412048339844, 0.3735809326171875, 0.3860206604003906, 0.39846038818359375, 0.4109001159667969, 0.42333984375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 7.0, 7.0, 14.0, 14.0, 20.0, 41.0, 98.0, 201.0, 701.0, 2785.0, 19486.0, 1660781.0, 2482533.0, 23300.0, 3121.0, 702.0, 239.0, 95.0, 50.0, 31.0, 13.0, 15.0, 12.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.380859375, -2.3198699951171875, -2.258880615234375, -2.1978912353515625, -2.13690185546875, -2.0759124755859375, -2.014923095703125, -1.9539337158203125, -1.8929443359375, -1.8319549560546875, -1.770965576171875, -1.7099761962890625, -1.64898681640625, -1.5879974365234375, -1.527008056640625, -1.4660186767578125, -1.405029296875, -1.3440399169921875, -1.283050537109375, -1.2220611572265625, -1.16107177734375, -1.1000823974609375, -1.039093017578125, -0.9781036376953125, -0.9171142578125, -0.8561248779296875, -0.795135498046875, -0.7341461181640625, -0.67315673828125, -0.6121673583984375, -0.551177978515625, -0.4901885986328125, -0.42919921875, -0.3682098388671875, -0.307220458984375, -0.2462310791015625, -0.18524169921875, -0.1242523193359375, -0.063262939453125, -0.0022735595703125, 0.0587158203125, 0.1197052001953125, 0.180694580078125, 0.2416839599609375, 0.30267333984375, 0.3636627197265625, 0.424652099609375, 0.4856414794921875, 0.546630859375, 0.6076202392578125, 0.668609619140625, 0.7295989990234375, 0.79058837890625, 0.8515777587890625, 0.912567138671875, 0.9735565185546875, 1.0345458984375, 1.0955352783203125, 1.156524658203125, 1.2175140380859375, 1.27850341796875, 1.3394927978515625, 1.400482177734375, 1.4614715576171875, 1.5224609375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 8.0, 9.0, 13.0, 24.0, 37.0, 63.0, 128.0, 223.0, 451.0, 745.0, 865.0, 641.0, 388.0, 216.0, 100.0, 59.0, 42.0, 21.0, 12.0, 14.0, 3.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3115234375, -0.2987518310546875, -0.285980224609375, -0.2732086181640625, -0.26043701171875, -0.2476654052734375, -0.234893798828125, -0.2221221923828125, -0.2093505859375, -0.1965789794921875, -0.183807373046875, -0.1710357666015625, -0.15826416015625, -0.1454925537109375, -0.132720947265625, -0.1199493408203125, -0.107177734375, -0.0944061279296875, -0.081634521484375, -0.0688629150390625, -0.05609130859375, -0.0433197021484375, -0.030548095703125, -0.0177764892578125, -0.0050048828125, 0.0077667236328125, 0.020538330078125, 0.0333099365234375, 0.04608154296875, 0.0588531494140625, 0.071624755859375, 0.0843963623046875, 0.09716796875, 0.1099395751953125, 0.122711181640625, 0.1354827880859375, 0.14825439453125, 0.1610260009765625, 0.173797607421875, 0.1865692138671875, 0.1993408203125, 0.2121124267578125, 0.224884033203125, 0.2376556396484375, 0.25042724609375, 0.2631988525390625, 0.275970458984375, 0.2887420654296875, 0.301513671875, 0.3142852783203125, 0.327056884765625, 0.3398284912109375, 0.35260009765625, 0.3653717041015625, 0.378143310546875, 0.3909149169921875, 0.4036865234375, 0.4164581298828125, 0.429229736328125, 0.4420013427734375, 0.45477294921875, 0.4675445556640625, 0.480316162109375, 0.4930877685546875, 0.505859375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 6.0, 3.0, 4.0, 6.0, 8.0, 20.0, 11.0, 19.0, 21.0, 29.0, 30.0, 30.0, 38.0, 48.0, 48.0, 36.0, 55.0, 55.0, 66.0, 63.0, 55.0, 62.0, 46.0, 33.0, 46.0, 40.0, 35.0, 16.0, 21.0, 15.0, 9.0, 6.0, 9.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.711143970489502, -0.6911450028419495, -0.6711459755897522, -0.6511470079421997, -0.6311479806900024, -0.61114901304245, -0.5911499857902527, -0.5711510181427002, -0.5511519908905029, -0.5311530232429504, -0.5111539959907532, -0.4911549985408783, -0.4711560010910034, -0.4511570334434509, -0.43115803599357605, -0.41115903854370117, -0.3911600708961487, -0.3711610734462738, -0.3511620759963989, -0.33116307854652405, -0.31116408109664917, -0.2911651134490967, -0.2711661159992218, -0.2511671185493469, -0.23116812109947205, -0.21116912364959717, -0.1911701261997223, -0.1711711436510086, -0.15117214620113373, -0.13117314875125885, -0.11117415875196457, -0.09117516875267029, -0.07117623090744019, -0.051177237182855606, -0.031178243458271027, -0.011179249733686447, 0.008819743990898132, 0.02881874144077301, 0.04881773144006729, 0.06881672143936157, 0.08881571888923645, 0.10881471633911133, 0.1288137137889862, 0.1488126963376999, 0.16881169378757477, 0.18881069123744965, 0.20880967378616333, 0.2288086712360382, 0.24880766868591309, 0.26880666613578796, 0.28880566358566284, 0.3088046610355377, 0.3288036584854126, 0.3488026261329651, 0.36880162358283997, 0.38880062103271484, 0.4087996184825897, 0.4287986159324646, 0.4487976133823395, 0.46879661083221436, 0.48879557847976685, 0.5087946057319641, 0.5287935733795166, 0.5487926006317139, 0.5687915682792664]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 7.0, 4.0, 7.0, 7.0, 14.0, 23.0, 13.0, 14.0, 23.0, 22.0, 33.0, 30.0, 33.0, 32.0, 38.0, 48.0, 55.0, 51.0, 52.0, 51.0, 43.0, 39.0, 35.0, 51.0, 43.0, 30.0, 22.0, 26.0, 33.0, 23.0, 14.0, 23.0, 16.0, 5.0, 8.0, 6.0, 7.0, 5.0, 5.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.5663232207298279, -0.549354076385498, -0.5323849320411682, -0.5154157876968384, -0.49844664335250854, -0.4814774990081787, -0.4645083248615265, -0.44753918051719666, -0.4305700361728668, -0.413600891828537, -0.39663174748420715, -0.3796626031398773, -0.3626934289932251, -0.34572428464889526, -0.32875514030456543, -0.3117859959602356, -0.29481685161590576, -0.2778477072715759, -0.2608785629272461, -0.24390940368175507, -0.22694025933742523, -0.2099711149930954, -0.19300195574760437, -0.17603281140327454, -0.1590636670589447, -0.14209452271461487, -0.12512537837028503, -0.108156219124794, -0.09118707478046417, -0.07421793043613434, -0.05724877864122391, -0.04027962684631348, -0.023310542106628418, -0.0063413940370082855, 0.010627754032611847, 0.02759690210223198, 0.04456605017185211, 0.061535194516181946, 0.07850434631109238, 0.09547349810600281, 0.11244264245033264, 0.12941178679466248, 0.1463809311389923, 0.16335009038448334, 0.18031923472881317, 0.197288379073143, 0.21425753831863403, 0.23122668266296387, 0.2481958270072937, 0.26516497135162354, 0.28213411569595337, 0.2991032600402832, 0.31607240438461304, 0.33304154872894287, 0.3500107228755951, 0.3669798672199249, 0.38394901156425476, 0.4009181559085846, 0.41788730025291443, 0.43485644459724426, 0.4518256187438965, 0.4687947630882263, 0.48576390743255615, 0.502733051776886, 0.5197021961212158]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 5.0, 7.0, 8.0, 12.0, 13.0, 15.0, 26.0, 30.0, 36.0, 39.0, 74.0, 81.0, 136.0, 167.0, 334.0, 537.0, 918.0, 1466.0, 2610.0, 4912.0, 12233.0, 65680.0, 532870.0, 366607.0, 40356.0, 9404.0, 4337.0, 2280.0, 1260.0, 737.0, 431.0, 263.0, 193.0, 134.0, 84.0, 74.0, 51.0, 31.0, 20.0, 20.0, 17.0, 19.0, 10.0, 4.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1939697265625, -0.18768882751464844, -0.18140792846679688, -0.1751270294189453, -0.16884613037109375, -0.1625652313232422, -0.15628433227539062, -0.15000343322753906, -0.1437225341796875, -0.13744163513183594, -0.13116073608398438, -0.12487983703613281, -0.11859893798828125, -0.11231803894042969, -0.10603713989257812, -0.09975624084472656, -0.093475341796875, -0.08719444274902344, -0.08091354370117188, -0.07463264465332031, -0.06835174560546875, -0.06207084655761719, -0.055789947509765625, -0.04950904846191406, -0.0432281494140625, -0.03694725036621094, -0.030666351318359375, -0.024385452270507812, -0.01810455322265625, -0.011823654174804688, -0.005542755126953125, 0.0007381439208984375, 0.00701904296875, 0.013299942016601562, 0.019580841064453125, 0.025861740112304688, 0.03214263916015625, 0.03842353820800781, 0.044704437255859375, 0.05098533630371094, 0.0572662353515625, 0.06354713439941406, 0.06982803344726562, 0.07610893249511719, 0.08238983154296875, 0.08867073059082031, 0.09495162963867188, 0.10123252868652344, 0.107513427734375, 0.11379432678222656, 0.12007522583007812, 0.1263561248779297, 0.13263702392578125, 0.1389179229736328, 0.14519882202148438, 0.15147972106933594, 0.1577606201171875, 0.16404151916503906, 0.17032241821289062, 0.1766033172607422, 0.18288421630859375, 0.1891651153564453, 0.19544601440429688, 0.20172691345214844, 0.2080078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 11.0, 8.0, 5.0, 8.0, 12.0, 14.0, 15.0, 14.0, 19.0, 22.0, 28.0, 27.0, 34.0, 28.0, 32.0, 37.0, 43.0, 41.0, 41.0, 35.0, 54.0, 38.0, 38.0, 45.0, 41.0, 43.0, 35.0, 35.0, 26.0, 24.0, 18.0, 18.0, 27.0, 14.0, 16.0, 14.0, 5.0, 6.0, 4.0, 2.0, 4.0, 5.0, 2.0, 4.0, 6.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0], "bins": [-0.3271484375, -0.3172607421875, -0.307373046875, -0.2974853515625, -0.28759765625, -0.2777099609375, -0.267822265625, -0.2579345703125, -0.248046875, -0.2381591796875, -0.228271484375, -0.2183837890625, -0.20849609375, -0.1986083984375, -0.188720703125, -0.1788330078125, -0.1689453125, -0.1590576171875, -0.149169921875, -0.1392822265625, -0.12939453125, -0.1195068359375, -0.109619140625, -0.0997314453125, -0.08984375, -0.0799560546875, -0.070068359375, -0.0601806640625, -0.05029296875, -0.0404052734375, -0.030517578125, -0.0206298828125, -0.0107421875, -0.0008544921875, 0.009033203125, 0.0189208984375, 0.02880859375, 0.0386962890625, 0.048583984375, 0.0584716796875, 0.068359375, 0.0782470703125, 0.088134765625, 0.0980224609375, 0.10791015625, 0.1177978515625, 0.127685546875, 0.1375732421875, 0.1474609375, 0.1573486328125, 0.167236328125, 0.1771240234375, 0.18701171875, 0.1968994140625, 0.206787109375, 0.2166748046875, 0.2265625, 0.2364501953125, 0.246337890625, 0.2562255859375, 0.26611328125, 0.2760009765625, 0.285888671875, 0.2957763671875, 0.3056640625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 6.0, 8.0, 16.0, 25.0, 42.0, 61.0, 102.0, 224.0, 392.0, 818.0, 1873.0, 4851.0, 19584.0, 226327.0, 698008.0, 79718.0, 10418.0, 3403.0, 1291.0, 631.0, 309.0, 169.0, 108.0, 60.0, 34.0, 31.0, 14.0, 3.0, 6.0, 4.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.215576171875, -0.208221435546875, -0.20086669921875, -0.193511962890625, -0.1861572265625, -0.178802490234375, -0.17144775390625, -0.164093017578125, -0.15673828125, -0.149383544921875, -0.14202880859375, -0.134674072265625, -0.1273193359375, -0.119964599609375, -0.11260986328125, -0.105255126953125, -0.097900390625, -0.090545654296875, -0.08319091796875, -0.075836181640625, -0.0684814453125, -0.061126708984375, -0.05377197265625, -0.046417236328125, -0.0390625, -0.031707763671875, -0.02435302734375, -0.016998291015625, -0.0096435546875, -0.002288818359375, 0.00506591796875, 0.012420654296875, 0.019775390625, 0.027130126953125, 0.03448486328125, 0.041839599609375, 0.0491943359375, 0.056549072265625, 0.06390380859375, 0.071258544921875, 0.07861328125, 0.085968017578125, 0.09332275390625, 0.100677490234375, 0.1080322265625, 0.115386962890625, 0.12274169921875, 0.130096435546875, 0.137451171875, 0.144805908203125, 0.15216064453125, 0.159515380859375, 0.1668701171875, 0.174224853515625, 0.18157958984375, 0.188934326171875, 0.1962890625, 0.203643798828125, 0.21099853515625, 0.218353271484375, 0.2257080078125, 0.233062744140625, 0.24041748046875, 0.247772216796875, 0.255126953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 4.0, 1.0, 7.0, 13.0, 7.0, 9.0, 11.0, 12.0, 10.0, 19.0, 26.0, 30.0, 26.0, 36.0, 30.0, 28.0, 41.0, 42.0, 39.0, 42.0, 47.0, 47.0, 54.0, 54.0, 56.0, 39.0, 30.0, 28.0, 28.0, 27.0, 21.0, 19.0, 22.0, 19.0, 11.0, 14.0, 16.0, 6.0, 3.0, 10.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8349609375, -0.8071136474609375, -0.779266357421875, -0.7514190673828125, -0.72357177734375, -0.6957244873046875, -0.667877197265625, -0.6400299072265625, -0.6121826171875, -0.5843353271484375, -0.556488037109375, -0.5286407470703125, -0.50079345703125, -0.4729461669921875, -0.445098876953125, -0.4172515869140625, -0.389404296875, -0.3615570068359375, -0.333709716796875, -0.3058624267578125, -0.27801513671875, -0.2501678466796875, -0.222320556640625, -0.1944732666015625, -0.1666259765625, -0.1387786865234375, -0.110931396484375, -0.0830841064453125, -0.05523681640625, -0.0273895263671875, 0.000457763671875, 0.0283050537109375, 0.05615234375, 0.0839996337890625, 0.111846923828125, 0.1396942138671875, 0.16754150390625, 0.1953887939453125, 0.223236083984375, 0.2510833740234375, 0.2789306640625, 0.3067779541015625, 0.334625244140625, 0.3624725341796875, 0.39031982421875, 0.4181671142578125, 0.446014404296875, 0.4738616943359375, 0.501708984375, 0.5295562744140625, 0.557403564453125, 0.5852508544921875, 0.61309814453125, 0.6409454345703125, 0.668792724609375, 0.6966400146484375, 0.7244873046875, 0.7523345947265625, 0.780181884765625, 0.8080291748046875, 0.83587646484375, 0.8637237548828125, 0.891571044921875, 0.9194183349609375, 0.947265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 11.0, 14.0, 14.0, 17.0, 28.0, 38.0, 47.0, 86.0, 121.0, 178.0, 342.0, 498.0, 957.0, 1963.0, 4458.0, 11812.0, 49729.0, 466734.0, 444244.0, 47132.0, 11520.0, 4412.0, 1907.0, 942.0, 490.0, 293.0, 190.0, 127.0, 61.0, 57.0, 35.0, 19.0, 21.0, 17.0, 7.0, 10.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1080322265625, -0.10454559326171875, -0.1010589599609375, -0.09757232666015625, -0.094085693359375, -0.09059906005859375, -0.0871124267578125, -0.08362579345703125, -0.08013916015625, -0.07665252685546875, -0.0731658935546875, -0.06967926025390625, -0.066192626953125, -0.06270599365234375, -0.0592193603515625, -0.05573272705078125, -0.05224609375, -0.04875946044921875, -0.0452728271484375, -0.04178619384765625, -0.038299560546875, -0.03481292724609375, -0.0313262939453125, -0.02783966064453125, -0.02435302734375, -0.02086639404296875, -0.0173797607421875, -0.01389312744140625, -0.010406494140625, -0.00691986083984375, -0.0034332275390625, 5.340576171875e-05, 0.0035400390625, 0.00702667236328125, 0.0105133056640625, 0.01399993896484375, 0.017486572265625, 0.02097320556640625, 0.0244598388671875, 0.02794647216796875, 0.03143310546875, 0.03491973876953125, 0.0384063720703125, 0.04189300537109375, 0.045379638671875, 0.04886627197265625, 0.0523529052734375, 0.05583953857421875, 0.059326171875, 0.06281280517578125, 0.0662994384765625, 0.06978607177734375, 0.073272705078125, 0.07675933837890625, 0.0802459716796875, 0.08373260498046875, 0.08721923828125, 0.09070587158203125, 0.0941925048828125, 0.09767913818359375, 0.101165771484375, 0.10465240478515625, 0.1081390380859375, 0.11162567138671875, 0.1151123046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 11.0, 4.0, 10.0, 7.0, 12.0, 33.0, 55.0, 75.0, 92.0, 150.0, 124.0, 131.0, 97.0, 62.0, 39.0, 17.0, 19.0, 13.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.510713577270508e-05, -3.381911665201187e-05, -3.2531097531318665e-05, -3.124307841062546e-05, -2.995505928993225e-05, -2.8667040169239044e-05, -2.7379021048545837e-05, -2.609100192785263e-05, -2.4802982807159424e-05, -2.3514963686466217e-05, -2.222694456577301e-05, -2.0938925445079803e-05, -1.9650906324386597e-05, -1.836288720369339e-05, -1.7074868083000183e-05, -1.5786848962306976e-05, -1.449882984161377e-05, -1.3210810720920563e-05, -1.1922791600227356e-05, -1.063477247953415e-05, -9.346753358840942e-06, -8.058734238147736e-06, -6.770715117454529e-06, -5.482695996761322e-06, -4.194676876068115e-06, -2.9066577553749084e-06, -1.6186386346817017e-06, -3.3061951398849487e-07, 9.57399606704712e-07, 2.2454187273979187e-06, 3.5334378480911255e-06, 4.821456968784332e-06, 6.109476089477539e-06, 7.397495210170746e-06, 8.685514330863953e-06, 9.97353345155716e-06, 1.1261552572250366e-05, 1.2549571692943573e-05, 1.383759081363678e-05, 1.5125609934329987e-05, 1.6413629055023193e-05, 1.77016481757164e-05, 1.8989667296409607e-05, 2.0277686417102814e-05, 2.156570553779602e-05, 2.2853724658489227e-05, 2.4141743779182434e-05, 2.542976289987564e-05, 2.6717782020568848e-05, 2.8005801141262054e-05, 2.929382026195526e-05, 3.058183938264847e-05, 3.1869858503341675e-05, 3.315787762403488e-05, 3.444589674472809e-05, 3.5733915865421295e-05, 3.70219349861145e-05, 3.830995410680771e-05, 3.9597973227500916e-05, 4.088599234819412e-05, 4.217401146888733e-05, 4.3462030589580536e-05, 4.475004971027374e-05, 4.603806883096695e-05, 4.7326087951660156e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 5.0, 5.0, 11.0, 13.0, 15.0, 32.0, 34.0, 49.0, 85.0, 158.0, 252.0, 463.0, 825.0, 1501.0, 2757.0, 5378.0, 11221.0, 28845.0, 108549.0, 406893.0, 350647.0, 85844.0, 24694.0, 9802.0, 4649.0, 2492.0, 1410.0, 768.0, 446.0, 287.0, 157.0, 91.0, 57.0, 35.0, 22.0, 13.0, 7.0, 15.0, 6.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07275390625, -0.07060909271240234, -0.06846427917480469, -0.06631946563720703, -0.06417465209960938, -0.06202983856201172, -0.05988502502441406, -0.057740211486816406, -0.05559539794921875, -0.053450584411621094, -0.05130577087402344, -0.04916095733642578, -0.047016143798828125, -0.04487133026123047, -0.04272651672363281, -0.040581703186035156, -0.0384368896484375, -0.036292076110839844, -0.03414726257324219, -0.03200244903564453, -0.029857635498046875, -0.02771282196044922, -0.025568008422851562, -0.023423194885253906, -0.02127838134765625, -0.019133567810058594, -0.016988754272460938, -0.014843940734863281, -0.012699127197265625, -0.010554313659667969, -0.008409500122070312, -0.006264686584472656, -0.004119873046875, -0.0019750595092773438, 0.0001697540283203125, 0.0023145675659179688, 0.004459381103515625, 0.006604194641113281, 0.008749008178710938, 0.010893821716308594, 0.01303863525390625, 0.015183448791503906, 0.017328262329101562, 0.01947307586669922, 0.021617889404296875, 0.02376270294189453, 0.025907516479492188, 0.028052330017089844, 0.0301971435546875, 0.032341957092285156, 0.03448677062988281, 0.03663158416748047, 0.038776397705078125, 0.04092121124267578, 0.04306602478027344, 0.045210838317871094, 0.04735565185546875, 0.049500465393066406, 0.05164527893066406, 0.05379009246826172, 0.055934906005859375, 0.05807971954345703, 0.06022453308105469, 0.062369346618652344, 0.06451416015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 0.0, 1.0, 4.0, 1.0, 3.0, 9.0, 6.0, 9.0, 11.0, 10.0, 21.0, 21.0, 29.0, 67.0, 84.0, 114.0, 135.0, 120.0, 104.0, 75.0, 45.0, 37.0, 27.0, 14.0, 5.0, 17.0, 7.0, 4.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0295562744140625, -0.0285952091217041, -0.027634143829345703, -0.026673078536987305, -0.025712013244628906, -0.024750947952270508, -0.02378988265991211, -0.02282881736755371, -0.021867752075195312, -0.020906686782836914, -0.019945621490478516, -0.018984556198120117, -0.01802349090576172, -0.01706242561340332, -0.016101360321044922, -0.015140295028686523, -0.014179229736328125, -0.013218164443969727, -0.012257099151611328, -0.01129603385925293, -0.010334968566894531, -0.009373903274536133, -0.008412837982177734, -0.007451772689819336, -0.0064907073974609375, -0.005529642105102539, -0.004568576812744141, -0.003607511520385742, -0.0026464462280273438, -0.0016853809356689453, -0.0007243156433105469, 0.00023674964904785156, 0.00119781494140625, 0.0021588802337646484, 0.003119945526123047, 0.004081010818481445, 0.005042076110839844, 0.006003141403198242, 0.006964206695556641, 0.007925271987915039, 0.008886337280273438, 0.009847402572631836, 0.010808467864990234, 0.011769533157348633, 0.012730598449707031, 0.01369166374206543, 0.014652729034423828, 0.015613794326782227, 0.016574859619140625, 0.017535924911499023, 0.018496990203857422, 0.01945805549621582, 0.02041912078857422, 0.021380186080932617, 0.022341251373291016, 0.023302316665649414, 0.024263381958007812, 0.02522444725036621, 0.02618551254272461, 0.027146577835083008, 0.028107643127441406, 0.029068708419799805, 0.030029773712158203, 0.0309908390045166, 0.031951904296875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 8.0, 4.0, 5.0, 9.0, 11.0, 22.0, 24.0, 30.0, 27.0, 58.0, 44.0, 58.0, 58.0, 60.0, 79.0, 83.0, 64.0, 68.0, 55.0, 63.0, 40.0, 31.0, 39.0, 20.0, 15.0, 7.0, 11.0, 7.0, 2.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49564194679260254, -0.4810281991958618, -0.4664144515991211, -0.45180070400238037, -0.43718698620796204, -0.4225732386112213, -0.4079594910144806, -0.39334574341773987, -0.37873199582099915, -0.3641182482242584, -0.3495045006275177, -0.33489078283309937, -0.32027703523635864, -0.3056632876396179, -0.2910495400428772, -0.2764357924461365, -0.26182204484939575, -0.24720829725265503, -0.2325945645570755, -0.21798081696033478, -0.20336706936359406, -0.18875333666801453, -0.1741395890712738, -0.15952584147453308, -0.14491212368011475, -0.13029837608337402, -0.1156846359372139, -0.10107089579105377, -0.08645714819431305, -0.07184340804815292, -0.0572296679019928, -0.042615920305252075, -0.028002172708511353, -0.013388429768383503, 0.0012253131717443466, 0.01583905518054962, 0.030452799052000046, 0.04506654292345047, 0.059680283069610596, 0.07429403066635132, 0.08890777081251144, 0.10352151095867157, 0.11813525855541229, 0.13274899125099182, 0.14736273884773254, 0.16197648644447327, 0.176590234041214, 0.1912039816379547, 0.20581771433353424, 0.22043146193027496, 0.2350451946258545, 0.24965894222259521, 0.26427268981933594, 0.27888643741607666, 0.2935001850128174, 0.3081139326095581, 0.32272765040397644, 0.33734139800071716, 0.3519551455974579, 0.3665688633918762, 0.38118261098861694, 0.39579635858535767, 0.4104101061820984, 0.4250238537788391, 0.43963760137557983]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 3.0, 9.0, 5.0, 8.0, 10.0, 10.0, 11.0, 18.0, 13.0, 21.0, 33.0, 27.0, 30.0, 41.0, 26.0, 46.0, 45.0, 48.0, 54.0, 53.0, 54.0, 50.0, 50.0, 35.0, 36.0, 38.0, 33.0, 25.0, 32.0, 16.0, 20.0, 29.0, 10.0, 11.0, 9.0, 10.0, 10.0, 3.0, 2.0, 7.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.3357851505279541, -0.32553255558013916, -0.3152799606323242, -0.30502739548683167, -0.2947748005390167, -0.2845222055912018, -0.27426961064338684, -0.2640170156955719, -0.25376445055007935, -0.2435118556022644, -0.23325927555561066, -0.22300668060779572, -0.21275410056114197, -0.20250150561332703, -0.19224891066551208, -0.18199631571769714, -0.1717437207698822, -0.16149112582206726, -0.1512385457754135, -0.14098595082759857, -0.13073337078094482, -0.12048077583312988, -0.11022818088531494, -0.0999755933880806, -0.08972300589084625, -0.07947041839361191, -0.06921783089637756, -0.05896523594856262, -0.04871264845132828, -0.03846006095409393, -0.02820746973156929, -0.017954878509044647, -0.007702291011810303, 0.002550298348069191, 0.012802887707948685, 0.02305547706782818, 0.03330806642770767, 0.04356065392494202, 0.05381324514746666, 0.0640658363699913, 0.07431842386722565, 0.08457101136445999, 0.09482359886169434, 0.10507619380950928, 0.11532878130674362, 0.12558136880397797, 0.1358339637517929, 0.14608654379844666, 0.1563391387462616, 0.16659173369407654, 0.17684431374073029, 0.18709690868854523, 0.19734948873519897, 0.20760208368301392, 0.21785467863082886, 0.2281072735786438, 0.23835985362529755, 0.2486124485731125, 0.25886502861976624, 0.2691176235675812, 0.2793702185153961, 0.28962278366088867, 0.2998753786087036, 0.31012797355651855, 0.3203805685043335]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 6.0, 5.0, 10.0, 29.0, 30.0, 51.0, 87.0, 104.0, 156.0, 355.0, 559.0, 1073.0, 2070.0, 4422.0, 9875.0, 22534.0, 54019.0, 153354.0, 424413.0, 242136.0, 77249.0, 31026.0, 13118.0, 5911.0, 2846.0, 1427.0, 676.0, 412.0, 226.0, 144.0, 94.0, 58.0, 35.0, 14.0, 7.0, 9.0, 8.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5390625, -0.51959228515625, -0.5001220703125, -0.48065185546875, -0.461181640625, -0.44171142578125, -0.4222412109375, -0.40277099609375, -0.38330078125, -0.36383056640625, -0.3443603515625, -0.32489013671875, -0.305419921875, -0.28594970703125, -0.2664794921875, -0.24700927734375, -0.2275390625, -0.20806884765625, -0.1885986328125, -0.16912841796875, -0.149658203125, -0.13018798828125, -0.1107177734375, -0.09124755859375, -0.07177734375, -0.05230712890625, -0.0328369140625, -0.01336669921875, 0.006103515625, 0.02557373046875, 0.0450439453125, 0.06451416015625, 0.083984375, 0.10345458984375, 0.1229248046875, 0.14239501953125, 0.161865234375, 0.18133544921875, 0.2008056640625, 0.22027587890625, 0.23974609375, 0.25921630859375, 0.2786865234375, 0.29815673828125, 0.317626953125, 0.33709716796875, 0.3565673828125, 0.37603759765625, 0.3955078125, 0.41497802734375, 0.4344482421875, 0.45391845703125, 0.473388671875, 0.49285888671875, 0.5123291015625, 0.53179931640625, 0.55126953125, 0.57073974609375, 0.5902099609375, 0.60968017578125, 0.629150390625, 0.64862060546875, 0.6680908203125, 0.68756103515625, 0.70703125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 8.0, 5.0, 4.0, 6.0, 5.0, 6.0, 7.0, 14.0, 19.0, 17.0, 15.0, 20.0, 31.0, 35.0, 29.0, 25.0, 52.0, 41.0, 42.0, 53.0, 52.0, 54.0, 45.0, 57.0, 47.0, 31.0, 35.0, 24.0, 35.0, 22.0, 18.0, 21.0, 19.0, 25.0, 13.0, 19.0, 8.0, 8.0, 4.0, 9.0, 3.0, 4.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.51416015625, -0.49764251708984375, -0.4811248779296875, -0.46460723876953125, -0.448089599609375, -0.43157196044921875, -0.4150543212890625, -0.39853668212890625, -0.38201904296875, -0.36550140380859375, -0.3489837646484375, -0.33246612548828125, -0.315948486328125, -0.29943084716796875, -0.2829132080078125, -0.26639556884765625, -0.2498779296875, -0.23336029052734375, -0.2168426513671875, -0.20032501220703125, -0.183807373046875, -0.16728973388671875, -0.1507720947265625, -0.13425445556640625, -0.11773681640625, -0.10121917724609375, -0.0847015380859375, -0.06818389892578125, -0.051666259765625, -0.03514862060546875, -0.0186309814453125, -0.00211334228515625, 0.014404296875, 0.03092193603515625, 0.0474395751953125, 0.06395721435546875, 0.080474853515625, 0.09699249267578125, 0.1135101318359375, 0.13002777099609375, 0.14654541015625, 0.16306304931640625, 0.1795806884765625, 0.19609832763671875, 0.212615966796875, 0.22913360595703125, 0.2456512451171875, 0.26216888427734375, 0.2786865234375, 0.29520416259765625, 0.3117218017578125, 0.32823944091796875, 0.344757080078125, 0.36127471923828125, 0.3777923583984375, 0.39430999755859375, 0.41082763671875, 0.42734527587890625, 0.4438629150390625, 0.46038055419921875, 0.476898193359375, 0.49341583251953125, 0.5099334716796875, 0.5264511108398438, 0.54296875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 2.0, 5.0, 6.0, 9.0, 14.0, 17.0, 23.0, 43.0, 46.0, 72.0, 106.0, 133.0, 152.0, 261.0, 403.0, 607.0, 1085.0, 2103.0, 4222.0, 9244.0, 22099.0, 54137.0, 158423.0, 429438.0, 237535.0, 75421.0, 29060.0, 12339.0, 5484.0, 2541.0, 1318.0, 765.0, 460.0, 263.0, 212.0, 143.0, 103.0, 68.0, 55.0, 37.0, 26.0, 16.0, 24.0, 14.0, 8.0, 4.0, 3.0, 8.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.69775390625, -0.6763916015625, -0.655029296875, -0.6336669921875, -0.6123046875, -0.5909423828125, -0.569580078125, -0.5482177734375, -0.52685546875, -0.5054931640625, -0.484130859375, -0.4627685546875, -0.44140625, -0.4200439453125, -0.398681640625, -0.3773193359375, -0.35595703125, -0.3345947265625, -0.313232421875, -0.2918701171875, -0.2705078125, -0.2491455078125, -0.227783203125, -0.2064208984375, -0.18505859375, -0.1636962890625, -0.142333984375, -0.1209716796875, -0.099609375, -0.0782470703125, -0.056884765625, -0.0355224609375, -0.01416015625, 0.0072021484375, 0.028564453125, 0.0499267578125, 0.0712890625, 0.0926513671875, 0.114013671875, 0.1353759765625, 0.15673828125, 0.1781005859375, 0.199462890625, 0.2208251953125, 0.2421875, 0.2635498046875, 0.284912109375, 0.3062744140625, 0.32763671875, 0.3489990234375, 0.370361328125, 0.3917236328125, 0.4130859375, 0.4344482421875, 0.455810546875, 0.4771728515625, 0.49853515625, 0.5198974609375, 0.541259765625, 0.5626220703125, 0.583984375, 0.6053466796875, 0.626708984375, 0.6480712890625, 0.66943359375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 4.0, 2.0, 6.0, 6.0, 7.0, 7.0, 12.0, 12.0, 16.0, 17.0, 19.0, 21.0, 36.0, 42.0, 25.0, 34.0, 53.0, 50.0, 57.0, 43.0, 56.0, 57.0, 41.0, 55.0, 49.0, 35.0, 35.0, 33.0, 28.0, 23.0, 20.0, 20.0, 12.0, 9.0, 18.0, 9.0, 13.0, 6.0, 5.0, 4.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.58544921875, -0.5658340454101562, -0.5462188720703125, -0.5266036987304688, -0.506988525390625, -0.48737335205078125, -0.4677581787109375, -0.44814300537109375, -0.42852783203125, -0.40891265869140625, -0.3892974853515625, -0.36968231201171875, -0.350067138671875, -0.33045196533203125, -0.3108367919921875, -0.29122161865234375, -0.2716064453125, -0.25199127197265625, -0.2323760986328125, -0.21276092529296875, -0.193145751953125, -0.17353057861328125, -0.1539154052734375, -0.13430023193359375, -0.11468505859375, -0.09506988525390625, -0.0754547119140625, -0.05583953857421875, -0.036224365234375, -0.01660919189453125, 0.0030059814453125, 0.02262115478515625, 0.042236328125, 0.06185150146484375, 0.0814666748046875, 0.10108184814453125, 0.120697021484375, 0.14031219482421875, 0.1599273681640625, 0.17954254150390625, 0.19915771484375, 0.21877288818359375, 0.2383880615234375, 0.25800323486328125, 0.277618408203125, 0.29723358154296875, 0.3168487548828125, 0.33646392822265625, 0.3560791015625, 0.37569427490234375, 0.3953094482421875, 0.41492462158203125, 0.434539794921875, 0.45415496826171875, 0.4737701416015625, 0.49338531494140625, 0.51300048828125, 0.5326156616210938, 0.5522308349609375, 0.5718460083007812, 0.591461181640625, 0.6110763549804688, 0.6306915283203125, 0.6503067016601562, 0.669921875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 10.0, 13.0, 11.0, 15.0, 29.0, 50.0, 81.0, 140.0, 249.0, 427.0, 824.0, 1544.0, 3109.0, 6988.0, 18253.0, 65122.0, 325906.0, 491880.0, 94222.0, 23606.0, 8499.0, 3699.0, 1740.0, 895.0, 492.0, 299.0, 172.0, 116.0, 55.0, 35.0, 22.0, 22.0, 10.0, 9.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.165771484375, -0.1600780487060547, -0.15438461303710938, -0.14869117736816406, -0.14299774169921875, -0.13730430603027344, -0.13161087036132812, -0.1259174346923828, -0.1202239990234375, -0.11453056335449219, -0.10883712768554688, -0.10314369201660156, -0.09745025634765625, -0.09175682067871094, -0.08606338500976562, -0.08036994934082031, -0.074676513671875, -0.06898307800292969, -0.06328964233398438, -0.05759620666503906, -0.05190277099609375, -0.04620933532714844, -0.040515899658203125, -0.03482246398925781, -0.0291290283203125, -0.023435592651367188, -0.017742156982421875, -0.012048721313476562, -0.00635528564453125, -0.0006618499755859375, 0.005031585693359375, 0.010725021362304688, 0.01641845703125, 0.022111892700195312, 0.027805328369140625, 0.03349876403808594, 0.03919219970703125, 0.04488563537597656, 0.050579071044921875, 0.05627250671386719, 0.0619659423828125, 0.06765937805175781, 0.07335281372070312, 0.07904624938964844, 0.08473968505859375, 0.09043312072753906, 0.09612655639648438, 0.10181999206542969, 0.107513427734375, 0.11320686340332031, 0.11890029907226562, 0.12459373474121094, 0.13028717041015625, 0.13598060607910156, 0.14167404174804688, 0.1473674774169922, 0.1530609130859375, 0.1587543487548828, 0.16444778442382812, 0.17014122009277344, 0.17583465576171875, 0.18152809143066406, 0.18722152709960938, 0.1929149627685547, 0.1986083984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 5.0, 3.0, 8.0, 5.0, 12.0, 13.0, 22.0, 30.0, 21.0, 35.0, 35.0, 57.0, 64.0, 73.0, 139.0, 76.0, 77.0, 73.0, 52.0, 34.0, 29.0, 25.0, 25.0, 21.0, 14.0, 8.0, 6.0, 9.0, 3.0, 6.0, 5.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9490718841552734e-05, -1.8673017621040344e-05, -1.7855316400527954e-05, -1.7037615180015564e-05, -1.6219913959503174e-05, -1.5402212738990784e-05, -1.4584511518478394e-05, -1.3766810297966003e-05, -1.2949109077453613e-05, -1.2131407856941223e-05, -1.1313706636428833e-05, -1.0496005415916443e-05, -9.678304195404053e-06, -8.860602974891663e-06, -8.042901754379272e-06, -7.225200533866882e-06, -6.407499313354492e-06, -5.589798092842102e-06, -4.772096872329712e-06, -3.954395651817322e-06, -3.1366944313049316e-06, -2.3189932107925415e-06, -1.5012919902801514e-06, -6.835907697677612e-07, 1.341104507446289e-07, 9.51811671257019e-07, 1.7695128917694092e-06, 2.5872141122817993e-06, 3.4049153327941895e-06, 4.22261655330658e-06, 5.04031777381897e-06, 5.85801899433136e-06, 6.67572021484375e-06, 7.49342143535614e-06, 8.31112265586853e-06, 9.12882387638092e-06, 9.94652509689331e-06, 1.07642263174057e-05, 1.158192753791809e-05, 1.2399628758430481e-05, 1.3217329978942871e-05, 1.4035031199455261e-05, 1.4852732419967651e-05, 1.567043364048004e-05, 1.648813486099243e-05, 1.7305836081504822e-05, 1.8123537302017212e-05, 1.8941238522529602e-05, 1.9758939743041992e-05, 2.0576640963554382e-05, 2.1394342184066772e-05, 2.2212043404579163e-05, 2.3029744625091553e-05, 2.3847445845603943e-05, 2.4665147066116333e-05, 2.5482848286628723e-05, 2.6300549507141113e-05, 2.7118250727653503e-05, 2.7935951948165894e-05, 2.8753653168678284e-05, 2.9571354389190674e-05, 3.0389055609703064e-05, 3.1206756830215454e-05, 3.2024458050727844e-05, 3.2842159271240234e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 9.0, 10.0, 17.0, 33.0, 38.0, 40.0, 83.0, 100.0, 156.0, 248.0, 320.0, 540.0, 1006.0, 1767.0, 3365.0, 7130.0, 18128.0, 73148.0, 535458.0, 329890.0, 50254.0, 14193.0, 5845.0, 2928.0, 1493.0, 864.0, 514.0, 294.0, 206.0, 150.0, 109.0, 51.0, 49.0, 38.0, 25.0, 16.0, 11.0, 7.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.263916015625, -0.25537109375, -0.246826171875, -0.23828125, -0.229736328125, -0.22119140625, -0.212646484375, -0.2041015625, -0.195556640625, -0.18701171875, -0.178466796875, -0.169921875, -0.161376953125, -0.15283203125, -0.144287109375, -0.1357421875, -0.127197265625, -0.11865234375, -0.110107421875, -0.1015625, -0.093017578125, -0.08447265625, -0.075927734375, -0.0673828125, -0.058837890625, -0.05029296875, -0.041748046875, -0.033203125, -0.024658203125, -0.01611328125, -0.007568359375, 0.0009765625, 0.009521484375, 0.01806640625, 0.026611328125, 0.03515625, 0.043701171875, 0.05224609375, 0.060791015625, 0.0693359375, 0.077880859375, 0.08642578125, 0.094970703125, 0.103515625, 0.112060546875, 0.12060546875, 0.129150390625, 0.1376953125, 0.146240234375, 0.15478515625, 0.163330078125, 0.171875, 0.180419921875, 0.18896484375, 0.197509765625, 0.2060546875, 0.214599609375, 0.22314453125, 0.231689453125, 0.240234375, 0.248779296875, 0.25732421875, 0.265869140625, 0.2744140625, 0.282958984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 5.0, 8.0, 8.0, 7.0, 20.0, 29.0, 26.0, 64.0, 62.0, 117.0, 208.0, 120.0, 102.0, 74.0, 50.0, 29.0, 22.0, 11.0, 7.0, 6.0, 8.0, 1.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1729736328125, -0.1682720184326172, -0.16357040405273438, -0.15886878967285156, -0.15416717529296875, -0.14946556091308594, -0.14476394653320312, -0.1400623321533203, -0.1353607177734375, -0.1306591033935547, -0.12595748901367188, -0.12125587463378906, -0.11655426025390625, -0.11185264587402344, -0.10715103149414062, -0.10244941711425781, -0.097747802734375, -0.09304618835449219, -0.08834457397460938, -0.08364295959472656, -0.07894134521484375, -0.07423973083496094, -0.06953811645507812, -0.06483650207519531, -0.0601348876953125, -0.05543327331542969, -0.050731658935546875, -0.04603004455566406, -0.04132843017578125, -0.03662681579589844, -0.031925201416015625, -0.027223587036132812, -0.02252197265625, -0.017820358276367188, -0.013118743896484375, -0.008417129516601562, -0.00371551513671875, 0.0009860992431640625, 0.005687713623046875, 0.010389328002929688, 0.0150909423828125, 0.019792556762695312, 0.024494171142578125, 0.029195785522460938, 0.03389739990234375, 0.03859901428222656, 0.043300628662109375, 0.04800224304199219, 0.052703857421875, 0.05740547180175781, 0.062107086181640625, 0.06680870056152344, 0.07151031494140625, 0.07621192932128906, 0.08091354370117188, 0.08561515808105469, 0.0903167724609375, 0.09501838684082031, 0.09972000122070312, 0.10442161560058594, 0.10912322998046875, 0.11382484436035156, 0.11852645874023438, 0.12322807312011719, 0.1279296875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 9.0, 16.0, 28.0, 116.0, 166.0, 237.0, 200.0, 128.0, 68.0, 22.0, 8.0, 7.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.209085941314697, -4.1206746101379395, -4.032263278961182, -3.943851947784424, -3.855440855026245, -3.7670295238494873, -3.6786181926727295, -3.5902068614959717, -3.501795530319214, -3.413384199142456, -3.3249728679656982, -3.2365617752075195, -3.1481504440307617, -3.059739112854004, -2.971327781677246, -2.8829164505004883, -2.7945051193237305, -2.7060937881469727, -2.617682456970215, -2.529271125793457, -2.4408600330352783, -2.3524487018585205, -2.2640373706817627, -2.175626039505005, -2.087214946746826, -1.9988036155700684, -1.9103924036026, -1.8219810724258423, -1.7335697412490845, -1.6451585292816162, -1.5567471981048584, -1.4683358669281006, -1.3799244165420532, -1.2915130853652954, -1.2031018733978271, -1.1146905422210693, -1.0262792110443115, -0.9378679394721985, -0.8494566679000854, -0.7610453367233276, -0.6726340651512146, -0.5842227935791016, -0.49581146240234375, -0.4074001908302307, -0.3189888894557953, -0.23057758808135986, -0.14216631650924683, -0.053754985332489014, 0.03465628623962402, 0.12306758016347885, 0.21147887408733368, 0.2998901605606079, 0.38830146193504333, 0.47671276330947876, 0.5651240348815918, 0.6535353660583496, 0.7419466376304626, 0.8303579092025757, 0.9187692403793335, 1.0071804523468018, 1.0955917835235596, 1.1840031147003174, 1.2724144458770752, 1.360825777053833, 1.4492369890213013]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 6.0, 15.0, 9.0, 12.0, 15.0, 14.0, 12.0, 12.0, 17.0, 20.0, 30.0, 27.0, 30.0, 36.0, 38.0, 52.0, 54.0, 37.0, 32.0, 46.0, 54.0, 39.0, 47.0, 40.0, 41.0, 32.0, 36.0, 32.0, 27.0, 17.0, 18.0, 17.0, 13.0, 15.0, 13.0, 6.0, 9.0, 5.0, 6.0, 2.0, 7.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.0428986549377441, -1.0138063430786133, -0.9847139716148376, -0.9556216597557068, -0.9265292882919312, -0.8974369764328003, -0.8683446645736694, -0.8392523527145386, -0.8101599812507629, -0.7810676693916321, -0.7519752979278564, -0.7228829860687256, -0.6937906742095947, -0.6646983027458191, -0.6356059908866882, -0.6065136194229126, -0.5774213075637817, -0.5483289957046509, -0.5192366242408752, -0.4901443123817444, -0.46105197072029114, -0.4319596290588379, -0.40286731719970703, -0.3737749755382538, -0.34468263387680054, -0.3155902922153473, -0.28649795055389404, -0.2574056386947632, -0.22831329703330994, -0.1992209553718567, -0.17012862861156464, -0.14103630185127258, -0.11194390058517456, -0.08285156637430191, -0.05375923216342926, -0.02466689795255661, 0.00442543625831604, 0.03351777791976929, 0.06261010468006134, 0.0917024314403534, 0.12079477310180664, 0.1498871147632599, 0.17897944152355194, 0.208071768283844, 0.23716410994529724, 0.2662564516067505, 0.29534876346588135, 0.3244411051273346, 0.35353344678878784, 0.3826257884502411, 0.41171813011169434, 0.4408104419708252, 0.46990278363227844, 0.4989951252937317, 0.5280874371528625, 0.5571798086166382, 0.586272120475769, 0.6153644323348999, 0.6444568037986755, 0.6735491156578064, 0.702641487121582, 0.7317337989807129, 0.7608261108398438, 0.7899184226989746, 0.8190107941627502]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 2.0, 7.0, 6.0, 12.0, 27.0, 32.0, 32.0, 36.0, 54.0, 101.0, 107.0, 186.0, 271.0, 361.0, 537.0, 790.0, 1211.0, 1682.0, 2235.0, 2804.0, 1029642.0, 2783.0, 2241.0, 1670.0, 1151.0, 813.0, 553.0, 372.0, 239.0, 190.0, 128.0, 98.0, 69.0, 49.0, 32.0, 33.0, 11.0, 15.0, 7.0, 6.0, 7.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.102470874786377, -1.0650981664657593, -1.0277254581451416, -0.9903526902198792, -0.9529799818992615, -0.9156072735786438, -0.8782345056533813, -0.8408617973327637, -0.803489089012146, -0.7661163806915283, -0.7287436723709106, -0.6913709044456482, -0.6539981961250305, -0.6166254878044128, -0.5792527198791504, -0.5418800115585327, -0.504507303237915, -0.46713459491729736, -0.4297618567943573, -0.39238911867141724, -0.35501641035079956, -0.3176437020301819, -0.2802709639072418, -0.24289822578430176, -0.20552551746368408, -0.1681527942419052, -0.13078007102012634, -0.09340734779834747, -0.056034624576568604, -0.018661901354789734, 0.018710821866989136, 0.0560835599899292, 0.09345626831054688, 0.13082899153232574, 0.16820171475410461, 0.20557443797588348, 0.24294716119766235, 0.28031986951828003, 0.3176926076412201, 0.35506534576416016, 0.39243805408477783, 0.4298107624053955, 0.46718350052833557, 0.5045562386512756, 0.5419289469718933, 0.579301655292511, 0.6166744232177734, 0.6540471315383911, 0.6914198398590088, 0.7287925481796265, 0.7661652565002441, 0.8035380244255066, 0.8409107327461243, 0.8782834410667419, 0.9156562089920044, 0.9530289173126221, 0.9904016256332397, 1.0277743339538574, 1.065147042274475, 1.1025197505950928, 1.139892578125, 1.1772652864456177, 1.2146379947662354, 1.252010703086853, 1.2893834114074707]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 9.0, 18.0, 37.0, 35.0, 31.0, 53.0, 83.0, 174.0, 331.0, 750.0, 1650.0, 3636.0, 8640.0, 26235.0, 51376248.0, 32427.0, 11523.0, 5236.0, 2226.0, 1023.0, 457.0, 244.0, 130.0, 55.0, 38.0, 22.0, 18.0, 10.0, 5.0, 6.0, 6.0, 4.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4312098026275635, -2.3461198806762695, -2.2610301971435547, -2.1759402751922607, -2.090850353240967, -2.005760669708252, -1.920670747756958, -1.8355809450149536, -1.7504911422729492, -1.6654013395309448, -1.5803115367889404, -1.4952216148376465, -1.410131812095642, -1.3250420093536377, -1.2399520874023438, -1.1548622846603394, -1.069772481918335, -0.9846826791763306, -0.8995928168296814, -0.8145029544830322, -0.7294131517410278, -0.6443233489990234, -0.5592334866523743, -0.4741436243057251, -0.3890538215637207, -0.3039639890193939, -0.21887415647506714, -0.13378432393074036, -0.048694491386413574, 0.03639534115791321, 0.12148517370223999, 0.20657503604888916, 0.29166460037231445, 0.37675443291664124, 0.461844265460968, 0.5469341278076172, 0.6320239305496216, 0.717113733291626, 0.8022035956382751, 0.8872934579849243, 0.9723832607269287, 1.057473063468933, 1.1425628662109375, 1.2276527881622314, 1.3127425909042358, 1.3978323936462402, 1.4829223155975342, 1.5680121183395386, 1.653101921081543, 1.7381917238235474, 1.8232815265655518, 1.9083714485168457, 1.99346125125885, 2.0785510540008545, 2.1636409759521484, 2.2487306594848633, 2.3338205814361572, 2.418910503387451, 2.504000186920166, 2.58909010887146, 2.674180030822754, 2.7592697143554688, 2.8443596363067627, 2.9294495582580566, 3.0145392417907715]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 9.0, 10.0, 10.0, 27.0, 16.0, 47.0, 61.0, 114.0, 177.0, 259.0, 405.0, 635.0, 1043.0, 1717.0, 2746.0, 4578.0, 7771.0, 13473.0, 23609.0, 41709.0, 72761.0, 125100.0, 201762.0, 303046.0, 443251.0, 2658529.0, 1316024.0, 384994.0, 267931.0, 174106.0, 103459.0, 60633.0, 34104.0, 19394.0, 11166.0, 6532.0, 3866.0, 2358.0, 1492.0, 916.0, 582.0, 366.0, 229.0, 168.0, 72.0, 73.0, 37.0, 25.0, 21.0, 14.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.471923828125, -0.4566230773925781, -0.44132232666015625, -0.4260215759277344, -0.4107208251953125, -0.3954200744628906, -0.38011932373046875, -0.3648185729980469, -0.349517822265625, -0.3342170715332031, -0.31891632080078125, -0.3036155700683594, -0.2883148193359375, -0.2730140686035156, -0.25771331787109375, -0.24241256713867188, -0.22711181640625, -0.21181106567382812, -0.19651031494140625, -0.18120956420898438, -0.1659088134765625, -0.15060806274414062, -0.13530731201171875, -0.12000656127929688, -0.104705810546875, -0.08940505981445312, -0.07410430908203125, -0.058803558349609375, -0.0435028076171875, -0.028202056884765625, -0.01290130615234375, 0.002399444580078125, 0.0177001953125, 0.033000946044921875, 0.04830169677734375, 0.06360244750976562, 0.0789031982421875, 0.09420394897460938, 0.10950469970703125, 0.12480545043945312, 0.140106201171875, 0.15540695190429688, 0.17070770263671875, 0.18600845336914062, 0.2013092041015625, 0.21660995483398438, 0.23191070556640625, 0.24721145629882812, 0.26251220703125, 0.2778129577636719, 0.29311370849609375, 0.3084144592285156, 0.3237152099609375, 0.3390159606933594, 0.35431671142578125, 0.3696174621582031, 0.384918212890625, 0.4002189636230469, 0.41551971435546875, 0.4308204650878906, 0.4461212158203125, 0.4614219665527344, 0.47672271728515625, 0.4920234680175781, 0.50732421875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 4.0, 7.0, 6.0, 13.0, 9.0, 12.0, 13.0, 19.0, 28.0, 26.0, 26.0, 27.0, 34.0, 42.0, 36.0, 41.0, 40.0, 56.0, 235.0, 820.0, 82.0, 44.0, 38.0, 43.0, 45.0, 37.0, 27.0, 29.0, 29.0, 28.0, 11.0, 24.0, 15.0, 16.0, 15.0, 6.0, 11.0, 8.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.580078125, -2.482086181640625, -2.38409423828125, -2.286102294921875, -2.1881103515625, -2.090118408203125, -1.99212646484375, -1.894134521484375, -1.796142578125, -1.698150634765625, -1.60015869140625, -1.502166748046875, -1.4041748046875, -1.306182861328125, -1.20819091796875, -1.110198974609375, -1.01220703125, -0.914215087890625, -0.81622314453125, -0.718231201171875, -0.6202392578125, -0.522247314453125, -0.42425537109375, -0.326263427734375, -0.228271484375, -0.130279541015625, -0.03228759765625, 0.065704345703125, 0.1636962890625, 0.261688232421875, 0.35968017578125, 0.457672119140625, 0.5556640625, 0.653656005859375, 0.75164794921875, 0.849639892578125, 0.9476318359375, 1.045623779296875, 1.14361572265625, 1.241607666015625, 1.339599609375, 1.437591552734375, 1.53558349609375, 1.633575439453125, 1.7315673828125, 1.829559326171875, 1.92755126953125, 2.025543212890625, 2.12353515625, 2.221527099609375, 2.31951904296875, 2.417510986328125, 2.5155029296875, 2.613494873046875, 2.71148681640625, 2.809478759765625, 2.907470703125, 3.005462646484375, 3.10345458984375, 3.201446533203125, 3.2994384765625, 3.397430419921875, 3.49542236328125, 3.593414306640625, 3.69140625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 6.0, 13.0, 14.0, 17.0, 31.0, 57.0, 124.0, 197.0, 325.0, 507.0, 830.0, 1290.0, 2212.0, 3645.0, 5770.0, 9100.0, 14405.0, 21905.0, 32916.0, 48375.0, 69495.0, 96311.0, 129889.0, 166330.0, 204097.0, 243352.0, 386362.0, 1940707.0, 1571495.0, 332352.0, 236844.0, 198838.0, 160050.0, 123157.0, 91572.0, 66020.0, 45797.0, 31339.0, 20358.0, 13061.0, 8485.0, 5399.0, 3255.0, 2009.0, 1212.0, 789.0, 443.0, 274.0, 160.0, 100.0, 60.0, 47.0, 23.0, 11.0, 5.0, 5.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.2449951171875, -0.2373199462890625, -0.229644775390625, -0.2219696044921875, -0.21429443359375, -0.2066192626953125, -0.198944091796875, -0.1912689208984375, -0.18359375, -0.1759185791015625, -0.168243408203125, -0.1605682373046875, -0.15289306640625, -0.1452178955078125, -0.137542724609375, -0.1298675537109375, -0.1221923828125, -0.1145172119140625, -0.106842041015625, -0.0991668701171875, -0.09149169921875, -0.0838165283203125, -0.076141357421875, -0.0684661865234375, -0.060791015625, -0.0531158447265625, -0.045440673828125, -0.0377655029296875, -0.03009033203125, -0.0224151611328125, -0.014739990234375, -0.0070648193359375, 0.0006103515625, 0.0082855224609375, 0.015960693359375, 0.0236358642578125, 0.03131103515625, 0.0389862060546875, 0.046661376953125, 0.0543365478515625, 0.06201171875, 0.0696868896484375, 0.077362060546875, 0.0850372314453125, 0.09271240234375, 0.1003875732421875, 0.108062744140625, 0.1157379150390625, 0.1234130859375, 0.1310882568359375, 0.138763427734375, 0.1464385986328125, 0.15411376953125, 0.1617889404296875, 0.169464111328125, 0.1771392822265625, 0.184814453125, 0.1924896240234375, 0.200164794921875, 0.2078399658203125, 0.21551513671875, 0.2231903076171875, 0.230865478515625, 0.2385406494140625, 0.2462158203125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 5.0, 9.0, 9.0, 6.0, 8.0, 13.0, 13.0, 25.0, 25.0, 16.0, 34.0, 24.0, 28.0, 23.0, 29.0, 43.0, 34.0, 39.0, 45.0, 79.0, 479.0, 548.0, 62.0, 43.0, 46.0, 46.0, 29.0, 35.0, 30.0, 21.0, 27.0, 18.0, 28.0, 19.0, 8.0, 11.0, 13.0, 13.0, 11.0, 7.0, 3.0, 8.0, 3.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9287109375, -1.8644561767578125, -1.800201416015625, -1.7359466552734375, -1.67169189453125, -1.6074371337890625, -1.543182373046875, -1.4789276123046875, -1.4146728515625, -1.3504180908203125, -1.286163330078125, -1.2219085693359375, -1.15765380859375, -1.0933990478515625, -1.029144287109375, -0.9648895263671875, -0.900634765625, -0.8363800048828125, -0.772125244140625, -0.7078704833984375, -0.64361572265625, -0.5793609619140625, -0.515106201171875, -0.4508514404296875, -0.3865966796875, -0.3223419189453125, -0.258087158203125, -0.1938323974609375, -0.12957763671875, -0.0653228759765625, -0.001068115234375, 0.0631866455078125, 0.12744140625, 0.1916961669921875, 0.255950927734375, 0.3202056884765625, 0.38446044921875, 0.4487152099609375, 0.512969970703125, 0.5772247314453125, 0.6414794921875, 0.7057342529296875, 0.769989013671875, 0.8342437744140625, 0.89849853515625, 0.9627532958984375, 1.027008056640625, 1.0912628173828125, 1.155517578125, 1.2197723388671875, 1.284027099609375, 1.3482818603515625, 1.41253662109375, 1.4767913818359375, 1.541046142578125, 1.6053009033203125, 1.6695556640625, 1.7338104248046875, 1.798065185546875, 1.8623199462890625, 1.92657470703125, 1.9908294677734375, 2.055084228515625, 2.1193389892578125, 2.18359375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 9.0, 6.0, 12.0, 8.0, 31.0, 36.0, 66.0, 79.0, 116.0, 153.0, 200.0, 305.0, 414.0, 608.0, 901.0, 1426.0, 2448.0, 4925.0, 12407.0, 37849.0, 120746.0, 342806.0, 753404.0, 3981437.0, 622313.0, 270037.0, 90345.0, 28460.0, 9984.0, 4006.0, 2036.0, 1274.0, 819.0, 559.0, 351.0, 255.0, 199.0, 105.0, 87.0, 53.0, 53.0, 38.0, 24.0, 17.0, 8.0, 9.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.67529296875, -0.6544342041015625, -0.633575439453125, -0.6127166748046875, -0.59185791015625, -0.5709991455078125, -0.550140380859375, -0.5292816162109375, -0.5084228515625, -0.4875640869140625, -0.466705322265625, -0.4458465576171875, -0.42498779296875, -0.4041290283203125, -0.383270263671875, -0.3624114990234375, -0.341552734375, -0.3206939697265625, -0.299835205078125, -0.2789764404296875, -0.25811767578125, -0.2372589111328125, -0.216400146484375, -0.1955413818359375, -0.1746826171875, -0.1538238525390625, -0.132965087890625, -0.1121063232421875, -0.09124755859375, -0.0703887939453125, -0.049530029296875, -0.0286712646484375, -0.0078125, 0.0130462646484375, 0.033905029296875, 0.0547637939453125, 0.07562255859375, 0.0964813232421875, 0.117340087890625, 0.1381988525390625, 0.1590576171875, 0.1799163818359375, 0.200775146484375, 0.2216339111328125, 0.24249267578125, 0.2633514404296875, 0.284210205078125, 0.3050689697265625, 0.325927734375, 0.3467864990234375, 0.367645263671875, 0.3885040283203125, 0.40936279296875, 0.4302215576171875, 0.451080322265625, 0.4719390869140625, 0.4927978515625, 0.5136566162109375, 0.534515380859375, 0.5553741455078125, 0.57623291015625, 0.5970916748046875, 0.617950439453125, 0.6388092041015625, 0.65966796875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 8.0, 10.0, 6.0, 11.0, 14.0, 16.0, 14.0, 18.0, 29.0, 35.0, 35.0, 25.0, 32.0, 46.0, 29.0, 40.0, 46.0, 83.0, 561.0, 495.0, 60.0, 47.0, 29.0, 29.0, 35.0, 42.0, 31.0, 35.0, 31.0, 19.0, 22.0, 17.0, 13.0, 9.0, 9.0, 12.0, 7.0, 6.0, 2.0, 7.0, 1.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.716796875, -1.6647491455078125, -1.612701416015625, -1.5606536865234375, -1.50860595703125, -1.4565582275390625, -1.404510498046875, -1.3524627685546875, -1.3004150390625, -1.2483673095703125, -1.196319580078125, -1.1442718505859375, -1.09222412109375, -1.0401763916015625, -0.988128662109375, -0.9360809326171875, -0.884033203125, -0.8319854736328125, -0.779937744140625, -0.7278900146484375, -0.67584228515625, -0.6237945556640625, -0.571746826171875, -0.5196990966796875, -0.4676513671875, -0.4156036376953125, -0.363555908203125, -0.3115081787109375, -0.25946044921875, -0.2074127197265625, -0.155364990234375, -0.1033172607421875, -0.05126953125, 0.0007781982421875, 0.052825927734375, 0.1048736572265625, 0.15692138671875, 0.2089691162109375, 0.261016845703125, 0.3130645751953125, 0.3651123046875, 0.4171600341796875, 0.469207763671875, 0.5212554931640625, 0.57330322265625, 0.6253509521484375, 0.677398681640625, 0.7294464111328125, 0.781494140625, 0.8335418701171875, 0.885589599609375, 0.9376373291015625, 0.98968505859375, 1.0417327880859375, 1.093780517578125, 1.1458282470703125, 1.1978759765625, 1.2499237060546875, 1.301971435546875, 1.3540191650390625, 1.40606689453125, 1.4581146240234375, 1.510162353515625, 1.5622100830078125, 1.6142578125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 10.0, 49.0, 268.0, 488.0, 157.0, 28.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.158155918121338, -3.7573583126068115, -3.356560468673706, -2.9557628631591797, -2.554965019226074, -2.154167413711548, -1.7533698081970215, -1.352571964263916, -0.9517743587493896, -0.5509766340255737, -0.1501789689064026, 0.25061869621276855, 0.6514164209365845, 1.0522141456604004, 1.4530117511749268, 1.8538095951080322, 2.2546072006225586, 2.655404806137085, 3.0562026500701904, 3.457000255584717, 3.8577980995178223, 4.2585954666137695, 4.659393310546875, 5.0601911544799805, 5.460988998413086, 5.861786842346191, 6.262584209442139, 6.663382053375244, 7.06417989730835, 7.464977264404297, 7.865775108337402, 8.266572952270508, 8.667370796203613, 9.068168640136719, 9.468966484069824, 9.86976432800293, 10.270561218261719, 10.671359062194824, 11.07215690612793, 11.472954750061035, 11.87375259399414, 12.274550437927246, 12.675348281860352, 13.07614517211914, 13.476943016052246, 13.877740859985352, 14.278538703918457, 14.679336547851562, 15.080133438110352, 15.480931282043457, 15.881729125976562, 16.28252601623535, 16.683324813842773, 17.084121704101562, 17.484920501708984, 17.885717391967773, 18.286516189575195, 18.687313079833984, 19.088111877441406, 19.488908767700195, 19.889707565307617, 20.290504455566406, 20.691303253173828, 21.092100143432617, 21.492897033691406]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 5.0, 4.0, 6.0, 12.0, 5.0, 10.0, 8.0, 12.0, 24.0, 23.0, 28.0, 29.0, 34.0, 30.0, 31.0, 33.0, 38.0, 27.0, 35.0, 48.0, 30.0, 41.0, 50.0, 36.0, 30.0, 30.0, 29.0, 39.0, 28.0, 29.0, 30.0, 23.0, 24.0, 19.0, 15.0, 17.0, 12.0, 15.0, 7.0, 13.0, 4.0, 7.0, 8.0, 5.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.381347894668579, -2.302940845489502, -2.224534034729004, -2.146127223968506, -2.0677201747894287, -1.9893132448196411, -1.9109063148498535, -1.832499384880066, -1.7540924549102783, -1.6756855249404907, -1.5972785949707031, -1.5188716650009155, -1.440464735031128, -1.3620578050613403, -1.2836508750915527, -1.2052439451217651, -1.1268370151519775, -1.04843008518219, -0.9700231552124023, -0.8916162252426147, -0.8132092952728271, -0.7348023653030396, -0.656395435333252, -0.5779885053634644, -0.49958157539367676, -0.42117464542388916, -0.34276771545410156, -0.26436078548431396, -0.18595385551452637, -0.10754692554473877, -0.029139995574951172, 0.049266934394836426, 0.12767410278320312, 0.20608103275299072, 0.2844879627227783, 0.3628948926925659, 0.4413018226623535, 0.5197087526321411, 0.5981156826019287, 0.6765226125717163, 0.7549295425415039, 0.8333364725112915, 0.9117434024810791, 0.9901503324508667, 1.0685572624206543, 1.146964192390442, 1.2253711223602295, 1.303778052330017, 1.3821849822998047, 1.4605919122695923, 1.5389988422393799, 1.6174057722091675, 1.695812702178955, 1.7742196321487427, 1.8526265621185303, 1.9310334920883179, 2.0094404220581055, 2.0878472328186035, 2.1662542819976807, 2.244661331176758, 2.323068141937256, 2.401474952697754, 2.479882001876831, 2.558289051055908, 2.6366958618164062]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 9.0, 10.0, 11.0, 16.0, 17.0, 45.0, 54.0, 87.0, 135.0, 284.0, 512.0, 1022.0, 2208.0, 4768.0, 11201.0, 29802.0, 122478.0, 1739321.0, 2061914.0, 164351.0, 33323.0, 12494.0, 5451.0, 2473.0, 1069.0, 532.0, 270.0, 164.0, 93.0, 43.0, 34.0, 21.0, 14.0, 15.0, 7.0, 6.0, 10.0, 3.0, 1.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1236572265625, -0.12022686004638672, -0.11679649353027344, -0.11336612701416016, -0.10993576049804688, -0.1065053939819336, -0.10307502746582031, -0.09964466094970703, -0.09621429443359375, -0.09278392791748047, -0.08935356140136719, -0.0859231948852539, -0.08249282836914062, -0.07906246185302734, -0.07563209533691406, -0.07220172882080078, -0.0687713623046875, -0.06534099578857422, -0.06191062927246094, -0.058480262756347656, -0.055049896240234375, -0.051619529724121094, -0.04818916320800781, -0.04475879669189453, -0.04132843017578125, -0.03789806365966797, -0.03446769714355469, -0.031037330627441406, -0.027606964111328125, -0.024176597595214844, -0.020746231079101562, -0.01731586456298828, -0.013885498046875, -0.010455131530761719, -0.0070247650146484375, -0.0035943984985351562, -0.000164031982421875, 0.0032663345336914062, 0.0066967010498046875, 0.010127067565917969, 0.01355743408203125, 0.01698780059814453, 0.020418167114257812, 0.023848533630371094, 0.027278900146484375, 0.030709266662597656, 0.03413963317871094, 0.03756999969482422, 0.0410003662109375, 0.04443073272705078, 0.04786109924316406, 0.051291465759277344, 0.054721832275390625, 0.058152198791503906, 0.06158256530761719, 0.06501293182373047, 0.06844329833984375, 0.07187366485595703, 0.07530403137207031, 0.0787343978881836, 0.08216476440429688, 0.08559513092041016, 0.08902549743652344, 0.09245586395263672, 0.09588623046875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 5.0, 5.0, 2.0, 7.0, 6.0, 6.0, 8.0, 11.0, 16.0, 21.0, 10.0, 22.0, 25.0, 33.0, 47.0, 36.0, 49.0, 46.0, 64.0, 44.0, 54.0, 60.0, 47.0, 53.0, 50.0, 42.0, 38.0, 27.0, 26.0, 32.0, 26.0, 17.0, 21.0, 8.0, 10.0, 8.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04217529296875, -0.04074430465698242, -0.039313316345214844, -0.037882328033447266, -0.03645133972167969, -0.03502035140991211, -0.03358936309814453, -0.03215837478637695, -0.030727386474609375, -0.029296398162841797, -0.02786540985107422, -0.02643442153930664, -0.025003433227539062, -0.023572444915771484, -0.022141456604003906, -0.020710468292236328, -0.01927947998046875, -0.017848491668701172, -0.016417503356933594, -0.014986515045166016, -0.013555526733398438, -0.01212453842163086, -0.010693550109863281, -0.009262561798095703, -0.007831573486328125, -0.006400585174560547, -0.004969596862792969, -0.0035386085510253906, -0.0021076202392578125, -0.0006766319274902344, 0.0007543563842773438, 0.002185344696044922, 0.0036163330078125, 0.005047321319580078, 0.006478309631347656, 0.007909297943115234, 0.009340286254882812, 0.01077127456665039, 0.012202262878417969, 0.013633251190185547, 0.015064239501953125, 0.016495227813720703, 0.01792621612548828, 0.01935720443725586, 0.020788192749023438, 0.022219181060791016, 0.023650169372558594, 0.025081157684326172, 0.02651214599609375, 0.027943134307861328, 0.029374122619628906, 0.030805110931396484, 0.03223609924316406, 0.03366708755493164, 0.03509807586669922, 0.0365290641784668, 0.037960052490234375, 0.03939104080200195, 0.04082202911376953, 0.04225301742553711, 0.04368400573730469, 0.045114994049072266, 0.046545982360839844, 0.04797697067260742, 0.049407958984375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 3.0, 2.0, 4.0, 10.0, 3.0, 7.0, 8.0, 5.0, 9.0, 13.0, 18.0, 25.0, 31.0, 50.0, 67.0, 177.0, 588.0, 3074.0, 30865.0, 1265365.0, 2818255.0, 69248.0, 5159.0, 820.0, 253.0, 85.0, 41.0, 27.0, 21.0, 19.0, 4.0, 10.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.154296875, -0.15014171600341797, -0.14598655700683594, -0.1418313980102539, -0.13767623901367188, -0.13352108001708984, -0.1293659210205078, -0.12521076202392578, -0.12105560302734375, -0.11690044403076172, -0.11274528503417969, -0.10859012603759766, -0.10443496704101562, -0.1002798080444336, -0.09612464904785156, -0.09196949005126953, -0.0878143310546875, -0.08365917205810547, -0.07950401306152344, -0.0753488540649414, -0.07119369506835938, -0.06703853607177734, -0.06288337707519531, -0.05872821807861328, -0.05457305908203125, -0.05041790008544922, -0.04626274108886719, -0.042107582092285156, -0.037952423095703125, -0.033797264099121094, -0.029642105102539062, -0.02548694610595703, -0.021331787109375, -0.01717662811279297, -0.013021469116210938, -0.008866310119628906, -0.004711151123046875, -0.0005559921264648438, 0.0035991668701171875, 0.007754325866699219, 0.01190948486328125, 0.01606464385986328, 0.020219802856445312, 0.024374961853027344, 0.028530120849609375, 0.032685279846191406, 0.03684043884277344, 0.04099559783935547, 0.0451507568359375, 0.04930591583251953, 0.05346107482910156, 0.057616233825683594, 0.061771392822265625, 0.06592655181884766, 0.07008171081542969, 0.07423686981201172, 0.07839202880859375, 0.08254718780517578, 0.08670234680175781, 0.09085750579833984, 0.09501266479492188, 0.0991678237915039, 0.10332298278808594, 0.10747814178466797, 0.11163330078125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 6.0, 9.0, 13.0, 12.0, 19.0, 15.0, 36.0, 42.0, 65.0, 82.0, 124.0, 164.0, 259.0, 356.0, 470.0, 516.0, 518.0, 381.0, 286.0, 208.0, 124.0, 93.0, 72.0, 61.0, 28.0, 19.0, 17.0, 12.0, 12.0, 11.0, 11.0, 6.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.048919677734375, -0.04736757278442383, -0.045815467834472656, -0.044263362884521484, -0.04271125793457031, -0.04115915298461914, -0.03960704803466797, -0.0380549430847168, -0.036502838134765625, -0.03495073318481445, -0.03339862823486328, -0.03184652328491211, -0.030294418334960938, -0.028742313385009766, -0.027190208435058594, -0.025638103485107422, -0.02408599853515625, -0.022533893585205078, -0.020981788635253906, -0.019429683685302734, -0.017877578735351562, -0.01632547378540039, -0.014773368835449219, -0.013221263885498047, -0.011669158935546875, -0.010117053985595703, -0.008564949035644531, -0.007012844085693359, -0.0054607391357421875, -0.003908634185791016, -0.0023565292358398438, -0.0008044242858886719, 0.0007476806640625, 0.002299785614013672, 0.0038518905639648438, 0.005403995513916016, 0.0069561004638671875, 0.00850820541381836, 0.010060310363769531, 0.011612415313720703, 0.013164520263671875, 0.014716625213623047, 0.01626873016357422, 0.01782083511352539, 0.019372940063476562, 0.020925045013427734, 0.022477149963378906, 0.024029254913330078, 0.02558135986328125, 0.027133464813232422, 0.028685569763183594, 0.030237674713134766, 0.03178977966308594, 0.03334188461303711, 0.03489398956298828, 0.03644609451293945, 0.037998199462890625, 0.0395503044128418, 0.04110240936279297, 0.04265451431274414, 0.04420661926269531, 0.045758724212646484, 0.047310829162597656, 0.04886293411254883, 0.0504150390625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 9.0, 103.0, 584.0, 289.0, 23.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17688630521297455, -0.13938170671463013, -0.1018771082162857, -0.06437250971794128, -0.026867911219596863, 0.010636687278747559, 0.04814128577709198, 0.08564586937427521, 0.12315048277378082, 0.16065508127212524, 0.19815967977046967, 0.2356642782688141, 0.2731688618659973, 0.31067347526550293, 0.34817808866500854, 0.3856826424598694, 0.423187255859375, 0.4606918692588806, 0.49819645285606384, 0.5357010364532471, 0.5732056498527527, 0.6107102632522583, 0.6482148170471191, 0.6857194304466248, 0.7232240438461304, 0.760728657245636, 0.7982332706451416, 0.8357378244400024, 0.8732424378395081, 0.9107470512390137, 0.9482516050338745, 0.9857562184333801, 1.0232608318328857, 1.0607653856277466, 1.098270058631897, 1.1357746124267578, 1.1732792854309082, 1.210783839225769, 1.2482883930206299, 1.2857930660247803, 1.3232976198196411, 1.360802173614502, 1.3983068466186523, 1.4358114004135132, 1.473315954208374, 1.5108206272125244, 1.5483251810073853, 1.585829734802246, 1.6233344078063965, 1.6608389616012573, 1.6983436346054077, 1.7358481884002686, 1.773352861404419, 1.8108574151992798, 1.8483619689941406, 1.885866641998291, 1.9233711957931519, 1.9608757495880127, 1.998380422592163, 2.0358850955963135, 2.0733895301818848, 2.110894203186035, 2.1483988761901855, 2.185903310775757, 2.2234079837799072]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 3.0, 8.0, 7.0, 7.0, 10.0, 11.0, 23.0, 30.0, 25.0, 26.0, 34.0, 54.0, 43.0, 47.0, 52.0, 51.0, 47.0, 50.0, 60.0, 52.0, 52.0, 57.0, 37.0, 36.0, 31.0, 22.0, 23.0, 24.0, 22.0, 13.0, 10.0, 8.0, 9.0, 5.0, 2.0, 4.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18044090270996094, -0.17483706772327423, -0.16923323273658752, -0.16362939774990082, -0.1580255627632141, -0.1524217128753662, -0.1468178778886795, -0.1412140429019928, -0.1356102079153061, -0.13000637292861938, -0.12440253794193268, -0.11879869550466537, -0.11319486051797867, -0.10759102553129196, -0.10198718309402466, -0.09638334810733795, -0.09077951312065125, -0.08517567813396454, -0.07957184314727783, -0.07396800071001053, -0.06836416572332382, -0.06276033073663712, -0.05715649202466011, -0.051552653312683105, -0.0459488183259964, -0.04034498333930969, -0.03474114462733269, -0.02913730777800083, -0.023533470928668976, -0.01792963407933712, -0.012325797230005264, -0.006721958518028259, -0.0011181235313415527, 0.004485713317990303, 0.010089550167322159, 0.015693387016654015, 0.02129722386598587, 0.026901060715317726, 0.03250489756464958, 0.03810873627662659, 0.04371257126331329, 0.04931640625, 0.054920244961977005, 0.06052408367395401, 0.06612791866064072, 0.07173175364732742, 0.07733559608459473, 0.08293943107128143, 0.08854326605796814, 0.09414710104465485, 0.09975093603134155, 0.10535477846860886, 0.11095861345529556, 0.11656244844198227, 0.12216629087924957, 0.12777012586593628, 0.13337396085262299, 0.1389777958393097, 0.1445816308259964, 0.1501854658126831, 0.155789315700531, 0.1613931506872177, 0.16699698567390442, 0.17260082066059113, 0.17820465564727783]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 6.0, 9.0, 11.0, 16.0, 19.0, 23.0, 44.0, 45.0, 60.0, 83.0, 122.0, 195.0, 297.0, 454.0, 656.0, 1090.0, 1957.0, 3563.0, 7942.0, 22141.0, 95390.0, 475330.0, 345522.0, 63344.0, 16469.0, 6324.0, 2996.0, 1648.0, 998.0, 563.0, 377.0, 235.0, 178.0, 114.0, 100.0, 49.0, 52.0, 25.0, 28.0, 13.0, 11.0, 11.0, 9.0, 7.0, 4.0, 3.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.09619140625, -0.09307575225830078, -0.08996009826660156, -0.08684444427490234, -0.08372879028320312, -0.0806131362915039, -0.07749748229980469, -0.07438182830810547, -0.07126617431640625, -0.06815052032470703, -0.06503486633300781, -0.061919212341308594, -0.058803558349609375, -0.055687904357910156, -0.05257225036621094, -0.04945659637451172, -0.0463409423828125, -0.04322528839111328, -0.04010963439941406, -0.036993980407714844, -0.033878326416015625, -0.030762672424316406, -0.027647018432617188, -0.02453136444091797, -0.02141571044921875, -0.01830005645751953, -0.015184402465820312, -0.012068748474121094, -0.008953094482421875, -0.005837440490722656, -0.0027217864990234375, 0.00039386749267578125, 0.003509521484375, 0.006625175476074219, 0.009740829467773438, 0.012856483459472656, 0.015972137451171875, 0.019087791442871094, 0.022203445434570312, 0.02531909942626953, 0.02843475341796875, 0.03155040740966797, 0.03466606140136719, 0.037781715393066406, 0.040897369384765625, 0.044013023376464844, 0.04712867736816406, 0.05024433135986328, 0.0533599853515625, 0.05647563934326172, 0.05959129333496094, 0.06270694732666016, 0.06582260131835938, 0.0689382553100586, 0.07205390930175781, 0.07516956329345703, 0.07828521728515625, 0.08140087127685547, 0.08451652526855469, 0.0876321792602539, 0.09074783325195312, 0.09386348724365234, 0.09697914123535156, 0.10009479522705078, 0.10321044921875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 3.0, 7.0, 8.0, 11.0, 19.0, 16.0, 16.0, 29.0, 35.0, 42.0, 42.0, 58.0, 63.0, 58.0, 49.0, 75.0, 55.0, 74.0, 50.0, 60.0, 38.0, 32.0, 30.0, 30.0, 27.0, 12.0, 13.0, 14.0, 9.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045684814453125, -0.04401063919067383, -0.042336463928222656, -0.040662288665771484, -0.03898811340332031, -0.03731393814086914, -0.03563976287841797, -0.0339655876159668, -0.032291412353515625, -0.030617237091064453, -0.02894306182861328, -0.02726888656616211, -0.025594711303710938, -0.023920536041259766, -0.022246360778808594, -0.020572185516357422, -0.01889801025390625, -0.017223834991455078, -0.015549659729003906, -0.013875484466552734, -0.012201309204101562, -0.01052713394165039, -0.008852958679199219, -0.007178783416748047, -0.005504608154296875, -0.003830432891845703, -0.0021562576293945312, -0.0004820823669433594, 0.0011920928955078125, 0.0028662681579589844, 0.004540443420410156, 0.006214618682861328, 0.0078887939453125, 0.009562969207763672, 0.011237144470214844, 0.012911319732666016, 0.014585494995117188, 0.01625967025756836, 0.01793384552001953, 0.019608020782470703, 0.021282196044921875, 0.022956371307373047, 0.02463054656982422, 0.02630472183227539, 0.027978897094726562, 0.029653072357177734, 0.031327247619628906, 0.03300142288208008, 0.03467559814453125, 0.03634977340698242, 0.038023948669433594, 0.039698123931884766, 0.04137229919433594, 0.04304647445678711, 0.04472064971923828, 0.04639482498168945, 0.048069000244140625, 0.0497431755065918, 0.05141735076904297, 0.05309152603149414, 0.05476570129394531, 0.056439876556396484, 0.058114051818847656, 0.05978822708129883, 0.06146240234375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 1.0, 4.0, 4.0, 7.0, 8.0, 10.0, 13.0, 21.0, 32.0, 28.0, 72.0, 111.0, 230.0, 514.0, 1075.0, 2683.0, 7195.0, 19758.0, 56288.0, 148455.0, 294363.0, 290025.0, 143298.0, 53343.0, 19305.0, 6906.0, 2635.0, 1114.0, 517.0, 218.0, 131.0, 76.0, 34.0, 24.0, 17.0, 10.0, 11.0, 7.0, 4.0, 6.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.054962158203125, -0.05329561233520508, -0.051629066467285156, -0.049962520599365234, -0.04829597473144531, -0.04662942886352539, -0.04496288299560547, -0.04329633712768555, -0.041629791259765625, -0.0399632453918457, -0.03829669952392578, -0.03663015365600586, -0.03496360778808594, -0.033297061920166016, -0.031630516052246094, -0.029963970184326172, -0.02829742431640625, -0.026630878448486328, -0.024964332580566406, -0.023297786712646484, -0.021631240844726562, -0.01996469497680664, -0.01829814910888672, -0.016631603240966797, -0.014965057373046875, -0.013298511505126953, -0.011631965637207031, -0.00996541976928711, -0.008298873901367188, -0.006632328033447266, -0.004965782165527344, -0.003299236297607422, -0.0016326904296875, 3.3855438232421875e-05, 0.0017004013061523438, 0.0033669471740722656, 0.0050334930419921875, 0.006700038909912109, 0.008366584777832031, 0.010033130645751953, 0.011699676513671875, 0.013366222381591797, 0.015032768249511719, 0.01669931411743164, 0.018365859985351562, 0.020032405853271484, 0.021698951721191406, 0.023365497589111328, 0.02503204345703125, 0.026698589324951172, 0.028365135192871094, 0.030031681060791016, 0.03169822692871094, 0.03336477279663086, 0.03503131866455078, 0.0366978645324707, 0.038364410400390625, 0.04003095626831055, 0.04169750213623047, 0.04336404800415039, 0.04503059387207031, 0.046697139739990234, 0.048363685607910156, 0.05003023147583008, 0.05169677734375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 15.0, 8.0, 8.0, 18.0, 15.0, 14.0, 34.0, 22.0, 20.0, 28.0, 36.0, 39.0, 41.0, 42.0, 43.0, 52.0, 39.0, 45.0, 48.0, 39.0, 47.0, 29.0, 41.0, 32.0, 29.0, 31.0, 23.0, 23.0, 28.0, 18.0, 14.0, 13.0, 13.0, 5.0, 14.0, 6.0, 7.0, 6.0, 4.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0938720703125, -0.09053516387939453, -0.08719825744628906, -0.0838613510131836, -0.08052444458007812, -0.07718753814697266, -0.07385063171386719, -0.07051372528076172, -0.06717681884765625, -0.06383991241455078, -0.06050300598144531, -0.057166099548339844, -0.053829193115234375, -0.050492286682128906, -0.04715538024902344, -0.04381847381591797, -0.0404815673828125, -0.03714466094970703, -0.03380775451660156, -0.030470848083496094, -0.027133941650390625, -0.023797035217285156, -0.020460128784179688, -0.01712322235107422, -0.01378631591796875, -0.010449409484863281, -0.0071125030517578125, -0.0037755966186523438, -0.000438690185546875, 0.0028982162475585938, 0.0062351226806640625, 0.009572029113769531, 0.012908935546875, 0.01624584197998047, 0.019582748413085938, 0.022919654846191406, 0.026256561279296875, 0.029593467712402344, 0.03293037414550781, 0.03626728057861328, 0.03960418701171875, 0.04294109344482422, 0.04627799987792969, 0.049614906311035156, 0.052951812744140625, 0.056288719177246094, 0.05962562561035156, 0.06296253204345703, 0.0662994384765625, 0.06963634490966797, 0.07297325134277344, 0.0763101577758789, 0.07964706420898438, 0.08298397064208984, 0.08632087707519531, 0.08965778350830078, 0.09299468994140625, 0.09633159637451172, 0.09966850280761719, 0.10300540924072266, 0.10634231567382812, 0.1096792221069336, 0.11301612854003906, 0.11635303497314453, 0.11968994140625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 6.0, 4.0, 16.0, 17.0, 41.0, 57.0, 97.0, 184.0, 642.0, 4212.0, 137676.0, 881934.0, 21257.0, 1707.0, 356.0, 144.0, 89.0, 52.0, 29.0, 15.0, 12.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10040283203125, -0.09738636016845703, -0.09436988830566406, -0.0913534164428711, -0.08833694458007812, -0.08532047271728516, -0.08230400085449219, -0.07928752899169922, -0.07627105712890625, -0.07325458526611328, -0.07023811340332031, -0.06722164154052734, -0.06420516967773438, -0.061188697814941406, -0.05817222595214844, -0.05515575408935547, -0.0521392822265625, -0.04912281036376953, -0.04610633850097656, -0.043089866638183594, -0.040073394775390625, -0.037056922912597656, -0.03404045104980469, -0.03102397918701172, -0.02800750732421875, -0.02499103546142578, -0.021974563598632812, -0.018958091735839844, -0.015941619873046875, -0.012925148010253906, -0.009908676147460938, -0.006892204284667969, -0.003875732421875, -0.0008592605590820312, 0.0021572113037109375, 0.005173683166503906, 0.008190155029296875, 0.011206626892089844, 0.014223098754882812, 0.01723957061767578, 0.02025604248046875, 0.02327251434326172, 0.026288986206054688, 0.029305458068847656, 0.032321929931640625, 0.035338401794433594, 0.03835487365722656, 0.04137134552001953, 0.0443878173828125, 0.04740428924560547, 0.05042076110839844, 0.053437232971191406, 0.056453704833984375, 0.059470176696777344, 0.06248664855957031, 0.06550312042236328, 0.06851959228515625, 0.07153606414794922, 0.07455253601074219, 0.07756900787353516, 0.08058547973632812, 0.0836019515991211, 0.08661842346191406, 0.08963489532470703, 0.0926513671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 5.0, 7.0, 12.0, 7.0, 13.0, 25.0, 29.0, 45.0, 47.0, 61.0, 66.0, 76.0, 83.0, 67.0, 79.0, 74.0, 56.0, 45.0, 49.0, 36.0, 26.0, 29.0, 17.0, 17.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.225440979003906e-06, -7.935799658298492e-06, -7.646158337593079e-06, -7.356517016887665e-06, -7.066875696182251e-06, -6.777234375476837e-06, -6.487593054771423e-06, -6.1979517340660095e-06, -5.908310413360596e-06, -5.618669092655182e-06, -5.329027771949768e-06, -5.039386451244354e-06, -4.7497451305389404e-06, -4.460103809833527e-06, -4.170462489128113e-06, -3.880821168422699e-06, -3.591179847717285e-06, -3.3015385270118713e-06, -3.0118972063064575e-06, -2.7222558856010437e-06, -2.43261456489563e-06, -2.142973244190216e-06, -1.8533319234848022e-06, -1.5636906027793884e-06, -1.2740492820739746e-06, -9.844079613685608e-07, -6.94766640663147e-07, -4.0512531995773315e-07, -1.1548399925231934e-07, 1.7415732145309448e-07, 4.637986421585083e-07, 7.534399628639221e-07, 1.043081283569336e-06, 1.3327226042747498e-06, 1.6223639249801636e-06, 1.9120052456855774e-06, 2.201646566390991e-06, 2.491287887096405e-06, 2.780929207801819e-06, 3.0705705285072327e-06, 3.3602118492126465e-06, 3.6498531699180603e-06, 3.939494490623474e-06, 4.229135811328888e-06, 4.518777132034302e-06, 4.8084184527397156e-06, 5.098059773445129e-06, 5.387701094150543e-06, 5.677342414855957e-06, 5.966983735561371e-06, 6.256625056266785e-06, 6.5462663769721985e-06, 6.835907697677612e-06, 7.125549018383026e-06, 7.41519033908844e-06, 7.704831659793854e-06, 7.994472980499268e-06, 8.284114301204681e-06, 8.573755621910095e-06, 8.863396942615509e-06, 9.153038263320923e-06, 9.442679584026337e-06, 9.73232090473175e-06, 1.0021962225437164e-05, 1.0311603546142578e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 7.0, 12.0, 17.0, 24.0, 35.0, 41.0, 69.0, 160.0, 243.0, 440.0, 783.0, 1443.0, 3369.0, 9552.0, 37552.0, 201600.0, 553671.0, 188860.0, 35200.0, 9062.0, 3173.0, 1440.0, 752.0, 413.0, 260.0, 135.0, 79.0, 51.0, 38.0, 24.0, 14.0, 6.0, 10.0, 1.0, 9.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034881591796875, -0.0337371826171875, -0.0325927734375, -0.0314483642578125, -0.030303955078125, -0.0291595458984375, -0.02801513671875, -0.0268707275390625, -0.025726318359375, -0.0245819091796875, -0.0234375, -0.0222930908203125, -0.021148681640625, -0.0200042724609375, -0.01885986328125, -0.0177154541015625, -0.016571044921875, -0.0154266357421875, -0.0142822265625, -0.0131378173828125, -0.011993408203125, -0.0108489990234375, -0.00970458984375, -0.0085601806640625, -0.007415771484375, -0.0062713623046875, -0.005126953125, -0.0039825439453125, -0.002838134765625, -0.0016937255859375, -0.00054931640625, 0.0005950927734375, 0.001739501953125, 0.0028839111328125, 0.0040283203125, 0.0051727294921875, 0.006317138671875, 0.0074615478515625, 0.00860595703125, 0.0097503662109375, 0.010894775390625, 0.0120391845703125, 0.01318359375, 0.0143280029296875, 0.015472412109375, 0.0166168212890625, 0.01776123046875, 0.0189056396484375, 0.020050048828125, 0.0211944580078125, 0.0223388671875, 0.0234832763671875, 0.024627685546875, 0.0257720947265625, 0.02691650390625, 0.0280609130859375, 0.029205322265625, 0.0303497314453125, 0.031494140625, 0.0326385498046875, 0.033782958984375, 0.0349273681640625, 0.03607177734375, 0.0372161865234375, 0.038360595703125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 0.0, 2.0, 3.0, 10.0, 5.0, 15.0, 13.0, 23.0, 42.0, 50.0, 95.0, 124.0, 163.0, 145.0, 110.0, 76.0, 42.0, 27.0, 24.0, 10.0, 5.0, 5.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06121826171875, -0.05950212478637695, -0.057785987854003906, -0.05606985092163086, -0.05435371398925781, -0.052637577056884766, -0.05092144012451172, -0.04920530319213867, -0.047489166259765625, -0.04577302932739258, -0.04405689239501953, -0.042340755462646484, -0.04062461853027344, -0.03890848159790039, -0.037192344665527344, -0.0354762077331543, -0.03376007080078125, -0.0320439338684082, -0.030327796936035156, -0.02861166000366211, -0.026895523071289062, -0.025179386138916016, -0.02346324920654297, -0.021747112274169922, -0.020030975341796875, -0.018314838409423828, -0.01659870147705078, -0.014882564544677734, -0.013166427612304688, -0.01145029067993164, -0.009734153747558594, -0.008018016815185547, -0.0063018798828125, -0.004585742950439453, -0.0028696060180664062, -0.0011534690856933594, 0.0005626678466796875, 0.0022788047790527344, 0.003994941711425781, 0.005711078643798828, 0.007427215576171875, 0.009143352508544922, 0.010859489440917969, 0.012575626373291016, 0.014291763305664062, 0.01600790023803711, 0.017724037170410156, 0.019440174102783203, 0.02115631103515625, 0.022872447967529297, 0.024588584899902344, 0.02630472183227539, 0.028020858764648438, 0.029736995697021484, 0.03145313262939453, 0.03316926956176758, 0.034885406494140625, 0.03660154342651367, 0.03831768035888672, 0.040033817291259766, 0.04174995422363281, 0.04346609115600586, 0.045182228088378906, 0.04689836502075195, 0.048614501953125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 6.0, 6.0, 10.0, 23.0, 36.0, 47.0, 70.0, 82.0, 103.0, 124.0, 128.0, 113.0, 78.0, 58.0, 33.0, 30.0, 20.0, 10.0, 11.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5258496999740601, -0.5134339928627014, -0.5010183453559875, -0.4886026382446289, -0.47618696093559265, -0.4637712836265564, -0.45135560631752014, -0.4389399290084839, -0.42652422189712524, -0.414108544588089, -0.40169286727905273, -0.3892771601676941, -0.37686148285865784, -0.3644458055496216, -0.3520301282405853, -0.3396144509315491, -0.3271987736225128, -0.31478309631347656, -0.3023674190044403, -0.28995174169540405, -0.2775360345840454, -0.26512035727500916, -0.2527046799659729, -0.24028900265693665, -0.2278733104467392, -0.21545763313770294, -0.2030419409275055, -0.19062626361846924, -0.17821058630943298, -0.16579489409923553, -0.15337921679019928, -0.14096352458000183, -0.12854784727096558, -0.11613216251134872, -0.10371647775173187, -0.09130080044269562, -0.07888511568307877, -0.06646943092346191, -0.05405375361442566, -0.04163806885480881, -0.029222384095191956, -0.016806701198220253, -0.00439101830124855, 0.008024662733078003, 0.020440347492694855, 0.03285603225231171, 0.04527170956134796, 0.05768739432096481, 0.07010307908058167, 0.08251876384019852, 0.09493444859981537, 0.10735012590885162, 0.11976581066846848, 0.13218149542808533, 0.14459717273712158, 0.15701285004615784, 0.16942854225635529, 0.18184421956539154, 0.194259911775589, 0.20667558908462524, 0.2190912663936615, 0.23150695860385895, 0.2439226359128952, 0.25633832812309265, 0.2687540054321289]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 9.0, 8.0, 20.0, 15.0, 20.0, 25.0, 22.0, 34.0, 33.0, 34.0, 40.0, 45.0, 34.0, 41.0, 49.0, 55.0, 41.0, 56.0, 45.0, 42.0, 33.0, 45.0, 29.0, 35.0, 25.0, 26.0, 22.0, 17.0, 11.0, 15.0, 9.0, 10.0, 9.0, 6.0, 8.0, 2.0, 1.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6307061314582825, -0.6127724051475525, -0.5948386192321777, -0.5769048929214478, -0.5589711666107178, -0.541037380695343, -0.523103654384613, -0.5051698684692383, -0.4872361421585083, -0.46930238604545593, -0.45136862993240356, -0.4334349036216736, -0.4155011475086212, -0.39756739139556885, -0.37963366508483887, -0.3616999089717865, -0.34376615285873413, -0.32583239674568176, -0.3078986406326294, -0.2899649143218994, -0.27203115820884705, -0.2540974020957947, -0.2361636608839035, -0.21822991967201233, -0.20029616355895996, -0.1823624074459076, -0.16442866623401642, -0.14649492502212524, -0.12856116890907288, -0.1106274202466011, -0.09269367158412933, -0.07475993037223816, -0.056826114654541016, -0.038892365992069244, -0.020958617329597473, -0.003024868667125702, 0.01490887999534607, 0.03284262865781784, 0.05077637732028961, 0.06871011853218079, 0.08664387464523315, 0.10457762330770493, 0.1225113719701767, 0.14044511318206787, 0.15837886929512024, 0.1763126254081726, 0.19424636662006378, 0.21218010783195496, 0.23011386394500732, 0.2480476200580597, 0.26598137617111206, 0.28391510248184204, 0.3018488585948944, 0.3197826147079468, 0.33771634101867676, 0.3556500971317291, 0.3735838532447815, 0.39151760935783386, 0.40945136547088623, 0.4273850917816162, 0.4453188478946686, 0.46325260400772095, 0.4811863303184509, 0.4991200864315033, 0.5170538425445557]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 7.0, 6.0, 6.0, 10.0, 10.0, 13.0, 8.0, 30.0, 41.0, 61.0, 94.0, 157.0, 326.0, 741.0, 2133.0, 8663.0, 68068.0, 3184723.0, 890319.0, 31575.0, 4998.0, 1260.0, 471.0, 210.0, 102.0, 62.0, 52.0, 31.0, 20.0, 18.0, 16.0, 7.0, 13.0, 2.0, 11.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.302001953125, -0.2944221496582031, -0.28684234619140625, -0.2792625427246094, -0.2716827392578125, -0.2641029357910156, -0.25652313232421875, -0.24894332885742188, -0.241363525390625, -0.23378372192382812, -0.22620391845703125, -0.21862411499023438, -0.2110443115234375, -0.20346450805664062, -0.19588470458984375, -0.18830490112304688, -0.18072509765625, -0.17314529418945312, -0.16556549072265625, -0.15798568725585938, -0.1504058837890625, -0.14282608032226562, -0.13524627685546875, -0.12766647338867188, -0.120086669921875, -0.11250686645507812, -0.10492706298828125, -0.09734725952148438, -0.0897674560546875, -0.08218765258789062, -0.07460784912109375, -0.06702804565429688, -0.0594482421875, -0.051868438720703125, -0.04428863525390625, -0.036708831787109375, -0.0291290283203125, -0.021549224853515625, -0.01396942138671875, -0.006389617919921875, 0.001190185546875, 0.008769989013671875, 0.01634979248046875, 0.023929595947265625, 0.0315093994140625, 0.039089202880859375, 0.04666900634765625, 0.054248809814453125, 0.06182861328125, 0.06940841674804688, 0.07698822021484375, 0.08456802368164062, 0.0921478271484375, 0.09972763061523438, 0.10730743408203125, 0.11488723754882812, 0.122467041015625, 0.13004684448242188, 0.13762664794921875, 0.14520645141601562, 0.1527862548828125, 0.16036605834960938, 0.16794586181640625, 0.17552566528320312, 0.18310546875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 3.0, 6.0, 5.0, 8.0, 9.0, 14.0, 13.0, 11.0, 28.0, 19.0, 27.0, 41.0, 49.0, 53.0, 54.0, 60.0, 70.0, 72.0, 64.0, 47.0, 64.0, 51.0, 38.0, 38.0, 16.0, 29.0, 28.0, 21.0, 15.0, 13.0, 14.0, 8.0, 4.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062164306640625, -0.06045818328857422, -0.05875205993652344, -0.057045936584472656, -0.055339813232421875, -0.053633689880371094, -0.05192756652832031, -0.05022144317626953, -0.04851531982421875, -0.04680919647216797, -0.04510307312011719, -0.043396949768066406, -0.041690826416015625, -0.039984703063964844, -0.03827857971191406, -0.03657245635986328, -0.0348663330078125, -0.03316020965576172, -0.03145408630371094, -0.029747962951660156, -0.028041839599609375, -0.026335716247558594, -0.024629592895507812, -0.02292346954345703, -0.02121734619140625, -0.01951122283935547, -0.017805099487304688, -0.016098976135253906, -0.014392852783203125, -0.012686729431152344, -0.010980606079101562, -0.009274482727050781, -0.007568359375, -0.005862236022949219, -0.0041561126708984375, -0.0024499893188476562, -0.000743865966796875, 0.0009622573852539062, 0.0026683807373046875, 0.004374504089355469, 0.00608062744140625, 0.007786750793457031, 0.009492874145507812, 0.011198997497558594, 0.012905120849609375, 0.014611244201660156, 0.016317367553710938, 0.01802349090576172, 0.0197296142578125, 0.02143573760986328, 0.023141860961914062, 0.024847984313964844, 0.026554107666015625, 0.028260231018066406, 0.029966354370117188, 0.03167247772216797, 0.03337860107421875, 0.03508472442626953, 0.03679084777832031, 0.038496971130371094, 0.040203094482421875, 0.041909217834472656, 0.04361534118652344, 0.04532146453857422, 0.047027587890625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 7.0, 5.0, 1.0, 16.0, 20.0, 32.0, 32.0, 61.0, 87.0, 125.0, 219.0, 347.0, 619.0, 1189.0, 2378.0, 4607.0, 9824.0, 21931.0, 54311.0, 147117.0, 446497.0, 1409155.0, 1404466.0, 447513.0, 147810.0, 54063.0, 22373.0, 9742.0, 4533.0, 2350.0, 1247.0, 658.0, 352.0, 208.0, 148.0, 80.0, 54.0, 27.0, 27.0, 18.0, 4.0, 6.0, 7.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.07586669921875, -0.07349586486816406, -0.07112503051757812, -0.06875419616699219, -0.06638336181640625, -0.06401252746582031, -0.061641693115234375, -0.05927085876464844, -0.0569000244140625, -0.05452919006347656, -0.052158355712890625, -0.04978752136230469, -0.04741668701171875, -0.04504585266113281, -0.042675018310546875, -0.04030418395996094, -0.037933349609375, -0.03556251525878906, -0.033191680908203125, -0.030820846557617188, -0.02845001220703125, -0.026079177856445312, -0.023708343505859375, -0.021337509155273438, -0.0189666748046875, -0.016595840454101562, -0.014225006103515625, -0.011854171752929688, -0.00948333740234375, -0.0071125030517578125, -0.004741668701171875, -0.0023708343505859375, 0.0, 0.0023708343505859375, 0.004741668701171875, 0.0071125030517578125, 0.00948333740234375, 0.011854171752929688, 0.014225006103515625, 0.016595840454101562, 0.0189666748046875, 0.021337509155273438, 0.023708343505859375, 0.026079177856445312, 0.02845001220703125, 0.030820846557617188, 0.033191680908203125, 0.03556251525878906, 0.037933349609375, 0.04030418395996094, 0.042675018310546875, 0.04504585266113281, 0.04741668701171875, 0.04978752136230469, 0.052158355712890625, 0.05452919006347656, 0.0569000244140625, 0.05927085876464844, 0.061641693115234375, 0.06401252746582031, 0.06638336181640625, 0.06875419616699219, 0.07112503051757812, 0.07349586486816406, 0.07586669921875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 5.0, 9.0, 10.0, 8.0, 12.0, 25.0, 39.0, 49.0, 52.0, 85.0, 128.0, 199.0, 270.0, 372.0, 554.0, 643.0, 536.0, 344.0, 235.0, 144.0, 86.0, 76.0, 57.0, 37.0, 20.0, 25.0, 9.0, 15.0, 8.0, 7.0, 10.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07611083984375, -0.07394933700561523, -0.07178783416748047, -0.0696263313293457, -0.06746482849121094, -0.06530332565307617, -0.0631418228149414, -0.06098031997680664, -0.058818817138671875, -0.05665731430053711, -0.054495811462402344, -0.05233430862426758, -0.05017280578613281, -0.04801130294799805, -0.04584980010986328, -0.043688297271728516, -0.04152679443359375, -0.039365291595458984, -0.03720378875732422, -0.03504228591918945, -0.03288078308105469, -0.030719280242919922, -0.028557777404785156, -0.02639627456665039, -0.024234771728515625, -0.02207326889038086, -0.019911766052246094, -0.017750263214111328, -0.015588760375976562, -0.013427257537841797, -0.011265754699707031, -0.009104251861572266, -0.0069427490234375, -0.004781246185302734, -0.0026197433471679688, -0.0004582405090332031, 0.0017032623291015625, 0.003864765167236328, 0.006026268005371094, 0.00818777084350586, 0.010349273681640625, 0.01251077651977539, 0.014672279357910156, 0.016833782196044922, 0.018995285034179688, 0.021156787872314453, 0.02331829071044922, 0.025479793548583984, 0.02764129638671875, 0.029802799224853516, 0.03196430206298828, 0.03412580490112305, 0.03628730773925781, 0.03844881057739258, 0.040610313415527344, 0.04277181625366211, 0.044933319091796875, 0.04709482192993164, 0.049256324768066406, 0.05141782760620117, 0.05357933044433594, 0.0557408332824707, 0.05790233612060547, 0.060063838958740234, 0.062225341796875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 1.0, 7.0, 12.0, 18.0, 16.0, 25.0, 30.0, 37.0, 41.0, 57.0, 67.0, 72.0, 72.0, 74.0, 85.0, 81.0, 62.0, 66.0, 40.0, 37.0, 32.0, 15.0, 10.0, 11.0, 6.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2082008570432663, -0.20202209055423737, -0.19584332406520844, -0.1896645724773407, -0.18348580598831177, -0.17730703949928284, -0.1711282730102539, -0.16494950652122498, -0.15877074003219604, -0.15259197354316711, -0.14641320705413818, -0.14023444056510925, -0.13405568897724152, -0.12787692248821259, -0.12169815599918365, -0.11551938951015472, -0.10934063792228699, -0.10316187143325806, -0.09698311239480972, -0.09080434590578079, -0.08462558686733246, -0.07844682037830353, -0.0722680538892746, -0.06608928740024567, -0.05991052836179733, -0.0537317655980587, -0.04755300283432007, -0.04137423634529114, -0.035195473581552505, -0.029016710817813873, -0.022837944328784943, -0.01665918156504631, -0.010480418801307678, -0.004301655106246471, 0.0018771085888147354, 0.008055873215198517, 0.014234635978937149, 0.02041339874267578, 0.026592165231704712, 0.032770927995443344, 0.038949690759181976, 0.04512845352292061, 0.05130721628665924, 0.05748598277568817, 0.0636647492647171, 0.06984350830316544, 0.07602227479219437, 0.0822010338306427, 0.08837980031967163, 0.09455856680870056, 0.1007373258471489, 0.10691609233617783, 0.11309485137462616, 0.11927361786365509, 0.12545238435268402, 0.13163115084171295, 0.1378099024295807, 0.14398866891860962, 0.15016743540763855, 0.15634620189666748, 0.16252495348453522, 0.16870371997356415, 0.17488248646259308, 0.181061252951622, 0.18724001944065094]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 6.0, 4.0, 11.0, 12.0, 7.0, 10.0, 14.0, 8.0, 17.0, 26.0, 37.0, 27.0, 33.0, 36.0, 46.0, 43.0, 44.0, 43.0, 42.0, 42.0, 44.0, 47.0, 45.0, 42.0, 43.0, 40.0, 36.0, 34.0, 26.0, 25.0, 19.0, 17.0, 14.0, 9.0, 10.0, 11.0, 4.0, 8.0, 1.0, 2.0, 7.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1924980878829956, -0.18635408580303192, -0.18021009862422943, -0.17406609654426575, -0.16792210936546326, -0.16177810728549957, -0.1556341052055359, -0.1494901180267334, -0.14334611594676971, -0.13720211386680603, -0.13105812668800354, -0.12491412460803986, -0.11877012997865677, -0.11262613534927368, -0.10648213326931, -0.10033813863992691, -0.09419414401054382, -0.08805014938116074, -0.08190615475177765, -0.07576215267181396, -0.06961815804243088, -0.06347416341304779, -0.057330165058374405, -0.05118616670370102, -0.04504217207431793, -0.038898177444934845, -0.03275417909026146, -0.026610182598233223, -0.020466186106204987, -0.01432218961417675, -0.008178193122148514, -0.002034194767475128, 0.004109799861907959, 0.010253796353936195, 0.016397792845964432, 0.022541789337992668, 0.028685785830020905, 0.03482978045940399, 0.04097377881407738, 0.04711777716875076, 0.05326177179813385, 0.05940576642751694, 0.06554976105690002, 0.07169376313686371, 0.0778377577662468, 0.08398175239562988, 0.09012575447559357, 0.09626974910497665, 0.10241374373435974, 0.10855773836374283, 0.11470173299312592, 0.1208457350730896, 0.1269897222518921, 0.13313372433185577, 0.13927772641181946, 0.14542171359062195, 0.15156571567058563, 0.15770971775054932, 0.1638537049293518, 0.1699977070093155, 0.17614170908927917, 0.18228569626808167, 0.18842969834804535, 0.19457370042800903, 0.20071768760681152]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 6.0, 7.0, 10.0, 17.0, 19.0, 10.0, 23.0, 31.0, 55.0, 74.0, 91.0, 145.0, 216.0, 361.0, 535.0, 797.0, 1304.0, 2139.0, 3710.0, 6796.0, 12588.0, 24994.0, 50833.0, 104519.0, 201313.0, 269186.0, 182640.0, 92756.0, 44879.0, 22442.0, 11373.0, 5891.0, 3359.0, 1984.0, 1287.0, 753.0, 421.0, 311.0, 196.0, 122.0, 102.0, 66.0, 57.0, 35.0, 27.0, 24.0, 14.0, 10.0, 5.0, 8.0, 3.0, 3.0, 5.0, 2.0, 4.0, 0.0, 1.0], "bins": [-0.0643310546875, -0.062346458435058594, -0.06036186218261719, -0.05837726593017578, -0.056392669677734375, -0.05440807342529297, -0.05242347717285156, -0.050438880920410156, -0.04845428466796875, -0.046469688415527344, -0.04448509216308594, -0.04250049591064453, -0.040515899658203125, -0.03853130340576172, -0.03654670715332031, -0.034562110900878906, -0.0325775146484375, -0.030592918395996094, -0.028608322143554688, -0.02662372589111328, -0.024639129638671875, -0.02265453338623047, -0.020669937133789062, -0.018685340881347656, -0.01670074462890625, -0.014716148376464844, -0.012731552124023438, -0.010746955871582031, -0.008762359619140625, -0.006777763366699219, -0.0047931671142578125, -0.0028085708618164062, -0.000823974609375, 0.0011606216430664062, 0.0031452178955078125, 0.005129814147949219, 0.007114410400390625, 0.009099006652832031, 0.011083602905273438, 0.013068199157714844, 0.01505279541015625, 0.017037391662597656, 0.019021987915039062, 0.02100658416748047, 0.022991180419921875, 0.02497577667236328, 0.026960372924804688, 0.028944969177246094, 0.0309295654296875, 0.032914161682128906, 0.03489875793457031, 0.03688335418701172, 0.038867950439453125, 0.04085254669189453, 0.04283714294433594, 0.044821739196777344, 0.04680633544921875, 0.048790931701660156, 0.05077552795410156, 0.05276012420654297, 0.054744720458984375, 0.05672931671142578, 0.05871391296386719, 0.060698509216308594, 0.06268310546875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 4.0, 2.0, 2.0, 4.0, 7.0, 6.0, 15.0, 12.0, 12.0, 15.0, 24.0, 18.0, 30.0, 41.0, 52.0, 41.0, 51.0, 38.0, 47.0, 56.0, 53.0, 53.0, 53.0, 44.0, 46.0, 36.0, 42.0, 31.0, 27.0, 29.0, 17.0, 23.0, 21.0, 17.0, 6.0, 6.0, 8.0, 3.0, 1.0, 3.0, 3.0, 1.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0487060546875, -0.04729318618774414, -0.04588031768798828, -0.04446744918823242, -0.04305458068847656, -0.0416417121887207, -0.040228843688964844, -0.038815975189208984, -0.037403106689453125, -0.035990238189697266, -0.034577369689941406, -0.03316450119018555, -0.03175163269042969, -0.030338764190673828, -0.02892589569091797, -0.02751302719116211, -0.02610015869140625, -0.02468729019165039, -0.02327442169189453, -0.021861553192138672, -0.020448684692382812, -0.019035816192626953, -0.017622947692871094, -0.016210079193115234, -0.014797210693359375, -0.013384342193603516, -0.011971473693847656, -0.010558605194091797, -0.009145736694335938, -0.007732868194580078, -0.006319999694824219, -0.004907131195068359, -0.0034942626953125, -0.0020813941955566406, -0.0006685256958007812, 0.0007443428039550781, 0.0021572113037109375, 0.003570079803466797, 0.004982948303222656, 0.006395816802978516, 0.007808685302734375, 0.009221553802490234, 0.010634422302246094, 0.012047290802001953, 0.013460159301757812, 0.014873027801513672, 0.01628589630126953, 0.01769876480102539, 0.01911163330078125, 0.02052450180053711, 0.02193737030029297, 0.023350238800048828, 0.024763107299804688, 0.026175975799560547, 0.027588844299316406, 0.029001712799072266, 0.030414581298828125, 0.031827449798583984, 0.033240318298339844, 0.0346531867980957, 0.03606605529785156, 0.03747892379760742, 0.03889179229736328, 0.04030466079711914, 0.041717529296875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 3.0, 7.0, 7.0, 4.0, 14.0, 9.0, 14.0, 17.0, 15.0, 21.0, 19.0, 23.0, 37.0, 37.0, 52.0, 86.0, 142.0, 488.0, 3538.0, 80208.0, 888355.0, 71191.0, 3287.0, 473.0, 130.0, 72.0, 55.0, 25.0, 31.0, 28.0, 18.0, 31.0, 21.0, 13.0, 15.0, 11.0, 13.0, 3.0, 8.0, 7.0, 5.0, 4.0, 4.0, 1.0, 2.0, 3.0, 4.0, 2.0], "bins": [-0.450927734375, -0.438568115234375, -0.42620849609375, -0.413848876953125, -0.4014892578125, -0.389129638671875, -0.37677001953125, -0.364410400390625, -0.35205078125, -0.339691162109375, -0.32733154296875, -0.314971923828125, -0.3026123046875, -0.290252685546875, -0.27789306640625, -0.265533447265625, -0.253173828125, -0.240814208984375, -0.22845458984375, -0.216094970703125, -0.2037353515625, -0.191375732421875, -0.17901611328125, -0.166656494140625, -0.154296875, -0.141937255859375, -0.12957763671875, -0.117218017578125, -0.1048583984375, -0.092498779296875, -0.08013916015625, -0.067779541015625, -0.055419921875, -0.043060302734375, -0.03070068359375, -0.018341064453125, -0.0059814453125, 0.006378173828125, 0.01873779296875, 0.031097412109375, 0.04345703125, 0.055816650390625, 0.06817626953125, 0.080535888671875, 0.0928955078125, 0.105255126953125, 0.11761474609375, 0.129974365234375, 0.142333984375, 0.154693603515625, 0.16705322265625, 0.179412841796875, 0.1917724609375, 0.204132080078125, 0.21649169921875, 0.228851318359375, 0.2412109375, 0.253570556640625, 0.26593017578125, 0.278289794921875, 0.2906494140625, 0.303009033203125, 0.31536865234375, 0.327728271484375, 0.340087890625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 4.0, 6.0, 5.0, 10.0, 3.0, 13.0, 8.0, 14.0, 17.0, 20.0, 19.0, 26.0, 30.0, 29.0, 26.0, 51.0, 40.0, 42.0, 40.0, 51.0, 50.0, 42.0, 49.0, 53.0, 35.0, 36.0, 34.0, 35.0, 27.0, 25.0, 16.0, 32.0, 19.0, 22.0, 13.0, 12.0, 9.0, 6.0, 8.0, 7.0, 4.0, 7.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.10223388671875, -0.09938716888427734, -0.09654045104980469, -0.09369373321533203, -0.09084701538085938, -0.08800029754638672, -0.08515357971191406, -0.0823068618774414, -0.07946014404296875, -0.0766134262084961, -0.07376670837402344, -0.07091999053955078, -0.06807327270507812, -0.06522655487060547, -0.06237983703613281, -0.059533119201660156, -0.0566864013671875, -0.053839683532714844, -0.05099296569824219, -0.04814624786376953, -0.045299530029296875, -0.04245281219482422, -0.03960609436035156, -0.036759376525878906, -0.03391265869140625, -0.031065940856933594, -0.028219223022460938, -0.02537250518798828, -0.022525787353515625, -0.01967906951904297, -0.016832351684570312, -0.013985633850097656, -0.011138916015625, -0.008292198181152344, -0.0054454803466796875, -0.0025987625122070312, 0.000247955322265625, 0.0030946731567382812, 0.0059413909912109375, 0.008788108825683594, 0.01163482666015625, 0.014481544494628906, 0.017328262329101562, 0.02017498016357422, 0.023021697998046875, 0.02586841583251953, 0.028715133666992188, 0.031561851501464844, 0.0344085693359375, 0.037255287170410156, 0.04010200500488281, 0.04294872283935547, 0.045795440673828125, 0.04864215850830078, 0.05148887634277344, 0.054335594177246094, 0.05718231201171875, 0.060029029846191406, 0.06287574768066406, 0.06572246551513672, 0.06856918334960938, 0.07141590118408203, 0.07426261901855469, 0.07710933685302734, 0.0799560546875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 7.0, 8.0, 11.0, 19.0, 26.0, 23.0, 46.0, 68.0, 125.0, 200.0, 350.0, 592.0, 1001.0, 1720.0, 3227.0, 6409.0, 13858.0, 34515.0, 99021.0, 303045.0, 369103.0, 136317.0, 44878.0, 17431.0, 7766.0, 3846.0, 2076.0, 1159.0, 651.0, 389.0, 230.0, 149.0, 84.0, 68.0, 44.0, 29.0, 21.0, 17.0, 6.0, 6.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.0577392578125, -0.05614137649536133, -0.054543495178222656, -0.052945613861083984, -0.05134773254394531, -0.04974985122680664, -0.04815196990966797, -0.0465540885925293, -0.044956207275390625, -0.04335832595825195, -0.04176044464111328, -0.04016256332397461, -0.03856468200683594, -0.036966800689697266, -0.035368919372558594, -0.03377103805541992, -0.03217315673828125, -0.030575275421142578, -0.028977394104003906, -0.027379512786865234, -0.025781631469726562, -0.02418375015258789, -0.02258586883544922, -0.020987987518310547, -0.019390106201171875, -0.017792224884033203, -0.01619434356689453, -0.01459646224975586, -0.012998580932617188, -0.011400699615478516, -0.009802818298339844, -0.008204936981201172, -0.0066070556640625, -0.005009174346923828, -0.0034112930297851562, -0.0018134117126464844, -0.0002155303955078125, 0.0013823509216308594, 0.0029802322387695312, 0.004578113555908203, 0.006175994873046875, 0.007773876190185547, 0.009371757507324219, 0.01096963882446289, 0.012567520141601562, 0.014165401458740234, 0.015763282775878906, 0.017361164093017578, 0.01895904541015625, 0.020556926727294922, 0.022154808044433594, 0.023752689361572266, 0.025350570678710938, 0.02694845199584961, 0.02854633331298828, 0.030144214630126953, 0.031742095947265625, 0.0333399772644043, 0.03493785858154297, 0.03653573989868164, 0.03813362121582031, 0.039731502532958984, 0.041329383850097656, 0.04292726516723633, 0.044525146484375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 6.0, 3.0, 3.0, 5.0, 3.0, 10.0, 8.0, 9.0, 15.0, 40.0, 46.0, 61.0, 92.0, 127.0, 111.0, 128.0, 88.0, 74.0, 41.0, 38.0, 13.0, 19.0, 6.0, 4.0, 7.0, 7.0, 5.0, 2.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.4437904357910156e-05, -2.370774745941162e-05, -2.2977590560913086e-05, -2.224743366241455e-05, -2.1517276763916016e-05, -2.078711986541748e-05, -2.0056962966918945e-05, -1.932680606842041e-05, -1.8596649169921875e-05, -1.786649227142334e-05, -1.7136335372924805e-05, -1.640617847442627e-05, -1.5676021575927734e-05, -1.49458646774292e-05, -1.4215707778930664e-05, -1.3485550880432129e-05, -1.2755393981933594e-05, -1.2025237083435059e-05, -1.1295080184936523e-05, -1.0564923286437988e-05, -9.834766387939453e-06, -9.104609489440918e-06, -8.374452590942383e-06, -7.644295692443848e-06, -6.9141387939453125e-06, -6.183981895446777e-06, -5.453824996948242e-06, -4.723668098449707e-06, -3.993511199951172e-06, -3.2633543014526367e-06, -2.5331974029541016e-06, -1.8030405044555664e-06, -1.0728836059570312e-06, -3.427267074584961e-07, 3.8743019104003906e-07, 1.1175870895385742e-06, 1.8477439880371094e-06, 2.5779008865356445e-06, 3.3080577850341797e-06, 4.038214683532715e-06, 4.76837158203125e-06, 5.498528480529785e-06, 6.22868537902832e-06, 6.9588422775268555e-06, 7.68899917602539e-06, 8.419156074523926e-06, 9.149312973022461e-06, 9.879469871520996e-06, 1.0609626770019531e-05, 1.1339783668518066e-05, 1.2069940567016602e-05, 1.2800097465515137e-05, 1.3530254364013672e-05, 1.4260411262512207e-05, 1.4990568161010742e-05, 1.5720725059509277e-05, 1.6450881958007812e-05, 1.7181038856506348e-05, 1.7911195755004883e-05, 1.8641352653503418e-05, 1.9371509552001953e-05, 2.0101666450500488e-05, 2.0831823348999023e-05, 2.156198024749756e-05, 2.2292137145996094e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 3.0, 4.0, 6.0, 6.0, 8.0, 7.0, 12.0, 12.0, 17.0, 15.0, 27.0, 31.0, 40.0, 67.0, 224.0, 1032.0, 10482.0, 248551.0, 743757.0, 40547.0, 2912.0, 433.0, 111.0, 54.0, 40.0, 32.0, 19.0, 19.0, 18.0, 12.0, 9.0, 7.0, 10.0, 4.0, 6.0, 4.0, 1.0, 5.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10491943359375, -0.10144901275634766, -0.09797859191894531, -0.09450817108154297, -0.09103775024414062, -0.08756732940673828, -0.08409690856933594, -0.0806264877319336, -0.07715606689453125, -0.0736856460571289, -0.07021522521972656, -0.06674480438232422, -0.06327438354492188, -0.05980396270751953, -0.05633354187011719, -0.052863121032714844, -0.0493927001953125, -0.045922279357910156, -0.04245185852050781, -0.03898143768310547, -0.035511016845703125, -0.03204059600830078, -0.028570175170898438, -0.025099754333496094, -0.02162933349609375, -0.018158912658691406, -0.014688491821289062, -0.011218070983886719, -0.007747650146484375, -0.004277229309082031, -0.0008068084716796875, 0.0026636123657226562, 0.006134033203125, 0.009604454040527344, 0.013074874877929688, 0.01654529571533203, 0.020015716552734375, 0.02348613739013672, 0.026956558227539062, 0.030426979064941406, 0.03389739990234375, 0.037367820739746094, 0.04083824157714844, 0.04430866241455078, 0.047779083251953125, 0.05124950408935547, 0.05471992492675781, 0.058190345764160156, 0.0616607666015625, 0.06513118743896484, 0.06860160827636719, 0.07207202911376953, 0.07554244995117188, 0.07901287078857422, 0.08248329162597656, 0.0859537124633789, 0.08942413330078125, 0.0928945541381836, 0.09636497497558594, 0.09983539581298828, 0.10330581665039062, 0.10677623748779297, 0.11024665832519531, 0.11371707916259766, 0.1171875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 9.0, 3.0, 3.0, 4.0, 5.0, 11.0, 2.0, 15.0, 7.0, 14.0, 19.0, 16.0, 25.0, 30.0, 45.0, 40.0, 52.0, 50.0, 76.0, 92.0, 62.0, 66.0, 57.0, 50.0, 47.0, 40.0, 28.0, 30.0, 23.0, 17.0, 12.0, 15.0, 6.0, 11.0, 6.0, 7.0, 2.0, 0.0, 4.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0235595703125, -0.022821903228759766, -0.02208423614501953, -0.021346569061279297, -0.020608901977539062, -0.019871234893798828, -0.019133567810058594, -0.01839590072631836, -0.017658233642578125, -0.01692056655883789, -0.016182899475097656, -0.015445232391357422, -0.014707565307617188, -0.013969898223876953, -0.013232231140136719, -0.012494564056396484, -0.01175689697265625, -0.011019229888916016, -0.010281562805175781, -0.009543895721435547, -0.008806228637695312, -0.008068561553955078, -0.007330894470214844, -0.006593227386474609, -0.005855560302734375, -0.005117893218994141, -0.004380226135253906, -0.003642559051513672, -0.0029048919677734375, -0.002167224884033203, -0.0014295578002929688, -0.0006918907165527344, 4.57763671875e-05, 0.0007834434509277344, 0.0015211105346679688, 0.002258777618408203, 0.0029964447021484375, 0.003734111785888672, 0.004471778869628906, 0.005209445953369141, 0.005947113037109375, 0.006684780120849609, 0.007422447204589844, 0.008160114288330078, 0.008897781372070312, 0.009635448455810547, 0.010373115539550781, 0.011110782623291016, 0.01184844970703125, 0.012586116790771484, 0.013323783874511719, 0.014061450958251953, 0.014799118041992188, 0.015536785125732422, 0.016274452209472656, 0.01701211929321289, 0.017749786376953125, 0.01848745346069336, 0.019225120544433594, 0.019962787628173828, 0.020700454711914062, 0.021438121795654297, 0.02217578887939453, 0.022913455963134766, 0.023651123046875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 9.0, 17.0, 63.0, 184.0, 344.0, 257.0, 94.0, 27.0, 17.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4072701930999756, -1.3795124292373657, -1.3517545461654663, -1.3239967823028564, -1.296238899230957, -1.2684811353683472, -1.2407233715057373, -1.212965488433838, -1.185207724571228, -1.1574499607086182, -1.1296920776367188, -1.1019343137741089, -1.074176549911499, -1.0464186668395996, -1.0186609029769897, -0.9909030795097351, -0.9631452560424805, -0.9353874325752258, -0.9076296091079712, -0.8798718452453613, -0.8521140217781067, -0.824356198310852, -0.7965984344482422, -0.7688406109809875, -0.7410827875137329, -0.7133249640464783, -0.6855671405792236, -0.6578093767166138, -0.6300515532493591, -0.6022937297821045, -0.5745359659194946, -0.54677814245224, -0.5190203785896301, -0.4912625551223755, -0.46350476145744324, -0.435746967792511, -0.40798914432525635, -0.3802313208580017, -0.35247352719306946, -0.3247157335281372, -0.29695791006088257, -0.26920008659362793, -0.24144229292869568, -0.21368448436260223, -0.1859266757965088, -0.15816886723041534, -0.1304110586643219, -0.10265325009822845, -0.07489544153213501, -0.047137632966041565, -0.01937982439994812, 0.008377984166145325, 0.03613579273223877, 0.06389360129833221, 0.09165140986442566, 0.1194092184305191, 0.14716702699661255, 0.174924835562706, 0.20268264412879944, 0.23044045269489288, 0.25819826126098633, 0.28595608472824097, 0.3137138783931732, 0.34147167205810547, 0.3692294955253601]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 5.0, 13.0, 8.0, 4.0, 9.0, 14.0, 15.0, 16.0, 19.0, 22.0, 32.0, 38.0, 31.0, 35.0, 49.0, 44.0, 53.0, 53.0, 55.0, 48.0, 36.0, 53.0, 35.0, 52.0, 32.0, 39.0, 32.0, 31.0, 14.0, 14.0, 19.0, 23.0, 16.0, 12.0, 10.0, 4.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.34522736072540283, -0.3336951732635498, -0.3221629559993744, -0.31063076853752136, -0.29909858107566833, -0.2875663638114929, -0.2760341763496399, -0.26450198888778687, -0.25296980142593384, -0.24143759906291962, -0.2299054116010666, -0.21837320923805237, -0.20684102177619934, -0.19530881941318512, -0.1837766170501709, -0.17224442958831787, -0.16071221232414246, -0.14918000996112823, -0.1376478224992752, -0.126115620136261, -0.11458342522382736, -0.10305123031139374, -0.09151902794837952, -0.07998683303594589, -0.06845463812351227, -0.056922443211078644, -0.04539024457335472, -0.0338580459356308, -0.022325851023197174, -0.01079365611076355, 0.0007385462522506714, 0.012270741164684296, 0.02380293607711792, 0.035335130989551544, 0.04686732962727547, 0.05839952826499939, 0.06993172317743301, 0.08146391808986664, 0.09299612045288086, 0.10452831536531448, 0.11606051027774811, 0.12759271264076233, 0.13912490010261536, 0.15065710246562958, 0.1621893048286438, 0.17372149229049683, 0.18525369465351105, 0.19678589701652527, 0.2083180844783783, 0.21985028684139252, 0.23138247430324554, 0.24291467666625977, 0.2544468641281128, 0.2659790515899658, 0.27751126885414124, 0.28904345631599426, 0.3005756735801697, 0.3121078610420227, 0.3236400783061981, 0.33517226576805115, 0.3467044532299042, 0.3582366704940796, 0.3697688579559326, 0.38130104541778564, 0.39283323287963867]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 6.0, 6.0, 8.0, 10.0, 13.0, 21.0, 28.0, 32.0, 61.0, 71.0, 122.0, 183.0, 274.0, 504.0, 811.0, 1651.0, 3306.0, 7321.0, 18232.0, 54066.0, 210263.0, 1411231.0, 2082652.0, 297392.0, 68966.0, 21884.0, 8069.0, 3427.0, 1639.0, 809.0, 449.0, 275.0, 167.0, 104.0, 69.0, 45.0, 39.0, 20.0, 11.0, 15.0, 13.0, 6.0, 1.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.12384033203125, -0.12050247192382812, -0.11716461181640625, -0.11382675170898438, -0.1104888916015625, -0.10715103149414062, -0.10381317138671875, -0.10047531127929688, -0.097137451171875, -0.09379959106445312, -0.09046173095703125, -0.08712387084960938, -0.0837860107421875, -0.08044815063476562, -0.07711029052734375, -0.07377243041992188, -0.0704345703125, -0.06709671020507812, -0.06375885009765625, -0.060420989990234375, -0.0570831298828125, -0.053745269775390625, -0.05040740966796875, -0.047069549560546875, -0.043731689453125, -0.040393829345703125, -0.03705596923828125, -0.033718109130859375, -0.0303802490234375, -0.027042388916015625, -0.02370452880859375, -0.020366668701171875, -0.01702880859375, -0.013690948486328125, -0.01035308837890625, -0.007015228271484375, -0.0036773681640625, -0.000339508056640625, 0.00299835205078125, 0.006336212158203125, 0.009674072265625, 0.013011932373046875, 0.01634979248046875, 0.019687652587890625, 0.0230255126953125, 0.026363372802734375, 0.02970123291015625, 0.033039093017578125, 0.036376953125, 0.039714813232421875, 0.04305267333984375, 0.046390533447265625, 0.0497283935546875, 0.053066253662109375, 0.05640411376953125, 0.059741973876953125, 0.063079833984375, 0.06641769409179688, 0.06975555419921875, 0.07309341430664062, 0.0764312744140625, 0.07976913452148438, 0.08310699462890625, 0.08644485473632812, 0.08978271484375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 4.0, 4.0, 7.0, 4.0, 13.0, 6.0, 9.0, 11.0, 18.0, 13.0, 23.0, 20.0, 26.0, 27.0, 40.0, 38.0, 53.0, 39.0, 50.0, 64.0, 57.0, 55.0, 42.0, 44.0, 43.0, 41.0, 32.0, 40.0, 27.0, 26.0, 19.0, 16.0, 21.0, 21.0, 12.0, 8.0, 8.0, 3.0, 4.0, 6.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.05084228515625, -0.04945516586303711, -0.04806804656982422, -0.04668092727661133, -0.04529380798339844, -0.04390668869018555, -0.042519569396972656, -0.041132450103759766, -0.039745330810546875, -0.038358211517333984, -0.036971092224121094, -0.0355839729309082, -0.03419685363769531, -0.03280973434448242, -0.03142261505126953, -0.03003549575805664, -0.02864837646484375, -0.02726125717163086, -0.02587413787841797, -0.024487018585205078, -0.023099899291992188, -0.021712779998779297, -0.020325660705566406, -0.018938541412353516, -0.017551422119140625, -0.016164302825927734, -0.014777183532714844, -0.013390064239501953, -0.012002944946289062, -0.010615825653076172, -0.009228706359863281, -0.00784158706665039, -0.0064544677734375, -0.005067348480224609, -0.0036802291870117188, -0.002293109893798828, -0.0009059906005859375, 0.0004811286926269531, 0.0018682479858398438, 0.0032553672790527344, 0.004642486572265625, 0.006029605865478516, 0.007416725158691406, 0.008803844451904297, 0.010190963745117188, 0.011578083038330078, 0.012965202331542969, 0.01435232162475586, 0.01573944091796875, 0.01712656021118164, 0.01851367950439453, 0.019900798797607422, 0.021287918090820312, 0.022675037384033203, 0.024062156677246094, 0.025449275970458984, 0.026836395263671875, 0.028223514556884766, 0.029610633850097656, 0.030997753143310547, 0.03238487243652344, 0.03377199172973633, 0.03515911102294922, 0.03654623031616211, 0.037933349609375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 5.0, 8.0, 9.0, 9.0, 18.0, 31.0, 41.0, 61.0, 107.0, 160.0, 334.0, 603.0, 1513.0, 3646.0, 10227.0, 31997.0, 108981.0, 405240.0, 1567906.0, 1515862.0, 394262.0, 105690.0, 31001.0, 10102.0, 3698.0, 1409.0, 573.0, 349.0, 174.0, 95.0, 44.0, 36.0, 34.0, 17.0, 12.0, 8.0, 4.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11212158203125, -0.10850334167480469, -0.10488510131835938, -0.10126686096191406, -0.09764862060546875, -0.09403038024902344, -0.09041213989257812, -0.08679389953613281, -0.0831756591796875, -0.07955741882324219, -0.07593917846679688, -0.07232093811035156, -0.06870269775390625, -0.06508445739746094, -0.061466217041015625, -0.05784797668457031, -0.054229736328125, -0.05061149597167969, -0.046993255615234375, -0.04337501525878906, -0.03975677490234375, -0.03613853454589844, -0.032520294189453125, -0.028902053833007812, -0.0252838134765625, -0.021665573120117188, -0.018047332763671875, -0.014429092407226562, -0.01081085205078125, -0.0071926116943359375, -0.003574371337890625, 4.38690185546875e-05, 0.003662109375, 0.0072803497314453125, 0.010898590087890625, 0.014516830444335938, 0.01813507080078125, 0.021753311157226562, 0.025371551513671875, 0.028989791870117188, 0.0326080322265625, 0.03622627258300781, 0.039844512939453125, 0.04346275329589844, 0.04708099365234375, 0.05069923400878906, 0.054317474365234375, 0.05793571472167969, 0.061553955078125, 0.06517219543457031, 0.06879043579101562, 0.07240867614746094, 0.07602691650390625, 0.07964515686035156, 0.08326339721679688, 0.08688163757324219, 0.0904998779296875, 0.09411811828613281, 0.09773635864257812, 0.10135459899902344, 0.10497283935546875, 0.10859107971191406, 0.11220932006835938, 0.11582756042480469, 0.11944580078125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 13.0, 11.0, 25.0, 29.0, 37.0, 54.0, 91.0, 110.0, 148.0, 222.0, 335.0, 474.0, 630.0, 555.0, 380.0, 284.0, 199.0, 145.0, 99.0, 68.0, 56.0, 27.0, 13.0, 26.0, 15.0, 10.0, 4.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08203125, -0.0791788101196289, -0.07632637023925781, -0.07347393035888672, -0.07062149047851562, -0.06776905059814453, -0.06491661071777344, -0.062064170837402344, -0.05921173095703125, -0.056359291076660156, -0.05350685119628906, -0.05065441131591797, -0.047801971435546875, -0.04494953155517578, -0.04209709167480469, -0.039244651794433594, -0.0363922119140625, -0.033539772033691406, -0.030687332153320312, -0.02783489227294922, -0.024982452392578125, -0.02213001251220703, -0.019277572631835938, -0.016425132751464844, -0.01357269287109375, -0.010720252990722656, -0.007867813110351562, -0.005015373229980469, -0.002162933349609375, 0.0006895065307617188, 0.0035419464111328125, 0.006394386291503906, 0.009246826171875, 0.012099266052246094, 0.014951705932617188, 0.01780414581298828, 0.020656585693359375, 0.02350902557373047, 0.026361465454101562, 0.029213905334472656, 0.03206634521484375, 0.034918785095214844, 0.03777122497558594, 0.04062366485595703, 0.043476104736328125, 0.04632854461669922, 0.04918098449707031, 0.052033424377441406, 0.0548858642578125, 0.057738304138183594, 0.06059074401855469, 0.06344318389892578, 0.06629562377929688, 0.06914806365966797, 0.07200050354003906, 0.07485294342041016, 0.07770538330078125, 0.08055782318115234, 0.08341026306152344, 0.08626270294189453, 0.08911514282226562, 0.09196758270263672, 0.09482002258300781, 0.0976724624633789, 0.10052490234375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 18.0, 45.0, 96.0, 220.0, 259.0, 196.0, 104.0, 45.0, 10.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33952879905700684, -0.3144300580024719, -0.2893312871456146, -0.2642325162887573, -0.2391337752342224, -0.2140350192785263, -0.1889362633228302, -0.1638375073671341, -0.138738751411438, -0.11363999545574188, -0.08854123950004578, -0.06344248354434967, -0.038343727588653564, -0.013244971632957458, 0.011853784322738647, 0.03695254027843475, 0.06205129623413086, 0.08715005218982697, 0.11224880814552307, 0.13734756410121918, 0.16244632005691528, 0.1875450760126114, 0.2126438319683075, 0.2377425879240036, 0.2628413438796997, 0.2879400849342346, 0.3130388557910919, 0.3381376266479492, 0.36323636770248413, 0.38833510875701904, 0.41343387961387634, 0.43853265047073364, 0.46363139152526855, 0.48873013257980347, 0.5138288736343384, 0.5389276742935181, 0.564026415348053, 0.5891251564025879, 0.6142239570617676, 0.6393226981163025, 0.6644214391708374, 0.6895201802253723, 0.7146189212799072, 0.7397177219390869, 0.7648164629936218, 0.7899152040481567, 0.8150140047073364, 0.8401127457618713, 0.8652114868164062, 0.8903102278709412, 0.9154089689254761, 0.9405077695846558, 0.9656065106391907, 0.9907052516937256, 1.0158040523529053, 1.0409027338027954, 1.066001534461975, 1.0911003351211548, 1.116199016571045, 1.1412978172302246, 1.1663966178894043, 1.1914952993392944, 1.2165940999984741, 1.2416927814483643, 1.266791582107544]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 4.0, 3.0, 8.0, 8.0, 10.0, 6.0, 10.0, 9.0, 6.0, 16.0, 15.0, 22.0, 20.0, 23.0, 24.0, 29.0, 26.0, 36.0, 30.0, 41.0, 40.0, 42.0, 35.0, 34.0, 31.0, 56.0, 39.0, 44.0, 33.0, 31.0, 32.0, 34.0, 33.0, 22.0, 14.0, 14.0, 19.0, 16.0, 14.0, 12.0, 10.0, 13.0, 8.0, 10.0, 5.0, 4.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.20630133152008057, -0.19990728795528412, -0.19351324439048767, -0.18711921572685242, -0.18072517216205597, -0.17433112859725952, -0.16793709993362427, -0.16154305636882782, -0.15514901280403137, -0.14875496923923492, -0.14236092567443848, -0.13596689701080322, -0.12957285344600677, -0.12317880988121033, -0.11678477376699448, -0.11039073765277863, -0.10399669408798218, -0.09760265052318573, -0.09120861440896988, -0.08481457829475403, -0.07842053472995758, -0.07202649116516113, -0.06563245505094528, -0.05923841521143913, -0.05284437537193298, -0.046450335532426834, -0.040056295692920685, -0.033662255853414536, -0.027268216013908386, -0.020874176174402237, -0.014480136334896088, -0.008086096495389938, -0.001692056655883789, 0.00470198318362236, 0.01109602302312851, 0.01749006286263466, 0.023884102702140808, 0.030278142541646957, 0.03667218238115311, 0.043066222220659256, 0.049460262060165405, 0.055854301899671555, 0.062248341739177704, 0.06864237785339355, 0.07503642141819, 0.08143046498298645, 0.0878245010972023, 0.09421853721141815, 0.1006125807762146, 0.10700662434101105, 0.1134006604552269, 0.11979469656944275, 0.1261887401342392, 0.13258278369903564, 0.1389768123626709, 0.14537085592746735, 0.1517648994922638, 0.15815894305706024, 0.1645529866218567, 0.17094701528549194, 0.1773410588502884, 0.18373510241508484, 0.1901291310787201, 0.19652317464351654, 0.202917218208313]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 14.0, 18.0, 18.0, 29.0, 35.0, 73.0, 103.0, 149.0, 289.0, 490.0, 844.0, 1400.0, 2477.0, 4513.0, 8561.0, 18199.0, 45336.0, 128168.0, 316820.0, 314264.0, 125534.0, 44238.0, 17987.0, 8471.0, 4592.0, 2541.0, 1378.0, 826.0, 470.0, 282.0, 156.0, 105.0, 57.0, 41.0, 26.0, 18.0, 9.0, 5.0, 6.0, 3.0, 1.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.128173828125, -0.1245107650756836, -0.12084770202636719, -0.11718463897705078, -0.11352157592773438, -0.10985851287841797, -0.10619544982910156, -0.10253238677978516, -0.09886932373046875, -0.09520626068115234, -0.09154319763183594, -0.08788013458251953, -0.08421707153320312, -0.08055400848388672, -0.07689094543457031, -0.0732278823852539, -0.0695648193359375, -0.0659017562866211, -0.06223869323730469, -0.05857563018798828, -0.054912567138671875, -0.05124950408935547, -0.04758644104003906, -0.043923377990722656, -0.04026031494140625, -0.036597251892089844, -0.03293418884277344, -0.02927112579345703, -0.025608062744140625, -0.02194499969482422, -0.018281936645507812, -0.014618873596191406, -0.010955810546875, -0.007292747497558594, -0.0036296844482421875, 3.337860107421875e-05, 0.003696441650390625, 0.007359504699707031, 0.011022567749023438, 0.014685630798339844, 0.01834869384765625, 0.022011756896972656, 0.025674819946289062, 0.02933788299560547, 0.033000946044921875, 0.03666400909423828, 0.04032707214355469, 0.043990135192871094, 0.0476531982421875, 0.051316261291503906, 0.05497932434082031, 0.05864238739013672, 0.062305450439453125, 0.06596851348876953, 0.06963157653808594, 0.07329463958740234, 0.07695770263671875, 0.08062076568603516, 0.08428382873535156, 0.08794689178466797, 0.09160995483398438, 0.09527301788330078, 0.09893608093261719, 0.1025991439819336, 0.10626220703125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 5.0, 11.0, 8.0, 10.0, 13.0, 13.0, 16.0, 14.0, 24.0, 24.0, 29.0, 40.0, 38.0, 48.0, 44.0, 44.0, 53.0, 50.0, 55.0, 46.0, 51.0, 43.0, 33.0, 40.0, 35.0, 26.0, 35.0, 22.0, 26.0, 12.0, 18.0, 8.0, 13.0, 15.0, 5.0, 10.0, 6.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.044708251953125, -0.04349851608276367, -0.042288780212402344, -0.041079044342041016, -0.03986930847167969, -0.03865957260131836, -0.03744983673095703, -0.0362401008605957, -0.035030364990234375, -0.03382062911987305, -0.03261089324951172, -0.03140115737915039, -0.030191421508789062, -0.028981685638427734, -0.027771949768066406, -0.026562213897705078, -0.02535247802734375, -0.024142742156982422, -0.022933006286621094, -0.021723270416259766, -0.020513534545898438, -0.01930379867553711, -0.01809406280517578, -0.016884326934814453, -0.015674591064453125, -0.014464855194091797, -0.013255119323730469, -0.01204538345336914, -0.010835647583007812, -0.009625911712646484, -0.008416175842285156, -0.007206439971923828, -0.0059967041015625, -0.004786968231201172, -0.0035772323608398438, -0.0023674964904785156, -0.0011577606201171875, 5.1975250244140625e-05, 0.0012617111206054688, 0.002471446990966797, 0.003681182861328125, 0.004890918731689453, 0.006100654602050781, 0.007310390472412109, 0.008520126342773438, 0.009729862213134766, 0.010939598083496094, 0.012149333953857422, 0.01335906982421875, 0.014568805694580078, 0.015778541564941406, 0.016988277435302734, 0.018198013305664062, 0.01940774917602539, 0.02061748504638672, 0.021827220916748047, 0.023036956787109375, 0.024246692657470703, 0.02545642852783203, 0.02666616439819336, 0.027875900268554688, 0.029085636138916016, 0.030295372009277344, 0.03150510787963867, 0.03271484375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 6.0, 11.0, 32.0, 37.0, 51.0, 72.0, 94.0, 197.0, 319.0, 655.0, 1376.0, 3172.0, 8050.0, 22677.0, 78568.0, 327299.0, 434600.0, 120960.0, 31765.0, 10922.0, 4181.0, 1742.0, 769.0, 391.0, 217.0, 140.0, 75.0, 59.0, 34.0, 32.0, 20.0, 12.0, 5.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1876220703125, -0.1825714111328125, -0.177520751953125, -0.1724700927734375, -0.16741943359375, -0.1623687744140625, -0.157318115234375, -0.1522674560546875, -0.147216796875, -0.1421661376953125, -0.137115478515625, -0.1320648193359375, -0.12701416015625, -0.1219635009765625, -0.116912841796875, -0.1118621826171875, -0.1068115234375, -0.1017608642578125, -0.096710205078125, -0.0916595458984375, -0.08660888671875, -0.0815582275390625, -0.076507568359375, -0.0714569091796875, -0.06640625, -0.0613555908203125, -0.056304931640625, -0.0512542724609375, -0.04620361328125, -0.0411529541015625, -0.036102294921875, -0.0310516357421875, -0.0260009765625, -0.0209503173828125, -0.015899658203125, -0.0108489990234375, -0.00579833984375, -0.0007476806640625, 0.004302978515625, 0.0093536376953125, 0.014404296875, 0.0194549560546875, 0.024505615234375, 0.0295562744140625, 0.03460693359375, 0.0396575927734375, 0.044708251953125, 0.0497589111328125, 0.0548095703125, 0.0598602294921875, 0.064910888671875, 0.0699615478515625, 0.07501220703125, 0.0800628662109375, 0.085113525390625, 0.0901641845703125, 0.09521484375, 0.1002655029296875, 0.105316162109375, 0.1103668212890625, 0.11541748046875, 0.1204681396484375, 0.125518798828125, 0.1305694580078125, 0.1356201171875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 6.0, 3.0, 10.0, 4.0, 11.0, 11.0, 11.0, 22.0, 26.0, 16.0, 35.0, 54.0, 45.0, 44.0, 48.0, 55.0, 51.0, 62.0, 55.0, 61.0, 49.0, 58.0, 48.0, 49.0, 34.0, 35.0, 17.0, 16.0, 18.0, 16.0, 12.0, 4.0, 7.0, 5.0, 9.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.127197265625, -0.12374687194824219, -0.12029647827148438, -0.11684608459472656, -0.11339569091796875, -0.10994529724121094, -0.10649490356445312, -0.10304450988769531, -0.0995941162109375, -0.09614372253417969, -0.09269332885742188, -0.08924293518066406, -0.08579254150390625, -0.08234214782714844, -0.07889175415039062, -0.07544136047363281, -0.071990966796875, -0.06854057312011719, -0.06509017944335938, -0.06163978576660156, -0.05818939208984375, -0.05473899841308594, -0.051288604736328125, -0.04783821105957031, -0.0443878173828125, -0.04093742370605469, -0.037487030029296875, -0.03403663635253906, -0.03058624267578125, -0.027135848999023438, -0.023685455322265625, -0.020235061645507812, -0.01678466796875, -0.013334274291992188, -0.009883880615234375, -0.0064334869384765625, -0.00298309326171875, 0.0004673004150390625, 0.003917694091796875, 0.0073680877685546875, 0.0108184814453125, 0.014268875122070312, 0.017719268798828125, 0.021169662475585938, 0.02462005615234375, 0.028070449829101562, 0.031520843505859375, 0.03497123718261719, 0.038421630859375, 0.04187202453613281, 0.045322418212890625, 0.04877281188964844, 0.05222320556640625, 0.05567359924316406, 0.059123992919921875, 0.06257438659667969, 0.0660247802734375, 0.06947517395019531, 0.07292556762695312, 0.07637596130371094, 0.07982635498046875, 0.08327674865722656, 0.08672714233398438, 0.09017753601074219, 0.0936279296875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 9.0, 16.0, 7.0, 17.0, 34.0, 40.0, 54.0, 68.0, 125.0, 165.0, 204.0, 368.0, 482.0, 777.0, 1147.0, 2080.0, 4843.0, 14228.0, 60108.0, 438473.0, 440532.0, 59931.0, 14427.0, 4876.0, 2093.0, 1129.0, 698.0, 437.0, 307.0, 253.0, 155.0, 126.0, 101.0, 72.0, 43.0, 36.0, 31.0, 17.0, 14.0, 7.0, 6.0, 10.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10711669921875, -0.1034231185913086, -0.09972953796386719, -0.09603595733642578, -0.09234237670898438, -0.08864879608154297, -0.08495521545410156, -0.08126163482666016, -0.07756805419921875, -0.07387447357177734, -0.07018089294433594, -0.06648731231689453, -0.06279373168945312, -0.05910015106201172, -0.05540657043457031, -0.051712989807128906, -0.0480194091796875, -0.044325828552246094, -0.04063224792480469, -0.03693866729736328, -0.033245086669921875, -0.02955150604248047, -0.025857925415039062, -0.022164344787597656, -0.01847076416015625, -0.014777183532714844, -0.011083602905273438, -0.007390022277832031, -0.003696441650390625, -2.86102294921875e-06, 0.0036907196044921875, 0.007384300231933594, 0.011077880859375, 0.014771461486816406, 0.018465042114257812, 0.02215862274169922, 0.025852203369140625, 0.02954578399658203, 0.03323936462402344, 0.036932945251464844, 0.04062652587890625, 0.044320106506347656, 0.04801368713378906, 0.05170726776123047, 0.055400848388671875, 0.05909442901611328, 0.06278800964355469, 0.0664815902709961, 0.0701751708984375, 0.0738687515258789, 0.07756233215332031, 0.08125591278076172, 0.08494949340820312, 0.08864307403564453, 0.09233665466308594, 0.09603023529052734, 0.09972381591796875, 0.10341739654541016, 0.10711097717285156, 0.11080455780029297, 0.11449813842773438, 0.11819171905517578, 0.12188529968261719, 0.1255788803100586, 0.1292724609375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 2.0, 4.0, 5.0, 11.0, 29.0, 90.0, 164.0, 258.0, 213.0, 117.0, 44.0, 18.0, 14.0, 6.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8252601623535156e-05, -2.6946887373924255e-05, -2.5641173124313354e-05, -2.4335458874702454e-05, -2.3029744625091553e-05, -2.1724030375480652e-05, -2.041831612586975e-05, -1.911260187625885e-05, -1.780688762664795e-05, -1.650117337703705e-05, -1.5195459127426147e-05, -1.3889744877815247e-05, -1.2584030628204346e-05, -1.1278316378593445e-05, -9.972602128982544e-06, -8.666887879371643e-06, -7.361173629760742e-06, -6.055459380149841e-06, -4.7497451305389404e-06, -3.4440308809280396e-06, -2.1383166313171387e-06, -8.326023817062378e-07, 4.731118679046631e-07, 1.778826117515564e-06, 3.084540367126465e-06, 4.390254616737366e-06, 5.695968866348267e-06, 7.0016831159591675e-06, 8.307397365570068e-06, 9.61311161518097e-06, 1.091882586479187e-05, 1.2224540114402771e-05, 1.3530254364013672e-05, 1.4835968613624573e-05, 1.6141682863235474e-05, 1.7447397112846375e-05, 1.8753111362457275e-05, 2.0058825612068176e-05, 2.1364539861679077e-05, 2.2670254111289978e-05, 2.397596836090088e-05, 2.528168261051178e-05, 2.658739686012268e-05, 2.789311110973358e-05, 2.9198825359344482e-05, 3.0504539608955383e-05, 3.1810253858566284e-05, 3.3115968108177185e-05, 3.4421682357788086e-05, 3.572739660739899e-05, 3.703311085700989e-05, 3.833882510662079e-05, 3.964453935623169e-05, 4.095025360584259e-05, 4.225596785545349e-05, 4.356168210506439e-05, 4.486739635467529e-05, 4.6173110604286194e-05, 4.7478824853897095e-05, 4.8784539103507996e-05, 5.0090253353118896e-05, 5.13959676027298e-05, 5.27016818523407e-05, 5.40073961019516e-05, 5.53131103515625e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 10.0, 10.0, 18.0, 21.0, 27.0, 47.0, 70.0, 92.0, 152.0, 277.0, 375.0, 662.0, 1087.0, 2081.0, 3879.0, 7337.0, 15135.0, 34104.0, 89681.0, 230091.0, 334898.0, 197561.0, 74384.0, 29148.0, 12933.0, 6500.0, 3409.0, 1883.0, 1043.0, 612.0, 340.0, 223.0, 143.0, 96.0, 73.0, 46.0, 33.0, 18.0, 16.0, 9.0, 4.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.044647216796875, -0.04312896728515625, -0.0416107177734375, -0.04009246826171875, -0.03857421875, -0.03705596923828125, -0.0355377197265625, -0.03401947021484375, -0.032501220703125, -0.03098297119140625, -0.0294647216796875, -0.02794647216796875, -0.02642822265625, -0.02490997314453125, -0.0233917236328125, -0.02187347412109375, -0.020355224609375, -0.01883697509765625, -0.0173187255859375, -0.01580047607421875, -0.0142822265625, -0.01276397705078125, -0.0112457275390625, -0.00972747802734375, -0.008209228515625, -0.00669097900390625, -0.0051727294921875, -0.00365447998046875, -0.00213623046875, -0.00061798095703125, 0.0009002685546875, 0.00241851806640625, 0.003936767578125, 0.00545501708984375, 0.0069732666015625, 0.00849151611328125, 0.010009765625, 0.01152801513671875, 0.0130462646484375, 0.01456451416015625, 0.016082763671875, 0.01760101318359375, 0.0191192626953125, 0.02063751220703125, 0.02215576171875, 0.02367401123046875, 0.0251922607421875, 0.02671051025390625, 0.028228759765625, 0.02974700927734375, 0.0312652587890625, 0.03278350830078125, 0.0343017578125, 0.03582000732421875, 0.0373382568359375, 0.03885650634765625, 0.040374755859375, 0.04189300537109375, 0.0434112548828125, 0.04492950439453125, 0.04644775390625, 0.04796600341796875, 0.0494842529296875, 0.05100250244140625, 0.052520751953125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 8.0, 7.0, 9.0, 10.0, 6.0, 12.0, 18.0, 19.0, 16.0, 23.0, 34.0, 46.0, 47.0, 58.0, 68.0, 67.0, 68.0, 58.0, 81.0, 69.0, 48.0, 42.0, 41.0, 36.0, 31.0, 18.0, 16.0, 9.0, 11.0, 8.0, 2.0, 5.0, 4.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0284881591796875, -0.02749323844909668, -0.02649831771850586, -0.02550339698791504, -0.02450847625732422, -0.0235135555267334, -0.022518634796142578, -0.021523714065551758, -0.020528793334960938, -0.019533872604370117, -0.018538951873779297, -0.017544031143188477, -0.016549110412597656, -0.015554189682006836, -0.014559268951416016, -0.013564348220825195, -0.012569427490234375, -0.011574506759643555, -0.010579586029052734, -0.009584665298461914, -0.008589744567871094, -0.0075948238372802734, -0.006599903106689453, -0.005604982376098633, -0.0046100616455078125, -0.003615140914916992, -0.002620220184326172, -0.0016252994537353516, -0.0006303787231445312, 0.00036454200744628906, 0.0013594627380371094, 0.0023543834686279297, 0.00334930419921875, 0.00434422492980957, 0.005339145660400391, 0.006334066390991211, 0.007328987121582031, 0.008323907852172852, 0.009318828582763672, 0.010313749313354492, 0.011308670043945312, 0.012303590774536133, 0.013298511505126953, 0.014293432235717773, 0.015288352966308594, 0.016283273696899414, 0.017278194427490234, 0.018273115158081055, 0.019268035888671875, 0.020262956619262695, 0.021257877349853516, 0.022252798080444336, 0.023247718811035156, 0.024242639541625977, 0.025237560272216797, 0.026232481002807617, 0.027227401733398438, 0.028222322463989258, 0.029217243194580078, 0.0302121639251709, 0.03120708465576172, 0.03220200538635254, 0.03319692611694336, 0.03419184684753418, 0.035186767578125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 5.0, 10.0, 31.0, 37.0, 71.0, 90.0, 128.0, 155.0, 152.0, 137.0, 75.0, 48.0, 25.0, 14.0, 9.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4316258728504181, -0.4184246063232422, -0.4052233397960663, -0.3920220732688904, -0.37882083654403687, -0.3656195402145386, -0.35241830348968506, -0.33921703696250916, -0.32601577043533325, -0.31281450390815735, -0.29961323738098145, -0.28641197085380554, -0.27321070432662964, -0.2600094676017761, -0.24680820107460022, -0.23360693454742432, -0.2204056680202484, -0.2072044014930725, -0.1940031349658966, -0.1808018833398819, -0.167600616812706, -0.1543993502855301, -0.14119809865951538, -0.12799683213233948, -0.11479556560516357, -0.10159429907798767, -0.08839304000139236, -0.07519178092479706, -0.061990514397621155, -0.04878924787044525, -0.035587988793849945, -0.02238672971725464, -0.009185463190078735, 0.0040157996118068695, 0.017217062413692474, 0.03041832521557808, 0.043619588017463684, 0.05682085454463959, 0.0700221136212349, 0.0832233726978302, 0.0964246392250061, 0.109625905752182, 0.12282716482877731, 0.13602842390537262, 0.14922969043254852, 0.16243095695972443, 0.17563220858573914, 0.18883347511291504, 0.20203474164009094, 0.21523600816726685, 0.22843727469444275, 0.24163852632045746, 0.25483977794647217, 0.26804107427597046, 0.281242311000824, 0.2944435775279999, 0.3076448440551758, 0.3208461105823517, 0.3340473771095276, 0.3472486436367035, 0.3604499101638794, 0.3736511468887329, 0.3868524134159088, 0.4000536799430847, 0.4132549464702606]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 8.0, 5.0, 5.0, 7.0, 7.0, 9.0, 8.0, 8.0, 12.0, 16.0, 19.0, 26.0, 22.0, 24.0, 28.0, 30.0, 37.0, 46.0, 28.0, 38.0, 38.0, 37.0, 35.0, 22.0, 41.0, 45.0, 23.0, 44.0, 31.0, 33.0, 34.0, 27.0, 31.0, 22.0, 25.0, 23.0, 23.0, 17.0, 7.0, 8.0, 10.0, 11.0, 7.0, 5.0, 4.0, 5.0, 3.0, 3.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.20474779605865479, -0.19832244515419006, -0.19189709424972534, -0.18547174334526062, -0.1790463924407959, -0.17262104153633118, -0.16619569063186646, -0.15977033972740173, -0.153344988822937, -0.1469196379184723, -0.14049428701400757, -0.13406893610954285, -0.12764358520507812, -0.1212182343006134, -0.11479289084672928, -0.10836753994226456, -0.10194219648838043, -0.09551684558391571, -0.08909149467945099, -0.08266614377498627, -0.07624079287052155, -0.06981544196605682, -0.0633900985121727, -0.05696474760770798, -0.050539396703243256, -0.044114045798778534, -0.03768869489431381, -0.03126334771513939, -0.024837996810674667, -0.018412645906209946, -0.011987298727035522, -0.005561947822570801, 0.0008634030818939209, 0.007288753055036068, 0.013714103028178215, 0.020139452069997787, 0.02656480297446251, 0.03299015387892723, 0.039415501058101654, 0.045840851962566376, 0.0522662028670311, 0.05869155377149582, 0.06511690467596054, 0.07154224812984467, 0.07796759903430939, 0.08439294993877411, 0.09081830084323883, 0.09724365174770355, 0.10366900265216827, 0.110094353556633, 0.11651970446109772, 0.12294505536556244, 0.12937040627002716, 0.13579575717449188, 0.1422210931777954, 0.14864644408226013, 0.15507179498672485, 0.16149714589118958, 0.1679224967956543, 0.17434784770011902, 0.18077319860458374, 0.18719854950904846, 0.19362390041351318, 0.2000492513179779, 0.20647460222244263]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 9.0, 15.0, 16.0, 26.0, 29.0, 79.0, 111.0, 211.0, 383.0, 752.0, 1493.0, 3115.0, 7764.0, 21374.0, 68605.0, 278434.0, 1339936.0, 1836931.0, 479453.0, 107693.0, 30455.0, 10188.0, 3922.0, 1698.0, 752.0, 365.0, 211.0, 94.0, 71.0, 47.0, 14.0, 10.0, 6.0, 8.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08074951171875, -0.07815837860107422, -0.07556724548339844, -0.07297611236572266, -0.07038497924804688, -0.0677938461303711, -0.06520271301269531, -0.06261157989501953, -0.06002044677734375, -0.05742931365966797, -0.05483818054199219, -0.052247047424316406, -0.049655914306640625, -0.047064781188964844, -0.04447364807128906, -0.04188251495361328, -0.0392913818359375, -0.03670024871826172, -0.03410911560058594, -0.031517982482910156, -0.028926849365234375, -0.026335716247558594, -0.023744583129882812, -0.02115345001220703, -0.01856231689453125, -0.01597118377685547, -0.013380050659179688, -0.010788917541503906, -0.008197784423828125, -0.005606651306152344, -0.0030155181884765625, -0.00042438507080078125, 0.002166748046875, 0.004757881164550781, 0.0073490142822265625, 0.009940147399902344, 0.012531280517578125, 0.015122413635253906, 0.017713546752929688, 0.02030467987060547, 0.02289581298828125, 0.02548694610595703, 0.028078079223632812, 0.030669212341308594, 0.033260345458984375, 0.035851478576660156, 0.03844261169433594, 0.04103374481201172, 0.0436248779296875, 0.04621601104736328, 0.04880714416503906, 0.051398277282714844, 0.053989410400390625, 0.056580543518066406, 0.05917167663574219, 0.06176280975341797, 0.06435394287109375, 0.06694507598876953, 0.06953620910644531, 0.0721273422241211, 0.07471847534179688, 0.07730960845947266, 0.07990074157714844, 0.08249187469482422, 0.0850830078125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 6.0, 4.0, 2.0, 5.0, 8.0, 10.0, 9.0, 10.0, 23.0, 14.0, 14.0, 28.0, 31.0, 32.0, 33.0, 42.0, 39.0, 46.0, 61.0, 42.0, 54.0, 35.0, 53.0, 59.0, 45.0, 40.0, 29.0, 32.0, 26.0, 26.0, 24.0, 18.0, 20.0, 20.0, 12.0, 10.0, 7.0, 12.0, 8.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.044525146484375, -0.04327392578125, -0.042022705078125, -0.040771484375, -0.039520263671875, -0.03826904296875, -0.037017822265625, -0.0357666015625, -0.034515380859375, -0.03326416015625, -0.032012939453125, -0.03076171875, -0.029510498046875, -0.02825927734375, -0.027008056640625, -0.0257568359375, -0.024505615234375, -0.02325439453125, -0.022003173828125, -0.020751953125, -0.019500732421875, -0.01824951171875, -0.016998291015625, -0.0157470703125, -0.014495849609375, -0.01324462890625, -0.011993408203125, -0.0107421875, -0.009490966796875, -0.00823974609375, -0.006988525390625, -0.0057373046875, -0.004486083984375, -0.00323486328125, -0.001983642578125, -0.000732421875, 0.000518798828125, 0.00177001953125, 0.003021240234375, 0.0042724609375, 0.005523681640625, 0.00677490234375, 0.008026123046875, 0.00927734375, 0.010528564453125, 0.01177978515625, 0.013031005859375, 0.0142822265625, 0.015533447265625, 0.01678466796875, 0.018035888671875, 0.019287109375, 0.020538330078125, 0.02178955078125, 0.023040771484375, 0.0242919921875, 0.025543212890625, 0.02679443359375, 0.028045654296875, 0.029296875, 0.030548095703125, 0.03179931640625, 0.033050537109375, 0.0343017578125, 0.035552978515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 7.0, 12.0, 13.0, 18.0, 21.0, 38.0, 47.0, 81.0, 113.0, 177.0, 243.0, 401.0, 703.0, 1554.0, 3410.0, 8394.0, 23308.0, 69637.0, 215409.0, 643214.0, 1414415.0, 1153033.0, 440886.0, 144087.0, 47406.0, 16237.0, 6043.0, 2529.0, 1196.0, 599.0, 359.0, 210.0, 136.0, 88.0, 69.0, 44.0, 35.0, 25.0, 19.0, 17.0, 14.0, 7.0, 9.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.08203125, -0.0794534683227539, -0.07687568664550781, -0.07429790496826172, -0.07172012329101562, -0.06914234161376953, -0.06656455993652344, -0.06398677825927734, -0.06140899658203125, -0.058831214904785156, -0.05625343322753906, -0.05367565155029297, -0.051097869873046875, -0.04852008819580078, -0.04594230651855469, -0.043364524841308594, -0.0407867431640625, -0.038208961486816406, -0.03563117980957031, -0.03305339813232422, -0.030475616455078125, -0.02789783477783203, -0.025320053100585938, -0.022742271423339844, -0.02016448974609375, -0.017586708068847656, -0.015008926391601562, -0.012431144714355469, -0.009853363037109375, -0.007275581359863281, -0.0046977996826171875, -0.0021200180053710938, 0.000457763671875, 0.0030355453491210938, 0.0056133270263671875, 0.008191108703613281, 0.010768890380859375, 0.013346672058105469, 0.015924453735351562, 0.018502235412597656, 0.02108001708984375, 0.023657798767089844, 0.026235580444335938, 0.02881336212158203, 0.031391143798828125, 0.03396892547607422, 0.03654670715332031, 0.039124488830566406, 0.0417022705078125, 0.044280052185058594, 0.04685783386230469, 0.04943561553955078, 0.052013397216796875, 0.05459117889404297, 0.05716896057128906, 0.059746742248535156, 0.06232452392578125, 0.06490230560302734, 0.06748008728027344, 0.07005786895751953, 0.07263565063476562, 0.07521343231201172, 0.07779121398925781, 0.0803689956665039, 0.08294677734375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 10.0, 10.0, 11.0, 16.0, 12.0, 13.0, 13.0, 29.0, 34.0, 57.0, 84.0, 77.0, 96.0, 136.0, 163.0, 188.0, 230.0, 292.0, 325.0, 337.0, 327.0, 296.0, 225.0, 211.0, 179.0, 156.0, 119.0, 100.0, 80.0, 54.0, 53.0, 28.0, 26.0, 16.0, 20.0, 16.0, 8.0, 9.0, 8.0, 6.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0760498046875, -0.0739140510559082, -0.0717782974243164, -0.06964254379272461, -0.06750679016113281, -0.06537103652954102, -0.06323528289794922, -0.06109952926635742, -0.058963775634765625, -0.05682802200317383, -0.05469226837158203, -0.052556514739990234, -0.05042076110839844, -0.04828500747680664, -0.046149253845214844, -0.04401350021362305, -0.04187774658203125, -0.03974199295043945, -0.037606239318847656, -0.03547048568725586, -0.03333473205566406, -0.031198978424072266, -0.02906322479248047, -0.026927471160888672, -0.024791717529296875, -0.022655963897705078, -0.02052021026611328, -0.018384456634521484, -0.016248703002929688, -0.01411294937133789, -0.011977195739746094, -0.009841442108154297, -0.0077056884765625, -0.005569934844970703, -0.0034341812133789062, -0.0012984275817871094, 0.0008373260498046875, 0.0029730796813964844, 0.005108833312988281, 0.007244586944580078, 0.009380340576171875, 0.011516094207763672, 0.013651847839355469, 0.015787601470947266, 0.017923355102539062, 0.02005910873413086, 0.022194862365722656, 0.024330615997314453, 0.02646636962890625, 0.028602123260498047, 0.030737876892089844, 0.03287363052368164, 0.03500938415527344, 0.037145137786865234, 0.03928089141845703, 0.04141664505004883, 0.043552398681640625, 0.04568815231323242, 0.04782390594482422, 0.049959659576416016, 0.05209541320800781, 0.05423116683959961, 0.056366920471191406, 0.0585026741027832, 0.060638427734375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 14.0, 22.0, 55.0, 69.0, 107.0, 133.0, 142.0, 142.0, 116.0, 76.0, 39.0, 34.0, 17.0, 9.0, 6.0, 8.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5496717095375061, -0.5310545563697815, -0.5124374628067017, -0.49382030963897705, -0.47520315647125244, -0.4565860331058502, -0.437968909740448, -0.4193517565727234, -0.40073463320732117, -0.38211750984191895, -0.36350035667419434, -0.3448832333087921, -0.3262661099433899, -0.3076489567756653, -0.28903183341026306, -0.27041471004486084, -0.25179755687713623, -0.23318041861057281, -0.2145632803440094, -0.19594615697860718, -0.17732901871204376, -0.15871188044548035, -0.14009475708007812, -0.12147761881351471, -0.1028604805469513, -0.08424334228038788, -0.06562621146440506, -0.04700907692313194, -0.028391942381858826, -0.00977480411529541, 0.008842326700687408, 0.027459457516670227, 0.04607665538787842, 0.06469379365444183, 0.08331092447042465, 0.10192805528640747, 0.12054519355297089, 0.1391623318195343, 0.15777945518493652, 0.17639659345149994, 0.19501373171806335, 0.21363086998462677, 0.23224800825119019, 0.2508651316165924, 0.26948225498199463, 0.28809940814971924, 0.30671653151512146, 0.3253336548805237, 0.3439508080482483, 0.3625679314136505, 0.3811850845813751, 0.39980220794677734, 0.41841936111450195, 0.4370364844799042, 0.4556536078453064, 0.474270761013031, 0.4928878843784332, 0.5115050077438354, 0.5301221609115601, 0.5487393140792847, 0.5673564076423645, 0.5859735608100891, 0.6045907139778137, 0.6232078075408936, 0.6418249607086182]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 7.0, 5.0, 7.0, 7.0, 7.0, 13.0, 6.0, 10.0, 13.0, 18.0, 11.0, 16.0, 18.0, 24.0, 18.0, 30.0, 21.0, 31.0, 29.0, 25.0, 30.0, 35.0, 34.0, 31.0, 41.0, 29.0, 29.0, 51.0, 28.0, 35.0, 33.0, 27.0, 34.0, 29.0, 23.0, 24.0, 17.0, 23.0, 21.0, 13.0, 14.0, 16.0, 18.0, 12.0, 9.0, 11.0, 3.0, 5.0, 5.0, 2.0, 3.0, 5.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.24280864000320435, -0.23558522760868073, -0.2283618003129959, -0.2211383879184723, -0.21391497552394867, -0.20669156312942505, -0.19946813583374023, -0.1922447234392166, -0.185021311044693, -0.17779789865016937, -0.17057447135448456, -0.16335105895996094, -0.15612764656543732, -0.1489042341709137, -0.14168080687522888, -0.13445739448070526, -0.12723396718502045, -0.12001054733991623, -0.11278713494539261, -0.10556371510028839, -0.09834030270576477, -0.09111688286066055, -0.08389346301555634, -0.07667005062103271, -0.0694466307759285, -0.06222321465611458, -0.05499979853630066, -0.04777637869119644, -0.04055296257138252, -0.033329546451568604, -0.026106126606464386, -0.018882710486650467, -0.011659294366836548, -0.004435877315700054, 0.0027875397354364395, 0.010010957717895508, 0.017234373837709427, 0.024457789957523346, 0.031681209802627563, 0.03890462592244148, 0.0461280420422554, 0.05335145816206932, 0.06057487428188324, 0.06779829412698746, 0.07502171397209167, 0.0822451263666153, 0.08946854621171951, 0.09669196605682373, 0.10391537845134735, 0.11113879829645157, 0.11836221069097519, 0.1255856305360794, 0.13280904293060303, 0.14003247022628784, 0.14725588262081146, 0.15447929501533508, 0.1617027223110199, 0.16892613470554352, 0.17614956200122833, 0.18337297439575195, 0.19059638679027557, 0.1978197991847992, 0.205043226480484, 0.21226663887500763, 0.21949005126953125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 7.0, 14.0, 12.0, 18.0, 27.0, 46.0, 61.0, 83.0, 143.0, 205.0, 353.0, 619.0, 1051.0, 1837.0, 3140.0, 5760.0, 10514.0, 19188.0, 35001.0, 62607.0, 107882.0, 163502.0, 196616.0, 170720.0, 115306.0, 68468.0, 38153.0, 21049.0, 11543.0, 6270.0, 3542.0, 1915.0, 1132.0, 657.0, 401.0, 245.0, 150.0, 91.0, 66.0, 55.0, 33.0, 25.0, 18.0, 8.0, 8.0, 5.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07476806640625, -0.07240009307861328, -0.07003211975097656, -0.06766414642333984, -0.06529617309570312, -0.0629281997680664, -0.06056022644042969, -0.05819225311279297, -0.05582427978515625, -0.05345630645751953, -0.05108833312988281, -0.048720359802246094, -0.046352386474609375, -0.043984413146972656, -0.04161643981933594, -0.03924846649169922, -0.0368804931640625, -0.03451251983642578, -0.03214454650878906, -0.029776573181152344, -0.027408599853515625, -0.025040626525878906, -0.022672653198242188, -0.02030467987060547, -0.01793670654296875, -0.015568733215332031, -0.013200759887695312, -0.010832786560058594, -0.008464813232421875, -0.006096839904785156, -0.0037288665771484375, -0.0013608932495117188, 0.001007080078125, 0.0033750534057617188, 0.0057430267333984375, 0.008111000061035156, 0.010478973388671875, 0.012846946716308594, 0.015214920043945312, 0.01758289337158203, 0.01995086669921875, 0.02231884002685547, 0.024686813354492188, 0.027054786682128906, 0.029422760009765625, 0.031790733337402344, 0.03415870666503906, 0.03652667999267578, 0.0388946533203125, 0.04126262664794922, 0.04363059997558594, 0.045998573303222656, 0.048366546630859375, 0.050734519958496094, 0.05310249328613281, 0.05547046661376953, 0.05783843994140625, 0.06020641326904297, 0.06257438659667969, 0.0649423599243164, 0.06731033325195312, 0.06967830657958984, 0.07204627990722656, 0.07441425323486328, 0.0767822265625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 7.0, 4.0, 12.0, 10.0, 13.0, 15.0, 17.0, 16.0, 10.0, 23.0, 28.0, 38.0, 37.0, 33.0, 46.0, 55.0, 54.0, 59.0, 40.0, 50.0, 55.0, 47.0, 44.0, 46.0, 45.0, 30.0, 22.0, 31.0, 17.0, 19.0, 16.0, 9.0, 9.0, 13.0, 8.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.046875, -0.045644283294677734, -0.04441356658935547, -0.0431828498840332, -0.04195213317871094, -0.04072141647338867, -0.039490699768066406, -0.03825998306274414, -0.037029266357421875, -0.03579854965209961, -0.034567832946777344, -0.03333711624145508, -0.03210639953613281, -0.030875682830810547, -0.02964496612548828, -0.028414249420166016, -0.02718353271484375, -0.025952816009521484, -0.02472209930419922, -0.023491382598876953, -0.022260665893554688, -0.021029949188232422, -0.019799232482910156, -0.01856851577758789, -0.017337799072265625, -0.01610708236694336, -0.014876365661621094, -0.013645648956298828, -0.012414932250976562, -0.011184215545654297, -0.009953498840332031, -0.008722782135009766, -0.0074920654296875, -0.006261348724365234, -0.005030632019042969, -0.003799915313720703, -0.0025691986083984375, -0.0013384819030761719, -0.00010776519775390625, 0.0011229515075683594, 0.002353668212890625, 0.0035843849182128906, 0.004815101623535156, 0.006045818328857422, 0.0072765350341796875, 0.008507251739501953, 0.009737968444824219, 0.010968685150146484, 0.01219940185546875, 0.013430118560791016, 0.014660835266113281, 0.015891551971435547, 0.017122268676757812, 0.018352985382080078, 0.019583702087402344, 0.02081441879272461, 0.022045135498046875, 0.02327585220336914, 0.024506568908691406, 0.025737285614013672, 0.026968002319335938, 0.028198719024658203, 0.02942943572998047, 0.030660152435302734, 0.031890869140625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 11.0, 6.0, 8.0, 10.0, 21.0, 28.0, 47.0, 55.0, 70.0, 132.0, 146.0, 213.0, 399.0, 593.0, 1002.0, 1817.0, 3277.0, 6537.0, 12724.0, 24356.0, 46703.0, 87353.0, 153298.0, 217110.0, 202733.0, 132638.0, 74276.0, 39328.0, 20592.0, 10528.0, 5423.0, 3000.0, 1609.0, 925.0, 570.0, 335.0, 227.0, 130.0, 96.0, 62.0, 43.0, 43.0, 21.0, 16.0, 13.0, 7.0, 4.0, 8.0, 6.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.099853515625, -0.09681415557861328, -0.09377479553222656, -0.09073543548583984, -0.08769607543945312, -0.0846567153930664, -0.08161735534667969, -0.07857799530029297, -0.07553863525390625, -0.07249927520751953, -0.06945991516113281, -0.0664205551147461, -0.06338119506835938, -0.060341835021972656, -0.05730247497558594, -0.05426311492919922, -0.0512237548828125, -0.04818439483642578, -0.04514503479003906, -0.042105674743652344, -0.039066314697265625, -0.036026954650878906, -0.03298759460449219, -0.02994823455810547, -0.02690887451171875, -0.02386951446533203, -0.020830154418945312, -0.017790794372558594, -0.014751434326171875, -0.011712074279785156, -0.008672714233398438, -0.005633354187011719, -0.002593994140625, 0.00044536590576171875, 0.0034847259521484375, 0.006524085998535156, 0.009563446044921875, 0.012602806091308594, 0.015642166137695312, 0.01868152618408203, 0.02172088623046875, 0.02476024627685547, 0.027799606323242188, 0.030838966369628906, 0.033878326416015625, 0.036917686462402344, 0.03995704650878906, 0.04299640655517578, 0.0460357666015625, 0.04907512664794922, 0.05211448669433594, 0.055153846740722656, 0.058193206787109375, 0.061232566833496094, 0.06427192687988281, 0.06731128692626953, 0.07035064697265625, 0.07339000701904297, 0.07642936706542969, 0.0794687271118164, 0.08250808715820312, 0.08554744720458984, 0.08858680725097656, 0.09162616729736328, 0.09466552734375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 3.0, 12.0, 7.0, 12.0, 9.0, 14.0, 14.0, 23.0, 16.0, 17.0, 15.0, 28.0, 30.0, 35.0, 26.0, 40.0, 38.0, 33.0, 34.0, 37.0, 49.0, 35.0, 39.0, 48.0, 34.0, 35.0, 32.0, 34.0, 38.0, 24.0, 31.0, 24.0, 18.0, 18.0, 11.0, 14.0, 14.0, 10.0, 9.0, 13.0, 4.0, 3.0, 5.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0], "bins": [-0.093017578125, -0.09022998809814453, -0.08744239807128906, -0.0846548080444336, -0.08186721801757812, -0.07907962799072266, -0.07629203796386719, -0.07350444793701172, -0.07071685791015625, -0.06792926788330078, -0.06514167785644531, -0.062354087829589844, -0.059566497802734375, -0.056778907775878906, -0.05399131774902344, -0.05120372772216797, -0.0484161376953125, -0.04562854766845703, -0.04284095764160156, -0.040053367614746094, -0.037265777587890625, -0.034478187561035156, -0.03169059753417969, -0.02890300750732422, -0.02611541748046875, -0.02332782745361328, -0.020540237426757812, -0.017752647399902344, -0.014965057373046875, -0.012177467346191406, -0.009389877319335938, -0.006602287292480469, -0.003814697265625, -0.0010271072387695312, 0.0017604827880859375, 0.004548072814941406, 0.007335662841796875, 0.010123252868652344, 0.012910842895507812, 0.01569843292236328, 0.01848602294921875, 0.02127361297607422, 0.024061203002929688, 0.026848793029785156, 0.029636383056640625, 0.032423973083496094, 0.03521156311035156, 0.03799915313720703, 0.0407867431640625, 0.04357433319091797, 0.04636192321777344, 0.049149513244628906, 0.051937103271484375, 0.054724693298339844, 0.05751228332519531, 0.06029987335205078, 0.06308746337890625, 0.06587505340576172, 0.06866264343261719, 0.07145023345947266, 0.07423782348632812, 0.0770254135131836, 0.07981300354003906, 0.08260059356689453, 0.08538818359375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 5.0, 14.0, 9.0, 6.0, 14.0, 26.0, 34.0, 33.0, 61.0, 69.0, 105.0, 145.0, 193.0, 277.0, 431.0, 617.0, 1034.0, 1761.0, 3183.0, 8269.0, 182342.0, 795908.0, 42398.0, 5075.0, 2474.0, 1429.0, 861.0, 559.0, 355.0, 254.0, 166.0, 110.0, 85.0, 63.0, 49.0, 26.0, 27.0, 19.0, 13.0, 12.0, 13.0, 5.0, 6.0, 3.0, 5.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.211181640625, -0.20484161376953125, -0.1985015869140625, -0.19216156005859375, -0.185821533203125, -0.17948150634765625, -0.1731414794921875, -0.16680145263671875, -0.16046142578125, -0.15412139892578125, -0.1477813720703125, -0.14144134521484375, -0.135101318359375, -0.12876129150390625, -0.1224212646484375, -0.11608123779296875, -0.1097412109375, -0.10340118408203125, -0.0970611572265625, -0.09072113037109375, -0.084381103515625, -0.07804107666015625, -0.0717010498046875, -0.06536102294921875, -0.05902099609375, -0.05268096923828125, -0.0463409423828125, -0.04000091552734375, -0.033660888671875, -0.02732086181640625, -0.0209808349609375, -0.01464080810546875, -0.00830078125, -0.00196075439453125, 0.0043792724609375, 0.01071929931640625, 0.017059326171875, 0.02339935302734375, 0.0297393798828125, 0.03607940673828125, 0.04241943359375, 0.04875946044921875, 0.0550994873046875, 0.06143951416015625, 0.067779541015625, 0.07411956787109375, 0.0804595947265625, 0.08679962158203125, 0.0931396484375, 0.09947967529296875, 0.1058197021484375, 0.11215972900390625, 0.118499755859375, 0.12483978271484375, 0.1311798095703125, 0.13751983642578125, 0.14385986328125, 0.15019989013671875, 0.1565399169921875, 0.16287994384765625, 0.169219970703125, 0.17555999755859375, 0.1819000244140625, 0.18824005126953125, 0.194580078125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 23.0, 128.0, 445.0, 320.0, 56.0, 8.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001342296600341797, -0.00013036932796239853, -0.00012650899589061737, -0.0001226486638188362, -0.00011878833174705505, -0.0001149279996752739, -0.00011106766760349274, -0.00010720733553171158, -0.00010334700345993042, -9.948667138814926e-05, -9.56263393163681e-05, -9.176600724458694e-05, -8.790567517280579e-05, -8.404534310102463e-05, -8.018501102924347e-05, -7.632467895746231e-05, -7.246434688568115e-05, -6.86040148139e-05, -6.474368274211884e-05, -6.088335067033768e-05, -5.702301859855652e-05, -5.316268652677536e-05, -4.93023544549942e-05, -4.544202238321304e-05, -4.1581690311431885e-05, -3.7721358239650726e-05, -3.386102616786957e-05, -3.000069409608841e-05, -2.614036202430725e-05, -2.2280029952526093e-05, -1.8419697880744934e-05, -1.4559365808963776e-05, -1.0699033737182617e-05, -6.838701665401459e-06, -2.9783695936203003e-06, 8.819624781608582e-07, 4.742294549942017e-06, 8.602626621723175e-06, 1.2462958693504333e-05, 1.6323290765285492e-05, 2.018362283706665e-05, 2.404395490884781e-05, 2.7904286980628967e-05, 3.1764619052410126e-05, 3.5624951124191284e-05, 3.948528319597244e-05, 4.33456152677536e-05, 4.720594733953476e-05, 5.106627941131592e-05, 5.4926611483097076e-05, 5.8786943554878235e-05, 6.26472756266594e-05, 6.650760769844055e-05, 7.036793977022171e-05, 7.422827184200287e-05, 7.808860391378403e-05, 8.194893598556519e-05, 8.580926805734634e-05, 8.96696001291275e-05, 9.352993220090866e-05, 9.739026427268982e-05, 0.00010125059634447098, 0.00010511092841625214, 0.0001089712604880333, 0.00011283159255981445]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 5.0, 5.0, 9.0, 11.0, 25.0, 32.0, 38.0, 58.0, 97.0, 126.0, 229.0, 364.0, 650.0, 1100.0, 2076.0, 4444.0, 9199.0, 19643.0, 41248.0, 83458.0, 148945.0, 208755.0, 209934.0, 150858.0, 85517.0, 42625.0, 20053.0, 9434.0, 4503.0, 2287.0, 1161.0, 659.0, 379.0, 218.0, 129.0, 93.0, 50.0, 45.0, 29.0, 22.0, 14.0, 15.0, 5.0, 7.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.034027099609375, -0.033026695251464844, -0.03202629089355469, -0.03102588653564453, -0.030025482177734375, -0.02902507781982422, -0.028024673461914062, -0.027024269104003906, -0.02602386474609375, -0.025023460388183594, -0.024023056030273438, -0.02302265167236328, -0.022022247314453125, -0.02102184295654297, -0.020021438598632812, -0.019021034240722656, -0.0180206298828125, -0.017020225524902344, -0.016019821166992188, -0.015019416809082031, -0.014019012451171875, -0.013018608093261719, -0.012018203735351562, -0.011017799377441406, -0.01001739501953125, -0.009016990661621094, -0.008016586303710938, -0.007016181945800781, -0.006015777587890625, -0.005015373229980469, -0.0040149688720703125, -0.0030145645141601562, -0.00201416015625, -0.0010137557983398438, -1.33514404296875e-05, 0.0009870529174804688, 0.001987457275390625, 0.0029878616333007812, 0.0039882659912109375, 0.004988670349121094, 0.00598907470703125, 0.006989479064941406, 0.007989883422851562, 0.008990287780761719, 0.009990692138671875, 0.010991096496582031, 0.011991500854492188, 0.012991905212402344, 0.0139923095703125, 0.014992713928222656, 0.015993118286132812, 0.01699352264404297, 0.017993927001953125, 0.01899433135986328, 0.019994735717773438, 0.020995140075683594, 0.02199554443359375, 0.022995948791503906, 0.023996353149414062, 0.02499675750732422, 0.025997161865234375, 0.02699756622314453, 0.027997970581054688, 0.028998374938964844, 0.029998779296875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 11.0, 9.0, 7.0, 16.0, 22.0, 22.0, 19.0, 21.0, 27.0, 34.0, 40.0, 55.0, 43.0, 54.0, 49.0, 64.0, 51.0, 47.0, 56.0, 53.0, 42.0, 45.0, 38.0, 26.0, 35.0, 24.0, 10.0, 13.0, 18.0, 13.0, 6.0, 8.0, 2.0, 6.0, 4.0, 4.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02764892578125, -0.026840686798095703, -0.026032447814941406, -0.02522420883178711, -0.024415969848632812, -0.023607730865478516, -0.02279949188232422, -0.021991252899169922, -0.021183013916015625, -0.020374774932861328, -0.01956653594970703, -0.018758296966552734, -0.017950057983398438, -0.01714181900024414, -0.016333580017089844, -0.015525341033935547, -0.01471710205078125, -0.013908863067626953, -0.013100624084472656, -0.01229238510131836, -0.011484146118164062, -0.010675907135009766, -0.009867668151855469, -0.009059429168701172, -0.008251190185546875, -0.007442951202392578, -0.006634712219238281, -0.005826473236083984, -0.0050182342529296875, -0.004209995269775391, -0.0034017562866210938, -0.002593517303466797, -0.0017852783203125, -0.0009770393371582031, -0.00016880035400390625, 0.0006394386291503906, 0.0014476776123046875, 0.0022559165954589844, 0.0030641555786132812, 0.003872394561767578, 0.004680633544921875, 0.005488872528076172, 0.006297111511230469, 0.007105350494384766, 0.007913589477539062, 0.00872182846069336, 0.009530067443847656, 0.010338306427001953, 0.01114654541015625, 0.011954784393310547, 0.012763023376464844, 0.01357126235961914, 0.014379501342773438, 0.015187740325927734, 0.01599597930908203, 0.016804218292236328, 0.017612457275390625, 0.018420696258544922, 0.01922893524169922, 0.020037174224853516, 0.020845413208007812, 0.02165365219116211, 0.022461891174316406, 0.023270130157470703, 0.024078369140625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 7.0, 8.0, 12.0, 10.0, 13.0, 24.0, 38.0, 45.0, 52.0, 60.0, 82.0, 82.0, 74.0, 86.0, 75.0, 68.0, 59.0, 36.0, 41.0, 30.0, 23.0, 17.0, 15.0, 8.0, 3.0, 6.0, 5.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25172969698905945, -0.24300813674926758, -0.2342865765094757, -0.22556501626968384, -0.21684345602989197, -0.2081218957901001, -0.19940032064914703, -0.19067876040935516, -0.1819572001695633, -0.17323563992977142, -0.16451407968997955, -0.15579251945018768, -0.14707094430923462, -0.13834938406944275, -0.12962782382965088, -0.12090626358985901, -0.11218470335006714, -0.10346314311027527, -0.0947415828704834, -0.08602001518011093, -0.07729845494031906, -0.06857689470052719, -0.05985533073544502, -0.051133766770362854, -0.042412206530570984, -0.033690646290779114, -0.024969082325696945, -0.016247520223259926, -0.0075259581208229065, 0.0011956021189689636, 0.009917166084051132, 0.0186387300491333, 0.02736032009124756, 0.03608188033103943, 0.0448034442961216, 0.053525008261203766, 0.062246568500995636, 0.0709681287407875, 0.07968969643115997, 0.08841125667095184, 0.09713281691074371, 0.10585437715053558, 0.11457593739032745, 0.12329750508069992, 0.1320190727710724, 0.14074063301086426, 0.14946219325065613, 0.158183753490448, 0.16690531373023987, 0.17562687397003174, 0.1843484342098236, 0.19306999444961548, 0.20179155468940735, 0.21051311492919922, 0.21923469007015228, 0.22795625030994415, 0.23667781054973602, 0.2453993707895279, 0.25412094593048096, 0.2628425061702728, 0.2715640664100647, 0.28028562664985657, 0.28900718688964844, 0.2977287471294403, 0.3064503073692322]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 5.0, 7.0, 5.0, 6.0, 8.0, 17.0, 16.0, 34.0, 28.0, 31.0, 37.0, 45.0, 46.0, 51.0, 58.0, 44.0, 53.0, 60.0, 59.0, 48.0, 46.0, 40.0, 46.0, 31.0, 39.0, 22.0, 17.0, 19.0, 23.0, 12.0, 16.0, 11.0, 8.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.43676120042800903, -0.4260993003845215, -0.41543740034103394, -0.4047755002975464, -0.39411357045173645, -0.3834516704082489, -0.37278977036476135, -0.3621278703212738, -0.35146597027778625, -0.3408040702342987, -0.33014217019081116, -0.3194802403450012, -0.30881834030151367, -0.2981564402580261, -0.2874945402145386, -0.276832640171051, -0.2661707401275635, -0.2555088400840759, -0.24484692513942719, -0.23418502509593964, -0.2235231250524521, -0.21286121010780334, -0.2021993100643158, -0.19153741002082825, -0.1808754801750183, -0.17021358013153076, -0.15955166518688202, -0.14888976514339447, -0.13822786509990692, -0.12756595015525818, -0.11690405011177063, -0.10624215006828308, -0.09558025002479553, -0.08491834253072739, -0.07425644248723984, -0.06359453499317169, -0.052932631224393845, -0.042270727455616, -0.03160881996154785, -0.020946919918060303, -0.010285012423992157, 0.0003768922761082649, 0.011038796976208687, 0.021700702607631683, 0.03236260637640953, 0.04302451014518738, 0.053686417639255524, 0.06434831768274307, 0.07501022517681122, 0.08567213267087936, 0.09633403271436691, 0.10699594020843506, 0.11765784025192261, 0.12831974029541016, 0.1389816552400589, 0.14964355528354645, 0.1603054702281952, 0.17096737027168274, 0.18162928521633148, 0.19229118525981903, 0.20295308530330658, 0.21361500024795532, 0.22427690029144287, 0.23493880033493042, 0.24560070037841797]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 6.0, 9.0, 7.0, 7.0, 8.0, 15.0, 16.0, 23.0, 29.0, 48.0, 55.0, 108.0, 185.0, 374.0, 843.0, 1986.0, 6021.0, 22634.0, 114769.0, 1026546.0, 2518813.0, 423278.0, 59209.0, 13124.0, 3712.0, 1254.0, 550.0, 243.0, 125.0, 81.0, 60.0, 36.0, 25.0, 16.0, 15.0, 14.0, 11.0, 5.0, 10.0, 4.0, 2.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1138916015625, -0.11057186126708984, -0.10725212097167969, -0.10393238067626953, -0.10061264038085938, -0.09729290008544922, -0.09397315979003906, -0.0906534194946289, -0.08733367919921875, -0.0840139389038086, -0.08069419860839844, -0.07737445831298828, -0.07405471801757812, -0.07073497772216797, -0.06741523742675781, -0.06409549713134766, -0.0607757568359375, -0.057456016540527344, -0.05413627624511719, -0.05081653594970703, -0.047496795654296875, -0.04417705535888672, -0.04085731506347656, -0.037537574768066406, -0.03421783447265625, -0.030898094177246094, -0.027578353881835938, -0.02425861358642578, -0.020938873291015625, -0.01761913299560547, -0.014299392700195312, -0.010979652404785156, -0.007659912109375, -0.004340171813964844, -0.0010204315185546875, 0.0022993087768554688, 0.005619049072265625, 0.008938789367675781, 0.012258529663085938, 0.015578269958496094, 0.01889801025390625, 0.022217750549316406, 0.025537490844726562, 0.02885723114013672, 0.032176971435546875, 0.03549671173095703, 0.03881645202636719, 0.042136192321777344, 0.0454559326171875, 0.048775672912597656, 0.05209541320800781, 0.05541515350341797, 0.058734893798828125, 0.06205463409423828, 0.06537437438964844, 0.0686941146850586, 0.07201385498046875, 0.0753335952758789, 0.07865333557128906, 0.08197307586669922, 0.08529281616210938, 0.08861255645751953, 0.09193229675292969, 0.09525203704833984, 0.09857177734375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 1.0, 5.0, 6.0, 6.0, 10.0, 6.0, 15.0, 19.0, 15.0, 28.0, 22.0, 24.0, 34.0, 35.0, 40.0, 53.0, 47.0, 46.0, 52.0, 45.0, 52.0, 56.0, 42.0, 42.0, 49.0, 45.0, 30.0, 30.0, 26.0, 17.0, 20.0, 16.0, 18.0, 11.0, 10.0, 5.0, 5.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.04681396484375, -0.045493125915527344, -0.04417228698730469, -0.04285144805908203, -0.041530609130859375, -0.04020977020263672, -0.03888893127441406, -0.037568092346191406, -0.03624725341796875, -0.034926414489746094, -0.03360557556152344, -0.03228473663330078, -0.030963897705078125, -0.02964305877685547, -0.028322219848632812, -0.027001380920410156, -0.0256805419921875, -0.024359703063964844, -0.023038864135742188, -0.02171802520751953, -0.020397186279296875, -0.01907634735107422, -0.017755508422851562, -0.016434669494628906, -0.01511383056640625, -0.013792991638183594, -0.012472152709960938, -0.011151313781738281, -0.009830474853515625, -0.008509635925292969, -0.0071887969970703125, -0.005867958068847656, -0.004547119140625, -0.0032262802124023438, -0.0019054412841796875, -0.0005846023559570312, 0.000736236572265625, 0.0020570755004882812, 0.0033779144287109375, 0.004698753356933594, 0.00601959228515625, 0.007340431213378906, 0.008661270141601562, 0.009982109069824219, 0.011302947998046875, 0.012623786926269531, 0.013944625854492188, 0.015265464782714844, 0.0165863037109375, 0.017907142639160156, 0.019227981567382812, 0.02054882049560547, 0.021869659423828125, 0.02319049835205078, 0.024511337280273438, 0.025832176208496094, 0.02715301513671875, 0.028473854064941406, 0.029794692993164062, 0.03111553192138672, 0.032436370849609375, 0.03375720977783203, 0.03507804870605469, 0.036398887634277344, 0.0377197265625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 10.0, 14.0, 17.0, 44.0, 52.0, 106.0, 175.0, 329.0, 742.0, 2094.0, 7148.0, 31566.0, 160958.0, 894114.0, 2233615.0, 702367.0, 126765.0, 25190.0, 5865.0, 1771.0, 673.0, 294.0, 155.0, 79.0, 48.0, 30.0, 19.0, 11.0, 10.0, 6.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1368408203125, -0.13327980041503906, -0.12971878051757812, -0.1261577606201172, -0.12259674072265625, -0.11903572082519531, -0.11547470092773438, -0.11191368103027344, -0.1083526611328125, -0.10479164123535156, -0.10123062133789062, -0.09766960144042969, -0.09410858154296875, -0.09054756164550781, -0.08698654174804688, -0.08342552185058594, -0.079864501953125, -0.07630348205566406, -0.07274246215820312, -0.06918144226074219, -0.06562042236328125, -0.06205940246582031, -0.058498382568359375, -0.05493736267089844, -0.0513763427734375, -0.04781532287597656, -0.044254302978515625, -0.04069328308105469, -0.03713226318359375, -0.03357124328613281, -0.030010223388671875, -0.026449203491210938, -0.02288818359375, -0.019327163696289062, -0.015766143798828125, -0.012205123901367188, -0.00864410400390625, -0.0050830841064453125, -0.001522064208984375, 0.0020389556884765625, 0.0055999755859375, 0.009160995483398438, 0.012722015380859375, 0.016283035278320312, 0.01984405517578125, 0.023405075073242188, 0.026966094970703125, 0.030527114868164062, 0.034088134765625, 0.03764915466308594, 0.041210174560546875, 0.04477119445800781, 0.04833221435546875, 0.05189323425292969, 0.055454254150390625, 0.05901527404785156, 0.0625762939453125, 0.06613731384277344, 0.06969833374023438, 0.07325935363769531, 0.07682037353515625, 0.08038139343261719, 0.08394241333007812, 0.08750343322753906, 0.091064453125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 1.0, 1.0, 6.0, 5.0, 17.0, 17.0, 27.0, 34.0, 50.0, 62.0, 73.0, 114.0, 179.0, 223.0, 295.0, 360.0, 476.0, 497.0, 411.0, 335.0, 220.0, 186.0, 121.0, 80.0, 75.0, 53.0, 39.0, 42.0, 28.0, 16.0, 12.0, 9.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10357666015625, -0.1009521484375, -0.09832763671875, -0.095703125, -0.09307861328125, -0.0904541015625, -0.08782958984375, -0.085205078125, -0.08258056640625, -0.0799560546875, -0.07733154296875, -0.07470703125, -0.07208251953125, -0.0694580078125, -0.06683349609375, -0.064208984375, -0.06158447265625, -0.0589599609375, -0.05633544921875, -0.0537109375, -0.05108642578125, -0.0484619140625, -0.04583740234375, -0.043212890625, -0.04058837890625, -0.0379638671875, -0.03533935546875, -0.03271484375, -0.03009033203125, -0.0274658203125, -0.02484130859375, -0.022216796875, -0.01959228515625, -0.0169677734375, -0.01434326171875, -0.01171875, -0.00909423828125, -0.0064697265625, -0.00384521484375, -0.001220703125, 0.00140380859375, 0.0040283203125, 0.00665283203125, 0.00927734375, 0.01190185546875, 0.0145263671875, 0.01715087890625, 0.019775390625, 0.02239990234375, 0.0250244140625, 0.02764892578125, 0.0302734375, 0.03289794921875, 0.0355224609375, 0.03814697265625, 0.040771484375, 0.04339599609375, 0.0460205078125, 0.04864501953125, 0.05126953125, 0.05389404296875, 0.0565185546875, 0.05914306640625, 0.061767578125, 0.06439208984375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 5.0, 14.0, 20.0, 44.0, 68.0, 78.0, 115.0, 111.0, 105.0, 115.0, 93.0, 67.0, 50.0, 45.0, 27.0, 18.0, 12.0, 3.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31187447905540466, -0.2980983853340149, -0.2843222916126251, -0.27054619789123535, -0.25677013397216797, -0.2429940402507782, -0.22921794652938843, -0.21544185280799866, -0.20166577398777008, -0.1878896802663803, -0.17411360144615173, -0.16033750772476196, -0.1465614140033722, -0.13278533518314362, -0.11900924146175385, -0.10523315519094467, -0.0914570689201355, -0.07768098264932632, -0.06390489637851715, -0.05012880265712738, -0.03635271638631821, -0.022576630115509033, -0.008800536394119263, 0.004975549876689911, 0.018751636147499084, 0.03252772241830826, 0.04630381241440773, 0.0600799024105072, 0.07385598868131638, 0.08763207495212555, 0.10140816867351532, 0.1151842549443245, 0.12896037101745605, 0.14273646473884583, 0.1565125435590744, 0.17028863728046417, 0.18406471610069275, 0.19784080982208252, 0.2116169035434723, 0.22539299726486206, 0.23916907608509064, 0.2529451549053192, 0.266721248626709, 0.28049734234809875, 0.2942734360694885, 0.3080494999885559, 0.32182562351226807, 0.33560168743133545, 0.3493777811527252, 0.363153874874115, 0.37692996859550476, 0.39070606231689453, 0.4044821262359619, 0.4182582199573517, 0.43203431367874146, 0.4458104074001312, 0.459586501121521, 0.47336259484291077, 0.48713868856430054, 0.5009147524833679, 0.5146908760070801, 0.5284669399261475, 0.5422430038452148, 0.556019127368927, 0.5697951912879944]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 4.0, 10.0, 7.0, 9.0, 11.0, 12.0, 16.0, 21.0, 19.0, 26.0, 26.0, 17.0, 29.0, 39.0, 33.0, 31.0, 42.0, 35.0, 33.0, 40.0, 44.0, 34.0, 39.0, 44.0, 41.0, 39.0, 32.0, 34.0, 42.0, 27.0, 32.0, 19.0, 17.0, 23.0, 13.0, 16.0, 15.0, 14.0, 8.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.24989545345306396, -0.24242407083511353, -0.23495268821716309, -0.22748130559921265, -0.2200099378824234, -0.21253855526447296, -0.20506717264652252, -0.19759579002857208, -0.19012442231178284, -0.1826530396938324, -0.17518165707588196, -0.16771027445793152, -0.16023890674114227, -0.15276752412319183, -0.1452961415052414, -0.13782475888729095, -0.13035337626934052, -0.12288199365139008, -0.11541061848402023, -0.1079392358660698, -0.10046786069869995, -0.09299647808074951, -0.08552509546279907, -0.07805371284484863, -0.07058233767747879, -0.06311095505952835, -0.05563957989215851, -0.04816819727420807, -0.04069681838154793, -0.03322543948888779, -0.025754056870937347, -0.018282677978277206, -0.010811299085617065, -0.00333991926163435, 0.004131460562348366, 0.011602841317653656, 0.019074220210313797, 0.026545599102973938, 0.03401698172092438, 0.04148836061358452, 0.04895973950624466, 0.0564311183989048, 0.06390249729156494, 0.07137387990951538, 0.07884526252746582, 0.08631663769483566, 0.0937880203127861, 0.10125939548015594, 0.10873077809810638, 0.11620216071605682, 0.12367353588342667, 0.1311449110507965, 0.13861629366874695, 0.1460876762866974, 0.15355905890464783, 0.16103044152259827, 0.1685018241405487, 0.17597320675849915, 0.18344458937644958, 0.19091597199440002, 0.19838733971118927, 0.2058587223291397, 0.21333010494709015, 0.2208014875650406, 0.22827285528182983]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 8.0, 10.0, 22.0, 35.0, 45.0, 68.0, 91.0, 154.0, 253.0, 438.0, 732.0, 1278.0, 2189.0, 3805.0, 6846.0, 12401.0, 22156.0, 41314.0, 77375.0, 133179.0, 193843.0, 203862.0, 150526.0, 89909.0, 49080.0, 25884.0, 14427.0, 8021.0, 4464.0, 2567.0, 1417.0, 837.0, 515.0, 290.0, 174.0, 114.0, 73.0, 46.0, 33.0, 26.0, 11.0, 18.0, 8.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.08837890625, -0.08571147918701172, -0.08304405212402344, -0.08037662506103516, -0.07770919799804688, -0.0750417709350586, -0.07237434387207031, -0.06970691680908203, -0.06703948974609375, -0.06437206268310547, -0.06170463562011719, -0.059037208557128906, -0.056369781494140625, -0.053702354431152344, -0.05103492736816406, -0.04836750030517578, -0.0457000732421875, -0.04303264617919922, -0.04036521911621094, -0.037697792053222656, -0.035030364990234375, -0.032362937927246094, -0.029695510864257812, -0.02702808380126953, -0.02436065673828125, -0.02169322967529297, -0.019025802612304688, -0.016358375549316406, -0.013690948486328125, -0.011023521423339844, -0.008356094360351562, -0.005688667297363281, -0.003021240234375, -0.00035381317138671875, 0.0023136138916015625, 0.004981040954589844, 0.007648468017578125, 0.010315895080566406, 0.012983322143554688, 0.01565074920654297, 0.01831817626953125, 0.02098560333251953, 0.023653030395507812, 0.026320457458496094, 0.028987884521484375, 0.031655311584472656, 0.03432273864746094, 0.03699016571044922, 0.0396575927734375, 0.04232501983642578, 0.04499244689941406, 0.047659873962402344, 0.050327301025390625, 0.052994728088378906, 0.05566215515136719, 0.05832958221435547, 0.06099700927734375, 0.06366443634033203, 0.06633186340332031, 0.0689992904663086, 0.07166671752929688, 0.07433414459228516, 0.07700157165527344, 0.07966899871826172, 0.08233642578125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 7.0, 6.0, 4.0, 4.0, 7.0, 13.0, 14.0, 18.0, 20.0, 21.0, 34.0, 26.0, 24.0, 37.0, 56.0, 48.0, 36.0, 70.0, 51.0, 37.0, 58.0, 52.0, 49.0, 37.0, 37.0, 38.0, 29.0, 28.0, 31.0, 15.0, 20.0, 14.0, 11.0, 10.0, 13.0, 7.0, 4.0, 1.0, 5.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043731689453125, -0.04251241683959961, -0.04129314422607422, -0.04007387161254883, -0.03885459899902344, -0.03763532638549805, -0.036416053771972656, -0.035196781158447266, -0.033977508544921875, -0.032758235931396484, -0.031538963317871094, -0.030319690704345703, -0.029100418090820312, -0.027881145477294922, -0.02666187286376953, -0.02544260025024414, -0.02422332763671875, -0.02300405502319336, -0.02178478240966797, -0.020565509796142578, -0.019346237182617188, -0.018126964569091797, -0.016907691955566406, -0.015688419342041016, -0.014469146728515625, -0.013249874114990234, -0.012030601501464844, -0.010811328887939453, -0.009592056274414062, -0.008372783660888672, -0.007153511047363281, -0.005934238433837891, -0.0047149658203125, -0.0034956932067871094, -0.0022764205932617188, -0.0010571479797363281, 0.0001621246337890625, 0.0013813972473144531, 0.0026006698608398438, 0.0038199424743652344, 0.005039215087890625, 0.006258487701416016, 0.007477760314941406, 0.008697032928466797, 0.009916305541992188, 0.011135578155517578, 0.012354850769042969, 0.01357412338256836, 0.01479339599609375, 0.01601266860961914, 0.01723194122314453, 0.018451213836669922, 0.019670486450195312, 0.020889759063720703, 0.022109031677246094, 0.023328304290771484, 0.024547576904296875, 0.025766849517822266, 0.026986122131347656, 0.028205394744873047, 0.029424667358398438, 0.030643939971923828, 0.03186321258544922, 0.03308248519897461, 0.0343017578125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 9.0, 14.0, 11.0, 15.0, 25.0, 35.0, 42.0, 59.0, 92.0, 118.0, 180.0, 236.0, 384.0, 570.0, 918.0, 1758.0, 3578.0, 8263.0, 19130.0, 45782.0, 101179.0, 195412.0, 268607.0, 205057.0, 109275.0, 49423.0, 20917.0, 8786.0, 3966.0, 1856.0, 1009.0, 576.0, 395.0, 242.0, 184.0, 129.0, 110.0, 46.0, 59.0, 32.0, 23.0, 14.0, 12.0, 9.0, 6.0, 7.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10272216796875, -0.09935951232910156, -0.09599685668945312, -0.09263420104980469, -0.08927154541015625, -0.08590888977050781, -0.08254623413085938, -0.07918357849121094, -0.0758209228515625, -0.07245826721191406, -0.06909561157226562, -0.06573295593261719, -0.06237030029296875, -0.05900764465332031, -0.055644989013671875, -0.05228233337402344, -0.048919677734375, -0.04555702209472656, -0.042194366455078125, -0.03883171081542969, -0.03546905517578125, -0.03210639953613281, -0.028743743896484375, -0.025381088256835938, -0.0220184326171875, -0.018655776977539062, -0.015293121337890625, -0.011930465698242188, -0.00856781005859375, -0.0052051544189453125, -0.001842498779296875, 0.0015201568603515625, 0.0048828125, 0.008245468139648438, 0.011608123779296875, 0.014970779418945312, 0.01833343505859375, 0.021696090698242188, 0.025058746337890625, 0.028421401977539062, 0.0317840576171875, 0.03514671325683594, 0.038509368896484375, 0.04187202453613281, 0.04523468017578125, 0.04859733581542969, 0.051959991455078125, 0.05532264709472656, 0.058685302734375, 0.06204795837402344, 0.06541061401367188, 0.06877326965332031, 0.07213592529296875, 0.07549858093261719, 0.07886123657226562, 0.08222389221191406, 0.0855865478515625, 0.08894920349121094, 0.09231185913085938, 0.09567451477050781, 0.09903717041015625, 0.10239982604980469, 0.10576248168945312, 0.10912513732910156, 0.11248779296875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 8.0, 13.0, 13.0, 6.0, 12.0, 7.0, 15.0, 15.0, 24.0, 15.0, 23.0, 25.0, 34.0, 33.0, 32.0, 39.0, 37.0, 38.0, 35.0, 37.0, 37.0, 35.0, 50.0, 38.0, 44.0, 38.0, 26.0, 33.0, 31.0, 24.0, 29.0, 26.0, 13.0, 9.0, 20.0, 12.0, 14.0, 13.0, 9.0, 9.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.09173583984375, -0.08884143829345703, -0.08594703674316406, -0.0830526351928711, -0.08015823364257812, -0.07726383209228516, -0.07436943054199219, -0.07147502899169922, -0.06858062744140625, -0.06568622589111328, -0.06279182434082031, -0.059897422790527344, -0.057003021240234375, -0.054108619689941406, -0.05121421813964844, -0.04831981658935547, -0.0454254150390625, -0.04253101348876953, -0.03963661193847656, -0.036742210388183594, -0.033847808837890625, -0.030953407287597656, -0.028059005737304688, -0.02516460418701172, -0.02227020263671875, -0.01937580108642578, -0.016481399536132812, -0.013586997985839844, -0.010692596435546875, -0.007798194885253906, -0.0049037933349609375, -0.0020093917846679688, 0.000885009765625, 0.0037794113159179688, 0.0066738128662109375, 0.009568214416503906, 0.012462615966796875, 0.015357017517089844, 0.018251419067382812, 0.02114582061767578, 0.02404022216796875, 0.02693462371826172, 0.029829025268554688, 0.032723426818847656, 0.035617828369140625, 0.038512229919433594, 0.04140663146972656, 0.04430103302001953, 0.0471954345703125, 0.05008983612060547, 0.05298423767089844, 0.055878639221191406, 0.058773040771484375, 0.061667442321777344, 0.06456184387207031, 0.06745624542236328, 0.07035064697265625, 0.07324504852294922, 0.07613945007324219, 0.07903385162353516, 0.08192825317382812, 0.0848226547241211, 0.08771705627441406, 0.09061145782470703, 0.093505859375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 8.0, 12.0, 15.0, 24.0, 45.0, 68.0, 127.0, 228.0, 394.0, 738.0, 1460.0, 3302.0, 8187.0, 22199.0, 63755.0, 174713.0, 327843.0, 268751.0, 113107.0, 39102.0, 14210.0, 5545.0, 2378.0, 1070.0, 569.0, 279.0, 150.0, 100.0, 64.0, 36.0, 26.0, 18.0, 7.0, 7.0, 6.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04669189453125, -0.04538679122924805, -0.044081687927246094, -0.04277658462524414, -0.04147148132324219, -0.040166378021240234, -0.03886127471923828, -0.03755617141723633, -0.036251068115234375, -0.03494596481323242, -0.03364086151123047, -0.032335758209228516, -0.031030654907226562, -0.02972555160522461, -0.028420448303222656, -0.027115345001220703, -0.02581024169921875, -0.024505138397216797, -0.023200035095214844, -0.02189493179321289, -0.020589828491210938, -0.019284725189208984, -0.01797962188720703, -0.016674518585205078, -0.015369415283203125, -0.014064311981201172, -0.012759208679199219, -0.011454105377197266, -0.010149002075195312, -0.00884389877319336, -0.007538795471191406, -0.006233692169189453, -0.0049285888671875, -0.003623485565185547, -0.0023183822631835938, -0.0010132789611816406, 0.0002918243408203125, 0.0015969276428222656, 0.0029020309448242188, 0.004207134246826172, 0.005512237548828125, 0.006817340850830078, 0.008122444152832031, 0.009427547454833984, 0.010732650756835938, 0.01203775405883789, 0.013342857360839844, 0.014647960662841797, 0.01595306396484375, 0.017258167266845703, 0.018563270568847656, 0.01986837387084961, 0.021173477172851562, 0.022478580474853516, 0.02378368377685547, 0.025088787078857422, 0.026393890380859375, 0.027698993682861328, 0.02900409698486328, 0.030309200286865234, 0.03161430358886719, 0.03291940689086914, 0.034224510192871094, 0.03552961349487305, 0.036834716796875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 7.0, 3.0, 5.0, 8.0, 7.0, 13.0, 13.0, 13.0, 12.0, 23.0, 20.0, 30.0, 24.0, 34.0, 41.0, 43.0, 60.0, 44.0, 62.0, 61.0, 65.0, 48.0, 40.0, 60.0, 36.0, 45.0, 31.0, 27.0, 21.0, 16.0, 17.0, 16.0, 12.0, 9.0, 6.0, 5.0, 3.0, 2.0, 3.0, 7.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.1801719665527344e-05, -1.1411495506763458e-05, -1.1021271347999573e-05, -1.0631047189235687e-05, -1.0240823030471802e-05, -9.850598871707916e-06, -9.46037471294403e-06, -9.070150554180145e-06, -8.67992639541626e-06, -8.289702236652374e-06, -7.899478077888489e-06, -7.509253919124603e-06, -7.119029760360718e-06, -6.728805601596832e-06, -6.338581442832947e-06, -5.948357284069061e-06, -5.558133125305176e-06, -5.16790896654129e-06, -4.777684807777405e-06, -4.387460649013519e-06, -3.997236490249634e-06, -3.6070123314857483e-06, -3.216788172721863e-06, -2.8265640139579773e-06, -2.436339855194092e-06, -2.0461156964302063e-06, -1.6558915376663208e-06, -1.2656673789024353e-06, -8.754432201385498e-07, -4.852190613746643e-07, -9.499490261077881e-08, 2.952292561531067e-07, 6.854534149169922e-07, 1.0756775736808777e-06, 1.4659017324447632e-06, 1.8561258912086487e-06, 2.246350049972534e-06, 2.6365742087364197e-06, 3.026798367500305e-06, 3.4170225262641907e-06, 3.807246685028076e-06, 4.197470843791962e-06, 4.587695002555847e-06, 4.977919161319733e-06, 5.368143320083618e-06, 5.758367478847504e-06, 6.148591637611389e-06, 6.538815796375275e-06, 6.92903995513916e-06, 7.319264113903046e-06, 7.709488272666931e-06, 8.099712431430817e-06, 8.489936590194702e-06, 8.880160748958588e-06, 9.270384907722473e-06, 9.660609066486359e-06, 1.0050833225250244e-05, 1.044105738401413e-05, 1.0831281542778015e-05, 1.12215057015419e-05, 1.1611729860305786e-05, 1.2001954019069672e-05, 1.2392178177833557e-05, 1.2782402336597443e-05, 1.3172626495361328e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 7.0, 5.0, 7.0, 9.0, 18.0, 21.0, 33.0, 58.0, 58.0, 79.0, 126.0, 231.0, 372.0, 769.0, 1359.0, 2972.0, 7128.0, 17455.0, 47734.0, 132935.0, 293345.0, 308245.0, 148234.0, 53425.0, 19585.0, 7728.0, 3262.0, 1461.0, 755.0, 408.0, 266.0, 165.0, 102.0, 59.0, 53.0, 26.0, 17.0, 20.0, 9.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-0.04840087890625, -0.04716157913208008, -0.045922279357910156, -0.044682979583740234, -0.04344367980957031, -0.04220438003540039, -0.04096508026123047, -0.03972578048706055, -0.038486480712890625, -0.0372471809387207, -0.03600788116455078, -0.03476858139038086, -0.03352928161621094, -0.032289981842041016, -0.031050682067871094, -0.029811382293701172, -0.02857208251953125, -0.027332782745361328, -0.026093482971191406, -0.024854183197021484, -0.023614883422851562, -0.02237558364868164, -0.02113628387451172, -0.019896984100341797, -0.018657684326171875, -0.017418384552001953, -0.01617908477783203, -0.01493978500366211, -0.013700485229492188, -0.012461185455322266, -0.011221885681152344, -0.009982585906982422, -0.0087432861328125, -0.007503986358642578, -0.006264686584472656, -0.005025386810302734, -0.0037860870361328125, -0.0025467872619628906, -0.0013074874877929688, -6.818771362304688e-05, 0.001171112060546875, 0.002410411834716797, 0.0036497116088867188, 0.004889011383056641, 0.0061283111572265625, 0.007367610931396484, 0.008606910705566406, 0.009846210479736328, 0.01108551025390625, 0.012324810028076172, 0.013564109802246094, 0.014803409576416016, 0.016042709350585938, 0.01728200912475586, 0.01852130889892578, 0.019760608673095703, 0.020999908447265625, 0.022239208221435547, 0.02347850799560547, 0.02471780776977539, 0.025957107543945312, 0.027196407318115234, 0.028435707092285156, 0.029675006866455078, 0.030914306640625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 3.0, 7.0, 8.0, 9.0, 8.0, 12.0, 20.0, 31.0, 28.0, 27.0, 32.0, 39.0, 47.0, 47.0, 45.0, 55.0, 61.0, 58.0, 62.0, 57.0, 53.0, 40.0, 45.0, 41.0, 23.0, 19.0, 23.0, 29.0, 14.0, 8.0, 11.0, 8.0, 7.0, 2.0, 3.0, 7.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0205535888671875, -0.019805431365966797, -0.019057273864746094, -0.01830911636352539, -0.017560958862304688, -0.016812801361083984, -0.01606464385986328, -0.015316486358642578, -0.014568328857421875, -0.013820171356201172, -0.013072013854980469, -0.012323856353759766, -0.011575698852539062, -0.01082754135131836, -0.010079383850097656, -0.009331226348876953, -0.00858306884765625, -0.007834911346435547, -0.007086753845214844, -0.006338596343994141, -0.0055904388427734375, -0.004842281341552734, -0.004094123840332031, -0.003345966339111328, -0.002597808837890625, -0.0018496513366699219, -0.0011014938354492188, -0.0003533363342285156, 0.0003948211669921875, 0.0011429786682128906, 0.0018911361694335938, 0.002639293670654297, 0.003387451171875, 0.004135608673095703, 0.004883766174316406, 0.005631923675537109, 0.0063800811767578125, 0.007128238677978516, 0.007876396179199219, 0.008624553680419922, 0.009372711181640625, 0.010120868682861328, 0.010869026184082031, 0.011617183685302734, 0.012365341186523438, 0.01311349868774414, 0.013861656188964844, 0.014609813690185547, 0.01535797119140625, 0.016106128692626953, 0.016854286193847656, 0.01760244369506836, 0.018350601196289062, 0.019098758697509766, 0.01984691619873047, 0.020595073699951172, 0.021343231201171875, 0.022091388702392578, 0.02283954620361328, 0.023587703704833984, 0.024335861206054688, 0.02508401870727539, 0.025832176208496094, 0.026580333709716797, 0.0273284912109375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 11.0, 9.0, 24.0, 50.0, 101.0, 157.0, 196.0, 185.0, 128.0, 75.0, 40.0, 17.0, 8.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8653367161750793, -0.8430077433586121, -0.8206787109375, -0.7983497381210327, -0.7760207653045654, -0.7536917924880981, -0.7313628196716309, -0.7090337872505188, -0.6867048144340515, -0.6643758416175842, -0.6420468091964722, -0.6197178363800049, -0.5973888635635376, -0.5750598907470703, -0.552730917930603, -0.530401885509491, -0.5080729126930237, -0.4857439398765564, -0.4634149372577667, -0.44108593463897705, -0.41875696182250977, -0.3964279890060425, -0.3740989863872528, -0.35176998376846313, -0.32944101095199585, -0.30711203813552856, -0.2847830355167389, -0.2624540328979492, -0.24012506008148193, -0.21779607236385345, -0.19546708464622498, -0.1731380969285965, -0.1508091688156128, -0.12848018109798431, -0.10615119338035583, -0.08382220566272736, -0.06149321794509888, -0.0391642302274704, -0.01683524250984192, 0.00549374520778656, 0.02782273292541504, 0.05015172064304352, 0.072480708360672, 0.09480969607830048, 0.11713868379592896, 0.13946767151355743, 0.1617966592311859, 0.1841256469488144, 0.20645463466644287, 0.22878362238407135, 0.25111261010169983, 0.2734416127204895, 0.2957705855369568, 0.3180995583534241, 0.34042856097221375, 0.3627575635910034, 0.3850865364074707, 0.407415509223938, 0.42974451184272766, 0.45207351446151733, 0.4744024872779846, 0.4967314600944519, 0.519060492515564, 0.5413894653320312, 0.5637184381484985]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 9.0, 9.0, 11.0, 11.0, 18.0, 16.0, 25.0, 24.0, 25.0, 23.0, 37.0, 45.0, 40.0, 33.0, 34.0, 41.0, 56.0, 46.0, 45.0, 43.0, 46.0, 41.0, 43.0, 28.0, 34.0, 24.0, 21.0, 30.0, 23.0, 16.0, 10.0, 13.0, 16.0, 20.0, 9.0, 6.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.33001846075057983, -0.3204707205295563, -0.3109229803085327, -0.30137524008750916, -0.2918274998664856, -0.28227975964546204, -0.2727320194244385, -0.26318424940109253, -0.25363653898239136, -0.2440887987613678, -0.23454105854034424, -0.22499331831932068, -0.21544557809829712, -0.20589783787727356, -0.1963500827550888, -0.18680234253406525, -0.1772545874118805, -0.16770684719085693, -0.15815910696983337, -0.14861136674880981, -0.13906362652778625, -0.1295158863067627, -0.11996813118457794, -0.11042039096355438, -0.10087265074253082, -0.09132491052150726, -0.0817771703004837, -0.07222942262887955, -0.06268168240785599, -0.05313394218683243, -0.04358619824051857, -0.03403845429420471, -0.024490714073181152, -0.014942971989512444, -0.005395229905843735, 0.004152512177824974, 0.013700254261493683, 0.023247994482517242, 0.0327957384288311, 0.04234348237514496, 0.05189122259616852, 0.06143896281719208, 0.07098670303821564, 0.0805344507098198, 0.09008219093084335, 0.09962993115186691, 0.10917767882347107, 0.11872541904449463, 0.1282731592655182, 0.13782089948654175, 0.1473686397075653, 0.15691637992858887, 0.16646412014961243, 0.176011860370636, 0.18555961549282074, 0.1951073557138443, 0.20465509593486786, 0.21420283615589142, 0.22375057637691498, 0.23329831659793854, 0.2428460717201233, 0.25239381194114685, 0.2619415521621704, 0.27148929238319397, 0.28103703260421753]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 7.0, 11.0, 11.0, 11.0, 14.0, 17.0, 19.0, 35.0, 48.0, 78.0, 133.0, 150.0, 253.0, 383.0, 569.0, 994.0, 1682.0, 3007.0, 5685.0, 11397.0, 24499.0, 56268.0, 147742.0, 492049.0, 1398125.0, 1349762.0, 456210.0, 142611.0, 54724.0, 24038.0, 11148.0, 5567.0, 2942.0, 1683.0, 943.0, 515.0, 339.0, 225.0, 153.0, 84.0, 49.0, 40.0, 17.0, 14.0, 12.0, 5.0, 5.0, 7.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.06341552734375, -0.06170034408569336, -0.05998516082763672, -0.05826997756958008, -0.05655479431152344, -0.0548396110534668, -0.053124427795410156, -0.051409244537353516, -0.049694061279296875, -0.047978878021240234, -0.046263694763183594, -0.04454851150512695, -0.04283332824707031, -0.04111814498901367, -0.03940296173095703, -0.03768777847290039, -0.03597259521484375, -0.03425741195678711, -0.03254222869873047, -0.030827045440673828, -0.029111862182617188, -0.027396678924560547, -0.025681495666503906, -0.023966312408447266, -0.022251129150390625, -0.020535945892333984, -0.018820762634277344, -0.017105579376220703, -0.015390396118164062, -0.013675212860107422, -0.011960029602050781, -0.01024484634399414, -0.0085296630859375, -0.006814479827880859, -0.005099296569824219, -0.003384113311767578, -0.0016689300537109375, 4.6253204345703125e-05, 0.0017614364624023438, 0.0034766197204589844, 0.005191802978515625, 0.006906986236572266, 0.008622169494628906, 0.010337352752685547, 0.012052536010742188, 0.013767719268798828, 0.015482902526855469, 0.01719808578491211, 0.01891326904296875, 0.02062845230102539, 0.02234363555908203, 0.024058818817138672, 0.025774002075195312, 0.027489185333251953, 0.029204368591308594, 0.030919551849365234, 0.032634735107421875, 0.034349918365478516, 0.036065101623535156, 0.0377802848815918, 0.03949546813964844, 0.04121065139770508, 0.04292583465576172, 0.04464101791381836, 0.046356201171875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 3.0, 7.0, 7.0, 7.0, 16.0, 9.0, 15.0, 18.0, 32.0, 30.0, 36.0, 35.0, 49.0, 41.0, 57.0, 44.0, 56.0, 49.0, 58.0, 39.0, 50.0, 49.0, 45.0, 38.0, 29.0, 38.0, 29.0, 19.0, 16.0, 12.0, 10.0, 14.0, 10.0, 12.0, 11.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.05072021484375, -0.049408912658691406, -0.04809761047363281, -0.04678630828857422, -0.045475006103515625, -0.04416370391845703, -0.04285240173339844, -0.041541099548339844, -0.04022979736328125, -0.038918495178222656, -0.03760719299316406, -0.03629589080810547, -0.034984588623046875, -0.03367328643798828, -0.03236198425292969, -0.031050682067871094, -0.0297393798828125, -0.028428077697753906, -0.027116775512695312, -0.02580547332763672, -0.024494171142578125, -0.02318286895751953, -0.021871566772460938, -0.020560264587402344, -0.01924896240234375, -0.017937660217285156, -0.016626358032226562, -0.015315055847167969, -0.014003753662109375, -0.012692451477050781, -0.011381149291992188, -0.010069847106933594, -0.008758544921875, -0.007447242736816406, -0.0061359405517578125, -0.004824638366699219, -0.003513336181640625, -0.0022020339965820312, -0.0008907318115234375, 0.00042057037353515625, 0.00173187255859375, 0.0030431747436523438, 0.0043544769287109375, 0.005665779113769531, 0.006977081298828125, 0.008288383483886719, 0.009599685668945312, 0.010910987854003906, 0.0122222900390625, 0.013533592224121094, 0.014844894409179688, 0.01615619659423828, 0.017467498779296875, 0.01877880096435547, 0.020090103149414062, 0.021401405334472656, 0.02271270751953125, 0.024024009704589844, 0.025335311889648438, 0.02664661407470703, 0.027957916259765625, 0.02926921844482422, 0.030580520629882812, 0.031891822814941406, 0.033203125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 5.0, 10.0, 10.0, 18.0, 27.0, 40.0, 52.0, 105.0, 178.0, 366.0, 776.0, 2188.0, 8325.0, 45144.0, 313791.0, 2123281.0, 1468622.0, 193623.0, 29037.0, 5702.0, 1679.0, 650.0, 266.0, 151.0, 95.0, 45.0, 35.0, 24.0, 14.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12188720703125, -0.11793994903564453, -0.11399269104003906, -0.1100454330444336, -0.10609817504882812, -0.10215091705322266, -0.09820365905761719, -0.09425640106201172, -0.09030914306640625, -0.08636188507080078, -0.08241462707519531, -0.07846736907958984, -0.07452011108398438, -0.0705728530883789, -0.06662559509277344, -0.06267833709716797, -0.0587310791015625, -0.05478382110595703, -0.05083656311035156, -0.046889305114746094, -0.042942047119140625, -0.038994789123535156, -0.03504753112792969, -0.03110027313232422, -0.02715301513671875, -0.02320575714111328, -0.019258499145507812, -0.015311241149902344, -0.011363983154296875, -0.007416725158691406, -0.0034694671630859375, 0.00047779083251953125, 0.004425048828125, 0.008372306823730469, 0.012319564819335938, 0.016266822814941406, 0.020214080810546875, 0.024161338806152344, 0.028108596801757812, 0.03205585479736328, 0.03600311279296875, 0.03995037078857422, 0.04389762878417969, 0.047844886779785156, 0.051792144775390625, 0.055739402770996094, 0.05968666076660156, 0.06363391876220703, 0.0675811767578125, 0.07152843475341797, 0.07547569274902344, 0.0794229507446289, 0.08337020874023438, 0.08731746673583984, 0.09126472473144531, 0.09521198272705078, 0.09915924072265625, 0.10310649871826172, 0.10705375671386719, 0.11100101470947266, 0.11494827270507812, 0.1188955307006836, 0.12284278869628906, 0.12679004669189453, 0.1307373046875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 10.0, 10.0, 8.0, 16.0, 24.0, 27.0, 38.0, 65.0, 99.0, 92.0, 153.0, 215.0, 289.0, 402.0, 495.0, 470.0, 465.0, 337.0, 238.0, 163.0, 135.0, 103.0, 57.0, 43.0, 29.0, 31.0, 15.0, 11.0, 9.0, 11.0, 8.0, 1.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.081298828125, -0.0786886215209961, -0.07607841491699219, -0.07346820831298828, -0.07085800170898438, -0.06824779510498047, -0.06563758850097656, -0.06302738189697266, -0.06041717529296875, -0.057806968688964844, -0.05519676208496094, -0.05258655548095703, -0.049976348876953125, -0.04736614227294922, -0.04475593566894531, -0.042145729064941406, -0.0395355224609375, -0.036925315856933594, -0.03431510925292969, -0.03170490264892578, -0.029094696044921875, -0.02648448944091797, -0.023874282836914062, -0.021264076232910156, -0.01865386962890625, -0.016043663024902344, -0.013433456420898438, -0.010823249816894531, -0.008213043212890625, -0.005602836608886719, -0.0029926300048828125, -0.00038242340087890625, 0.002227783203125, 0.004837989807128906, 0.0074481964111328125, 0.010058403015136719, 0.012668609619140625, 0.015278816223144531, 0.017889022827148438, 0.020499229431152344, 0.02310943603515625, 0.025719642639160156, 0.028329849243164062, 0.03094005584716797, 0.033550262451171875, 0.03616046905517578, 0.03877067565917969, 0.041380882263183594, 0.0439910888671875, 0.046601295471191406, 0.04921150207519531, 0.05182170867919922, 0.054431915283203125, 0.05704212188720703, 0.05965232849121094, 0.062262535095214844, 0.06487274169921875, 0.06748294830322266, 0.07009315490722656, 0.07270336151123047, 0.07531356811523438, 0.07792377471923828, 0.08053398132324219, 0.0831441879272461, 0.08575439453125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 4.0, 24.0, 19.0, 44.0, 61.0, 86.0, 104.0, 99.0, 112.0, 123.0, 87.0, 83.0, 58.0, 34.0, 23.0, 20.0, 5.0, 1.0, 0.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.5702563524246216, -0.5564194321632385, -0.5425825119018555, -0.5287455320358276, -0.5149086117744446, -0.5010716915130615, -0.48723477125167847, -0.4733978509902954, -0.45956093072891235, -0.4457240104675293, -0.43188706040382385, -0.4180501401424408, -0.40421321988105774, -0.3903762698173523, -0.37653934955596924, -0.3627024292945862, -0.34886547923088074, -0.3350285589694977, -0.32119160890579224, -0.3073546886444092, -0.2935177683830261, -0.27968084812164307, -0.2658438980579376, -0.25200697779655457, -0.23817004263401031, -0.22433310747146606, -0.210496187210083, -0.19665925204753876, -0.1828223168849945, -0.16898539662361145, -0.1551484614610672, -0.14131152629852295, -0.1274745762348175, -0.11363764852285385, -0.0998007208108902, -0.08596378564834595, -0.0721268579363823, -0.05828993022441864, -0.04445299506187439, -0.030616067349910736, -0.016779139637947083, -0.0029422100633382797, 0.010894719511270523, 0.024731650948524475, 0.03856857866048813, 0.05240550637245178, 0.06624244153499603, 0.08007936924695969, 0.09391629695892334, 0.107753224670887, 0.12159015238285065, 0.1354270875453949, 0.14926400780677795, 0.1631009429693222, 0.17693787813186646, 0.1907747983932495, 0.20461173355579376, 0.218448668718338, 0.23228558897972107, 0.24612252414226532, 0.25995945930480957, 0.2737963795661926, 0.2876332998275757, 0.30147024989128113, 0.3153071701526642]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 4.0, 7.0, 8.0, 7.0, 11.0, 17.0, 17.0, 15.0, 19.0, 34.0, 29.0, 26.0, 45.0, 34.0, 33.0, 39.0, 38.0, 43.0, 53.0, 38.0, 41.0, 42.0, 41.0, 41.0, 38.0, 28.0, 28.0, 30.0, 29.0, 21.0, 27.0, 20.0, 19.0, 22.0, 10.0, 11.0, 10.0, 6.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.27998483180999756, -0.2722688615322113, -0.26455286145210266, -0.2568368911743164, -0.24912090599536896, -0.2414049208164215, -0.23368893563747406, -0.2259729504585266, -0.21825698018074036, -0.2105409950017929, -0.20282500982284546, -0.1951090395450592, -0.18739305436611176, -0.1796770691871643, -0.17196108400821686, -0.1642450988292694, -0.15652911365032196, -0.1488131284713745, -0.14109714329242706, -0.13338115811347961, -0.12566518783569336, -0.11794920265674591, -0.11023321747779846, -0.10251723229885101, -0.09480125457048416, -0.08708526939153671, -0.07936929166316986, -0.07165330648422241, -0.06393732130527496, -0.05622134357690811, -0.04850535839796066, -0.04078937694430351, -0.03307339549064636, -0.025357414036989212, -0.017641430720686913, -0.009925447404384613, -0.0022094659507274628, 0.0055065155029296875, 0.013222500681877136, 0.020938482135534286, 0.028654463589191437, 0.03637044504284859, 0.04408642649650574, 0.051802411675453186, 0.059518393129110336, 0.06723437458276749, 0.07495035976171494, 0.08266633749008179, 0.09038232266902924, 0.09809830784797668, 0.10581428557634354, 0.11353027075529099, 0.12124624848365784, 0.12896223366260529, 0.13667821884155273, 0.14439420402050018, 0.15211018919944763, 0.15982617437839508, 0.16754215955734253, 0.17525812983512878, 0.18297411501407623, 0.19069010019302368, 0.19840608537197113, 0.20612207055091858, 0.21383804082870483]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 7.0, 3.0, 10.0, 12.0, 20.0, 37.0, 35.0, 50.0, 69.0, 135.0, 195.0, 320.0, 510.0, 829.0, 1380.0, 2557.0, 4573.0, 8223.0, 14979.0, 27473.0, 49324.0, 85547.0, 137722.0, 189006.0, 188602.0, 138572.0, 86715.0, 49381.0, 27885.0, 15006.0, 8508.0, 4527.0, 2662.0, 1428.0, 865.0, 489.0, 319.0, 192.0, 142.0, 76.0, 57.0, 42.0, 33.0, 14.0, 7.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.075439453125, -0.07322120666503906, -0.07100296020507812, -0.06878471374511719, -0.06656646728515625, -0.06434822082519531, -0.062129974365234375, -0.05991172790527344, -0.0576934814453125, -0.05547523498535156, -0.053256988525390625, -0.05103874206542969, -0.04882049560546875, -0.04660224914550781, -0.044384002685546875, -0.04216575622558594, -0.039947509765625, -0.03772926330566406, -0.035511016845703125, -0.03329277038574219, -0.03107452392578125, -0.028856277465820312, -0.026638031005859375, -0.024419784545898438, -0.0222015380859375, -0.019983291625976562, -0.017765045166015625, -0.015546798706054688, -0.01332855224609375, -0.011110305786132812, -0.008892059326171875, -0.0066738128662109375, -0.00445556640625, -0.0022373199462890625, -1.9073486328125e-05, 0.0021991729736328125, 0.00441741943359375, 0.0066356658935546875, 0.008853912353515625, 0.011072158813476562, 0.0132904052734375, 0.015508651733398438, 0.017726898193359375, 0.019945144653320312, 0.02216339111328125, 0.024381637573242188, 0.026599884033203125, 0.028818130493164062, 0.031036376953125, 0.03325462341308594, 0.035472869873046875, 0.03769111633300781, 0.03990936279296875, 0.04212760925292969, 0.044345855712890625, 0.04656410217285156, 0.0487823486328125, 0.05100059509277344, 0.053218841552734375, 0.05543708801269531, 0.05765533447265625, 0.05987358093261719, 0.062091827392578125, 0.06431007385253906, 0.0665283203125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 9.0, 7.0, 15.0, 14.0, 14.0, 12.0, 19.0, 39.0, 25.0, 30.0, 35.0, 34.0, 42.0, 41.0, 42.0, 52.0, 58.0, 51.0, 47.0, 44.0, 44.0, 36.0, 42.0, 40.0, 27.0, 26.0, 27.0, 18.0, 18.0, 18.0, 15.0, 9.0, 10.0, 10.0, 6.0, 4.0, 5.0, 6.0, 3.0, 3.0, 2.0], "bins": [-0.04632568359375, -0.04516935348510742, -0.044013023376464844, -0.042856693267822266, -0.04170036315917969, -0.04054403305053711, -0.03938770294189453, -0.03823137283325195, -0.037075042724609375, -0.0359187126159668, -0.03476238250732422, -0.03360605239868164, -0.03244972229003906, -0.031293392181396484, -0.030137062072753906, -0.028980731964111328, -0.02782440185546875, -0.026668071746826172, -0.025511741638183594, -0.024355411529541016, -0.023199081420898438, -0.02204275131225586, -0.02088642120361328, -0.019730091094970703, -0.018573760986328125, -0.017417430877685547, -0.01626110076904297, -0.01510477066040039, -0.013948440551757812, -0.012792110443115234, -0.011635780334472656, -0.010479450225830078, -0.0093231201171875, -0.008166790008544922, -0.007010459899902344, -0.005854129791259766, -0.0046977996826171875, -0.0035414695739746094, -0.0023851394653320312, -0.0012288093566894531, -7.2479248046875e-05, 0.0010838508605957031, 0.0022401809692382812, 0.0033965110778808594, 0.0045528411865234375, 0.005709171295166016, 0.006865501403808594, 0.008021831512451172, 0.00917816162109375, 0.010334491729736328, 0.011490821838378906, 0.012647151947021484, 0.013803482055664062, 0.01495981216430664, 0.01611614227294922, 0.017272472381591797, 0.018428802490234375, 0.019585132598876953, 0.02074146270751953, 0.02189779281616211, 0.023054122924804688, 0.024210453033447266, 0.025366783142089844, 0.026523113250732422, 0.027679443359375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 10.0, 11.0, 20.0, 14.0, 40.0, 46.0, 76.0, 126.0, 199.0, 395.0, 774.0, 1663.0, 3706.0, 8710.0, 20909.0, 47577.0, 103344.0, 196096.0, 262832.0, 203557.0, 108853.0, 50479.0, 21955.0, 9462.0, 4117.0, 1742.0, 816.0, 417.0, 216.0, 149.0, 102.0, 39.0, 34.0, 17.0, 17.0, 13.0, 10.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09100341796875, -0.0878143310546875, -0.084625244140625, -0.0814361572265625, -0.0782470703125, -0.0750579833984375, -0.071868896484375, -0.0686798095703125, -0.06549072265625, -0.0623016357421875, -0.059112548828125, -0.0559234619140625, -0.052734375, -0.0495452880859375, -0.046356201171875, -0.0431671142578125, -0.03997802734375, -0.0367889404296875, -0.033599853515625, -0.0304107666015625, -0.0272216796875, -0.0240325927734375, -0.020843505859375, -0.0176544189453125, -0.01446533203125, -0.0112762451171875, -0.008087158203125, -0.0048980712890625, -0.001708984375, 0.0014801025390625, 0.004669189453125, 0.0078582763671875, 0.01104736328125, 0.0142364501953125, 0.017425537109375, 0.0206146240234375, 0.0238037109375, 0.0269927978515625, 0.030181884765625, 0.0333709716796875, 0.03656005859375, 0.0397491455078125, 0.042938232421875, 0.0461273193359375, 0.04931640625, 0.0525054931640625, 0.055694580078125, 0.0588836669921875, 0.06207275390625, 0.0652618408203125, 0.068450927734375, 0.0716400146484375, 0.0748291015625, 0.0780181884765625, 0.081207275390625, 0.0843963623046875, 0.08758544921875, 0.0907745361328125, 0.093963623046875, 0.0971527099609375, 0.100341796875, 0.1035308837890625, 0.106719970703125, 0.1099090576171875, 0.11309814453125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 9.0, 6.0, 6.0, 12.0, 12.0, 16.0, 17.0, 18.0, 33.0, 34.0, 30.0, 34.0, 36.0, 33.0, 52.0, 58.0, 56.0, 53.0, 49.0, 50.0, 49.0, 48.0, 38.0, 43.0, 36.0, 30.0, 36.0, 22.0, 25.0, 14.0, 8.0, 7.0, 8.0, 6.0, 6.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13037109375, -0.12659263610839844, -0.12281417846679688, -0.11903572082519531, -0.11525726318359375, -0.11147880554199219, -0.10770034790039062, -0.10392189025878906, -0.1001434326171875, -0.09636497497558594, -0.09258651733398438, -0.08880805969238281, -0.08502960205078125, -0.08125114440917969, -0.07747268676757812, -0.07369422912597656, -0.069915771484375, -0.06613731384277344, -0.062358856201171875, -0.05858039855957031, -0.05480194091796875, -0.05102348327636719, -0.047245025634765625, -0.04346656799316406, -0.0396881103515625, -0.03590965270996094, -0.032131195068359375, -0.028352737426757812, -0.02457427978515625, -0.020795822143554688, -0.017017364501953125, -0.013238906860351562, -0.00946044921875, -0.0056819915771484375, -0.001903533935546875, 0.0018749237060546875, 0.00565338134765625, 0.009431838989257812, 0.013210296630859375, 0.016988754272460938, 0.0207672119140625, 0.024545669555664062, 0.028324127197265625, 0.03210258483886719, 0.03588104248046875, 0.03965950012207031, 0.043437957763671875, 0.04721641540527344, 0.050994873046875, 0.05477333068847656, 0.058551788330078125, 0.06233024597167969, 0.06610870361328125, 0.06988716125488281, 0.07366561889648438, 0.07744407653808594, 0.0812225341796875, 0.08500099182128906, 0.08877944946289062, 0.09255790710449219, 0.09633636474609375, 0.10011482238769531, 0.10389328002929688, 0.10767173767089844, 0.1114501953125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 14.0, 9.0, 12.0, 28.0, 59.0, 108.0, 186.0, 375.0, 770.0, 1869.0, 4690.0, 12608.0, 36239.0, 98933.0, 219045.0, 301225.0, 217600.0, 98587.0, 35570.0, 12605.0, 4644.0, 1805.0, 806.0, 342.0, 194.0, 86.0, 48.0, 30.0, 19.0, 8.0, 11.0, 8.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.034271240234375, -0.03318309783935547, -0.03209495544433594, -0.031006813049316406, -0.029918670654296875, -0.028830528259277344, -0.027742385864257812, -0.02665424346923828, -0.02556610107421875, -0.02447795867919922, -0.023389816284179688, -0.022301673889160156, -0.021213531494140625, -0.020125389099121094, -0.019037246704101562, -0.01794910430908203, -0.0168609619140625, -0.01577281951904297, -0.014684677124023438, -0.013596534729003906, -0.012508392333984375, -0.011420249938964844, -0.010332107543945312, -0.009243965148925781, -0.00815582275390625, -0.007067680358886719, -0.0059795379638671875, -0.004891395568847656, -0.003803253173828125, -0.0027151107788085938, -0.0016269683837890625, -0.0005388259887695312, 0.00054931640625, 0.0016374588012695312, 0.0027256011962890625, 0.0038137435913085938, 0.004901885986328125, 0.005990028381347656, 0.0070781707763671875, 0.008166313171386719, 0.00925445556640625, 0.010342597961425781, 0.011430740356445312, 0.012518882751464844, 0.013607025146484375, 0.014695167541503906, 0.015783309936523438, 0.01687145233154297, 0.0179595947265625, 0.01904773712158203, 0.020135879516601562, 0.021224021911621094, 0.022312164306640625, 0.023400306701660156, 0.024488449096679688, 0.02557659149169922, 0.02666473388671875, 0.02775287628173828, 0.028841018676757812, 0.029929161071777344, 0.031017303466796875, 0.032105445861816406, 0.03319358825683594, 0.03428173065185547, 0.035369873046875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 7.0, 4.0, 7.0, 4.0, 12.0, 10.0, 11.0, 13.0, 24.0, 19.0, 27.0, 33.0, 34.0, 64.0, 48.0, 64.0, 65.0, 57.0, 70.0, 48.0, 63.0, 40.0, 46.0, 40.0, 18.0, 38.0, 26.0, 20.0, 13.0, 14.0, 8.0, 5.0, 9.0, 5.0, 5.0, 2.0, 5.0, 2.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.3530254364013672e-05, -1.3130716979503632e-05, -1.2731179594993591e-05, -1.2331642210483551e-05, -1.193210482597351e-05, -1.153256744146347e-05, -1.113303005695343e-05, -1.073349267244339e-05, -1.033395528793335e-05, -9.93441790342331e-06, -9.534880518913269e-06, -9.135343134403229e-06, -8.735805749893188e-06, -8.336268365383148e-06, -7.936730980873108e-06, -7.537193596363068e-06, -7.137656211853027e-06, -6.738118827342987e-06, -6.338581442832947e-06, -5.9390440583229065e-06, -5.539506673812866e-06, -5.139969289302826e-06, -4.740431904792786e-06, -4.340894520282745e-06, -3.941357135772705e-06, -3.541819751262665e-06, -3.1422823667526245e-06, -2.7427449822425842e-06, -2.343207597732544e-06, -1.9436702132225037e-06, -1.5441328287124634e-06, -1.144595444202423e-06, -7.450580596923828e-07, -3.4552067518234253e-07, 5.4016709327697754e-08, 4.5355409383773804e-07, 8.530914783477783e-07, 1.2526288628578186e-06, 1.6521662473678589e-06, 2.051703631877899e-06, 2.4512410163879395e-06, 2.8507784008979797e-06, 3.25031578540802e-06, 3.6498531699180603e-06, 4.049390554428101e-06, 4.448927938938141e-06, 4.848465323448181e-06, 5.2480027079582214e-06, 5.647540092468262e-06, 6.047077476978302e-06, 6.446614861488342e-06, 6.8461522459983826e-06, 7.245689630508423e-06, 7.645227015018463e-06, 8.044764399528503e-06, 8.444301784038544e-06, 8.843839168548584e-06, 9.243376553058624e-06, 9.642913937568665e-06, 1.0042451322078705e-05, 1.0441988706588745e-05, 1.0841526091098785e-05, 1.1241063475608826e-05, 1.1640600860118866e-05, 1.2040138244628906e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 9.0, 9.0, 16.0, 15.0, 19.0, 31.0, 57.0, 109.0, 138.0, 252.0, 435.0, 774.0, 1307.0, 2493.0, 4708.0, 9779.0, 20147.0, 42099.0, 82541.0, 144786.0, 204090.0, 207898.0, 151064.0, 87676.0, 44880.0, 21816.0, 10489.0, 5029.0, 2611.0, 1385.0, 767.0, 449.0, 295.0, 142.0, 84.0, 58.0, 38.0, 17.0, 14.0, 10.0, 7.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0], "bins": [-0.02630615234375, -0.02561473846435547, -0.024923324584960938, -0.024231910705566406, -0.023540496826171875, -0.022849082946777344, -0.022157669067382812, -0.02146625518798828, -0.02077484130859375, -0.02008342742919922, -0.019392013549804688, -0.018700599670410156, -0.018009185791015625, -0.017317771911621094, -0.016626358032226562, -0.01593494415283203, -0.0152435302734375, -0.014552116394042969, -0.013860702514648438, -0.013169288635253906, -0.012477874755859375, -0.011786460876464844, -0.011095046997070312, -0.010403633117675781, -0.00971221923828125, -0.009020805358886719, -0.008329391479492188, -0.007637977600097656, -0.006946563720703125, -0.006255149841308594, -0.0055637359619140625, -0.004872322082519531, -0.004180908203125, -0.0034894943237304688, -0.0027980804443359375, -0.0021066665649414062, -0.001415252685546875, -0.0007238388061523438, -3.24249267578125e-05, 0.0006589889526367188, 0.00135040283203125, 0.0020418167114257812, 0.0027332305908203125, 0.0034246444702148438, 0.004116058349609375, 0.004807472229003906, 0.0054988861083984375, 0.006190299987792969, 0.0068817138671875, 0.007573127746582031, 0.008264541625976562, 0.008955955505371094, 0.009647369384765625, 0.010338783264160156, 0.011030197143554688, 0.011721611022949219, 0.01241302490234375, 0.013104438781738281, 0.013795852661132812, 0.014487266540527344, 0.015178680419921875, 0.015870094299316406, 0.016561508178710938, 0.01725292205810547, 0.0179443359375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 4.0, 8.0, 5.0, 13.0, 7.0, 15.0, 18.0, 16.0, 36.0, 30.0, 48.0, 53.0, 53.0, 57.0, 63.0, 62.0, 68.0, 52.0, 51.0, 56.0, 48.0, 28.0, 40.0, 29.0, 30.0, 17.0, 20.0, 16.0, 19.0, 7.0, 4.0, 4.0, 8.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01983642578125, -0.019155263900756836, -0.018474102020263672, -0.017792940139770508, -0.017111778259277344, -0.01643061637878418, -0.015749454498291016, -0.015068292617797852, -0.014387130737304688, -0.013705968856811523, -0.01302480697631836, -0.012343645095825195, -0.011662483215332031, -0.010981321334838867, -0.010300159454345703, -0.009618997573852539, -0.008937835693359375, -0.008256673812866211, -0.007575511932373047, -0.006894350051879883, -0.006213188171386719, -0.005532026290893555, -0.004850864410400391, -0.0041697025299072266, -0.0034885406494140625, -0.0028073787689208984, -0.0021262168884277344, -0.0014450550079345703, -0.0007638931274414062, -8.273124694824219e-05, 0.0005984306335449219, 0.001279592514038086, 0.00196075439453125, 0.002641916275024414, 0.003323078155517578, 0.004004240036010742, 0.004685401916503906, 0.00536656379699707, 0.006047725677490234, 0.0067288875579833984, 0.0074100494384765625, 0.008091211318969727, 0.00877237319946289, 0.009453535079956055, 0.010134696960449219, 0.010815858840942383, 0.011497020721435547, 0.012178182601928711, 0.012859344482421875, 0.013540506362915039, 0.014221668243408203, 0.014902830123901367, 0.015583992004394531, 0.016265153884887695, 0.01694631576538086, 0.017627477645874023, 0.018308639526367188, 0.01898980140686035, 0.019670963287353516, 0.02035212516784668, 0.021033287048339844, 0.021714448928833008, 0.022395610809326172, 0.023076772689819336, 0.0237579345703125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 11.0, 11.0, 17.0, 45.0, 71.0, 78.0, 99.0, 130.0, 128.0, 113.0, 101.0, 78.0, 41.0, 26.0, 15.0, 15.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6395614147186279, -0.6244599223136902, -0.6093584895133972, -0.5942569971084595, -0.5791555047035217, -0.564054012298584, -0.548952579498291, -0.5338510870933533, -0.5187495946884155, -0.5036481022834778, -0.4885466396808624, -0.47344517707824707, -0.4583436846733093, -0.44324222207069397, -0.4281407594680786, -0.41303926706314087, -0.3979378342628479, -0.38283637166023254, -0.3677348792552948, -0.35263341665267944, -0.3375319242477417, -0.32243046164512634, -0.307328999042511, -0.29222750663757324, -0.2771260142326355, -0.26202455163002014, -0.2469230592250824, -0.23182159662246704, -0.2167201191186905, -0.20161864161491394, -0.1865171641111374, -0.17141568660736084, -0.15631422400474548, -0.14121274650096893, -0.12611126899719238, -0.11100979894399643, -0.09590832889080048, -0.08080685138702393, -0.06570537388324738, -0.05060390383005142, -0.03550242632627487, -0.02040095254778862, -0.005299476906657219, 0.009801998734474182, 0.024903472512960434, 0.040004946291446686, 0.055106423795223236, 0.07020789384841919, 0.08530937135219574, 0.10041084885597229, 0.11551231890916824, 0.1306138038635254, 0.14571526646614075, 0.1608167439699173, 0.17591822147369385, 0.1910196840763092, 0.20612117648124695, 0.2212226539850235, 0.23632413148880005, 0.2514255940914154, 0.26652708649635315, 0.2816285490989685, 0.29673004150390625, 0.3118315041065216, 0.32693296670913696]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 4.0, 8.0, 9.0, 8.0, 12.0, 11.0, 11.0, 15.0, 20.0, 23.0, 19.0, 24.0, 37.0, 47.0, 39.0, 27.0, 40.0, 38.0, 47.0, 53.0, 43.0, 38.0, 39.0, 41.0, 39.0, 35.0, 27.0, 26.0, 35.0, 23.0, 33.0, 28.0, 13.0, 17.0, 10.0, 17.0, 11.0, 5.0, 7.0, 7.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.29893815517425537, -0.28897735476493835, -0.2790165841579437, -0.2690557837486267, -0.2590950131416321, -0.24913421273231506, -0.23917342722415924, -0.22921264171600342, -0.2192518413066864, -0.20929105579853058, -0.19933027029037476, -0.18936946988105774, -0.17940868437290192, -0.1694478988647461, -0.15948711335659027, -0.14952632784843445, -0.13956554234027863, -0.1296047568321228, -0.11964396387338638, -0.10968317836523056, -0.09972238540649414, -0.08976159989833832, -0.0798008143901825, -0.06984002143144608, -0.05987923592329025, -0.04991844668984413, -0.03995765745639801, -0.029996871948242188, -0.020036082714796066, -0.010075293481349945, -0.00011450797319412231, 0.009846284985542297, 0.01980707049369812, 0.02976785972714424, 0.03972864896059036, 0.049689434468746185, 0.059650223702192307, 0.06961101293563843, 0.07957179844379425, 0.08953259140253067, 0.09949337691068649, 0.10945416241884232, 0.11941495537757874, 0.12937574088573456, 0.13933652639389038, 0.1492973268032074, 0.15925809741020203, 0.16921889781951904, 0.17917968332767487, 0.1891404688358307, 0.1991012543439865, 0.20906203985214233, 0.21902284026145935, 0.22898362576961517, 0.238944411277771, 0.248905211687088, 0.25886598229408264, 0.26882678270339966, 0.2787875533103943, 0.2887483537197113, 0.29870912432670593, 0.30866992473602295, 0.3186306953430176, 0.3285914957523346, 0.3385522961616516]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 4.0, 2.0, 4.0, 8.0, 13.0, 21.0, 22.0, 32.0, 62.0, 93.0, 144.0, 225.0, 418.0, 789.0, 1614.0, 3422.0, 8149.0, 20763.0, 62480.0, 234725.0, 1214593.0, 1974058.0, 501861.0, 113283.0, 35294.0, 12743.0, 5251.0, 2181.0, 964.0, 488.0, 267.0, 119.0, 84.0, 35.0, 20.0, 17.0, 17.0, 10.0, 8.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.08966064453125, -0.08731555938720703, -0.08497047424316406, -0.0826253890991211, -0.08028030395507812, -0.07793521881103516, -0.07559013366699219, -0.07324504852294922, -0.07089996337890625, -0.06855487823486328, -0.06620979309082031, -0.06386470794677734, -0.061519622802734375, -0.059174537658691406, -0.05682945251464844, -0.05448436737060547, -0.0521392822265625, -0.04979419708251953, -0.04744911193847656, -0.045104026794433594, -0.042758941650390625, -0.040413856506347656, -0.03806877136230469, -0.03572368621826172, -0.03337860107421875, -0.03103351593017578, -0.028688430786132812, -0.026343345642089844, -0.023998260498046875, -0.021653175354003906, -0.019308090209960938, -0.01696300506591797, -0.014617919921875, -0.012272834777832031, -0.009927749633789062, -0.007582664489746094, -0.005237579345703125, -0.0028924942016601562, -0.0005474090576171875, 0.0017976760864257812, 0.00414276123046875, 0.006487846374511719, 0.008832931518554688, 0.011178016662597656, 0.013523101806640625, 0.015868186950683594, 0.018213272094726562, 0.02055835723876953, 0.0229034423828125, 0.02524852752685547, 0.027593612670898438, 0.029938697814941406, 0.032283782958984375, 0.034628868103027344, 0.03697395324707031, 0.03931903839111328, 0.04166412353515625, 0.04400920867919922, 0.04635429382324219, 0.048699378967285156, 0.051044464111328125, 0.053389549255371094, 0.05573463439941406, 0.05807971954345703, 0.0604248046875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 9.0, 2.0, 8.0, 8.0, 15.0, 15.0, 20.0, 23.0, 25.0, 30.0, 20.0, 36.0, 34.0, 50.0, 49.0, 53.0, 58.0, 30.0, 48.0, 48.0, 44.0, 50.0, 38.0, 43.0, 29.0, 22.0, 30.0, 18.0, 24.0, 23.0, 18.0, 15.0, 16.0, 11.0, 8.0, 8.0, 10.0, 2.0, 5.0, 5.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.04766845703125, -0.046422481536865234, -0.04517650604248047, -0.0439305305480957, -0.04268455505371094, -0.04143857955932617, -0.040192604064941406, -0.03894662857055664, -0.037700653076171875, -0.03645467758178711, -0.035208702087402344, -0.03396272659301758, -0.03271675109863281, -0.03147077560424805, -0.03022480010986328, -0.028978824615478516, -0.02773284912109375, -0.026486873626708984, -0.02524089813232422, -0.023994922637939453, -0.022748947143554688, -0.021502971649169922, -0.020256996154785156, -0.01901102066040039, -0.017765045166015625, -0.01651906967163086, -0.015273094177246094, -0.014027118682861328, -0.012781143188476562, -0.011535167694091797, -0.010289192199707031, -0.009043216705322266, -0.0077972412109375, -0.006551265716552734, -0.005305290222167969, -0.004059314727783203, -0.0028133392333984375, -0.0015673637390136719, -0.00032138824462890625, 0.0009245872497558594, 0.002170562744140625, 0.0034165382385253906, 0.004662513732910156, 0.005908489227294922, 0.0071544647216796875, 0.008400440216064453, 0.009646415710449219, 0.010892391204833984, 0.01213836669921875, 0.013384342193603516, 0.014630317687988281, 0.015876293182373047, 0.017122268676757812, 0.018368244171142578, 0.019614219665527344, 0.02086019515991211, 0.022106170654296875, 0.02335214614868164, 0.024598121643066406, 0.025844097137451172, 0.027090072631835938, 0.028336048126220703, 0.02958202362060547, 0.030827999114990234, 0.032073974609375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 3.0, 13.0, 6.0, 22.0, 24.0, 41.0, 54.0, 97.0, 156.0, 248.0, 556.0, 1175.0, 2878.0, 7378.0, 20507.0, 61909.0, 202184.0, 711277.0, 1831496.0, 960081.0, 270256.0, 81606.0, 26631.0, 9280.0, 3445.0, 1432.0, 708.0, 316.0, 188.0, 93.0, 79.0, 44.0, 28.0, 16.0, 16.0, 9.0, 7.0, 6.0, 1.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0740966796875, -0.07182502746582031, -0.06955337524414062, -0.06728172302246094, -0.06501007080078125, -0.06273841857910156, -0.060466766357421875, -0.05819511413574219, -0.0559234619140625, -0.05365180969238281, -0.051380157470703125, -0.04910850524902344, -0.04683685302734375, -0.04456520080566406, -0.042293548583984375, -0.04002189636230469, -0.037750244140625, -0.03547859191894531, -0.033206939697265625, -0.030935287475585938, -0.02866363525390625, -0.026391983032226562, -0.024120330810546875, -0.021848678588867188, -0.0195770263671875, -0.017305374145507812, -0.015033721923828125, -0.012762069702148438, -0.01049041748046875, -0.008218765258789062, -0.005947113037109375, -0.0036754608154296875, -0.00140380859375, 0.0008678436279296875, 0.003139495849609375, 0.0054111480712890625, 0.00768280029296875, 0.009954452514648438, 0.012226104736328125, 0.014497756958007812, 0.0167694091796875, 0.019041061401367188, 0.021312713623046875, 0.023584365844726562, 0.02585601806640625, 0.028127670288085938, 0.030399322509765625, 0.03267097473144531, 0.034942626953125, 0.03721427917480469, 0.039485931396484375, 0.04175758361816406, 0.04402923583984375, 0.04630088806152344, 0.048572540283203125, 0.05084419250488281, 0.0531158447265625, 0.05538749694824219, 0.057659149169921875, 0.05993080139160156, 0.06220245361328125, 0.06447410583496094, 0.06674575805664062, 0.06901741027832031, 0.0712890625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 5.0, 2.0, 6.0, 12.0, 14.0, 17.0, 20.0, 32.0, 43.0, 56.0, 78.0, 99.0, 144.0, 225.0, 285.0, 367.0, 500.0, 544.0, 447.0, 324.0, 225.0, 164.0, 144.0, 81.0, 67.0, 48.0, 36.0, 21.0, 17.0, 21.0, 10.0, 10.0, 6.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0885009765625, -0.0861215591430664, -0.08374214172363281, -0.08136272430419922, -0.07898330688476562, -0.07660388946533203, -0.07422447204589844, -0.07184505462646484, -0.06946563720703125, -0.06708621978759766, -0.06470680236816406, -0.06232738494873047, -0.059947967529296875, -0.05756855010986328, -0.05518913269042969, -0.052809715270996094, -0.0504302978515625, -0.048050880432128906, -0.04567146301269531, -0.04329204559326172, -0.040912628173828125, -0.03853321075439453, -0.03615379333496094, -0.033774375915527344, -0.03139495849609375, -0.029015541076660156, -0.026636123657226562, -0.02425670623779297, -0.021877288818359375, -0.01949787139892578, -0.017118453979492188, -0.014739036560058594, -0.012359619140625, -0.009980201721191406, -0.0076007843017578125, -0.005221366882324219, -0.002841949462890625, -0.00046253204345703125, 0.0019168853759765625, 0.004296302795410156, 0.00667572021484375, 0.009055137634277344, 0.011434555053710938, 0.013813972473144531, 0.016193389892578125, 0.01857280731201172, 0.020952224731445312, 0.023331642150878906, 0.0257110595703125, 0.028090476989746094, 0.030469894409179688, 0.03284931182861328, 0.035228729248046875, 0.03760814666748047, 0.03998756408691406, 0.042366981506347656, 0.04474639892578125, 0.047125816345214844, 0.04950523376464844, 0.05188465118408203, 0.054264068603515625, 0.05664348602294922, 0.05902290344238281, 0.061402320861816406, 0.06378173828125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 7.0, 8.0, 3.0, 8.0, 17.0, 23.0, 34.0, 40.0, 49.0, 59.0, 67.0, 105.0, 90.0, 93.0, 86.0, 81.0, 65.0, 61.0, 36.0, 21.0, 23.0, 11.0, 10.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.35886165499687195, -0.34757113456726074, -0.33628058433532715, -0.32499006390571594, -0.31369954347610474, -0.30240899324417114, -0.29111847281455994, -0.27982795238494873, -0.26853740215301514, -0.25724688172340393, -0.24595634639263153, -0.23466581106185913, -0.22337529063224792, -0.21208475530147552, -0.20079421997070312, -0.18950369954109192, -0.1782131791114807, -0.1669226437807083, -0.1556321233510971, -0.1443415880203247, -0.1330510675907135, -0.1217605322599411, -0.1104699969291687, -0.0991794690489769, -0.0878889411687851, -0.07659841328859329, -0.06530788540840149, -0.05401735007762909, -0.042726822197437286, -0.03143629431724548, -0.020145758986473083, -0.00885523110628128, 0.0024352967739105225, 0.013725826516747475, 0.025016356259584427, 0.03630688786506653, 0.04759741574525833, 0.058887943625450134, 0.07017847895622253, 0.08146900683641434, 0.09275953471660614, 0.10405006259679794, 0.11534059047698975, 0.12663112580776215, 0.13792166113853455, 0.14921218156814575, 0.16050271689891815, 0.17179325222969055, 0.18308377265930176, 0.19437430799007416, 0.20566482841968536, 0.21695536375045776, 0.22824588418006897, 0.23953641951084137, 0.25082695484161377, 0.262117475271225, 0.2734079957008362, 0.2846985161304474, 0.295989066362381, 0.3072795867919922, 0.3185701072216034, 0.3298606276512146, 0.3411511778831482, 0.3524416983127594, 0.363732248544693]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 5.0, 3.0, 5.0, 6.0, 14.0, 16.0, 14.0, 24.0, 26.0, 24.0, 29.0, 32.0, 40.0, 37.0, 52.0, 40.0, 41.0, 41.0, 39.0, 39.0, 43.0, 50.0, 35.0, 44.0, 38.0, 39.0, 33.0, 27.0, 23.0, 32.0, 19.0, 21.0, 9.0, 8.0, 12.0, 8.0, 8.0, 4.0, 6.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.24597465991973877, -0.23880283534526825, -0.23163102567195892, -0.2244592010974884, -0.21728739142417908, -0.21011556684970856, -0.20294374227523804, -0.1957719326019287, -0.1886001080274582, -0.18142828345298767, -0.17425647377967834, -0.16708464920520782, -0.1599128246307373, -0.15274101495742798, -0.14556919038295746, -0.13839736580848694, -0.1312255561351776, -0.12405373901128769, -0.11688192188739777, -0.10971009731292725, -0.10253828018903732, -0.0953664630651474, -0.08819463849067688, -0.08102282136678696, -0.07385100424289703, -0.06667918711900711, -0.05950736626982689, -0.05233554542064667, -0.045163728296756744, -0.03799191117286682, -0.0308200903236866, -0.023648269474506378, -0.016476452350616455, -0.009304633364081383, -0.0021328143775463104, 0.005039004608988762, 0.012210823595523834, 0.019382640719413757, 0.02655446156859398, 0.0337262824177742, 0.040898099541664124, 0.04806991666555405, 0.05524173751473427, 0.06241355836391449, 0.06958537548780441, 0.07675719261169434, 0.08392901718616486, 0.09110083431005478, 0.0982726514339447, 0.10544446855783463, 0.11261628568172455, 0.11978811025619507, 0.1269599199295044, 0.13413174450397491, 0.14130356907844543, 0.14847537875175476, 0.15564720332622528, 0.1628190279006958, 0.16999083757400513, 0.17716266214847565, 0.18433448672294617, 0.1915062963962555, 0.198678120970726, 0.20584994554519653, 0.21302175521850586]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 6.0, 1.0, 6.0, 7.0, 6.0, 8.0, 20.0, 20.0, 31.0, 32.0, 67.0, 96.0, 146.0, 237.0, 402.0, 639.0, 1128.0, 1909.0, 3342.0, 6110.0, 11042.0, 21008.0, 38793.0, 70942.0, 121601.0, 179047.0, 200711.0, 161341.0, 102651.0, 58180.0, 31306.0, 16867.0, 9123.0, 5011.0, 2826.0, 1554.0, 921.0, 547.0, 315.0, 183.0, 126.0, 86.0, 50.0, 33.0, 29.0, 17.0, 15.0, 10.0, 3.0, 10.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08575439453125, -0.08261680603027344, -0.07947921752929688, -0.07634162902832031, -0.07320404052734375, -0.07006645202636719, -0.06692886352539062, -0.06379127502441406, -0.0606536865234375, -0.05751609802246094, -0.054378509521484375, -0.05124092102050781, -0.04810333251953125, -0.04496574401855469, -0.041828155517578125, -0.03869056701660156, -0.035552978515625, -0.03241539001464844, -0.029277801513671875, -0.026140213012695312, -0.02300262451171875, -0.019865036010742188, -0.016727447509765625, -0.013589859008789062, -0.0104522705078125, -0.0073146820068359375, -0.004177093505859375, -0.0010395050048828125, 0.00209808349609375, 0.0052356719970703125, 0.008373260498046875, 0.011510848999023438, 0.0146484375, 0.017786026000976562, 0.020923614501953125, 0.024061203002929688, 0.02719879150390625, 0.030336380004882812, 0.033473968505859375, 0.03661155700683594, 0.0397491455078125, 0.04288673400878906, 0.046024322509765625, 0.04916191101074219, 0.05229949951171875, 0.05543708801269531, 0.058574676513671875, 0.06171226501464844, 0.064849853515625, 0.06798744201660156, 0.07112503051757812, 0.07426261901855469, 0.07740020751953125, 0.08053779602050781, 0.08367538452148438, 0.08681297302246094, 0.0899505615234375, 0.09308815002441406, 0.09622573852539062, 0.09936332702636719, 0.10250091552734375, 0.10563850402832031, 0.10877609252929688, 0.11191368103027344, 0.11505126953125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 4.0, 5.0, 9.0, 14.0, 10.0, 20.0, 14.0, 15.0, 20.0, 26.0, 36.0, 45.0, 39.0, 42.0, 52.0, 38.0, 46.0, 53.0, 45.0, 53.0, 42.0, 49.0, 40.0, 39.0, 28.0, 34.0, 39.0, 27.0, 24.0, 14.0, 11.0, 21.0, 13.0, 9.0, 6.0, 10.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0438232421875, -0.042616844177246094, -0.04141044616699219, -0.04020404815673828, -0.038997650146484375, -0.03779125213623047, -0.03658485412597656, -0.035378456115722656, -0.03417205810546875, -0.032965660095214844, -0.03175926208496094, -0.03055286407470703, -0.029346466064453125, -0.02814006805419922, -0.026933670043945312, -0.025727272033691406, -0.0245208740234375, -0.023314476013183594, -0.022108078002929688, -0.02090167999267578, -0.019695281982421875, -0.01848888397216797, -0.017282485961914062, -0.016076087951660156, -0.01486968994140625, -0.013663291931152344, -0.012456893920898438, -0.011250495910644531, -0.010044097900390625, -0.008837699890136719, -0.0076313018798828125, -0.006424903869628906, -0.005218505859375, -0.004012107849121094, -0.0028057098388671875, -0.0015993118286132812, -0.000392913818359375, 0.0008134841918945312, 0.0020198822021484375, 0.0032262802124023438, 0.00443267822265625, 0.005639076232910156, 0.0068454742431640625, 0.008051872253417969, 0.009258270263671875, 0.010464668273925781, 0.011671066284179688, 0.012877464294433594, 0.0140838623046875, 0.015290260314941406, 0.016496658325195312, 0.01770305633544922, 0.018909454345703125, 0.02011585235595703, 0.021322250366210938, 0.022528648376464844, 0.02373504638671875, 0.024941444396972656, 0.026147842407226562, 0.02735424041748047, 0.028560638427734375, 0.02976703643798828, 0.030973434448242188, 0.032179832458496094, 0.03338623046875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 9.0, 8.0, 9.0, 12.0, 18.0, 17.0, 31.0, 58.0, 64.0, 104.0, 168.0, 225.0, 347.0, 616.0, 1127.0, 2159.0, 4523.0, 9774.0, 22238.0, 51813.0, 111601.0, 198133.0, 247702.0, 196721.0, 108892.0, 50893.0, 22010.0, 9782.0, 4464.0, 2254.0, 1096.0, 610.0, 380.0, 254.0, 152.0, 106.0, 64.0, 30.0, 35.0, 25.0, 18.0, 7.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.113037109375, -0.10944747924804688, -0.10585784912109375, -0.10226821899414062, -0.0986785888671875, -0.09508895874023438, -0.09149932861328125, -0.08790969848632812, -0.084320068359375, -0.08073043823242188, -0.07714080810546875, -0.07355117797851562, -0.0699615478515625, -0.06637191772460938, -0.06278228759765625, -0.059192657470703125, -0.05560302734375, -0.052013397216796875, -0.04842376708984375, -0.044834136962890625, -0.0412445068359375, -0.037654876708984375, -0.03406524658203125, -0.030475616455078125, -0.026885986328125, -0.023296356201171875, -0.01970672607421875, -0.016117095947265625, -0.0125274658203125, -0.008937835693359375, -0.00534820556640625, -0.001758575439453125, 0.0018310546875, 0.005420684814453125, 0.00901031494140625, 0.012599945068359375, 0.0161895751953125, 0.019779205322265625, 0.02336883544921875, 0.026958465576171875, 0.030548095703125, 0.034137725830078125, 0.03772735595703125, 0.041316986083984375, 0.0449066162109375, 0.048496246337890625, 0.05208587646484375, 0.055675506591796875, 0.05926513671875, 0.06285476684570312, 0.06644439697265625, 0.07003402709960938, 0.0736236572265625, 0.07721328735351562, 0.08080291748046875, 0.08439254760742188, 0.087982177734375, 0.09157180786132812, 0.09516143798828125, 0.09875106811523438, 0.1023406982421875, 0.10593032836914062, 0.10951995849609375, 0.11310958862304688, 0.11669921875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 1.0, 9.0, 5.0, 10.0, 14.0, 13.0, 10.0, 27.0, 17.0, 17.0, 33.0, 31.0, 34.0, 31.0, 51.0, 43.0, 41.0, 39.0, 48.0, 54.0, 57.0, 40.0, 38.0, 46.0, 36.0, 31.0, 31.0, 32.0, 29.0, 27.0, 22.0, 11.0, 16.0, 14.0, 9.0, 13.0, 5.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10076904296875, -0.09743690490722656, -0.09410476684570312, -0.09077262878417969, -0.08744049072265625, -0.08410835266113281, -0.08077621459960938, -0.07744407653808594, -0.0741119384765625, -0.07077980041503906, -0.06744766235351562, -0.06411552429199219, -0.06078338623046875, -0.05745124816894531, -0.054119110107421875, -0.05078697204589844, -0.047454833984375, -0.04412269592285156, -0.040790557861328125, -0.03745841979980469, -0.03412628173828125, -0.030794143676757812, -0.027462005615234375, -0.024129867553710938, -0.0207977294921875, -0.017465591430664062, -0.014133453369140625, -0.010801315307617188, -0.00746917724609375, -0.0041370391845703125, -0.000804901123046875, 0.0025272369384765625, 0.005859375, 0.009191513061523438, 0.012523651123046875, 0.015855789184570312, 0.01918792724609375, 0.022520065307617188, 0.025852203369140625, 0.029184341430664062, 0.0325164794921875, 0.03584861755371094, 0.039180755615234375, 0.04251289367675781, 0.04584503173828125, 0.04917716979980469, 0.052509307861328125, 0.05584144592285156, 0.059173583984375, 0.06250572204589844, 0.06583786010742188, 0.06916999816894531, 0.07250213623046875, 0.07583427429199219, 0.07916641235351562, 0.08249855041503906, 0.0858306884765625, 0.08916282653808594, 0.09249496459960938, 0.09582710266113281, 0.09915924072265625, 0.10249137878417969, 0.10582351684570312, 0.10915565490722656, 0.11248779296875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 7.0, 6.0, 5.0, 9.0, 24.0, 10.0, 25.0, 34.0, 56.0, 86.0, 118.0, 170.0, 256.0, 331.0, 507.0, 799.0, 1234.0, 1895.0, 3092.0, 5274.0, 8818.0, 15653.0, 28894.0, 53460.0, 99081.0, 163353.0, 208146.0, 184972.0, 121261.0, 67818.0, 36169.0, 19701.0, 10901.0, 6196.0, 3748.0, 2193.0, 1491.0, 905.0, 575.0, 399.0, 254.0, 175.0, 137.0, 107.0, 56.0, 52.0, 35.0, 21.0, 19.0, 14.0, 9.0, 6.0, 2.0, 6.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.029052734375, -0.02813577651977539, -0.02721881866455078, -0.026301860809326172, -0.025384902954101562, -0.024467945098876953, -0.023550987243652344, -0.022634029388427734, -0.021717071533203125, -0.020800113677978516, -0.019883155822753906, -0.018966197967529297, -0.018049240112304688, -0.017132282257080078, -0.01621532440185547, -0.01529836654663086, -0.01438140869140625, -0.01346445083618164, -0.012547492980957031, -0.011630535125732422, -0.010713577270507812, -0.009796619415283203, -0.008879661560058594, -0.007962703704833984, -0.007045745849609375, -0.006128787994384766, -0.005211830139160156, -0.004294872283935547, -0.0033779144287109375, -0.002460956573486328, -0.0015439987182617188, -0.0006270408630371094, 0.0002899169921875, 0.0012068748474121094, 0.0021238327026367188, 0.003040790557861328, 0.0039577484130859375, 0.004874706268310547, 0.005791664123535156, 0.006708621978759766, 0.007625579833984375, 0.008542537689208984, 0.009459495544433594, 0.010376453399658203, 0.011293411254882812, 0.012210369110107422, 0.013127326965332031, 0.01404428482055664, 0.01496124267578125, 0.01587820053100586, 0.01679515838623047, 0.017712116241455078, 0.018629074096679688, 0.019546031951904297, 0.020462989807128906, 0.021379947662353516, 0.022296905517578125, 0.023213863372802734, 0.024130821228027344, 0.025047779083251953, 0.025964736938476562, 0.026881694793701172, 0.02779865264892578, 0.02871561050415039, 0.029632568359375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 6.0, 10.0, 4.0, 7.0, 15.0, 14.0, 11.0, 7.0, 16.0, 15.0, 25.0, 27.0, 24.0, 17.0, 31.0, 32.0, 31.0, 32.0, 50.0, 58.0, 38.0, 57.0, 52.0, 48.0, 45.0, 47.0, 42.0, 29.0, 35.0, 31.0, 27.0, 15.0, 21.0, 18.0, 17.0, 10.0, 10.0, 3.0, 4.0, 6.0, 9.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.4483928680419922e-05, -1.4083459973335266e-05, -1.368299126625061e-05, -1.3282522559165955e-05, -1.2882053852081299e-05, -1.2481585144996643e-05, -1.2081116437911987e-05, -1.1680647730827332e-05, -1.1280179023742676e-05, -1.087971031665802e-05, -1.0479241609573364e-05, -1.0078772902488708e-05, -9.678304195404053e-06, -9.277835488319397e-06, -8.877366781234741e-06, -8.476898074150085e-06, -8.07642936706543e-06, -7.675960659980774e-06, -7.275491952896118e-06, -6.875023245811462e-06, -6.474554538726807e-06, -6.074085831642151e-06, -5.673617124557495e-06, -5.273148417472839e-06, -4.872679710388184e-06, -4.472211003303528e-06, -4.071742296218872e-06, -3.6712735891342163e-06, -3.2708048820495605e-06, -2.8703361749649048e-06, -2.469867467880249e-06, -2.0693987607955933e-06, -1.6689300537109375e-06, -1.2684613466262817e-06, -8.67992639541626e-07, -4.675239324569702e-07, -6.705522537231445e-08, 3.334134817123413e-07, 7.338821887969971e-07, 1.1343508958816528e-06, 1.5348196029663086e-06, 1.9352883100509644e-06, 2.33575701713562e-06, 2.736225724220276e-06, 3.1366944313049316e-06, 3.5371631383895874e-06, 3.937631845474243e-06, 4.338100552558899e-06, 4.738569259643555e-06, 5.1390379667282104e-06, 5.539506673812866e-06, 5.939975380897522e-06, 6.340444087982178e-06, 6.7409127950668335e-06, 7.141381502151489e-06, 7.541850209236145e-06, 7.9423189163208e-06, 8.342787623405457e-06, 8.743256330490112e-06, 9.143725037574768e-06, 9.544193744659424e-06, 9.94466245174408e-06, 1.0345131158828735e-05, 1.0745599865913391e-05, 1.1146068572998047e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 5.0, 8.0, 8.0, 9.0, 19.0, 27.0, 29.0, 43.0, 72.0, 91.0, 122.0, 182.0, 325.0, 530.0, 799.0, 1443.0, 2648.0, 4917.0, 9754.0, 21323.0, 53518.0, 145531.0, 313570.0, 287651.0, 123409.0, 45422.0, 18383.0, 8466.0, 4446.0, 2325.0, 1281.0, 828.0, 488.0, 296.0, 205.0, 115.0, 79.0, 48.0, 33.0, 19.0, 31.0, 9.0, 14.0, 8.0, 12.0, 7.0, 3.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.04595947265625, -0.04460430145263672, -0.04324913024902344, -0.041893959045410156, -0.040538787841796875, -0.039183616638183594, -0.03782844543457031, -0.03647327423095703, -0.03511810302734375, -0.03376293182373047, -0.03240776062011719, -0.031052589416503906, -0.029697418212890625, -0.028342247009277344, -0.026987075805664062, -0.02563190460205078, -0.0242767333984375, -0.02292156219482422, -0.021566390991210938, -0.020211219787597656, -0.018856048583984375, -0.017500877380371094, -0.016145706176757812, -0.014790534973144531, -0.01343536376953125, -0.012080192565917969, -0.010725021362304688, -0.009369850158691406, -0.008014678955078125, -0.006659507751464844, -0.0053043365478515625, -0.003949165344238281, -0.002593994140625, -0.0012388229370117188, 0.0001163482666015625, 0.0014715194702148438, 0.002826690673828125, 0.004181861877441406, 0.0055370330810546875, 0.006892204284667969, 0.00824737548828125, 0.009602546691894531, 0.010957717895507812, 0.012312889099121094, 0.013668060302734375, 0.015023231506347656, 0.016378402709960938, 0.01773357391357422, 0.0190887451171875, 0.02044391632080078, 0.021799087524414062, 0.023154258728027344, 0.024509429931640625, 0.025864601135253906, 0.027219772338867188, 0.02857494354248047, 0.02993011474609375, 0.03128528594970703, 0.03264045715332031, 0.033995628356933594, 0.035350799560546875, 0.036705970764160156, 0.03806114196777344, 0.03941631317138672, 0.040771484375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 13.0, 9.0, 16.0, 15.0, 33.0, 39.0, 35.0, 65.0, 69.0, 83.0, 112.0, 108.0, 81.0, 68.0, 73.0, 39.0, 39.0, 27.0, 18.0, 16.0, 13.0, 5.0, 5.0, 3.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.048309326171875, -0.047008514404296875, -0.04570770263671875, -0.044406890869140625, -0.0431060791015625, -0.041805267333984375, -0.04050445556640625, -0.039203643798828125, -0.03790283203125, -0.036602020263671875, -0.03530120849609375, -0.034000396728515625, -0.0326995849609375, -0.031398773193359375, -0.03009796142578125, -0.028797149658203125, -0.027496337890625, -0.026195526123046875, -0.02489471435546875, -0.023593902587890625, -0.0222930908203125, -0.020992279052734375, -0.01969146728515625, -0.018390655517578125, -0.01708984375, -0.015789031982421875, -0.01448822021484375, -0.013187408447265625, -0.0118865966796875, -0.010585784912109375, -0.00928497314453125, -0.007984161376953125, -0.006683349609375, -0.005382537841796875, -0.00408172607421875, -0.002780914306640625, -0.0014801025390625, -0.000179290771484375, 0.00112152099609375, 0.002422332763671875, 0.00372314453125, 0.005023956298828125, 0.00632476806640625, 0.007625579833984375, 0.0089263916015625, 0.010227203369140625, 0.01152801513671875, 0.012828826904296875, 0.014129638671875, 0.015430450439453125, 0.01673126220703125, 0.018032073974609375, 0.0193328857421875, 0.020633697509765625, 0.02193450927734375, 0.023235321044921875, 0.0245361328125, 0.025836944580078125, 0.02713775634765625, 0.028438568115234375, 0.0297393798828125, 0.031040191650390625, 0.03234100341796875, 0.033641815185546875, 0.034942626953125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 9.0, 8.0, 8.0, 11.0, 18.0, 24.0, 31.0, 34.0, 40.0, 57.0, 64.0, 69.0, 69.0, 88.0, 84.0, 69.0, 66.0, 51.0, 41.0, 29.0, 36.0, 24.0, 16.0, 19.0, 14.0, 8.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.41167014837265015, -0.3999342918395996, -0.38819846510887146, -0.3764626085758209, -0.3647267818450928, -0.35299092531204224, -0.3412550687789917, -0.32951924204826355, -0.3177834153175354, -0.30604755878448486, -0.2943117320537567, -0.2825758755207062, -0.270840048789978, -0.2591041922569275, -0.24736835062503815, -0.2356325089931488, -0.22389665246009827, -0.21216081082820892, -0.20042496919631958, -0.18868911266326904, -0.1769532859325409, -0.16521742939949036, -0.153481587767601, -0.14174574613571167, -0.13000990450382233, -0.11827406287193298, -0.10653822124004364, -0.0948023721575737, -0.08306653052568436, -0.07133068889379501, -0.05959483981132507, -0.04785899817943573, -0.03612315654754639, -0.024387313053011894, -0.012651469558477402, -0.00091562420129776, 0.010820217430591583, 0.022556059062480927, 0.03429190814495087, 0.04602774977684021, 0.05776359140872955, 0.0694994330406189, 0.08123527467250824, 0.09297112375497818, 0.10470696538686752, 0.11644280701875687, 0.1281786561012268, 0.13991449773311615, 0.1516503393650055, 0.16338618099689484, 0.17512202262878418, 0.18685787916183472, 0.19859370589256287, 0.2103295624256134, 0.22206540405750275, 0.2338012456893921, 0.24553708732128143, 0.2572729289531708, 0.2690087854862213, 0.28074461221694946, 0.29248046875, 0.30421629548072815, 0.3159521520137787, 0.32768797874450684, 0.3394238352775574]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 9.0, 8.0, 8.0, 8.0, 6.0, 14.0, 16.0, 19.0, 15.0, 22.0, 18.0, 25.0, 29.0, 31.0, 30.0, 34.0, 32.0, 49.0, 42.0, 43.0, 35.0, 54.0, 35.0, 47.0, 37.0, 38.0, 45.0, 38.0, 30.0, 21.0, 30.0, 30.0, 12.0, 19.0, 15.0, 12.0, 11.0, 11.0, 3.0, 8.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.34467560052871704, -0.334215372800827, -0.323755145072937, -0.3132948875427246, -0.3028346598148346, -0.2923744320869446, -0.2819141745567322, -0.27145394682884216, -0.26099371910095215, -0.25053349137306213, -0.24007324874401093, -0.22961300611495972, -0.2191527783870697, -0.2086925506591797, -0.19823230803012848, -0.18777206540107727, -0.17731183767318726, -0.16685160994529724, -0.15639136731624603, -0.14593112468719482, -0.1354708969593048, -0.1250106692314148, -0.11455042660236359, -0.10409019142389297, -0.09362995624542236, -0.08316972106695175, -0.07270948588848114, -0.06224925071001053, -0.05178901553153992, -0.041328780353069305, -0.030868545174598694, -0.020408309996128082, -0.00994807481765747, 0.0005121603608131409, 0.010972395539283752, 0.021432630717754364, 0.031892865896224976, 0.04235310107469559, 0.0528133362531662, 0.06327357143163681, 0.07373380661010742, 0.08419404178857803, 0.09465427696704865, 0.10511451214551926, 0.11557474732398987, 0.12603497505187988, 0.1364952176809311, 0.1469554603099823, 0.15741568803787231, 0.16787591576576233, 0.17833615839481354, 0.18879640102386475, 0.19925662875175476, 0.20971685647964478, 0.22017709910869598, 0.2306373417377472, 0.2410975694656372, 0.2515577971935272, 0.26201802492141724, 0.27247828245162964, 0.28293851017951965, 0.29339873790740967, 0.30385899543762207, 0.3143192231655121, 0.3247794508934021]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 4.0, 2.0, 10.0, 11.0, 9.0, 14.0, 15.0, 40.0, 59.0, 73.0, 118.0, 192.0, 332.0, 528.0, 891.0, 1647.0, 2906.0, 5710.0, 11475.0, 24580.0, 58376.0, 167694.0, 621045.0, 1683361.0, 1133477.0, 313124.0, 97331.0, 37352.0, 16524.0, 7879.0, 4149.0, 2226.0, 1294.0, 766.0, 392.0, 248.0, 161.0, 97.0, 51.0, 40.0, 22.0, 19.0, 17.0, 13.0, 6.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.05987548828125, -0.05792808532714844, -0.055980682373046875, -0.05403327941894531, -0.05208587646484375, -0.05013847351074219, -0.048191070556640625, -0.04624366760253906, -0.0442962646484375, -0.04234886169433594, -0.040401458740234375, -0.03845405578613281, -0.03650665283203125, -0.03455924987792969, -0.032611846923828125, -0.030664443969726562, -0.028717041015625, -0.026769638061523438, -0.024822235107421875, -0.022874832153320312, -0.02092742919921875, -0.018980026245117188, -0.017032623291015625, -0.015085220336914062, -0.0131378173828125, -0.011190414428710938, -0.009243011474609375, -0.0072956085205078125, -0.00534820556640625, -0.0034008026123046875, -0.001453399658203125, 0.0004940032958984375, 0.00244140625, 0.0043888092041015625, 0.006336212158203125, 0.008283615112304688, 0.01023101806640625, 0.012178421020507812, 0.014125823974609375, 0.016073226928710938, 0.0180206298828125, 0.019968032836914062, 0.021915435791015625, 0.023862838745117188, 0.02581024169921875, 0.027757644653320312, 0.029705047607421875, 0.03165245056152344, 0.033599853515625, 0.03554725646972656, 0.037494659423828125, 0.03944206237792969, 0.04138946533203125, 0.04333686828613281, 0.045284271240234375, 0.04723167419433594, 0.0491790771484375, 0.05112648010253906, 0.053073883056640625, 0.05502128601074219, 0.05696868896484375, 0.05891609191894531, 0.060863494873046875, 0.06281089782714844, 0.06475830078125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 11.0, 3.0, 10.0, 8.0, 13.0, 16.0, 19.0, 26.0, 31.0, 42.0, 28.0, 36.0, 35.0, 33.0, 53.0, 57.0, 38.0, 44.0, 41.0, 45.0, 48.0, 44.0, 36.0, 44.0, 36.0, 30.0, 29.0, 27.0, 24.0, 13.0, 18.0, 11.0, 11.0, 7.0, 8.0, 5.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0513916015625, -0.04991292953491211, -0.04843425750732422, -0.04695558547973633, -0.04547691345214844, -0.04399824142456055, -0.042519569396972656, -0.041040897369384766, -0.039562225341796875, -0.038083553314208984, -0.036604881286621094, -0.0351262092590332, -0.03364753723144531, -0.03216886520385742, -0.03069019317626953, -0.02921152114868164, -0.02773284912109375, -0.02625417709350586, -0.02477550506591797, -0.023296833038330078, -0.021818161010742188, -0.020339488983154297, -0.018860816955566406, -0.017382144927978516, -0.015903472900390625, -0.014424800872802734, -0.012946128845214844, -0.011467456817626953, -0.009988784790039062, -0.008510112762451172, -0.007031440734863281, -0.005552768707275391, -0.0040740966796875, -0.0025954246520996094, -0.0011167526245117188, 0.0003619194030761719, 0.0018405914306640625, 0.003319263458251953, 0.004797935485839844, 0.006276607513427734, 0.007755279541015625, 0.009233951568603516, 0.010712623596191406, 0.012191295623779297, 0.013669967651367188, 0.015148639678955078, 0.01662731170654297, 0.01810598373413086, 0.01958465576171875, 0.02106332778930664, 0.02254199981689453, 0.024020671844482422, 0.025499343872070312, 0.026978015899658203, 0.028456687927246094, 0.029935359954833984, 0.031414031982421875, 0.032892704010009766, 0.034371376037597656, 0.03585004806518555, 0.03732872009277344, 0.03880739212036133, 0.04028606414794922, 0.04176473617553711, 0.043243408203125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 8.0, 19.0, 15.0, 31.0, 62.0, 75.0, 122.0, 188.0, 344.0, 691.0, 1335.0, 2809.0, 6705.0, 17524.0, 52284.0, 172968.0, 648075.0, 1999847.0, 942762.0, 239090.0, 70867.0, 23022.0, 8512.0, 3456.0, 1646.0, 775.0, 438.0, 239.0, 142.0, 85.0, 54.0, 35.0, 19.0, 17.0, 8.0, 9.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07196044921875, -0.06935596466064453, -0.06675148010253906, -0.0641469955444336, -0.061542510986328125, -0.058938026428222656, -0.05633354187011719, -0.05372905731201172, -0.05112457275390625, -0.04852008819580078, -0.04591560363769531, -0.043311119079589844, -0.040706634521484375, -0.038102149963378906, -0.03549766540527344, -0.03289318084716797, -0.0302886962890625, -0.02768421173095703, -0.025079727172851562, -0.022475242614746094, -0.019870758056640625, -0.017266273498535156, -0.014661788940429688, -0.012057304382324219, -0.00945281982421875, -0.006848335266113281, -0.0042438507080078125, -0.0016393661499023438, 0.000965118408203125, 0.0035696029663085938, 0.0061740875244140625, 0.008778572082519531, 0.011383056640625, 0.013987541198730469, 0.016592025756835938, 0.019196510314941406, 0.021800994873046875, 0.024405479431152344, 0.027009963989257812, 0.02961444854736328, 0.03221893310546875, 0.03482341766357422, 0.03742790222167969, 0.040032386779785156, 0.042636871337890625, 0.045241355895996094, 0.04784584045410156, 0.05045032501220703, 0.0530548095703125, 0.05565929412841797, 0.05826377868652344, 0.060868263244628906, 0.06347274780273438, 0.06607723236083984, 0.06868171691894531, 0.07128620147705078, 0.07389068603515625, 0.07649517059326172, 0.07909965515136719, 0.08170413970947266, 0.08430862426757812, 0.0869131088256836, 0.08951759338378906, 0.09212207794189453, 0.0947265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 9.0, 9.0, 14.0, 17.0, 31.0, 48.0, 54.0, 96.0, 118.0, 189.0, 281.0, 423.0, 582.0, 676.0, 512.0, 350.0, 194.0, 135.0, 109.0, 77.0, 58.0, 27.0, 16.0, 10.0, 11.0, 6.0, 9.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.072021484375, -0.06878471374511719, -0.06554794311523438, -0.06231117248535156, -0.05907440185546875, -0.05583763122558594, -0.052600860595703125, -0.04936408996582031, -0.0461273193359375, -0.04289054870605469, -0.039653778076171875, -0.03641700744628906, -0.03318023681640625, -0.029943466186523438, -0.026706695556640625, -0.023469924926757812, -0.020233154296875, -0.016996383666992188, -0.013759613037109375, -0.010522842407226562, -0.00728607177734375, -0.0040493011474609375, -0.000812530517578125, 0.0024242401123046875, 0.0056610107421875, 0.008897781372070312, 0.012134552001953125, 0.015371322631835938, 0.01860809326171875, 0.021844863891601562, 0.025081634521484375, 0.028318405151367188, 0.03155517578125, 0.03479194641113281, 0.038028717041015625, 0.04126548767089844, 0.04450225830078125, 0.04773902893066406, 0.050975799560546875, 0.05421257019042969, 0.0574493408203125, 0.06068611145019531, 0.06392288208007812, 0.06715965270996094, 0.07039642333984375, 0.07363319396972656, 0.07686996459960938, 0.08010673522949219, 0.083343505859375, 0.08658027648925781, 0.08981704711914062, 0.09305381774902344, 0.09629058837890625, 0.09952735900878906, 0.10276412963867188, 0.10600090026855469, 0.1092376708984375, 0.11247444152832031, 0.11571121215820312, 0.11894798278808594, 0.12218475341796875, 0.12542152404785156, 0.12865829467773438, 0.1318950653076172, 0.1351318359375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 12.0, 24.0, 38.0, 56.0, 64.0, 87.0, 140.0, 126.0, 140.0, 114.0, 65.0, 45.0, 30.0, 19.0, 11.0, 12.0, 5.0, 3.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4022735357284546, -0.38456782698631287, -0.36686211824417114, -0.3491564095020294, -0.3314507007598877, -0.31374502182006836, -0.29603931307792664, -0.2783336043357849, -0.2606278955936432, -0.24292218685150146, -0.22521647810935974, -0.2075107842683792, -0.1898050755262375, -0.17209936678409576, -0.15439367294311523, -0.1366879642009735, -0.11898225545883179, -0.10127654671669006, -0.08357084542512894, -0.06586514413356781, -0.048159435391426086, -0.030453726649284363, -0.012748025357723236, 0.004957675933837891, 0.022663384675979614, 0.04036908969283104, 0.058074794709682465, 0.07578049600124359, 0.09348620474338531, 0.11119191348552704, 0.12889760732650757, 0.1466033160686493, 0.16430902481079102, 0.18201473355293274, 0.19972044229507446, 0.217426136136055, 0.23513184487819672, 0.25283753871917725, 0.27054324746131897, 0.2882489562034607, 0.3059546649456024, 0.32366037368774414, 0.34136608242988586, 0.3590717911720276, 0.3767774701118469, 0.39448320865631104, 0.41218888759613037, 0.4298945963382721, 0.4476003050804138, 0.46530601382255554, 0.48301172256469727, 0.5007174015045166, 0.5184231400489807, 0.5361288189888, 0.5538345575332642, 0.5715402364730835, 0.5892459154129028, 0.6069515943527222, 0.6246573328971863, 0.6423630118370056, 0.6600687503814697, 0.6777744293212891, 0.6954801678657532, 0.7131858468055725, 0.7308915853500366]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 11.0, 6.0, 7.0, 8.0, 23.0, 12.0, 13.0, 20.0, 21.0, 22.0, 32.0, 28.0, 37.0, 34.0, 29.0, 46.0, 38.0, 44.0, 41.0, 39.0, 40.0, 38.0, 42.0, 40.0, 44.0, 37.0, 35.0, 22.0, 34.0, 12.0, 26.0, 21.0, 21.0, 11.0, 11.0, 18.0, 6.0, 8.0, 10.0, 2.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.28799694776535034, -0.27979883551597595, -0.27160075306892395, -0.26340264081954956, -0.25520452857017517, -0.24700643122196198, -0.23880833387374878, -0.2306102216243744, -0.222412109375, -0.2142140120267868, -0.20601589977741241, -0.19781780242919922, -0.18961969017982483, -0.18142159283161163, -0.17322349548339844, -0.16502538323402405, -0.15682728588581085, -0.14862918853759766, -0.14043107628822327, -0.13223297894001007, -0.12403486669063568, -0.11583676934242249, -0.10763866454362869, -0.0994405597448349, -0.09124245494604111, -0.08304435014724731, -0.07484624534845352, -0.06664814054965973, -0.058450039476156235, -0.05025193467736244, -0.04205383360385895, -0.033855728805065155, -0.025657624006271362, -0.01745951920747757, -0.009261416271328926, -0.0010633133351802826, 0.00713479146361351, 0.015332896262407303, 0.023530997335910797, 0.03172910213470459, 0.03992720693349838, 0.048125311732292175, 0.05632341653108597, 0.06452152132987976, 0.07271961867809296, 0.08091773092746735, 0.08911582827568054, 0.09731393307447433, 0.10551203787326813, 0.11371014267206192, 0.12190824747085571, 0.1301063448190689, 0.1383044570684433, 0.1465025544166565, 0.15470066666603088, 0.16289876401424408, 0.17109686136245728, 0.17929495871067047, 0.18749307096004486, 0.19569116830825806, 0.20388928055763245, 0.21208737790584564, 0.22028547525405884, 0.22848358750343323, 0.23668169975280762]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 5.0, 11.0, 13.0, 29.0, 36.0, 45.0, 102.0, 139.0, 217.0, 360.0, 688.0, 1176.0, 2040.0, 3972.0, 7334.0, 13932.0, 26706.0, 50431.0, 95767.0, 173658.0, 243074.0, 194441.0, 110266.0, 58678.0, 30927.0, 16049.0, 8476.0, 4464.0, 2421.0, 1256.0, 749.0, 420.0, 262.0, 142.0, 101.0, 55.0, 39.0, 22.0, 20.0, 10.0, 7.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09698486328125, -0.09381675720214844, -0.09064865112304688, -0.08748054504394531, -0.08431243896484375, -0.08114433288574219, -0.07797622680664062, -0.07480812072753906, -0.0716400146484375, -0.06847190856933594, -0.06530380249023438, -0.06213569641113281, -0.05896759033203125, -0.05579948425292969, -0.052631378173828125, -0.04946327209472656, -0.046295166015625, -0.04312705993652344, -0.039958953857421875, -0.03679084777832031, -0.03362274169921875, -0.030454635620117188, -0.027286529541015625, -0.024118423461914062, -0.0209503173828125, -0.017782211303710938, -0.014614105224609375, -0.011445999145507812, -0.00827789306640625, -0.0051097869873046875, -0.001941680908203125, 0.0012264251708984375, 0.00439453125, 0.0075626373291015625, 0.010730743408203125, 0.013898849487304688, 0.01706695556640625, 0.020235061645507812, 0.023403167724609375, 0.026571273803710938, 0.0297393798828125, 0.03290748596191406, 0.036075592041015625, 0.03924369812011719, 0.04241180419921875, 0.04557991027832031, 0.048748016357421875, 0.05191612243652344, 0.055084228515625, 0.05825233459472656, 0.061420440673828125, 0.06458854675292969, 0.06775665283203125, 0.07092475891113281, 0.07409286499023438, 0.07726097106933594, 0.0804290771484375, 0.08359718322753906, 0.08676528930664062, 0.08993339538574219, 0.09310150146484375, 0.09626960754394531, 0.09943771362304688, 0.10260581970214844, 0.10577392578125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 3.0, 8.0, 6.0, 9.0, 13.0, 17.0, 19.0, 24.0, 21.0, 23.0, 26.0, 38.0, 39.0, 48.0, 44.0, 33.0, 30.0, 43.0, 45.0, 33.0, 46.0, 39.0, 36.0, 38.0, 36.0, 35.0, 35.0, 33.0, 25.0, 23.0, 17.0, 17.0, 16.0, 8.0, 9.0, 9.0, 15.0, 5.0, 8.0, 4.0, 6.0, 2.0, 5.0, 4.0, 2.0, 1.0, 2.0], "bins": [-0.04510498046875, -0.043860435485839844, -0.04261589050292969, -0.04137134552001953, -0.040126800537109375, -0.03888225555419922, -0.03763771057128906, -0.036393165588378906, -0.03514862060546875, -0.033904075622558594, -0.03265953063964844, -0.03141498565673828, -0.030170440673828125, -0.02892589569091797, -0.027681350708007812, -0.026436805725097656, -0.0251922607421875, -0.023947715759277344, -0.022703170776367188, -0.02145862579345703, -0.020214080810546875, -0.01896953582763672, -0.017724990844726562, -0.016480445861816406, -0.01523590087890625, -0.013991355895996094, -0.012746810913085938, -0.011502265930175781, -0.010257720947265625, -0.009013175964355469, -0.0077686309814453125, -0.006524085998535156, -0.005279541015625, -0.004034996032714844, -0.0027904510498046875, -0.0015459060668945312, -0.000301361083984375, 0.0009431838989257812, 0.0021877288818359375, 0.0034322738647460938, 0.00467681884765625, 0.005921363830566406, 0.0071659088134765625, 0.008410453796386719, 0.009654998779296875, 0.010899543762207031, 0.012144088745117188, 0.013388633728027344, 0.0146331787109375, 0.015877723693847656, 0.017122268676757812, 0.01836681365966797, 0.019611358642578125, 0.02085590362548828, 0.022100448608398438, 0.023344993591308594, 0.02458953857421875, 0.025834083557128906, 0.027078628540039062, 0.02832317352294922, 0.029567718505859375, 0.03081226348876953, 0.03205680847167969, 0.033301353454589844, 0.0345458984375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 7.0, 10.0, 11.0, 13.0, 20.0, 21.0, 34.0, 46.0, 56.0, 92.0, 128.0, 195.0, 294.0, 591.0, 1243.0, 3085.0, 8199.0, 24323.0, 69404.0, 177560.0, 328375.0, 258385.0, 112382.0, 41053.0, 14185.0, 5007.0, 1928.0, 790.0, 378.0, 222.0, 180.0, 99.0, 71.0, 43.0, 43.0, 24.0, 13.0, 18.0, 10.0, 10.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.146728515625, -0.1426239013671875, -0.138519287109375, -0.1344146728515625, -0.13031005859375, -0.1262054443359375, -0.122100830078125, -0.1179962158203125, -0.1138916015625, -0.1097869873046875, -0.105682373046875, -0.1015777587890625, -0.09747314453125, -0.0933685302734375, -0.089263916015625, -0.0851593017578125, -0.0810546875, -0.0769500732421875, -0.072845458984375, -0.0687408447265625, -0.06463623046875, -0.0605316162109375, -0.056427001953125, -0.0523223876953125, -0.0482177734375, -0.0441131591796875, -0.040008544921875, -0.0359039306640625, -0.03179931640625, -0.0276947021484375, -0.023590087890625, -0.0194854736328125, -0.015380859375, -0.0112762451171875, -0.007171630859375, -0.0030670166015625, 0.00103759765625, 0.0051422119140625, 0.009246826171875, 0.0133514404296875, 0.0174560546875, 0.0215606689453125, 0.025665283203125, 0.0297698974609375, 0.03387451171875, 0.0379791259765625, 0.042083740234375, 0.0461883544921875, 0.05029296875, 0.0543975830078125, 0.058502197265625, 0.0626068115234375, 0.06671142578125, 0.0708160400390625, 0.074920654296875, 0.0790252685546875, 0.0831298828125, 0.0872344970703125, 0.091339111328125, 0.0954437255859375, 0.09954833984375, 0.1036529541015625, 0.107757568359375, 0.1118621826171875, 0.115966796875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 7.0, 9.0, 5.0, 5.0, 5.0, 9.0, 13.0, 13.0, 17.0, 15.0, 18.0, 21.0, 24.0, 31.0, 31.0, 33.0, 32.0, 31.0, 47.0, 40.0, 54.0, 47.0, 30.0, 43.0, 30.0, 49.0, 28.0, 35.0, 31.0, 28.0, 39.0, 23.0, 24.0, 14.0, 23.0, 20.0, 19.0, 14.0, 11.0, 13.0, 6.0, 3.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.10986328125, -0.1063222885131836, -0.10278129577636719, -0.09924030303955078, -0.09569931030273438, -0.09215831756591797, -0.08861732482910156, -0.08507633209228516, -0.08153533935546875, -0.07799434661865234, -0.07445335388183594, -0.07091236114501953, -0.06737136840820312, -0.06383037567138672, -0.06028938293457031, -0.056748390197753906, -0.0532073974609375, -0.049666404724121094, -0.04612541198730469, -0.04258441925048828, -0.039043426513671875, -0.03550243377685547, -0.03196144104003906, -0.028420448303222656, -0.02487945556640625, -0.021338462829589844, -0.017797470092773438, -0.014256477355957031, -0.010715484619140625, -0.007174491882324219, -0.0036334991455078125, -9.250640869140625e-05, 0.003448486328125, 0.006989479064941406, 0.010530471801757812, 0.014071464538574219, 0.017612457275390625, 0.02115345001220703, 0.024694442749023438, 0.028235435485839844, 0.03177642822265625, 0.035317420959472656, 0.03885841369628906, 0.04239940643310547, 0.045940399169921875, 0.04948139190673828, 0.05302238464355469, 0.056563377380371094, 0.0601043701171875, 0.0636453628540039, 0.06718635559082031, 0.07072734832763672, 0.07426834106445312, 0.07780933380126953, 0.08135032653808594, 0.08489131927490234, 0.08843231201171875, 0.09197330474853516, 0.09551429748535156, 0.09905529022216797, 0.10259628295898438, 0.10613727569580078, 0.10967826843261719, 0.1132192611694336, 0.11676025390625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 4.0, 8.0, 12.0, 11.0, 16.0, 38.0, 39.0, 65.0, 102.0, 151.0, 276.0, 425.0, 707.0, 1307.0, 2226.0, 4165.0, 7480.0, 13232.0, 23322.0, 41841.0, 79864.0, 160318.0, 250398.0, 215385.0, 115722.0, 58322.0, 31782.0, 18035.0, 10192.0, 5897.0, 3039.0, 1742.0, 1006.0, 536.0, 325.0, 195.0, 135.0, 63.0, 51.0, 40.0, 26.0, 17.0, 10.0, 11.0, 9.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.03326416015625, -0.03224897384643555, -0.031233787536621094, -0.03021860122680664, -0.029203414916992188, -0.028188228607177734, -0.02717304229736328, -0.026157855987548828, -0.025142669677734375, -0.024127483367919922, -0.02311229705810547, -0.022097110748291016, -0.021081924438476562, -0.02006673812866211, -0.019051551818847656, -0.018036365509033203, -0.01702117919921875, -0.016005992889404297, -0.014990806579589844, -0.01397562026977539, -0.012960433959960938, -0.011945247650146484, -0.010930061340332031, -0.009914875030517578, -0.008899688720703125, -0.007884502410888672, -0.006869316101074219, -0.005854129791259766, -0.0048389434814453125, -0.0038237571716308594, -0.0028085708618164062, -0.0017933845520019531, -0.0007781982421875, 0.00023698806762695312, 0.0012521743774414062, 0.0022673606872558594, 0.0032825469970703125, 0.004297733306884766, 0.005312919616699219, 0.006328105926513672, 0.007343292236328125, 0.008358478546142578, 0.009373664855957031, 0.010388851165771484, 0.011404037475585938, 0.01241922378540039, 0.013434410095214844, 0.014449596405029297, 0.01546478271484375, 0.016479969024658203, 0.017495155334472656, 0.01851034164428711, 0.019525527954101562, 0.020540714263916016, 0.02155590057373047, 0.022571086883544922, 0.023586273193359375, 0.024601459503173828, 0.02561664581298828, 0.026631832122802734, 0.027647018432617188, 0.02866220474243164, 0.029677391052246094, 0.030692577362060547, 0.031707763671875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 6.0, 1.0, 4.0, 8.0, 15.0, 14.0, 9.0, 15.0, 10.0, 21.0, 28.0, 24.0, 28.0, 37.0, 31.0, 57.0, 46.0, 59.0, 60.0, 70.0, 47.0, 50.0, 46.0, 49.0, 48.0, 33.0, 34.0, 23.0, 21.0, 21.0, 14.0, 14.0, 7.0, 8.0, 4.0, 5.0, 6.0, 7.0, 7.0, 10.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.4483928680419922e-05, -1.4085322618484497e-05, -1.3686716556549072e-05, -1.3288110494613647e-05, -1.2889504432678223e-05, -1.2490898370742798e-05, -1.2092292308807373e-05, -1.1693686246871948e-05, -1.1295080184936523e-05, -1.0896474123001099e-05, -1.0497868061065674e-05, -1.0099261999130249e-05, -9.700655937194824e-06, -9.3020498752594e-06, -8.903443813323975e-06, -8.50483775138855e-06, -8.106231689453125e-06, -7.7076256275177e-06, -7.309019565582275e-06, -6.910413503646851e-06, -6.511807441711426e-06, -6.113201379776001e-06, -5.714595317840576e-06, -5.315989255905151e-06, -4.9173831939697266e-06, -4.518777132034302e-06, -4.120171070098877e-06, -3.721565008163452e-06, -3.3229589462280273e-06, -2.9243528842926025e-06, -2.5257468223571777e-06, -2.127140760421753e-06, -1.7285346984863281e-06, -1.3299286365509033e-06, -9.313225746154785e-07, -5.327165126800537e-07, -1.341104507446289e-07, 2.644956111907959e-07, 6.631016731262207e-07, 1.0617077350616455e-06, 1.4603137969970703e-06, 1.8589198589324951e-06, 2.25752592086792e-06, 2.6561319828033447e-06, 3.0547380447387695e-06, 3.4533441066741943e-06, 3.851950168609619e-06, 4.250556230545044e-06, 4.649162292480469e-06, 5.0477683544158936e-06, 5.446374416351318e-06, 5.844980478286743e-06, 6.243586540222168e-06, 6.642192602157593e-06, 7.040798664093018e-06, 7.439404726028442e-06, 7.838010787963867e-06, 8.236616849899292e-06, 8.635222911834717e-06, 9.033828973770142e-06, 9.432435035705566e-06, 9.831041097640991e-06, 1.0229647159576416e-05, 1.062825322151184e-05, 1.1026859283447266e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 5.0, 2.0, 8.0, 5.0, 12.0, 13.0, 26.0, 31.0, 59.0, 76.0, 121.0, 203.0, 434.0, 787.0, 1627.0, 3577.0, 7978.0, 16426.0, 34010.0, 72999.0, 192305.0, 358457.0, 210199.0, 79408.0, 36289.0, 17507.0, 8337.0, 3947.0, 1818.0, 850.0, 441.0, 215.0, 128.0, 90.0, 48.0, 37.0, 20.0, 13.0, 16.0, 12.0, 5.0, 8.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040130615234375, -0.03885841369628906, -0.037586212158203125, -0.03631401062011719, -0.03504180908203125, -0.03376960754394531, -0.032497406005859375, -0.031225204467773438, -0.0299530029296875, -0.028680801391601562, -0.027408599853515625, -0.026136398315429688, -0.02486419677734375, -0.023591995239257812, -0.022319793701171875, -0.021047592163085938, -0.019775390625, -0.018503189086914062, -0.017230987548828125, -0.015958786010742188, -0.01468658447265625, -0.013414382934570312, -0.012142181396484375, -0.010869979858398438, -0.0095977783203125, -0.008325576782226562, -0.007053375244140625, -0.0057811737060546875, -0.00450897216796875, -0.0032367706298828125, -0.001964569091796875, -0.0006923675537109375, 0.000579833984375, 0.0018520355224609375, 0.003124237060546875, 0.0043964385986328125, 0.00566864013671875, 0.0069408416748046875, 0.008213043212890625, 0.009485244750976562, 0.0107574462890625, 0.012029647827148438, 0.013301849365234375, 0.014574050903320312, 0.01584625244140625, 0.017118453979492188, 0.018390655517578125, 0.019662857055664062, 0.02093505859375, 0.022207260131835938, 0.023479461669921875, 0.024751663208007812, 0.02602386474609375, 0.027296066284179688, 0.028568267822265625, 0.029840469360351562, 0.0311126708984375, 0.03238487243652344, 0.033657073974609375, 0.03492927551269531, 0.03620147705078125, 0.03747367858886719, 0.038745880126953125, 0.04001808166503906, 0.041290283203125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 7.0, 3.0, 0.0, 3.0, 7.0, 5.0, 8.0, 10.0, 16.0, 18.0, 15.0, 21.0, 29.0, 33.0, 27.0, 51.0, 41.0, 50.0, 82.0, 76.0, 62.0, 59.0, 55.0, 49.0, 55.0, 41.0, 34.0, 28.0, 27.0, 23.0, 14.0, 17.0, 10.0, 3.0, 4.0, 8.0, 8.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03125, -0.03022623062133789, -0.02920246124267578, -0.028178691864013672, -0.027154922485351562, -0.026131153106689453, -0.025107383728027344, -0.024083614349365234, -0.023059844970703125, -0.022036075592041016, -0.021012306213378906, -0.019988536834716797, -0.018964767456054688, -0.017940998077392578, -0.01691722869873047, -0.01589345932006836, -0.01486968994140625, -0.01384592056274414, -0.012822151184082031, -0.011798381805419922, -0.010774612426757812, -0.009750843048095703, -0.008727073669433594, -0.007703304290771484, -0.006679534912109375, -0.005655765533447266, -0.004631996154785156, -0.003608226776123047, -0.0025844573974609375, -0.0015606880187988281, -0.0005369186401367188, 0.0004868507385253906, 0.0015106201171875, 0.0025343894958496094, 0.0035581588745117188, 0.004581928253173828, 0.0056056976318359375, 0.006629467010498047, 0.007653236389160156, 0.008677005767822266, 0.009700775146484375, 0.010724544525146484, 0.011748313903808594, 0.012772083282470703, 0.013795852661132812, 0.014819622039794922, 0.01584339141845703, 0.01686716079711914, 0.01789093017578125, 0.01891469955444336, 0.01993846893310547, 0.020962238311767578, 0.021986007690429688, 0.023009777069091797, 0.024033546447753906, 0.025057315826416016, 0.026081085205078125, 0.027104854583740234, 0.028128623962402344, 0.029152393341064453, 0.030176162719726562, 0.031199932098388672, 0.03222370147705078, 0.03324747085571289, 0.034271240234375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 8.0, 8.0, 4.0, 17.0, 17.0, 34.0, 30.0, 60.0, 78.0, 78.0, 87.0, 103.0, 108.0, 90.0, 79.0, 61.0, 42.0, 29.0, 25.0, 15.0, 15.0, 6.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46429601311683655, -0.4510050415992737, -0.4377140998840332, -0.42442312836647034, -0.41113215684890747, -0.3978411853313446, -0.38455021381378174, -0.37125927209854126, -0.3579683005809784, -0.3446773290634155, -0.33138638734817505, -0.3180954158306122, -0.3048044443130493, -0.29151347279548645, -0.2782225012779236, -0.2649315595626831, -0.25164058804512024, -0.23834961652755737, -0.2250586599111557, -0.21176770329475403, -0.19847673177719116, -0.1851857602596283, -0.17189480364322662, -0.15860384702682495, -0.14531287550926208, -0.13202190399169922, -0.11873094737529755, -0.10543998330831528, -0.09214901924133301, -0.07885805517435074, -0.06556709110736847, -0.0522761270403862, -0.03898513317108154, -0.025694169104099274, -0.012403205037117004, 0.0008877590298652649, 0.014178723096847534, 0.027469687163829803, 0.04076065123081207, 0.05405161529779434, 0.06734257936477661, 0.08063354343175888, 0.09392450749874115, 0.10721547156572342, 0.12050643563270569, 0.13379740715026855, 0.14708836376667023, 0.1603793203830719, 0.17367029190063477, 0.18696126341819763, 0.2002522200345993, 0.21354317665100098, 0.22683414816856384, 0.2401251196861267, 0.2534160614013672, 0.26670703291893005, 0.2799980044364929, 0.2932889759540558, 0.30657994747161865, 0.31987088918685913, 0.333161860704422, 0.34645283222198486, 0.35974377393722534, 0.3730347454547882, 0.3863257169723511]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 6.0, 7.0, 9.0, 5.0, 9.0, 10.0, 7.0, 23.0, 15.0, 20.0, 18.0, 16.0, 21.0, 22.0, 45.0, 36.0, 41.0, 45.0, 37.0, 34.0, 45.0, 43.0, 33.0, 47.0, 51.0, 56.0, 31.0, 32.0, 26.0, 25.0, 21.0, 25.0, 23.0, 14.0, 21.0, 20.0, 10.0, 15.0, 7.0, 7.0, 3.0, 6.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31429964303970337, -0.30414900183677673, -0.2939983904361725, -0.28384774923324585, -0.2736971378326416, -0.26354649662971497, -0.2533958852291107, -0.24324524402618408, -0.23309463262557983, -0.2229440063238144, -0.21279338002204895, -0.2026427537202835, -0.19249212741851807, -0.18234150111675262, -0.17219087481498718, -0.16204023361206055, -0.1518896073102951, -0.14173898100852966, -0.13158835470676422, -0.12143772840499878, -0.11128710210323334, -0.1011364758014679, -0.09098584204912186, -0.08083521574735641, -0.07068458944559097, -0.06053396314382553, -0.05038333684206009, -0.04023270681500435, -0.030082080513238907, -0.019931454211473465, -0.009780824184417725, 0.0003698021173477173, 0.01052042841911316, 0.0206710547208786, 0.030821682885289192, 0.04097231104969978, 0.051122937351465225, 0.06127356365323067, 0.07142419368028641, 0.08157481998205185, 0.09172544628381729, 0.10187607258558273, 0.11202669888734818, 0.12217733263969421, 0.13232795894145966, 0.1424785852432251, 0.15262921154499054, 0.16277983784675598, 0.17293046414852142, 0.18308109045028687, 0.1932317167520523, 0.20338234305381775, 0.2135329693555832, 0.22368359565734863, 0.23383423686027527, 0.24398484826087952, 0.25413548946380615, 0.2642861306667328, 0.27443674206733704, 0.28458738327026367, 0.2947379946708679, 0.30488863587379456, 0.3150392472743988, 0.32518988847732544, 0.3353404998779297]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 7.0, 7.0, 8.0, 8.0, 10.0, 8.0, 23.0, 26.0, 45.0, 65.0, 120.0, 212.0, 371.0, 590.0, 1057.0, 2203.0, 4762.0, 10672.0, 26765.0, 74117.0, 254300.0, 1088637.0, 1922876.0, 580901.0, 145769.0, 47399.0, 18269.0, 7757.0, 3585.0, 1671.0, 865.0, 490.0, 280.0, 135.0, 96.0, 45.0, 45.0, 21.0, 22.0, 13.0, 10.0, 5.0, 8.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0701904296875, -0.0677938461303711, -0.06539726257324219, -0.06300067901611328, -0.060604095458984375, -0.05820751190185547, -0.05581092834472656, -0.053414344787597656, -0.05101776123046875, -0.048621177673339844, -0.04622459411621094, -0.04382801055908203, -0.041431427001953125, -0.03903484344482422, -0.03663825988769531, -0.034241676330566406, -0.0318450927734375, -0.029448509216308594, -0.027051925659179688, -0.02465534210205078, -0.022258758544921875, -0.01986217498779297, -0.017465591430664062, -0.015069007873535156, -0.01267242431640625, -0.010275840759277344, -0.007879257202148438, -0.005482673645019531, -0.003086090087890625, -0.0006895065307617188, 0.0017070770263671875, 0.004103660583496094, 0.006500244140625, 0.008896827697753906, 0.011293411254882812, 0.013689994812011719, 0.016086578369140625, 0.01848316192626953, 0.020879745483398438, 0.023276329040527344, 0.02567291259765625, 0.028069496154785156, 0.030466079711914062, 0.03286266326904297, 0.035259246826171875, 0.03765583038330078, 0.04005241394042969, 0.042448997497558594, 0.0448455810546875, 0.047242164611816406, 0.04963874816894531, 0.05203533172607422, 0.054431915283203125, 0.05682849884033203, 0.05922508239746094, 0.061621665954589844, 0.06401824951171875, 0.06641483306884766, 0.06881141662597656, 0.07120800018310547, 0.07360458374023438, 0.07600116729736328, 0.07839775085449219, 0.0807943344116211, 0.08319091796875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 4.0, 11.0, 11.0, 12.0, 12.0, 10.0, 19.0, 20.0, 22.0, 22.0, 23.0, 26.0, 29.0, 40.0, 37.0, 34.0, 37.0, 43.0, 39.0, 47.0, 31.0, 46.0, 39.0, 37.0, 40.0, 30.0, 32.0, 27.0, 30.0, 23.0, 25.0, 20.0, 14.0, 12.0, 13.0, 14.0, 11.0, 14.0, 5.0, 6.0, 7.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.040435791015625, -0.03916358947753906, -0.037891387939453125, -0.03661918640136719, -0.03534698486328125, -0.03407478332519531, -0.032802581787109375, -0.03153038024902344, -0.0302581787109375, -0.028985977172851562, -0.027713775634765625, -0.026441574096679688, -0.02516937255859375, -0.023897171020507812, -0.022624969482421875, -0.021352767944335938, -0.02008056640625, -0.018808364868164062, -0.017536163330078125, -0.016263961791992188, -0.01499176025390625, -0.013719558715820312, -0.012447357177734375, -0.011175155639648438, -0.0099029541015625, -0.008630752563476562, -0.007358551025390625, -0.0060863494873046875, -0.00481414794921875, -0.0035419464111328125, -0.002269744873046875, -0.0009975433349609375, 0.000274658203125, 0.0015468597412109375, 0.002819061279296875, 0.0040912628173828125, 0.00536346435546875, 0.0066356658935546875, 0.007907867431640625, 0.009180068969726562, 0.0104522705078125, 0.011724472045898438, 0.012996673583984375, 0.014268875122070312, 0.01554107666015625, 0.016813278198242188, 0.018085479736328125, 0.019357681274414062, 0.0206298828125, 0.021902084350585938, 0.023174285888671875, 0.024446487426757812, 0.02571868896484375, 0.026990890502929688, 0.028263092041015625, 0.029535293579101562, 0.0308074951171875, 0.03207969665527344, 0.033351898193359375, 0.03462409973144531, 0.03589630126953125, 0.03716850280761719, 0.038440704345703125, 0.03971290588378906, 0.040985107421875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 6.0, 4.0, 3.0, 12.0, 14.0, 21.0, 17.0, 39.0, 75.0, 121.0, 174.0, 342.0, 684.0, 1443.0, 3458.0, 9306.0, 28766.0, 100911.0, 402466.0, 1731385.0, 1463225.0, 329133.0, 84492.0, 24454.0, 7921.0, 3066.0, 1350.0, 621.0, 308.0, 175.0, 90.0, 65.0, 35.0, 29.0, 17.0, 15.0, 9.0, 8.0, 5.0, 4.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.09820556640625, -0.09512996673583984, -0.09205436706542969, -0.08897876739501953, -0.08590316772460938, -0.08282756805419922, -0.07975196838378906, -0.0766763687133789, -0.07360076904296875, -0.0705251693725586, -0.06744956970214844, -0.06437397003173828, -0.061298370361328125, -0.05822277069091797, -0.05514717102050781, -0.052071571350097656, -0.0489959716796875, -0.045920372009277344, -0.04284477233886719, -0.03976917266845703, -0.036693572998046875, -0.03361797332763672, -0.030542373657226562, -0.027466773986816406, -0.02439117431640625, -0.021315574645996094, -0.018239974975585938, -0.015164375305175781, -0.012088775634765625, -0.009013175964355469, -0.0059375762939453125, -0.0028619766235351562, 0.000213623046875, 0.0032892227172851562, 0.0063648223876953125, 0.009440422058105469, 0.012516021728515625, 0.015591621398925781, 0.018667221069335938, 0.021742820739746094, 0.02481842041015625, 0.027894020080566406, 0.030969619750976562, 0.03404521942138672, 0.037120819091796875, 0.04019641876220703, 0.04327201843261719, 0.046347618103027344, 0.0494232177734375, 0.052498817443847656, 0.05557441711425781, 0.05865001678466797, 0.061725616455078125, 0.06480121612548828, 0.06787681579589844, 0.0709524154663086, 0.07402801513671875, 0.0771036148071289, 0.08017921447753906, 0.08325481414794922, 0.08633041381835938, 0.08940601348876953, 0.09248161315917969, 0.09555721282958984, 0.0986328125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 6.0, 9.0, 4.0, 19.0, 22.0, 20.0, 47.0, 57.0, 82.0, 136.0, 197.0, 328.0, 565.0, 686.0, 620.0, 430.0, 281.0, 192.0, 117.0, 88.0, 55.0, 42.0, 25.0, 12.0, 11.0, 6.0, 6.0, 5.0, 5.0, 4.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.16162109375, -0.1579303741455078, -0.15423965454101562, -0.15054893493652344, -0.14685821533203125, -0.14316749572753906, -0.13947677612304688, -0.1357860565185547, -0.1320953369140625, -0.1284046173095703, -0.12471389770507812, -0.12102317810058594, -0.11733245849609375, -0.11364173889160156, -0.10995101928710938, -0.10626029968261719, -0.102569580078125, -0.09887886047363281, -0.09518814086914062, -0.09149742126464844, -0.08780670166015625, -0.08411598205566406, -0.08042526245117188, -0.07673454284667969, -0.0730438232421875, -0.06935310363769531, -0.06566238403320312, -0.06197166442871094, -0.05828094482421875, -0.05459022521972656, -0.050899505615234375, -0.04720878601074219, -0.04351806640625, -0.03982734680175781, -0.036136627197265625, -0.03244590759277344, -0.02875518798828125, -0.025064468383789062, -0.021373748779296875, -0.017683029174804688, -0.0139923095703125, -0.010301589965820312, -0.006610870361328125, -0.0029201507568359375, 0.00077056884765625, 0.0044612884521484375, 0.008152008056640625, 0.011842727661132812, 0.015533447265625, 0.019224166870117188, 0.022914886474609375, 0.026605606079101562, 0.03029632568359375, 0.03398704528808594, 0.037677764892578125, 0.04136848449707031, 0.0450592041015625, 0.04874992370605469, 0.052440643310546875, 0.05613136291503906, 0.05982208251953125, 0.06351280212402344, 0.06720352172851562, 0.07089424133300781, 0.0745849609375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 3.0, 6.0, 21.0, 45.0, 76.0, 110.0, 145.0, 150.0, 158.0, 123.0, 71.0, 51.0, 27.0, 15.0, 8.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1953783631324768, -0.17190924286842346, -0.1484401375055313, -0.12497102469205856, -0.10150191187858582, -0.07803279906511307, -0.05456368625164032, -0.03109458088874817, -0.007625460624694824, 0.015843652188777924, 0.03931276500225067, 0.06278187781572342, 0.08625099062919617, 0.10972010344266891, 0.13318921625614166, 0.1566583216190338, 0.18012744188308716, 0.2035965621471405, 0.22706566751003265, 0.2505347728729248, 0.27400389313697815, 0.2974730134010315, 0.32094210386276245, 0.3444112241268158, 0.36788034439086914, 0.3913494646549225, 0.41481858491897583, 0.4382876753807068, 0.46175679564476013, 0.4852259159088135, 0.5086950063705444, 0.5321640968322754, 0.5556333065032959, 0.5791023969650269, 0.6025715470314026, 0.6260406374931335, 0.6495097875595093, 0.6729788780212402, 0.6964479684829712, 0.7199170589447021, 0.7433862090110779, 0.7668552994728088, 0.7903244495391846, 0.8137935400009155, 0.8372626304626465, 0.8607317805290222, 0.8842008709907532, 0.9076700210571289, 0.9311391115188599, 0.9546082019805908, 0.9780773520469666, 1.0015465021133423, 1.0250155925750732, 1.0484846830368042, 1.0719537734985352, 1.0954228639602661, 1.118891954421997, 1.142361044883728, 1.165830135345459, 1.1892993450164795, 1.2127684354782104, 1.2362375259399414, 1.2597066164016724, 1.2831757068634033, 1.3066449165344238]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 8.0, 14.0, 10.0, 10.0, 18.0, 10.0, 17.0, 27.0, 26.0, 30.0, 32.0, 42.0, 39.0, 24.0, 25.0, 45.0, 37.0, 47.0, 37.0, 50.0, 45.0, 40.0, 44.0, 32.0, 38.0, 37.0, 24.0, 26.0, 28.0, 22.0, 21.0, 16.0, 15.0, 12.0, 12.0, 9.0, 12.0, 2.0, 4.0, 5.0, 5.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3129574656486511, -0.3040841519832611, -0.2952108383178711, -0.2863375246524811, -0.27746421098709106, -0.26859086751937866, -0.25971755385398865, -0.25084424018859863, -0.24197092652320862, -0.2330976128578186, -0.2242242991924286, -0.21535097062587738, -0.20647765696048737, -0.19760434329509735, -0.18873101472854614, -0.17985770106315613, -0.1709843873977661, -0.1621110737323761, -0.15323776006698608, -0.14436443150043488, -0.13549111783504486, -0.12661780416965485, -0.11774448305368423, -0.10887116193771362, -0.09999784827232361, -0.0911245346069336, -0.08225121349096298, -0.07337789237499237, -0.06450457870960236, -0.05563126131892204, -0.04675794392824173, -0.03788462653756142, -0.029011309146881104, -0.02013799175620079, -0.011264674365520477, -0.002391356974840164, 0.006481960415840149, 0.015355277806520462, 0.024228595197200775, 0.03310191258788109, 0.0419752299785614, 0.050848547369241714, 0.05972186475992203, 0.06859518587589264, 0.07746849954128265, 0.08634181320667267, 0.09521513432264328, 0.10408845543861389, 0.1129617691040039, 0.12183508276939392, 0.13070839643478394, 0.13958172500133514, 0.14845503866672516, 0.15732835233211517, 0.16620168089866638, 0.1750749945640564, 0.1839483082294464, 0.19282162189483643, 0.20169493556022644, 0.21056826412677765, 0.21944157779216766, 0.22831489145755768, 0.2371882200241089, 0.2460615336894989, 0.2549348473548889]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 6.0, 9.0, 22.0, 49.0, 76.0, 114.0, 209.0, 378.0, 701.0, 1379.0, 2698.0, 5333.0, 10707.0, 21220.0, 40409.0, 74818.0, 128446.0, 202851.0, 219333.0, 150020.0, 88712.0, 48797.0, 25523.0, 13239.0, 6505.0, 3349.0, 1727.0, 838.0, 459.0, 265.0, 132.0, 79.0, 62.0, 28.0, 28.0, 10.0, 10.0, 8.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.1212158203125, -0.117767333984375, -0.11431884765625, -0.110870361328125, -0.107421875, -0.103973388671875, -0.10052490234375, -0.097076416015625, -0.0936279296875, -0.090179443359375, -0.08673095703125, -0.083282470703125, -0.079833984375, -0.076385498046875, -0.07293701171875, -0.069488525390625, -0.0660400390625, -0.062591552734375, -0.05914306640625, -0.055694580078125, -0.05224609375, -0.048797607421875, -0.04534912109375, -0.041900634765625, -0.0384521484375, -0.035003662109375, -0.03155517578125, -0.028106689453125, -0.024658203125, -0.021209716796875, -0.01776123046875, -0.014312744140625, -0.0108642578125, -0.007415771484375, -0.00396728515625, -0.000518798828125, 0.0029296875, 0.006378173828125, 0.00982666015625, 0.013275146484375, 0.0167236328125, 0.020172119140625, 0.02362060546875, 0.027069091796875, 0.030517578125, 0.033966064453125, 0.03741455078125, 0.040863037109375, 0.0443115234375, 0.047760009765625, 0.05120849609375, 0.054656982421875, 0.05810546875, 0.061553955078125, 0.06500244140625, 0.068450927734375, 0.0718994140625, 0.075347900390625, 0.07879638671875, 0.082244873046875, 0.085693359375, 0.089141845703125, 0.09259033203125, 0.096038818359375, 0.0994873046875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 9.0, 7.0, 9.0, 9.0, 6.0, 6.0, 16.0, 16.0, 13.0, 28.0, 25.0, 22.0, 29.0, 32.0, 30.0, 34.0, 32.0, 36.0, 44.0, 42.0, 49.0, 35.0, 39.0, 38.0, 43.0, 35.0, 26.0, 26.0, 31.0, 31.0, 25.0, 27.0, 16.0, 20.0, 16.0, 19.0, 15.0, 9.0, 12.0, 9.0, 4.0, 9.0, 5.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0396728515625, -0.038448333740234375, -0.03722381591796875, -0.035999298095703125, -0.0347747802734375, -0.033550262451171875, -0.03232574462890625, -0.031101226806640625, -0.029876708984375, -0.028652191162109375, -0.02742767333984375, -0.026203155517578125, -0.0249786376953125, -0.023754119873046875, -0.02252960205078125, -0.021305084228515625, -0.02008056640625, -0.018856048583984375, -0.01763153076171875, -0.016407012939453125, -0.0151824951171875, -0.013957977294921875, -0.01273345947265625, -0.011508941650390625, -0.010284423828125, -0.009059906005859375, -0.00783538818359375, -0.006610870361328125, -0.0053863525390625, -0.004161834716796875, -0.00293731689453125, -0.001712799072265625, -0.00048828125, 0.000736236572265625, 0.00196075439453125, 0.003185272216796875, 0.0044097900390625, 0.005634307861328125, 0.00685882568359375, 0.008083343505859375, 0.009307861328125, 0.010532379150390625, 0.01175689697265625, 0.012981414794921875, 0.0142059326171875, 0.015430450439453125, 0.01665496826171875, 0.017879486083984375, 0.01910400390625, 0.020328521728515625, 0.02155303955078125, 0.022777557373046875, 0.0240020751953125, 0.025226593017578125, 0.02645111083984375, 0.027675628662109375, 0.028900146484375, 0.030124664306640625, 0.03134918212890625, 0.032573699951171875, 0.0337982177734375, 0.035022735595703125, 0.03624725341796875, 0.037471771240234375, 0.0386962890625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 15.0, 13.0, 32.0, 34.0, 69.0, 62.0, 109.0, 247.0, 414.0, 992.0, 2137.0, 5097.0, 13209.0, 33592.0, 83273.0, 181134.0, 290227.0, 235657.0, 119073.0, 50106.0, 19632.0, 7631.0, 3083.0, 1278.0, 612.0, 336.0, 173.0, 87.0, 75.0, 44.0, 25.0, 17.0, 19.0, 12.0, 7.0, 8.0, 6.0, 4.0, 2.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11785888671875, -0.11360645294189453, -0.10935401916503906, -0.1051015853881836, -0.10084915161132812, -0.09659671783447266, -0.09234428405761719, -0.08809185028076172, -0.08383941650390625, -0.07958698272705078, -0.07533454895019531, -0.07108211517333984, -0.06682968139648438, -0.0625772476196289, -0.05832481384277344, -0.05407238006591797, -0.0498199462890625, -0.04556751251220703, -0.04131507873535156, -0.037062644958496094, -0.032810211181640625, -0.028557777404785156, -0.024305343627929688, -0.02005290985107422, -0.01580047607421875, -0.011548042297363281, -0.0072956085205078125, -0.0030431747436523438, 0.001209259033203125, 0.005461692810058594, 0.009714126586914062, 0.013966560363769531, 0.018218994140625, 0.02247142791748047, 0.026723861694335938, 0.030976295471191406, 0.035228729248046875, 0.039481163024902344, 0.04373359680175781, 0.04798603057861328, 0.05223846435546875, 0.05649089813232422, 0.06074333190917969, 0.06499576568603516, 0.06924819946289062, 0.0735006332397461, 0.07775306701660156, 0.08200550079345703, 0.0862579345703125, 0.09051036834716797, 0.09476280212402344, 0.0990152359008789, 0.10326766967773438, 0.10752010345458984, 0.11177253723144531, 0.11602497100830078, 0.12027740478515625, 0.12452983856201172, 0.1287822723388672, 0.13303470611572266, 0.13728713989257812, 0.1415395736694336, 0.14579200744628906, 0.15004444122314453, 0.154296875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 3.0, 3.0, 5.0, 12.0, 7.0, 9.0, 8.0, 8.0, 17.0, 7.0, 22.0, 21.0, 28.0, 31.0, 15.0, 35.0, 28.0, 30.0, 34.0, 35.0, 33.0, 40.0, 40.0, 41.0, 45.0, 29.0, 40.0, 30.0, 39.0, 32.0, 29.0, 20.0, 28.0, 23.0, 23.0, 25.0, 10.0, 15.0, 19.0, 13.0, 15.0, 13.0, 8.0, 4.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 5.0, 0.0, 2.0], "bins": [-0.11669921875, -0.11330318450927734, -0.10990715026855469, -0.10651111602783203, -0.10311508178710938, -0.09971904754638672, -0.09632301330566406, -0.0929269790649414, -0.08953094482421875, -0.0861349105834961, -0.08273887634277344, -0.07934284210205078, -0.07594680786132812, -0.07255077362060547, -0.06915473937988281, -0.06575870513916016, -0.0623626708984375, -0.058966636657714844, -0.05557060241699219, -0.05217456817626953, -0.048778533935546875, -0.04538249969482422, -0.04198646545410156, -0.038590431213378906, -0.03519439697265625, -0.031798362731933594, -0.028402328491210938, -0.02500629425048828, -0.021610260009765625, -0.01821422576904297, -0.014818191528320312, -0.011422157287597656, -0.008026123046875, -0.004630088806152344, -0.0012340545654296875, 0.0021619796752929688, 0.005558013916015625, 0.008954048156738281, 0.012350082397460938, 0.015746116638183594, 0.01914215087890625, 0.022538185119628906, 0.025934219360351562, 0.02933025360107422, 0.032726287841796875, 0.03612232208251953, 0.03951835632324219, 0.042914390563964844, 0.0463104248046875, 0.049706459045410156, 0.05310249328613281, 0.05649852752685547, 0.059894561767578125, 0.06329059600830078, 0.06668663024902344, 0.0700826644897461, 0.07347869873046875, 0.0768747329711914, 0.08027076721191406, 0.08366680145263672, 0.08706283569335938, 0.09045886993408203, 0.09385490417480469, 0.09725093841552734, 0.10064697265625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 9.0, 3.0, 7.0, 14.0, 25.0, 27.0, 56.0, 81.0, 113.0, 211.0, 288.0, 519.0, 833.0, 1431.0, 2309.0, 3974.0, 6850.0, 11683.0, 19936.0, 33424.0, 55713.0, 89419.0, 133188.0, 172014.0, 170141.0, 129450.0, 85641.0, 53309.0, 31797.0, 19184.0, 10995.0, 6457.0, 3801.0, 2250.0, 1344.0, 812.0, 467.0, 274.0, 192.0, 109.0, 73.0, 45.0, 30.0, 20.0, 12.0, 8.0, 5.0, 10.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0302581787109375, -0.029340028762817383, -0.028421878814697266, -0.02750372886657715, -0.02658557891845703, -0.025667428970336914, -0.024749279022216797, -0.02383112907409668, -0.022912979125976562, -0.021994829177856445, -0.021076679229736328, -0.02015852928161621, -0.019240379333496094, -0.018322229385375977, -0.01740407943725586, -0.016485929489135742, -0.015567779541015625, -0.014649629592895508, -0.01373147964477539, -0.012813329696655273, -0.011895179748535156, -0.010977029800415039, -0.010058879852294922, -0.009140729904174805, -0.008222579956054688, -0.00730443000793457, -0.006386280059814453, -0.005468130111694336, -0.004549980163574219, -0.0036318302154541016, -0.0027136802673339844, -0.0017955303192138672, -0.00087738037109375, 4.076957702636719e-05, 0.0009589195251464844, 0.0018770694732666016, 0.0027952194213867188, 0.003713369369506836, 0.004631519317626953, 0.00554966926574707, 0.0064678192138671875, 0.007385969161987305, 0.008304119110107422, 0.009222269058227539, 0.010140419006347656, 0.011058568954467773, 0.01197671890258789, 0.012894868850708008, 0.013813018798828125, 0.014731168746948242, 0.01564931869506836, 0.016567468643188477, 0.017485618591308594, 0.01840376853942871, 0.019321918487548828, 0.020240068435668945, 0.021158218383789062, 0.02207636833190918, 0.022994518280029297, 0.023912668228149414, 0.02483081817626953, 0.02574896812438965, 0.026667118072509766, 0.027585268020629883, 0.02850341796875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 3.0, 4.0, 8.0, 9.0, 8.0, 8.0, 8.0, 12.0, 10.0, 12.0, 13.0, 21.0, 22.0, 16.0, 30.0, 24.0, 28.0, 44.0, 42.0, 42.0, 50.0, 54.0, 68.0, 41.0, 57.0, 41.0, 49.0, 46.0, 23.0, 29.0, 33.0, 20.0, 25.0, 15.0, 9.0, 11.0, 11.0, 9.0, 8.0, 9.0, 6.0, 4.0, 5.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.4781951904296875e-05, -1.4328397810459137e-05, -1.3874843716621399e-05, -1.3421289622783661e-05, -1.2967735528945923e-05, -1.2514181435108185e-05, -1.2060627341270447e-05, -1.1607073247432709e-05, -1.115351915359497e-05, -1.0699965059757233e-05, -1.0246410965919495e-05, -9.792856872081757e-06, -9.339302778244019e-06, -8.88574868440628e-06, -8.432194590568542e-06, -7.978640496730804e-06, -7.525086402893066e-06, -7.071532309055328e-06, -6.61797821521759e-06, -6.164424121379852e-06, -5.710870027542114e-06, -5.257315933704376e-06, -4.803761839866638e-06, -4.3502077460289e-06, -3.896653652191162e-06, -3.443099558353424e-06, -2.989545464515686e-06, -2.535991370677948e-06, -2.08243727684021e-06, -1.628883183002472e-06, -1.1753290891647339e-06, -7.217749953269958e-07, -2.682209014892578e-07, 1.8533319234848022e-07, 6.388872861862183e-07, 1.0924413800239563e-06, 1.5459954738616943e-06, 1.9995495676994324e-06, 2.4531036615371704e-06, 2.9066577553749084e-06, 3.3602118492126465e-06, 3.8137659430503845e-06, 4.2673200368881226e-06, 4.720874130725861e-06, 5.174428224563599e-06, 5.627982318401337e-06, 6.081536412239075e-06, 6.535090506076813e-06, 6.988644599914551e-06, 7.442198693752289e-06, 7.895752787590027e-06, 8.349306881427765e-06, 8.802860975265503e-06, 9.256415069103241e-06, 9.709969162940979e-06, 1.0163523256778717e-05, 1.0617077350616455e-05, 1.1070631444454193e-05, 1.1524185538291931e-05, 1.197773963212967e-05, 1.2431293725967407e-05, 1.2884847819805145e-05, 1.3338401913642883e-05, 1.3791956007480621e-05, 1.424551010131836e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 8.0, 6.0, 12.0, 15.0, 20.0, 24.0, 43.0, 68.0, 113.0, 157.0, 300.0, 591.0, 1050.0, 2027.0, 3671.0, 7146.0, 13434.0, 26263.0, 50495.0, 94677.0, 167477.0, 232281.0, 196697.0, 118840.0, 63885.0, 33176.0, 17080.0, 8990.0, 4624.0, 2407.0, 1279.0, 713.0, 377.0, 219.0, 125.0, 62.0, 45.0, 34.0, 28.0, 16.0, 20.0, 11.0, 16.0, 10.0, 3.0, 4.0, 6.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.037689208984375, -0.03660249710083008, -0.035515785217285156, -0.034429073333740234, -0.03334236145019531, -0.03225564956665039, -0.03116893768310547, -0.030082225799560547, -0.028995513916015625, -0.027908802032470703, -0.02682209014892578, -0.02573537826538086, -0.024648666381835938, -0.023561954498291016, -0.022475242614746094, -0.021388530731201172, -0.02030181884765625, -0.019215106964111328, -0.018128395080566406, -0.017041683197021484, -0.015954971313476562, -0.01486825942993164, -0.013781547546386719, -0.012694835662841797, -0.011608123779296875, -0.010521411895751953, -0.009434700012207031, -0.00834798812866211, -0.0072612762451171875, -0.006174564361572266, -0.005087852478027344, -0.004001140594482422, -0.0029144287109375, -0.0018277168273925781, -0.0007410049438476562, 0.0003457069396972656, 0.0014324188232421875, 0.0025191307067871094, 0.0036058425903320312, 0.004692554473876953, 0.005779266357421875, 0.006865978240966797, 0.007952690124511719, 0.00903940200805664, 0.010126113891601562, 0.011212825775146484, 0.012299537658691406, 0.013386249542236328, 0.01447296142578125, 0.015559673309326172, 0.016646385192871094, 0.017733097076416016, 0.018819808959960938, 0.01990652084350586, 0.02099323272705078, 0.022079944610595703, 0.023166656494140625, 0.024253368377685547, 0.02534008026123047, 0.02642679214477539, 0.027513504028320312, 0.028600215911865234, 0.029686927795410156, 0.030773639678955078, 0.0318603515625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 3.0, 4.0, 5.0, 5.0, 7.0, 10.0, 6.0, 7.0, 13.0, 13.0, 14.0, 17.0, 28.0, 22.0, 28.0, 30.0, 23.0, 39.0, 51.0, 51.0, 41.0, 52.0, 71.0, 57.0, 54.0, 36.0, 52.0, 38.0, 27.0, 27.0, 24.0, 22.0, 12.0, 15.0, 15.0, 11.0, 11.0, 4.0, 7.0, 11.0, 5.0, 12.0, 4.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.03192138671875, -0.03090047836303711, -0.02987957000732422, -0.028858661651611328, -0.027837753295898438, -0.026816844940185547, -0.025795936584472656, -0.024775028228759766, -0.023754119873046875, -0.022733211517333984, -0.021712303161621094, -0.020691394805908203, -0.019670486450195312, -0.018649578094482422, -0.01762866973876953, -0.01660776138305664, -0.01558685302734375, -0.01456594467163086, -0.013545036315917969, -0.012524127960205078, -0.011503219604492188, -0.010482311248779297, -0.009461402893066406, -0.008440494537353516, -0.007419586181640625, -0.006398677825927734, -0.005377769470214844, -0.004356861114501953, -0.0033359527587890625, -0.002315044403076172, -0.0012941360473632812, -0.0002732276916503906, 0.0007476806640625, 0.0017685890197753906, 0.0027894973754882812, 0.003810405731201172, 0.0048313140869140625, 0.005852222442626953, 0.006873130798339844, 0.007894039154052734, 0.008914947509765625, 0.009935855865478516, 0.010956764221191406, 0.011977672576904297, 0.012998580932617188, 0.014019489288330078, 0.015040397644042969, 0.01606130599975586, 0.01708221435546875, 0.01810312271118164, 0.01912403106689453, 0.020144939422607422, 0.021165847778320312, 0.022186756134033203, 0.023207664489746094, 0.024228572845458984, 0.025249481201171875, 0.026270389556884766, 0.027291297912597656, 0.028312206268310547, 0.029333114624023438, 0.030354022979736328, 0.03137493133544922, 0.03239583969116211, 0.033416748046875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 6.0, 10.0, 12.0, 14.0, 24.0, 20.0, 45.0, 58.0, 55.0, 75.0, 80.0, 108.0, 79.0, 91.0, 71.0, 50.0, 58.0, 45.0, 21.0, 21.0, 18.0, 13.0, 8.0, 9.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.280575692653656, -0.26758620142936707, -0.2545967102050781, -0.241607204079628, -0.22861771285533905, -0.21562820672988892, -0.20263871550559998, -0.18964922428131104, -0.1766597330570221, -0.16367024183273315, -0.15068073570728302, -0.13769124448299408, -0.12470175325870514, -0.1117122545838356, -0.09872275590896606, -0.08573326468467712, -0.07274375855922699, -0.05975426360964775, -0.04676476866006851, -0.033775269985198975, -0.020785775035619736, -0.007796280086040497, 0.0051932185888290405, 0.01818270981311798, 0.03117220848798752, 0.04416170343756676, 0.057151198387145996, 0.07014069706201553, 0.08313019573688507, 0.09611968696117401, 0.10910918563604355, 0.12209867686033249, 0.13508817553520203, 0.14807766675949097, 0.1610671728849411, 0.17405666410923004, 0.18704615533351898, 0.20003566145896912, 0.21302515268325806, 0.226014643907547, 0.23900413513183594, 0.2519936263561249, 0.2649831175804138, 0.27797263860702515, 0.2909621298313141, 0.303951621055603, 0.31694111227989197, 0.3299306035041809, 0.34292012453079224, 0.3559096157550812, 0.3688991069793701, 0.38188862800598145, 0.3948781192302704, 0.4078676104545593, 0.42085710167884827, 0.4338465929031372, 0.44683608412742615, 0.4598255753517151, 0.47281506657600403, 0.48580455780029297, 0.4987940788269043, 0.5117835402488708, 0.5247730612754822, 0.5377625226974487, 0.5507520437240601]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 8.0, 6.0, 5.0, 7.0, 1.0, 5.0, 10.0, 10.0, 13.0, 12.0, 14.0, 10.0, 15.0, 20.0, 26.0, 22.0, 21.0, 24.0, 39.0, 41.0, 37.0, 33.0, 42.0, 38.0, 30.0, 50.0, 28.0, 48.0, 43.0, 42.0, 27.0, 30.0, 20.0, 26.0, 29.0, 27.0, 15.0, 24.0, 19.0, 16.0, 13.0, 10.0, 10.0, 9.0, 5.0, 5.0, 7.0, 3.0, 3.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2848557233810425, -0.2759571969509125, -0.26705870032310486, -0.25816017389297485, -0.24926164746284485, -0.24036313593387604, -0.23146462440490723, -0.22256609797477722, -0.21366757154464722, -0.2047690600156784, -0.1958705335855484, -0.1869720220565796, -0.17807349562644958, -0.16917498409748077, -0.16027647256851196, -0.15137794613838196, -0.14247943460941315, -0.13358092308044434, -0.12468239665031433, -0.11578388512134552, -0.10688535869121552, -0.0979868471622467, -0.0890883281826973, -0.08018980920314789, -0.07129129022359848, -0.06239277124404907, -0.053494252264499664, -0.044595737010240555, -0.03569721803069115, -0.02679869905114174, -0.01790018379688263, -0.009001664817333221, -0.00010314583778381348, 0.00879537221044302, 0.017693890258669853, 0.026592407375574112, 0.03549092635512352, 0.04438944533467293, 0.05328796058893204, 0.062186479568481445, 0.07108499854803085, 0.07998351752758026, 0.08888203650712967, 0.09778055548667908, 0.10667906701564789, 0.1155775934457779, 0.1244761049747467, 0.1333746314048767, 0.14227314293384552, 0.15117165446281433, 0.16007018089294434, 0.16896869242191315, 0.17786721885204315, 0.18676573038101196, 0.19566425681114197, 0.20456276834011078, 0.2134612798690796, 0.2223597913980484, 0.2312583178281784, 0.24015682935714722, 0.24905535578727722, 0.2579538822174072, 0.26685237884521484, 0.27575090527534485, 0.28464943170547485]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [5.0, 2.0, 4.0, 4.0, 3.0, 6.0, 4.0, 9.0, 18.0, 15.0, 20.0, 26.0, 34.0, 64.0, 79.0, 111.0, 160.0, 202.0, 292.0, 355.0, 613.0, 958.0, 1575.0, 2526.0, 4360.0, 8081.0, 15272.0, 31293.0, 69678.0, 177315.0, 556419.0, 1685366.0, 1096133.0, 329558.0, 116336.0, 48209.0, 22714.0, 11396.0, 6026.0, 3404.0, 2035.0, 1204.0, 789.0, 502.0, 329.0, 233.0, 163.0, 111.0, 78.0, 56.0, 41.0, 33.0, 25.0, 21.0, 14.0, 3.0, 9.0, 0.0, 4.0, 6.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.058837890625, -0.056986331939697266, -0.05513477325439453, -0.0532832145690918, -0.05143165588378906, -0.04958009719848633, -0.047728538513183594, -0.04587697982788086, -0.044025421142578125, -0.04217386245727539, -0.040322303771972656, -0.03847074508666992, -0.03661918640136719, -0.03476762771606445, -0.03291606903076172, -0.031064510345458984, -0.02921295166015625, -0.027361392974853516, -0.02550983428955078, -0.023658275604248047, -0.021806716918945312, -0.019955158233642578, -0.018103599548339844, -0.01625204086303711, -0.014400482177734375, -0.01254892349243164, -0.010697364807128906, -0.008845806121826172, -0.0069942474365234375, -0.005142688751220703, -0.0032911300659179688, -0.0014395713806152344, 0.0004119873046875, 0.0022635459899902344, 0.004115104675292969, 0.005966663360595703, 0.007818222045898438, 0.009669780731201172, 0.011521339416503906, 0.01337289810180664, 0.015224456787109375, 0.01707601547241211, 0.018927574157714844, 0.020779132843017578, 0.022630691528320312, 0.024482250213623047, 0.02633380889892578, 0.028185367584228516, 0.03003692626953125, 0.031888484954833984, 0.03374004364013672, 0.03559160232543945, 0.03744316101074219, 0.03929471969604492, 0.041146278381347656, 0.04299783706665039, 0.044849395751953125, 0.04670095443725586, 0.048552513122558594, 0.05040407180786133, 0.05225563049316406, 0.0541071891784668, 0.05595874786376953, 0.057810306549072266, 0.059661865234375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 4.0, 4.0, 12.0, 6.0, 10.0, 10.0, 12.0, 16.0, 11.0, 28.0, 18.0, 22.0, 25.0, 19.0, 33.0, 19.0, 37.0, 28.0, 34.0, 41.0, 39.0, 43.0, 43.0, 36.0, 39.0, 39.0, 27.0, 29.0, 27.0, 35.0, 33.0, 23.0, 22.0, 23.0, 15.0, 18.0, 21.0, 16.0, 14.0, 14.0, 16.0, 7.0, 6.0, 9.0, 3.0, 8.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0390625, -0.03779411315917969, -0.036525726318359375, -0.03525733947753906, -0.03398895263671875, -0.03272056579589844, -0.031452178955078125, -0.030183792114257812, -0.0289154052734375, -0.027647018432617188, -0.026378631591796875, -0.025110244750976562, -0.02384185791015625, -0.022573471069335938, -0.021305084228515625, -0.020036697387695312, -0.018768310546875, -0.017499923706054688, -0.016231536865234375, -0.014963150024414062, -0.01369476318359375, -0.012426376342773438, -0.011157989501953125, -0.009889602661132812, -0.0086212158203125, -0.0073528289794921875, -0.006084442138671875, -0.0048160552978515625, -0.00354766845703125, -0.0022792816162109375, -0.001010894775390625, 0.0002574920654296875, 0.00152587890625, 0.0027942657470703125, 0.004062652587890625, 0.0053310394287109375, 0.00659942626953125, 0.007867813110351562, 0.009136199951171875, 0.010404586791992188, 0.0116729736328125, 0.012941360473632812, 0.014209747314453125, 0.015478134155273438, 0.01674652099609375, 0.018014907836914062, 0.019283294677734375, 0.020551681518554688, 0.021820068359375, 0.023088455200195312, 0.024356842041015625, 0.025625228881835938, 0.02689361572265625, 0.028162002563476562, 0.029430389404296875, 0.030698776245117188, 0.0319671630859375, 0.03323554992675781, 0.034503936767578125, 0.03577232360839844, 0.03704071044921875, 0.03830909729003906, 0.039577484130859375, 0.04084587097167969, 0.0421142578125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 8.0, 9.0, 16.0, 25.0, 26.0, 39.0, 44.0, 92.0, 95.0, 160.0, 247.0, 370.0, 586.0, 873.0, 1663.0, 2973.0, 5890.0, 12129.0, 26958.0, 64570.0, 168004.0, 493936.0, 1528070.0, 1258020.0, 393253.0, 137575.0, 53546.0, 22912.0, 10465.0, 5171.0, 2662.0, 1478.0, 855.0, 481.0, 341.0, 235.0, 148.0, 85.0, 67.0, 62.0, 43.0, 22.0, 21.0, 17.0, 12.0, 7.0, 5.0, 4.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.07366943359375, -0.07128524780273438, -0.06890106201171875, -0.06651687622070312, -0.0641326904296875, -0.061748504638671875, -0.05936431884765625, -0.056980133056640625, -0.054595947265625, -0.052211761474609375, -0.04982757568359375, -0.047443389892578125, -0.0450592041015625, -0.042675018310546875, -0.04029083251953125, -0.037906646728515625, -0.0355224609375, -0.033138275146484375, -0.03075408935546875, -0.028369903564453125, -0.0259857177734375, -0.023601531982421875, -0.02121734619140625, -0.018833160400390625, -0.016448974609375, -0.014064788818359375, -0.01168060302734375, -0.009296417236328125, -0.0069122314453125, -0.004528045654296875, -0.00214385986328125, 0.000240325927734375, 0.00262451171875, 0.005008697509765625, 0.00739288330078125, 0.009777069091796875, 0.0121612548828125, 0.014545440673828125, 0.01692962646484375, 0.019313812255859375, 0.021697998046875, 0.024082183837890625, 0.02646636962890625, 0.028850555419921875, 0.0312347412109375, 0.033618927001953125, 0.03600311279296875, 0.038387298583984375, 0.040771484375, 0.043155670166015625, 0.04553985595703125, 0.047924041748046875, 0.0503082275390625, 0.052692413330078125, 0.05507659912109375, 0.057460784912109375, 0.059844970703125, 0.062229156494140625, 0.06461334228515625, 0.06699752807617188, 0.0693817138671875, 0.07176589965820312, 0.07415008544921875, 0.07653427124023438, 0.07891845703125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 7.0, 8.0, 7.0, 15.0, 18.0, 19.0, 33.0, 37.0, 46.0, 74.0, 107.0, 163.0, 196.0, 290.0, 435.0, 587.0, 626.0, 442.0, 281.0, 214.0, 151.0, 88.0, 67.0, 49.0, 24.0, 21.0, 14.0, 18.0, 8.0, 11.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08856201171875, -0.0857076644897461, -0.08285331726074219, -0.07999897003173828, -0.07714462280273438, -0.07429027557373047, -0.07143592834472656, -0.06858158111572266, -0.06572723388671875, -0.06287288665771484, -0.06001853942871094, -0.05716419219970703, -0.054309844970703125, -0.05145549774169922, -0.04860115051269531, -0.045746803283691406, -0.0428924560546875, -0.040038108825683594, -0.03718376159667969, -0.03432941436767578, -0.031475067138671875, -0.02862071990966797, -0.025766372680664062, -0.022912025451660156, -0.02005767822265625, -0.017203330993652344, -0.014348983764648438, -0.011494636535644531, -0.008640289306640625, -0.005785942077636719, -0.0029315948486328125, -7.724761962890625e-05, 0.002777099609375, 0.005631446838378906, 0.008485794067382812, 0.011340141296386719, 0.014194488525390625, 0.01704883575439453, 0.019903182983398438, 0.022757530212402344, 0.02561187744140625, 0.028466224670410156, 0.03132057189941406, 0.03417491912841797, 0.037029266357421875, 0.03988361358642578, 0.04273796081542969, 0.045592308044433594, 0.0484466552734375, 0.051301002502441406, 0.05415534973144531, 0.05700969696044922, 0.059864044189453125, 0.06271839141845703, 0.06557273864746094, 0.06842708587646484, 0.07128143310546875, 0.07413578033447266, 0.07699012756347656, 0.07984447479248047, 0.08269882202148438, 0.08555316925048828, 0.08840751647949219, 0.0912618637084961, 0.0941162109375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 2.0, 3.0, 4.0, 11.0, 9.0, 6.0, 13.0, 16.0, 33.0, 36.0, 41.0, 49.0, 51.0, 62.0, 81.0, 77.0, 77.0, 87.0, 69.0, 55.0, 54.0, 43.0, 32.0, 25.0, 19.0, 10.0, 7.0, 4.0, 8.0, 5.0, 2.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31754857301712036, -0.30716583132743835, -0.29678308963775635, -0.28640034794807434, -0.27601760625839233, -0.2656348943710327, -0.2552521526813507, -0.2448694109916687, -0.2344866693019867, -0.2241039276123047, -0.21372118592262268, -0.20333845913410187, -0.19295571744441986, -0.18257297575473785, -0.17219024896621704, -0.16180750727653503, -0.15142476558685303, -0.14104202389717102, -0.130659282207489, -0.1202765554189682, -0.1098938137292862, -0.09951107203960419, -0.08912833780050278, -0.07874560356140137, -0.06836286187171936, -0.05798012390732765, -0.047597385942935944, -0.037214647978544235, -0.026831910014152527, -0.01644917204976082, -0.00606643408536911, 0.0043163001537323, 0.014699041843414307, 0.025081779807806015, 0.03546451777219772, 0.04584725573658943, 0.05622999370098114, 0.06661273539066315, 0.07699546962976456, 0.08737820386886597, 0.09776094555854797, 0.10814368724822998, 0.11852642148733139, 0.1289091557264328, 0.1392918974161148, 0.14967463910579681, 0.16005736589431763, 0.17044010758399963, 0.18082284927368164, 0.19120559096336365, 0.20158833265304565, 0.21197105944156647, 0.22235380113124847, 0.23273654282093048, 0.2431192696094513, 0.2535020112991333, 0.2638847529888153, 0.2742674946784973, 0.2846502363681793, 0.29503297805786133, 0.30541568994522095, 0.31579843163490295, 0.32618117332458496, 0.33656391501426697, 0.346946656703949]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 1.0, 14.0, 7.0, 9.0, 10.0, 13.0, 13.0, 20.0, 26.0, 18.0, 23.0, 30.0, 24.0, 28.0, 31.0, 31.0, 27.0, 38.0, 29.0, 33.0, 26.0, 29.0, 44.0, 39.0, 43.0, 38.0, 35.0, 26.0, 28.0, 39.0, 25.0, 32.0, 27.0, 12.0, 22.0, 19.0, 14.0, 11.0, 6.0, 19.0, 6.0, 5.0, 3.0, 6.0, 6.0, 4.0, 5.0, 0.0, 5.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.21680021286010742, -0.21019044518470764, -0.20358067750930786, -0.19697090983390808, -0.1903611421585083, -0.18375137448310852, -0.17714160680770874, -0.17053183913230896, -0.16392207145690918, -0.1573123037815094, -0.15070253610610962, -0.14409276843070984, -0.13748300075531006, -0.13087323307991028, -0.1242634579539299, -0.11765369027853012, -0.11104391515254974, -0.10443414747714996, -0.09782437980175018, -0.0912146121263504, -0.08460484445095062, -0.07799507677555084, -0.07138530164957047, -0.06477553397417068, -0.058165766298770905, -0.051555998623371124, -0.044946230947971344, -0.038336459547281265, -0.031726691871881485, -0.025116924196481705, -0.018507152795791626, -0.011897385120391846, -0.005287617444992065, 0.0013221511617302895, 0.007931919768452644, 0.014541689306497574, 0.021151456981897354, 0.027761224657297134, 0.03437099605798721, 0.04098076373338699, 0.047590531408786774, 0.054200299084186554, 0.060810066759586334, 0.06741984188556671, 0.07402960956096649, 0.08063937723636627, 0.08724914491176605, 0.09385891258716583, 0.10046868026256561, 0.1070784479379654, 0.11368821561336517, 0.12029798328876495, 0.12690775096416473, 0.13351751863956451, 0.1401273012161255, 0.14673706889152527, 0.15334683656692505, 0.15995660424232483, 0.1665663719177246, 0.1731761395931244, 0.17978590726852417, 0.18639567494392395, 0.19300544261932373, 0.1996152102947235, 0.2062249779701233]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 6.0, 7.0, 17.0, 11.0, 19.0, 35.0, 62.0, 65.0, 94.0, 148.0, 278.0, 409.0, 666.0, 1102.0, 1815.0, 3038.0, 5036.0, 8701.0, 14374.0, 24643.0, 42832.0, 72425.0, 121642.0, 180194.0, 197349.0, 149066.0, 92623.0, 54410.0, 31460.0, 18526.0, 10962.0, 6588.0, 3921.0, 2243.0, 1483.0, 855.0, 519.0, 334.0, 220.0, 140.0, 86.0, 54.0, 40.0, 18.0, 14.0, 7.0, 6.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07720947265625, -0.07465553283691406, -0.07210159301757812, -0.06954765319824219, -0.06699371337890625, -0.06443977355957031, -0.061885833740234375, -0.05933189392089844, -0.0567779541015625, -0.05422401428222656, -0.051670074462890625, -0.04911613464355469, -0.04656219482421875, -0.04400825500488281, -0.041454315185546875, -0.03890037536621094, -0.036346435546875, -0.03379249572753906, -0.031238555908203125, -0.028684616088867188, -0.02613067626953125, -0.023576736450195312, -0.021022796630859375, -0.018468856811523438, -0.0159149169921875, -0.013360977172851562, -0.010807037353515625, -0.008253097534179688, -0.00569915771484375, -0.0031452178955078125, -0.000591278076171875, 0.0019626617431640625, 0.0045166015625, 0.0070705413818359375, 0.009624481201171875, 0.012178421020507812, 0.01473236083984375, 0.017286300659179688, 0.019840240478515625, 0.022394180297851562, 0.0249481201171875, 0.027502059936523438, 0.030055999755859375, 0.03260993957519531, 0.03516387939453125, 0.03771781921386719, 0.040271759033203125, 0.04282569885253906, 0.045379638671875, 0.04793357849121094, 0.050487518310546875, 0.05304145812988281, 0.05559539794921875, 0.05814933776855469, 0.060703277587890625, 0.06325721740722656, 0.0658111572265625, 0.06836509704589844, 0.07091903686523438, 0.07347297668457031, 0.07602691650390625, 0.07858085632324219, 0.08113479614257812, 0.08368873596191406, 0.08624267578125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 1.0, 7.0, 3.0, 8.0, 14.0, 16.0, 14.0, 15.0, 15.0, 18.0, 20.0, 19.0, 27.0, 26.0, 28.0, 38.0, 31.0, 40.0, 27.0, 38.0, 33.0, 37.0, 38.0, 46.0, 37.0, 46.0, 37.0, 30.0, 32.0, 26.0, 28.0, 23.0, 16.0, 25.0, 16.0, 26.0, 11.0, 9.0, 14.0, 12.0, 7.0, 10.0, 9.0, 8.0, 4.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.03912353515625, -0.03788423538208008, -0.036644935607910156, -0.035405635833740234, -0.03416633605957031, -0.03292703628540039, -0.03168773651123047, -0.030448436737060547, -0.029209136962890625, -0.027969837188720703, -0.02673053741455078, -0.02549123764038086, -0.024251937866210938, -0.023012638092041016, -0.021773338317871094, -0.020534038543701172, -0.01929473876953125, -0.018055438995361328, -0.016816139221191406, -0.015576839447021484, -0.014337539672851562, -0.01309823989868164, -0.011858940124511719, -0.010619640350341797, -0.009380340576171875, -0.008141040802001953, -0.006901741027832031, -0.005662441253662109, -0.0044231414794921875, -0.0031838417053222656, -0.0019445419311523438, -0.0007052421569824219, 0.0005340576171875, 0.0017733573913574219, 0.0030126571655273438, 0.004251956939697266, 0.0054912567138671875, 0.006730556488037109, 0.007969856262207031, 0.009209156036376953, 0.010448455810546875, 0.011687755584716797, 0.012927055358886719, 0.01416635513305664, 0.015405654907226562, 0.016644954681396484, 0.017884254455566406, 0.019123554229736328, 0.02036285400390625, 0.021602153778076172, 0.022841453552246094, 0.024080753326416016, 0.025320053100585938, 0.02655935287475586, 0.02779865264892578, 0.029037952423095703, 0.030277252197265625, 0.03151655197143555, 0.03275585174560547, 0.03399515151977539, 0.03523445129394531, 0.036473751068115234, 0.037713050842285156, 0.03895235061645508, 0.040191650390625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 3.0, 1.0, 2.0, 3.0, 5.0, 13.0, 12.0, 18.0, 27.0, 36.0, 49.0, 91.0, 112.0, 175.0, 283.0, 561.0, 1109.0, 2601.0, 5873.0, 14383.0, 35658.0, 89588.0, 219777.0, 337805.0, 202548.0, 82084.0, 32517.0, 13185.0, 5423.0, 2234.0, 1055.0, 508.0, 279.0, 180.0, 108.0, 74.0, 51.0, 36.0, 18.0, 25.0, 16.0, 11.0, 5.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1259765625, -0.12197113037109375, -0.1179656982421875, -0.11396026611328125, -0.109954833984375, -0.10594940185546875, -0.1019439697265625, -0.09793853759765625, -0.09393310546875, -0.08992767333984375, -0.0859222412109375, -0.08191680908203125, -0.077911376953125, -0.07390594482421875, -0.0699005126953125, -0.06589508056640625, -0.0618896484375, -0.05788421630859375, -0.0538787841796875, -0.04987335205078125, -0.045867919921875, -0.04186248779296875, -0.0378570556640625, -0.03385162353515625, -0.02984619140625, -0.02584075927734375, -0.0218353271484375, -0.01782989501953125, -0.013824462890625, -0.00981903076171875, -0.0058135986328125, -0.00180816650390625, 0.002197265625, 0.00620269775390625, 0.0102081298828125, 0.01421356201171875, 0.018218994140625, 0.02222442626953125, 0.0262298583984375, 0.03023529052734375, 0.03424072265625, 0.03824615478515625, 0.0422515869140625, 0.04625701904296875, 0.050262451171875, 0.05426788330078125, 0.0582733154296875, 0.06227874755859375, 0.0662841796875, 0.07028961181640625, 0.0742950439453125, 0.07830047607421875, 0.082305908203125, 0.08631134033203125, 0.0903167724609375, 0.09432220458984375, 0.09832763671875, 0.10233306884765625, 0.1063385009765625, 0.11034393310546875, 0.114349365234375, 0.11835479736328125, 0.1223602294921875, 0.12636566162109375, 0.13037109375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 4.0, 0.0, 4.0, 1.0, 8.0, 9.0, 8.0, 10.0, 13.0, 6.0, 16.0, 34.0, 19.0, 27.0, 36.0, 28.0, 28.0, 35.0, 30.0, 37.0, 49.0, 36.0, 48.0, 51.0, 49.0, 50.0, 46.0, 32.0, 39.0, 34.0, 26.0, 25.0, 29.0, 15.0, 21.0, 20.0, 18.0, 18.0, 12.0, 8.0, 5.0, 4.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.102294921875, -0.0985260009765625, -0.094757080078125, -0.0909881591796875, -0.08721923828125, -0.0834503173828125, -0.079681396484375, -0.0759124755859375, -0.0721435546875, -0.0683746337890625, -0.064605712890625, -0.0608367919921875, -0.05706787109375, -0.0532989501953125, -0.049530029296875, -0.0457611083984375, -0.0419921875, -0.0382232666015625, -0.034454345703125, -0.0306854248046875, -0.02691650390625, -0.0231475830078125, -0.019378662109375, -0.0156097412109375, -0.0118408203125, -0.0080718994140625, -0.004302978515625, -0.0005340576171875, 0.00323486328125, 0.0070037841796875, 0.010772705078125, 0.0145416259765625, 0.018310546875, 0.0220794677734375, 0.025848388671875, 0.0296173095703125, 0.03338623046875, 0.0371551513671875, 0.040924072265625, 0.0446929931640625, 0.0484619140625, 0.0522308349609375, 0.055999755859375, 0.0597686767578125, 0.06353759765625, 0.0673065185546875, 0.071075439453125, 0.0748443603515625, 0.07861328125, 0.0823822021484375, 0.086151123046875, 0.0899200439453125, 0.09368896484375, 0.0974578857421875, 0.101226806640625, 0.1049957275390625, 0.1087646484375, 0.1125335693359375, 0.116302490234375, 0.1200714111328125, 0.12384033203125, 0.1276092529296875, 0.131378173828125, 0.1351470947265625, 0.138916015625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 6.0, 4.0, 6.0, 17.0, 18.0, 32.0, 67.0, 86.0, 151.0, 223.0, 394.0, 691.0, 1093.0, 1778.0, 2895.0, 4849.0, 8337.0, 13945.0, 23730.0, 41694.0, 73532.0, 130247.0, 205509.0, 212006.0, 140207.0, 79302.0, 44777.0, 25491.0, 15204.0, 8944.0, 5335.0, 3183.0, 1863.0, 1174.0, 667.0, 415.0, 247.0, 162.0, 98.0, 69.0, 40.0, 24.0, 20.0, 8.0, 12.0, 6.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0297088623046875, -0.028752565383911133, -0.027796268463134766, -0.0268399715423584, -0.02588367462158203, -0.024927377700805664, -0.023971080780029297, -0.02301478385925293, -0.022058486938476562, -0.021102190017700195, -0.020145893096923828, -0.01918959617614746, -0.018233299255371094, -0.017277002334594727, -0.01632070541381836, -0.015364408493041992, -0.014408111572265625, -0.013451814651489258, -0.01249551773071289, -0.011539220809936523, -0.010582923889160156, -0.009626626968383789, -0.008670330047607422, -0.007714033126831055, -0.0067577362060546875, -0.00580143928527832, -0.004845142364501953, -0.003888845443725586, -0.0029325485229492188, -0.0019762516021728516, -0.0010199546813964844, -6.365776062011719e-05, 0.00089263916015625, 0.0018489360809326172, 0.0028052330017089844, 0.0037615299224853516, 0.004717826843261719, 0.005674123764038086, 0.006630420684814453, 0.00758671760559082, 0.008543014526367188, 0.009499311447143555, 0.010455608367919922, 0.011411905288696289, 0.012368202209472656, 0.013324499130249023, 0.01428079605102539, 0.015237092971801758, 0.016193389892578125, 0.017149686813354492, 0.01810598373413086, 0.019062280654907227, 0.020018577575683594, 0.02097487449645996, 0.021931171417236328, 0.022887468338012695, 0.023843765258789062, 0.02480006217956543, 0.025756359100341797, 0.026712656021118164, 0.02766895294189453, 0.0286252498626709, 0.029581546783447266, 0.030537843704223633, 0.031494140625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 6.0, 3.0, 2.0, 5.0, 5.0, 9.0, 13.0, 12.0, 19.0, 29.0, 26.0, 20.0, 40.0, 46.0, 58.0, 59.0, 50.0, 56.0, 62.0, 70.0, 49.0, 53.0, 57.0, 56.0, 42.0, 23.0, 26.0, 20.0, 20.0, 16.0, 12.0, 6.0, 6.0, 4.0, 10.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3649463653564453e-05, -1.3178214430809021e-05, -1.2706965208053589e-05, -1.2235715985298157e-05, -1.1764466762542725e-05, -1.1293217539787292e-05, -1.082196831703186e-05, -1.0350719094276428e-05, -9.879469871520996e-06, -9.408220648765564e-06, -8.936971426010132e-06, -8.4657222032547e-06, -7.994472980499268e-06, -7.5232237577438354e-06, -7.051974534988403e-06, -6.580725312232971e-06, -6.109476089477539e-06, -5.638226866722107e-06, -5.166977643966675e-06, -4.695728421211243e-06, -4.2244791984558105e-06, -3.7532299757003784e-06, -3.2819807529449463e-06, -2.810731530189514e-06, -2.339482307434082e-06, -1.86823308467865e-06, -1.3969838619232178e-06, -9.257346391677856e-07, -4.544854164123535e-07, 1.6763806343078613e-08, 4.880130290985107e-07, 9.592622518539429e-07, 1.430511474609375e-06, 1.9017606973648071e-06, 2.3730099201202393e-06, 2.8442591428756714e-06, 3.3155083656311035e-06, 3.7867575883865356e-06, 4.258006811141968e-06, 4.7292560338974e-06, 5.200505256652832e-06, 5.671754479408264e-06, 6.143003702163696e-06, 6.614252924919128e-06, 7.0855021476745605e-06, 7.556751370429993e-06, 8.028000593185425e-06, 8.499249815940857e-06, 8.970499038696289e-06, 9.441748261451721e-06, 9.912997484207153e-06, 1.0384246706962585e-05, 1.0855495929718018e-05, 1.132674515247345e-05, 1.1797994375228882e-05, 1.2269243597984314e-05, 1.2740492820739746e-05, 1.3211742043495178e-05, 1.368299126625061e-05, 1.4154240489006042e-05, 1.4625489711761475e-05, 1.5096738934516907e-05, 1.556798815727234e-05, 1.603923738002777e-05, 1.6510486602783203e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 3.0, 9.0, 9.0, 14.0, 18.0, 41.0, 48.0, 77.0, 143.0, 222.0, 450.0, 896.0, 1719.0, 3735.0, 7940.0, 16984.0, 37281.0, 83385.0, 183229.0, 297936.0, 222838.0, 104268.0, 46734.0, 21499.0, 9943.0, 4576.0, 2166.0, 1096.0, 538.0, 311.0, 169.0, 99.0, 55.0, 39.0, 31.0, 11.0, 12.0, 7.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0390625, -0.03782796859741211, -0.03659343719482422, -0.03535890579223633, -0.03412437438964844, -0.03288984298706055, -0.031655311584472656, -0.030420780181884766, -0.029186248779296875, -0.027951717376708984, -0.026717185974121094, -0.025482654571533203, -0.024248123168945312, -0.023013591766357422, -0.02177906036376953, -0.02054452896118164, -0.01930999755859375, -0.01807546615600586, -0.01684093475341797, -0.015606403350830078, -0.014371871948242188, -0.013137340545654297, -0.011902809143066406, -0.010668277740478516, -0.009433746337890625, -0.008199214935302734, -0.006964683532714844, -0.005730152130126953, -0.0044956207275390625, -0.003261089324951172, -0.0020265579223632812, -0.0007920265197753906, 0.0004425048828125, 0.0016770362854003906, 0.0029115676879882812, 0.004146099090576172, 0.0053806304931640625, 0.006615161895751953, 0.007849693298339844, 0.009084224700927734, 0.010318756103515625, 0.011553287506103516, 0.012787818908691406, 0.014022350311279297, 0.015256881713867188, 0.016491413116455078, 0.01772594451904297, 0.01896047592163086, 0.02019500732421875, 0.02142953872680664, 0.02266407012939453, 0.023898601531982422, 0.025133132934570312, 0.026367664337158203, 0.027602195739746094, 0.028836727142333984, 0.030071258544921875, 0.031305789947509766, 0.032540321350097656, 0.03377485275268555, 0.03500938415527344, 0.03624391555786133, 0.03747844696044922, 0.03871297836303711, 0.039947509765625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 5.0, 6.0, 11.0, 4.0, 5.0, 14.0, 18.0, 23.0, 13.0, 19.0, 28.0, 24.0, 50.0, 52.0, 55.0, 48.0, 61.0, 63.0, 63.0, 54.0, 62.0, 46.0, 49.0, 49.0, 31.0, 26.0, 27.0, 20.0, 17.0, 7.0, 15.0, 4.0, 5.0, 5.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0], "bins": [-0.041961669921875, -0.04085278511047363, -0.039743900299072266, -0.0386350154876709, -0.03752613067626953, -0.036417245864868164, -0.0353083610534668, -0.03419947624206543, -0.03309059143066406, -0.031981706619262695, -0.030872821807861328, -0.02976393699645996, -0.028655052185058594, -0.027546167373657227, -0.02643728256225586, -0.025328397750854492, -0.024219512939453125, -0.023110628128051758, -0.02200174331665039, -0.020892858505249023, -0.019783973693847656, -0.01867508888244629, -0.017566204071044922, -0.016457319259643555, -0.015348434448242188, -0.01423954963684082, -0.013130664825439453, -0.012021780014038086, -0.010912895202636719, -0.009804010391235352, -0.008695125579833984, -0.007586240768432617, -0.00647735595703125, -0.005368471145629883, -0.004259586334228516, -0.0031507015228271484, -0.0020418167114257812, -0.0009329319000244141, 0.00017595291137695312, 0.0012848377227783203, 0.0023937225341796875, 0.0035026073455810547, 0.004611492156982422, 0.005720376968383789, 0.006829261779785156, 0.007938146591186523, 0.00904703140258789, 0.010155916213989258, 0.011264801025390625, 0.012373685836791992, 0.01348257064819336, 0.014591455459594727, 0.015700340270996094, 0.01680922508239746, 0.017918109893798828, 0.019026994705200195, 0.020135879516601562, 0.02124476432800293, 0.022353649139404297, 0.023462533950805664, 0.02457141876220703, 0.0256803035736084, 0.026789188385009766, 0.027898073196411133, 0.0290069580078125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 6.0, 11.0, 21.0, 38.0, 45.0, 73.0, 85.0, 103.0, 99.0, 109.0, 87.0, 102.0, 85.0, 41.0, 30.0, 35.0, 15.0, 4.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6966410875320435, -0.6796780228614807, -0.6627150177955627, -0.645751953125, -0.628788948059082, -0.6118258833885193, -0.5948628783226013, -0.5778998136520386, -0.5609368085861206, -0.5439737439155579, -0.5270107388496399, -0.5100476741790771, -0.4930846691131592, -0.47612160444259644, -0.4591585695743561, -0.4421955347061157, -0.425232470035553, -0.4082694351673126, -0.39130640029907227, -0.3743433654308319, -0.35738033056259155, -0.3404172658920288, -0.32345423102378845, -0.3064911961555481, -0.28952816128730774, -0.2725651264190674, -0.255602091550827, -0.23863904178142548, -0.22167600691318512, -0.20471297204494476, -0.1877499222755432, -0.17078688740730286, -0.1538238525390625, -0.13686081767082214, -0.11989777535200119, -0.10293473303318024, -0.08597169816493988, -0.06900866329669952, -0.05204562097787857, -0.03508257865905762, -0.01811954379081726, -0.0011565051972866058, 0.01580653339624405, 0.032769571989774704, 0.04973261058330536, 0.06669564545154572, 0.08365868777036667, 0.10062173008918762, 0.11758476495742798, 0.13454779982566833, 0.1515108346939087, 0.16847388446331024, 0.1854369193315506, 0.20239995419979095, 0.2193630039691925, 0.23632603883743286, 0.2532890737056732, 0.2702521085739136, 0.28721514344215393, 0.3041781783103943, 0.32114124298095703, 0.338104248046875, 0.35506731271743774, 0.3720303475856781, 0.38899338245391846]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 13.0, 9.0, 8.0, 9.0, 17.0, 10.0, 24.0, 22.0, 16.0, 31.0, 34.0, 24.0, 37.0, 26.0, 34.0, 27.0, 47.0, 43.0, 44.0, 39.0, 44.0, 48.0, 28.0, 45.0, 41.0, 34.0, 41.0, 25.0, 21.0, 21.0, 15.0, 20.0, 26.0, 16.0, 15.0, 11.0, 7.0, 9.0, 5.0, 7.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31484436988830566, -0.3046812415122986, -0.2945181131362915, -0.2843549847602844, -0.27419185638427734, -0.26402872800827026, -0.2538655996322632, -0.2437024861574173, -0.23353935778141022, -0.22337622940540314, -0.21321310102939606, -0.20304997265338898, -0.1928868591785431, -0.182723730802536, -0.17256060242652893, -0.16239747405052185, -0.15223434567451477, -0.1420712172985077, -0.1319080889225006, -0.12174496799707413, -0.11158183962106705, -0.10141871124505997, -0.09125559031963348, -0.0810924619436264, -0.07092933356761932, -0.060766205191612244, -0.05060308054089546, -0.04043995589017868, -0.0302768275141716, -0.02011369913816452, -0.009950574487447739, 0.00021255016326904297, 0.010375678539276123, 0.020538805052638054, 0.030701931565999985, 0.040865056216716766, 0.051028184592723846, 0.061191312968730927, 0.07135443389415741, 0.08151756227016449, 0.09168069064617157, 0.10184381902217865, 0.11200694739818573, 0.12217006832361221, 0.1323331892490387, 0.14249631762504578, 0.15265944600105286, 0.16282257437705994, 0.17298570275306702, 0.1831488311290741, 0.19331195950508118, 0.20347508788108826, 0.21363821625709534, 0.22380134463310242, 0.2339644581079483, 0.24412758648395538, 0.25429069995880127, 0.26445382833480835, 0.27461695671081543, 0.2847800850868225, 0.2949432134628296, 0.30510634183883667, 0.31526947021484375, 0.32543259859085083, 0.3355957269668579]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 5.0, 6.0, 9.0, 7.0, 12.0, 14.0, 11.0, 20.0, 22.0, 43.0, 41.0, 44.0, 116.0, 191.0, 343.0, 894.0, 2575.0, 9923.0, 46257.0, 378411.0, 3186339.0, 496524.0, 56469.0, 11035.0, 2952.0, 986.0, 404.0, 218.0, 107.0, 79.0, 61.0, 34.0, 27.0, 21.0, 20.0, 15.0, 11.0, 3.0, 6.0, 5.0, 8.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1348876953125, -0.13016319274902344, -0.12543869018554688, -0.12071418762207031, -0.11598968505859375, -0.11126518249511719, -0.10654067993164062, -0.10181617736816406, -0.0970916748046875, -0.09236717224121094, -0.08764266967773438, -0.08291816711425781, -0.07819366455078125, -0.07346916198730469, -0.06874465942382812, -0.06402015686035156, -0.059295654296875, -0.05457115173339844, -0.049846649169921875, -0.04512214660644531, -0.04039764404296875, -0.03567314147949219, -0.030948638916015625, -0.026224136352539062, -0.0214996337890625, -0.016775131225585938, -0.012050628662109375, -0.0073261260986328125, -0.00260162353515625, 0.0021228790283203125, 0.006847381591796875, 0.011571884155273438, 0.01629638671875, 0.021020889282226562, 0.025745391845703125, 0.030469894409179688, 0.03519439697265625, 0.03991889953613281, 0.044643402099609375, 0.04936790466308594, 0.0540924072265625, 0.05881690979003906, 0.06354141235351562, 0.06826591491699219, 0.07299041748046875, 0.07771492004394531, 0.08243942260742188, 0.08716392517089844, 0.091888427734375, 0.09661293029785156, 0.10133743286132812, 0.10606193542480469, 0.11078643798828125, 0.11551094055175781, 0.12023544311523438, 0.12495994567871094, 0.1296844482421875, 0.13440895080566406, 0.13913345336914062, 0.1438579559326172, 0.14858245849609375, 0.1533069610595703, 0.15803146362304688, 0.16275596618652344, 0.16748046875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 1.0, 4.0, 0.0, 2.0, 7.0, 4.0, 3.0, 6.0, 7.0, 6.0, 13.0, 13.0, 12.0, 14.0, 14.0, 20.0, 21.0, 27.0, 34.0, 30.0, 29.0, 33.0, 30.0, 36.0, 45.0, 37.0, 37.0, 30.0, 39.0, 42.0, 42.0, 36.0, 30.0, 31.0, 31.0, 37.0, 31.0, 20.0, 23.0, 17.0, 20.0, 21.0, 18.0, 7.0, 11.0, 5.0, 8.0, 6.0, 2.0, 5.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.04376220703125, -0.0423741340637207, -0.040986061096191406, -0.03959798812866211, -0.03820991516113281, -0.036821842193603516, -0.03543376922607422, -0.03404569625854492, -0.032657623291015625, -0.03126955032348633, -0.02988147735595703, -0.028493404388427734, -0.027105331420898438, -0.02571725845336914, -0.024329185485839844, -0.022941112518310547, -0.02155303955078125, -0.020164966583251953, -0.018776893615722656, -0.01738882064819336, -0.016000747680664062, -0.014612674713134766, -0.013224601745605469, -0.011836528778076172, -0.010448455810546875, -0.009060382843017578, -0.007672309875488281, -0.006284236907958984, -0.0048961639404296875, -0.0035080909729003906, -0.0021200180053710938, -0.0007319450378417969, 0.0006561279296875, 0.002044200897216797, 0.0034322738647460938, 0.004820346832275391, 0.0062084197998046875, 0.007596492767333984, 0.008984565734863281, 0.010372638702392578, 0.011760711669921875, 0.013148784637451172, 0.014536857604980469, 0.015924930572509766, 0.017313003540039062, 0.01870107650756836, 0.020089149475097656, 0.021477222442626953, 0.02286529541015625, 0.024253368377685547, 0.025641441345214844, 0.02702951431274414, 0.028417587280273438, 0.029805660247802734, 0.03119373321533203, 0.03258180618286133, 0.033969879150390625, 0.03535795211791992, 0.03674602508544922, 0.038134098052978516, 0.03952217102050781, 0.04091024398803711, 0.042298316955566406, 0.0436863899230957, 0.045074462890625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 8.0, 9.0, 6.0, 14.0, 8.0, 26.0, 26.0, 37.0, 57.0, 81.0, 152.0, 206.0, 311.0, 517.0, 841.0, 1537.0, 2648.0, 5325.0, 10503.0, 21946.0, 48422.0, 113888.0, 294059.0, 856464.0, 1701799.0, 708078.0, 247889.0, 97577.0, 42181.0, 19527.0, 9391.0, 4646.0, 2509.0, 1486.0, 801.0, 460.0, 292.0, 178.0, 114.0, 85.0, 54.0, 32.0, 29.0, 21.0, 12.0, 12.0, 11.0, 6.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07440185546875, -0.07195568084716797, -0.06950950622558594, -0.0670633316040039, -0.06461715698242188, -0.062170982360839844, -0.05972480773925781, -0.05727863311767578, -0.05483245849609375, -0.05238628387451172, -0.04994010925292969, -0.047493934631347656, -0.045047760009765625, -0.042601585388183594, -0.04015541076660156, -0.03770923614501953, -0.0352630615234375, -0.03281688690185547, -0.030370712280273438, -0.027924537658691406, -0.025478363037109375, -0.023032188415527344, -0.020586013793945312, -0.01813983917236328, -0.01569366455078125, -0.013247489929199219, -0.010801315307617188, -0.008355140686035156, -0.005908966064453125, -0.0034627914428710938, -0.0010166168212890625, 0.0014295578002929688, 0.003875732421875, 0.006321907043457031, 0.008768081665039062, 0.011214256286621094, 0.013660430908203125, 0.016106605529785156, 0.018552780151367188, 0.02099895477294922, 0.02344512939453125, 0.02589130401611328, 0.028337478637695312, 0.030783653259277344, 0.033229827880859375, 0.035676002502441406, 0.03812217712402344, 0.04056835174560547, 0.0430145263671875, 0.04546070098876953, 0.04790687561035156, 0.050353050231933594, 0.052799224853515625, 0.055245399475097656, 0.05769157409667969, 0.06013774871826172, 0.06258392333984375, 0.06503009796142578, 0.06747627258300781, 0.06992244720458984, 0.07236862182617188, 0.0748147964477539, 0.07726097106933594, 0.07970714569091797, 0.0821533203125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 8.0, 6.0, 10.0, 28.0, 27.0, 41.0, 48.0, 76.0, 104.0, 156.0, 236.0, 332.0, 525.0, 707.0, 619.0, 383.0, 288.0, 162.0, 112.0, 68.0, 44.0, 26.0, 22.0, 20.0, 13.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11578369140625, -0.11253643035888672, -0.10928916931152344, -0.10604190826416016, -0.10279464721679688, -0.0995473861694336, -0.09630012512207031, -0.09305286407470703, -0.08980560302734375, -0.08655834197998047, -0.08331108093261719, -0.0800638198852539, -0.07681655883789062, -0.07356929779052734, -0.07032203674316406, -0.06707477569580078, -0.0638275146484375, -0.06058025360107422, -0.05733299255371094, -0.054085731506347656, -0.050838470458984375, -0.047591209411621094, -0.04434394836425781, -0.04109668731689453, -0.03784942626953125, -0.03460216522216797, -0.03135490417480469, -0.028107643127441406, -0.024860382080078125, -0.021613121032714844, -0.018365859985351562, -0.015118598937988281, -0.011871337890625, -0.008624076843261719, -0.0053768157958984375, -0.0021295547485351562, 0.001117706298828125, 0.004364967346191406, 0.0076122283935546875, 0.010859489440917969, 0.01410675048828125, 0.01735401153564453, 0.020601272583007812, 0.023848533630371094, 0.027095794677734375, 0.030343055725097656, 0.03359031677246094, 0.03683757781982422, 0.0400848388671875, 0.04333209991455078, 0.04657936096191406, 0.049826622009277344, 0.053073883056640625, 0.056321144104003906, 0.05956840515136719, 0.06281566619873047, 0.06606292724609375, 0.06931018829345703, 0.07255744934082031, 0.0758047103881836, 0.07905197143554688, 0.08229923248291016, 0.08554649353027344, 0.08879375457763672, 0.092041015625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 8.0, 12.0, 15.0, 16.0, 21.0, 28.0, 27.0, 39.0, 46.0, 55.0, 70.0, 46.0, 53.0, 77.0, 75.0, 61.0, 53.0, 50.0, 46.0, 34.0, 35.0, 21.0, 27.0, 18.0, 15.0, 16.0, 6.0, 4.0, 3.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25698065757751465, -0.2487000674009323, -0.24041947722434998, -0.23213888704776764, -0.2238582968711853, -0.21557770669460297, -0.20729711651802063, -0.1990165263414383, -0.19073593616485596, -0.18245534598827362, -0.17417475581169128, -0.16589416563510895, -0.1576135754585266, -0.14933298528194427, -0.14105239510536194, -0.1327718049287796, -0.12449121475219727, -0.11621062457561493, -0.10793003439903259, -0.09964944422245026, -0.09136885404586792, -0.08308826386928558, -0.07480767369270325, -0.06652708351612091, -0.058246493339538574, -0.04996590316295624, -0.0416853129863739, -0.033404722809791565, -0.02512413263320923, -0.016843542456626892, -0.008562952280044556, -0.00028236210346221924, 0.007998228073120117, 0.016278818249702454, 0.02455940842628479, 0.032839998602867126, 0.04112058877944946, 0.0494011789560318, 0.057681769132614136, 0.06596235930919647, 0.07424294948577881, 0.08252353966236115, 0.09080412983894348, 0.09908472001552582, 0.10736531019210815, 0.11564590036869049, 0.12392649054527283, 0.13220708072185516, 0.1404876708984375, 0.14876826107501984, 0.15704885125160217, 0.1653294414281845, 0.17361003160476685, 0.18189062178134918, 0.19017121195793152, 0.19845180213451385, 0.2067323923110962, 0.21501298248767853, 0.22329357266426086, 0.2315741628408432, 0.23985475301742554, 0.24813534319400787, 0.2564159333705902, 0.26469653844833374, 0.2729771137237549]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 7.0, 4.0, 4.0, 9.0, 6.0, 16.0, 14.0, 16.0, 17.0, 16.0, 27.0, 29.0, 26.0, 32.0, 23.0, 30.0, 45.0, 37.0, 42.0, 49.0, 56.0, 46.0, 36.0, 51.0, 31.0, 39.0, 38.0, 34.0, 30.0, 26.0, 23.0, 18.0, 22.0, 13.0, 19.0, 14.0, 7.0, 15.0, 10.0, 6.0, 6.0, 6.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.21432888507843018, -0.20741678774356842, -0.20050470530986786, -0.1935926079750061, -0.18668051064014435, -0.1797684133052826, -0.17285633087158203, -0.16594423353672028, -0.15903213620185852, -0.15212003886699677, -0.1452079564332962, -0.13829585909843445, -0.1313837617635727, -0.12447167187929153, -0.11755958199501038, -0.11064748466014862, -0.10373540222644806, -0.0968233123421669, -0.08991121500730515, -0.08299912512302399, -0.07608702778816223, -0.06917493790388107, -0.062262848019599915, -0.05535075441002846, -0.048438660800457, -0.041526567190885544, -0.03461447358131409, -0.02770238369703293, -0.02079029008746147, -0.013878196477890015, -0.006966106593608856, -5.401298403739929e-05, 0.006858080625534058, 0.01377017330378294, 0.020682265982031822, 0.02759435772895813, 0.03450645133852959, 0.041418544948101044, 0.0483306348323822, 0.05524272844195366, 0.062154822051525116, 0.06906691193580627, 0.07597900927066803, 0.08289109915494919, 0.08980318903923035, 0.0967152863740921, 0.10362737625837326, 0.11053946614265442, 0.11745156347751617, 0.12436365336179733, 0.1312757432460785, 0.13818784058094025, 0.145099937915802, 0.15201202034950256, 0.15892411768436432, 0.16583621501922607, 0.17274829745292664, 0.1796603947877884, 0.18657247722148895, 0.1934845745563507, 0.20039667189121246, 0.20730876922607422, 0.21422085165977478, 0.22113294899463654, 0.2280450463294983]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 8.0, 3.0, 15.0, 13.0, 31.0, 42.0, 71.0, 113.0, 202.0, 322.0, 480.0, 770.0, 1210.0, 2060.0, 3230.0, 5140.0, 8007.0, 12460.0, 19731.0, 31571.0, 52003.0, 90785.0, 160969.0, 227034.0, 178652.0, 101910.0, 57965.0, 34564.0, 21807.0, 13562.0, 8849.0, 5642.0, 3536.0, 2209.0, 1363.0, 831.0, 493.0, 337.0, 216.0, 137.0, 79.0, 44.0, 33.0, 17.0, 17.0, 11.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.07293701171875, -0.07069969177246094, -0.06846237182617188, -0.06622505187988281, -0.06398773193359375, -0.06175041198730469, -0.059513092041015625, -0.05727577209472656, -0.0550384521484375, -0.05280113220214844, -0.050563812255859375, -0.04832649230957031, -0.04608917236328125, -0.04385185241699219, -0.041614532470703125, -0.03937721252441406, -0.037139892578125, -0.03490257263183594, -0.032665252685546875, -0.030427932739257812, -0.02819061279296875, -0.025953292846679688, -0.023715972900390625, -0.021478652954101562, -0.0192413330078125, -0.017004013061523438, -0.014766693115234375, -0.012529373168945312, -0.01029205322265625, -0.008054733276367188, -0.005817413330078125, -0.0035800933837890625, -0.0013427734375, 0.0008945465087890625, 0.003131866455078125, 0.0053691864013671875, 0.00760650634765625, 0.009843826293945312, 0.012081146240234375, 0.014318466186523438, 0.0165557861328125, 0.018793106079101562, 0.021030426025390625, 0.023267745971679688, 0.02550506591796875, 0.027742385864257812, 0.029979705810546875, 0.03221702575683594, 0.034454345703125, 0.03669166564941406, 0.038928985595703125, 0.04116630554199219, 0.04340362548828125, 0.04564094543457031, 0.047878265380859375, 0.05011558532714844, 0.0523529052734375, 0.05459022521972656, 0.056827545166015625, 0.05906486511230469, 0.06130218505859375, 0.06353950500488281, 0.06577682495117188, 0.06801414489746094, 0.07025146484375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 7.0, 8.0, 9.0, 14.0, 7.0, 13.0, 14.0, 18.0, 19.0, 20.0, 24.0, 23.0, 33.0, 29.0, 25.0, 28.0, 42.0, 46.0, 31.0, 39.0, 37.0, 41.0, 36.0, 32.0, 49.0, 31.0, 35.0, 30.0, 33.0, 33.0, 18.0, 21.0, 20.0, 25.0, 22.0, 18.0, 8.0, 10.0, 11.0, 7.0, 12.0, 3.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.044586181640625, -0.04315996170043945, -0.041733741760253906, -0.04030752182006836, -0.03888130187988281, -0.037455081939697266, -0.03602886199951172, -0.03460264205932617, -0.033176422119140625, -0.03175020217895508, -0.03032398223876953, -0.028897762298583984, -0.027471542358398438, -0.02604532241821289, -0.024619102478027344, -0.023192882537841797, -0.02176666259765625, -0.020340442657470703, -0.018914222717285156, -0.01748800277709961, -0.016061782836914062, -0.014635562896728516, -0.013209342956542969, -0.011783123016357422, -0.010356903076171875, -0.008930683135986328, -0.007504463195800781, -0.006078243255615234, -0.0046520233154296875, -0.0032258033752441406, -0.0017995834350585938, -0.0003733634948730469, 0.0010528564453125, 0.002479076385498047, 0.0039052963256835938, 0.005331516265869141, 0.0067577362060546875, 0.008183956146240234, 0.009610176086425781, 0.011036396026611328, 0.012462615966796875, 0.013888835906982422, 0.015315055847167969, 0.016741275787353516, 0.018167495727539062, 0.01959371566772461, 0.021019935607910156, 0.022446155548095703, 0.02387237548828125, 0.025298595428466797, 0.026724815368652344, 0.02815103530883789, 0.029577255249023438, 0.031003475189208984, 0.03242969512939453, 0.03385591506958008, 0.035282135009765625, 0.03670835494995117, 0.03813457489013672, 0.039560794830322266, 0.04098701477050781, 0.04241323471069336, 0.043839454650878906, 0.04526567459106445, 0.04669189453125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 2.0, 5.0, 7.0, 8.0, 10.0, 15.0, 19.0, 24.0, 37.0, 39.0, 61.0, 85.0, 117.0, 205.0, 411.0, 963.0, 3010.0, 10719.0, 36797.0, 144492.0, 541758.0, 232627.0, 54200.0, 15614.0, 4641.0, 1341.0, 575.0, 266.0, 160.0, 81.0, 71.0, 65.0, 31.0, 34.0, 14.0, 20.0, 7.0, 9.0, 1.0, 3.0, 1.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1640625, -0.15790557861328125, -0.1517486572265625, -0.14559173583984375, -0.139434814453125, -0.13327789306640625, -0.1271209716796875, -0.12096405029296875, -0.11480712890625, -0.10865020751953125, -0.1024932861328125, -0.09633636474609375, -0.090179443359375, -0.08402252197265625, -0.0778656005859375, -0.07170867919921875, -0.0655517578125, -0.05939483642578125, -0.0532379150390625, -0.04708099365234375, -0.040924072265625, -0.03476715087890625, -0.0286102294921875, -0.02245330810546875, -0.01629638671875, -0.01013946533203125, -0.0039825439453125, 0.00217437744140625, 0.008331298828125, 0.01448822021484375, 0.0206451416015625, 0.02680206298828125, 0.032958984375, 0.03911590576171875, 0.0452728271484375, 0.05142974853515625, 0.057586669921875, 0.06374359130859375, 0.0699005126953125, 0.07605743408203125, 0.08221435546875, 0.08837127685546875, 0.0945281982421875, 0.10068511962890625, 0.106842041015625, 0.11299896240234375, 0.1191558837890625, 0.12531280517578125, 0.1314697265625, 0.13762664794921875, 0.1437835693359375, 0.14994049072265625, 0.156097412109375, 0.16225433349609375, 0.1684112548828125, 0.17456817626953125, 0.18072509765625, 0.18688201904296875, 0.1930389404296875, 0.19919586181640625, 0.205352783203125, 0.21150970458984375, 0.2176666259765625, 0.22382354736328125, 0.22998046875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 8.0, 3.0, 7.0, 4.0, 20.0, 19.0, 25.0, 29.0, 33.0, 40.0, 28.0, 47.0, 51.0, 44.0, 51.0, 55.0, 52.0, 48.0, 44.0, 54.0, 52.0, 58.0, 45.0, 36.0, 37.0, 21.0, 18.0, 22.0, 11.0, 10.0, 11.0, 7.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1650390625, -0.15933990478515625, -0.1536407470703125, -0.14794158935546875, -0.142242431640625, -0.13654327392578125, -0.1308441162109375, -0.12514495849609375, -0.11944580078125, -0.11374664306640625, -0.1080474853515625, -0.10234832763671875, -0.096649169921875, -0.09095001220703125, -0.0852508544921875, -0.07955169677734375, -0.0738525390625, -0.06815338134765625, -0.0624542236328125, -0.05675506591796875, -0.051055908203125, -0.04535675048828125, -0.0396575927734375, -0.03395843505859375, -0.02825927734375, -0.02256011962890625, -0.0168609619140625, -0.01116180419921875, -0.005462646484375, 0.00023651123046875, 0.0059356689453125, 0.01163482666015625, 0.017333984375, 0.02303314208984375, 0.0287322998046875, 0.03443145751953125, 0.040130615234375, 0.04582977294921875, 0.0515289306640625, 0.05722808837890625, 0.06292724609375, 0.06862640380859375, 0.0743255615234375, 0.08002471923828125, 0.085723876953125, 0.09142303466796875, 0.0971221923828125, 0.10282135009765625, 0.1085205078125, 0.11421966552734375, 0.1199188232421875, 0.12561798095703125, 0.131317138671875, 0.13701629638671875, 0.1427154541015625, 0.14841461181640625, 0.15411376953125, 0.15981292724609375, 0.1655120849609375, 0.17121124267578125, 0.176910400390625, 0.18260955810546875, 0.1883087158203125, 0.19400787353515625, 0.19970703125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 2.0, 6.0, 8.0, 18.0, 25.0, 30.0, 44.0, 97.0, 153.0, 285.0, 518.0, 1009.0, 2126.0, 4380.0, 9101.0, 18875.0, 41601.0, 123219.0, 461207.0, 264647.0, 67969.0, 27837.0, 13035.0, 6315.0, 2997.0, 1499.0, 693.0, 407.0, 183.0, 115.0, 54.0, 31.0, 23.0, 14.0, 11.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06646728515625, -0.06437397003173828, -0.06228065490722656, -0.060187339782714844, -0.058094024658203125, -0.056000709533691406, -0.05390739440917969, -0.05181407928466797, -0.04972076416015625, -0.04762744903564453, -0.04553413391113281, -0.043440818786621094, -0.041347503662109375, -0.039254188537597656, -0.03716087341308594, -0.03506755828857422, -0.0329742431640625, -0.03088092803955078, -0.028787612915039062, -0.026694297790527344, -0.024600982666015625, -0.022507667541503906, -0.020414352416992188, -0.01832103729248047, -0.01622772216796875, -0.014134407043457031, -0.012041091918945312, -0.009947776794433594, -0.007854461669921875, -0.005761146545410156, -0.0036678314208984375, -0.0015745162963867188, 0.000518798828125, 0.0026121139526367188, 0.0047054290771484375, 0.006798744201660156, 0.008892059326171875, 0.010985374450683594, 0.013078689575195312, 0.015172004699707031, 0.01726531982421875, 0.01935863494873047, 0.021451950073242188, 0.023545265197753906, 0.025638580322265625, 0.027731895446777344, 0.029825210571289062, 0.03191852569580078, 0.0340118408203125, 0.03610515594482422, 0.03819847106933594, 0.040291786193847656, 0.042385101318359375, 0.044478416442871094, 0.04657173156738281, 0.04866504669189453, 0.05075836181640625, 0.05285167694091797, 0.05494499206542969, 0.057038307189941406, 0.059131622314453125, 0.061224937438964844, 0.06331825256347656, 0.06541156768798828, 0.0675048828125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 4.0, 2.0, 4.0, 9.0, 5.0, 13.0, 10.0, 11.0, 14.0, 17.0, 28.0, 32.0, 38.0, 34.0, 61.0, 59.0, 79.0, 79.0, 57.0, 59.0, 61.0, 60.0, 52.0, 37.0, 31.0, 27.0, 16.0, 21.0, 21.0, 10.0, 4.0, 6.0, 6.0, 6.0, 5.0, 1.0, 8.0, 1.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.7523765563964844e-05, -1.70096755027771e-05, -1.6495585441589355e-05, -1.598149538040161e-05, -1.5467405319213867e-05, -1.4953315258026123e-05, -1.4439225196838379e-05, -1.3925135135650635e-05, -1.341104507446289e-05, -1.2896955013275146e-05, -1.2382864952087402e-05, -1.1868774890899658e-05, -1.1354684829711914e-05, -1.084059476852417e-05, -1.0326504707336426e-05, -9.812414646148682e-06, -9.298324584960938e-06, -8.784234523773193e-06, -8.27014446258545e-06, -7.756054401397705e-06, -7.241964340209961e-06, -6.727874279022217e-06, -6.213784217834473e-06, -5.6996941566467285e-06, -5.185604095458984e-06, -4.67151403427124e-06, -4.157423973083496e-06, -3.643333911895752e-06, -3.129243850708008e-06, -2.6151537895202637e-06, -2.1010637283325195e-06, -1.5869736671447754e-06, -1.0728836059570312e-06, -5.587935447692871e-07, -4.470348358154297e-08, 4.6938657760620117e-07, 9.834766387939453e-07, 1.4975666999816895e-06, 2.0116567611694336e-06, 2.5257468223571777e-06, 3.039836883544922e-06, 3.553926944732666e-06, 4.06801700592041e-06, 4.582107067108154e-06, 5.0961971282958984e-06, 5.610287189483643e-06, 6.124377250671387e-06, 6.638467311859131e-06, 7.152557373046875e-06, 7.666647434234619e-06, 8.180737495422363e-06, 8.694827556610107e-06, 9.208917617797852e-06, 9.723007678985596e-06, 1.023709774017334e-05, 1.0751187801361084e-05, 1.1265277862548828e-05, 1.1779367923736572e-05, 1.2293457984924316e-05, 1.280754804611206e-05, 1.3321638107299805e-05, 1.3835728168487549e-05, 1.4349818229675293e-05, 1.4863908290863037e-05, 1.537799835205078e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 1.0, 12.0, 15.0, 16.0, 22.0, 30.0, 45.0, 62.0, 126.0, 238.0, 483.0, 1121.0, 3125.0, 8430.0, 23011.0, 70029.0, 305723.0, 471536.0, 111597.0, 33588.0, 12124.0, 4246.0, 1595.0, 691.0, 297.0, 140.0, 90.0, 55.0, 29.0, 31.0, 15.0, 13.0, 8.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08905029296875, -0.0867772102355957, -0.0845041275024414, -0.08223104476928711, -0.07995796203613281, -0.07768487930297852, -0.07541179656982422, -0.07313871383666992, -0.07086563110351562, -0.06859254837036133, -0.06631946563720703, -0.06404638290405273, -0.06177330017089844, -0.05950021743774414, -0.057227134704589844, -0.05495405197143555, -0.05268096923828125, -0.05040788650512695, -0.048134803771972656, -0.04586172103881836, -0.04358863830566406, -0.041315555572509766, -0.03904247283935547, -0.03676939010620117, -0.034496307373046875, -0.03222322463989258, -0.02995014190673828, -0.027677059173583984, -0.025403976440429688, -0.02313089370727539, -0.020857810974121094, -0.018584728240966797, -0.0163116455078125, -0.014038562774658203, -0.011765480041503906, -0.00949239730834961, -0.0072193145751953125, -0.004946231842041016, -0.0026731491088867188, -0.0004000663757324219, 0.001873016357421875, 0.004146099090576172, 0.006419181823730469, 0.008692264556884766, 0.010965347290039062, 0.01323843002319336, 0.015511512756347656, 0.017784595489501953, 0.02005767822265625, 0.022330760955810547, 0.024603843688964844, 0.02687692642211914, 0.029150009155273438, 0.031423091888427734, 0.03369617462158203, 0.03596925735473633, 0.038242340087890625, 0.04051542282104492, 0.04278850555419922, 0.045061588287353516, 0.04733467102050781, 0.04960775375366211, 0.051880836486816406, 0.0541539192199707, 0.056427001953125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 6.0, 5.0, 5.0, 7.0, 13.0, 6.0, 16.0, 21.0, 26.0, 31.0, 58.0, 71.0, 93.0, 101.0, 109.0, 98.0, 85.0, 61.0, 42.0, 33.0, 26.0, 13.0, 18.0, 11.0, 7.0, 7.0, 3.0, 7.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.06085205078125, -0.05918312072753906, -0.057514190673828125, -0.05584526062011719, -0.05417633056640625, -0.05250740051269531, -0.050838470458984375, -0.04916954040527344, -0.0475006103515625, -0.04583168029785156, -0.044162750244140625, -0.04249382019042969, -0.04082489013671875, -0.03915596008300781, -0.037487030029296875, -0.03581809997558594, -0.034149169921875, -0.03248023986816406, -0.030811309814453125, -0.029142379760742188, -0.02747344970703125, -0.025804519653320312, -0.024135589599609375, -0.022466659545898438, -0.0207977294921875, -0.019128799438476562, -0.017459869384765625, -0.015790939331054688, -0.01412200927734375, -0.012453079223632812, -0.010784149169921875, -0.009115219116210938, -0.0074462890625, -0.0057773590087890625, -0.004108428955078125, -0.0024394989013671875, -0.00077056884765625, 0.0008983612060546875, 0.002567291259765625, 0.0042362213134765625, 0.0059051513671875, 0.0075740814208984375, 0.009243011474609375, 0.010911941528320312, 0.01258087158203125, 0.014249801635742188, 0.015918731689453125, 0.017587661743164062, 0.019256591796875, 0.020925521850585938, 0.022594451904296875, 0.024263381958007812, 0.02593231201171875, 0.027601242065429688, 0.029270172119140625, 0.030939102172851562, 0.0326080322265625, 0.03427696228027344, 0.035945892333984375, 0.03761482238769531, 0.03928375244140625, 0.04095268249511719, 0.042621612548828125, 0.04429054260253906, 0.04595947265625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 15.0, 35.0, 59.0, 115.0, 179.0, 169.0, 170.0, 114.0, 95.0, 27.0, 15.0, 9.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.389845073223114, -0.3586246967315674, -0.32740435004234314, -0.2961840033531189, -0.26496362686157227, -0.23374326527118683, -0.2025229036808014, -0.17130254209041595, -0.14008218050003052, -0.10886181890964508, -0.07764145731925964, -0.04642109572887421, -0.01520073413848877, 0.016019627451896667, 0.047239989042282104, 0.07846035063266754, 0.10968071222305298, 0.14090107381343842, 0.17212143540382385, 0.2033417969942093, 0.23456215858459473, 0.26578253507614136, 0.2970028817653656, 0.32822322845458984, 0.3594436049461365, 0.3906639814376831, 0.42188432812690735, 0.4531046748161316, 0.4843250513076782, 0.5155454277992249, 0.5467658042907715, 0.5779861211776733, 0.6092064380645752, 0.6404268145561218, 0.6716471910476685, 0.7028675079345703, 0.7340878844261169, 0.7653082609176636, 0.7965285778045654, 0.8277489542961121, 0.8589693307876587, 0.8901897072792053, 0.921410083770752, 0.9526304006576538, 0.9838507771492004, 1.015071153640747, 1.046291470527649, 1.0775119066238403, 1.1087322235107422, 1.139952540397644, 1.1711729764938354, 1.2023932933807373, 1.2336137294769287, 1.2648340463638306, 1.2960543632507324, 1.3272747993469238, 1.3584951162338257, 1.3897154331207275, 1.420935869216919, 1.4521561861038208, 1.4833765029907227, 1.514596939086914, 1.545817255973816, 1.5770376920700073, 1.6082580089569092]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 3.0, 4.0, 6.0, 7.0, 9.0, 10.0, 14.0, 9.0, 10.0, 22.0, 23.0, 29.0, 33.0, 36.0, 29.0, 37.0, 30.0, 43.0, 39.0, 44.0, 43.0, 33.0, 43.0, 48.0, 34.0, 41.0, 46.0, 39.0, 31.0, 38.0, 21.0, 24.0, 25.0, 16.0, 14.0, 15.0, 12.0, 12.0, 10.0, 4.0, 9.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.4383001923561096, -0.4258387088775635, -0.4133772552013397, -0.40091580152511597, -0.3884543180465698, -0.3759928345680237, -0.3635313808917999, -0.35106992721557617, -0.33860844373703003, -0.3261469602584839, -0.31368550658226013, -0.3012240529060364, -0.28876256942749023, -0.2763010859489441, -0.26383963227272034, -0.2513781785964966, -0.23891669511795044, -0.2264552265405655, -0.21399375796318054, -0.2015322893857956, -0.18907082080841064, -0.1766093522310257, -0.16414788365364075, -0.1516864150762558, -0.13922494649887085, -0.1267634779214859, -0.11430200934410095, -0.101840540766716, -0.08937907218933105, -0.0769176036119461, -0.06445613503456116, -0.05199466645717621, -0.03953319787979126, -0.02707172930240631, -0.014610260725021362, -0.0021487921476364136, 0.010312676429748535, 0.022774145007133484, 0.03523561358451843, 0.04769708216190338, 0.06015855073928833, 0.07262001931667328, 0.08508148789405823, 0.09754295647144318, 0.11000442504882812, 0.12246589362621307, 0.13492736220359802, 0.14738883078098297, 0.15985029935836792, 0.17231176793575287, 0.18477323651313782, 0.19723470509052277, 0.20969617366790771, 0.22215764224529266, 0.2346191108226776, 0.24708057940006256, 0.2595420479774475, 0.27200353145599365, 0.2844649851322174, 0.29692643880844116, 0.3093879222869873, 0.32184940576553345, 0.3343108594417572, 0.34677231311798096, 0.3592337965965271]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 5.0, 5.0, 4.0, 5.0, 9.0, 12.0, 12.0, 13.0, 18.0, 34.0, 46.0, 56.0, 94.0, 126.0, 242.0, 400.0, 680.0, 1153.0, 2205.0, 4067.0, 8372.0, 17294.0, 38702.0, 90198.0, 237473.0, 758514.0, 2019100.0, 652329.0, 212959.0, 82805.0, 34984.0, 16013.0, 7741.0, 3795.0, 2052.0, 1142.0, 638.0, 354.0, 218.0, 121.0, 84.0, 62.0, 36.0, 32.0, 26.0, 20.0, 14.0, 10.0, 9.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06524658203125, -0.06310367584228516, -0.06096076965332031, -0.05881786346435547, -0.056674957275390625, -0.05453205108642578, -0.05238914489746094, -0.050246238708496094, -0.04810333251953125, -0.045960426330566406, -0.04381752014160156, -0.04167461395263672, -0.039531707763671875, -0.03738880157470703, -0.03524589538574219, -0.033102989196777344, -0.0309600830078125, -0.028817176818847656, -0.026674270629882812, -0.02453136444091797, -0.022388458251953125, -0.02024555206298828, -0.018102645874023438, -0.015959739685058594, -0.01381683349609375, -0.011673927307128906, -0.009531021118164062, -0.007388114929199219, -0.005245208740234375, -0.0031023025512695312, -0.0009593963623046875, 0.0011835098266601562, 0.003326416015625, 0.005469322204589844, 0.0076122283935546875, 0.009755134582519531, 0.011898040771484375, 0.014040946960449219, 0.016183853149414062, 0.018326759338378906, 0.02046966552734375, 0.022612571716308594, 0.024755477905273438, 0.02689838409423828, 0.029041290283203125, 0.03118419647216797, 0.03332710266113281, 0.035470008850097656, 0.0376129150390625, 0.039755821228027344, 0.04189872741699219, 0.04404163360595703, 0.046184539794921875, 0.04832744598388672, 0.05047035217285156, 0.052613258361816406, 0.05475616455078125, 0.056899070739746094, 0.05904197692871094, 0.06118488311767578, 0.06332778930664062, 0.06547069549560547, 0.06761360168457031, 0.06975650787353516, 0.0718994140625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 4.0, 1.0, 3.0, 2.0, 12.0, 8.0, 14.0, 12.0, 18.0, 19.0, 18.0, 17.0, 27.0, 29.0, 26.0, 27.0, 31.0, 38.0, 45.0, 34.0, 39.0, 43.0, 50.0, 51.0, 46.0, 30.0, 43.0, 42.0, 37.0, 25.0, 32.0, 34.0, 24.0, 15.0, 16.0, 15.0, 17.0, 12.0, 16.0, 8.0, 9.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.06494140625, -0.06314706802368164, -0.06135272979736328, -0.05955839157104492, -0.05776405334472656, -0.0559697151184082, -0.054175376892089844, -0.052381038665771484, -0.050586700439453125, -0.048792362213134766, -0.046998023986816406, -0.04520368576049805, -0.04340934753417969, -0.04161500930786133, -0.03982067108154297, -0.03802633285522461, -0.03623199462890625, -0.03443765640258789, -0.03264331817626953, -0.030848979949951172, -0.029054641723632812, -0.027260303497314453, -0.025465965270996094, -0.023671627044677734, -0.021877288818359375, -0.020082950592041016, -0.018288612365722656, -0.016494274139404297, -0.014699935913085938, -0.012905597686767578, -0.011111259460449219, -0.00931692123413086, -0.0075225830078125, -0.005728244781494141, -0.003933906555175781, -0.002139568328857422, -0.0003452301025390625, 0.0014491081237792969, 0.0032434463500976562, 0.005037784576416016, 0.006832122802734375, 0.008626461029052734, 0.010420799255371094, 0.012215137481689453, 0.014009475708007812, 0.015803813934326172, 0.01759815216064453, 0.01939249038696289, 0.02118682861328125, 0.02298116683959961, 0.02477550506591797, 0.026569843292236328, 0.028364181518554688, 0.030158519744873047, 0.031952857971191406, 0.033747196197509766, 0.035541534423828125, 0.037335872650146484, 0.039130210876464844, 0.0409245491027832, 0.04271888732910156, 0.04451322555541992, 0.04630756378173828, 0.04810190200805664, 0.049896240234375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 4.0, 2.0, 6.0, 3.0, 14.0, 13.0, 26.0, 34.0, 74.0, 86.0, 102.0, 167.0, 271.0, 384.0, 605.0, 898.0, 1409.0, 2090.0, 3554.0, 5915.0, 10194.0, 18638.0, 35483.0, 69969.0, 145649.0, 319326.0, 786014.0, 1516821.0, 709975.0, 291808.0, 134336.0, 65179.0, 33065.0, 17582.0, 9604.0, 5671.0, 3320.0, 2097.0, 1321.0, 826.0, 606.0, 368.0, 241.0, 158.0, 118.0, 67.0, 67.0, 37.0, 34.0, 25.0, 11.0, 8.0, 8.0, 8.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0711669921875, -0.06890392303466797, -0.06664085388183594, -0.0643777847290039, -0.062114715576171875, -0.059851646423339844, -0.05758857727050781, -0.05532550811767578, -0.05306243896484375, -0.05079936981201172, -0.04853630065917969, -0.046273231506347656, -0.044010162353515625, -0.041747093200683594, -0.03948402404785156, -0.03722095489501953, -0.0349578857421875, -0.03269481658935547, -0.030431747436523438, -0.028168678283691406, -0.025905609130859375, -0.023642539978027344, -0.021379470825195312, -0.01911640167236328, -0.01685333251953125, -0.014590263366699219, -0.012327194213867188, -0.010064125061035156, -0.007801055908203125, -0.005537986755371094, -0.0032749176025390625, -0.0010118484497070312, 0.001251220703125, 0.0035142898559570312, 0.0057773590087890625, 0.008040428161621094, 0.010303497314453125, 0.012566566467285156, 0.014829635620117188, 0.01709270477294922, 0.01935577392578125, 0.02161884307861328, 0.023881912231445312, 0.026144981384277344, 0.028408050537109375, 0.030671119689941406, 0.03293418884277344, 0.03519725799560547, 0.0374603271484375, 0.03972339630126953, 0.04198646545410156, 0.044249534606933594, 0.046512603759765625, 0.048775672912597656, 0.05103874206542969, 0.05330181121826172, 0.05556488037109375, 0.05782794952392578, 0.06009101867675781, 0.062354087829589844, 0.06461715698242188, 0.0668802261352539, 0.06914329528808594, 0.07140636444091797, 0.07366943359375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 8.0, 9.0, 7.0, 11.0, 9.0, 14.0, 23.0, 34.0, 37.0, 51.0, 71.0, 104.0, 132.0, 172.0, 266.0, 358.0, 563.0, 589.0, 506.0, 307.0, 215.0, 151.0, 104.0, 75.0, 72.0, 47.0, 27.0, 20.0, 27.0, 12.0, 20.0, 7.0, 7.0, 5.0, 5.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.099853515625, -0.09702587127685547, -0.09419822692871094, -0.0913705825805664, -0.08854293823242188, -0.08571529388427734, -0.08288764953613281, -0.08006000518798828, -0.07723236083984375, -0.07440471649169922, -0.07157707214355469, -0.06874942779541016, -0.06592178344726562, -0.0630941390991211, -0.06026649475097656, -0.05743885040283203, -0.0546112060546875, -0.05178356170654297, -0.04895591735839844, -0.046128273010253906, -0.043300628662109375, -0.040472984313964844, -0.03764533996582031, -0.03481769561767578, -0.03199005126953125, -0.02916240692138672, -0.026334762573242188, -0.023507118225097656, -0.020679473876953125, -0.017851829528808594, -0.015024185180664062, -0.012196540832519531, -0.009368896484375, -0.006541252136230469, -0.0037136077880859375, -0.0008859634399414062, 0.001941680908203125, 0.004769325256347656, 0.0075969696044921875, 0.010424613952636719, 0.01325225830078125, 0.01607990264892578, 0.018907546997070312, 0.021735191345214844, 0.024562835693359375, 0.027390480041503906, 0.030218124389648438, 0.03304576873779297, 0.0358734130859375, 0.03870105743408203, 0.04152870178222656, 0.044356346130371094, 0.047183990478515625, 0.050011634826660156, 0.05283927917480469, 0.05566692352294922, 0.05849456787109375, 0.06132221221923828, 0.06414985656738281, 0.06697750091552734, 0.06980514526367188, 0.0726327896118164, 0.07546043395996094, 0.07828807830810547, 0.08111572265625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 3.0, 5.0, 6.0, 11.0, 13.0, 15.0, 32.0, 33.0, 45.0, 57.0, 59.0, 75.0, 75.0, 77.0, 91.0, 76.0, 73.0, 52.0, 53.0, 41.0, 36.0, 12.0, 21.0, 13.0, 3.0, 8.0, 6.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3206601142883301, -0.3084813356399536, -0.29630255699157715, -0.2841237783432007, -0.2719449996948242, -0.25976622104644775, -0.2475874423980713, -0.23540866374969482, -0.22322988510131836, -0.2110511064529419, -0.19887232780456543, -0.18669354915618896, -0.1745147705078125, -0.16233599185943604, -0.15015721321105957, -0.1379784345626831, -0.12579967081546783, -0.11362089216709137, -0.1014421135187149, -0.08926333487033844, -0.07708455622196198, -0.06490577757358551, -0.05272700637578964, -0.04054822772741318, -0.028369449079036713, -0.016190670430660248, -0.004011893644928932, 0.008166883140802383, 0.02034566178917885, 0.03252444043755531, 0.04470321536064148, 0.056881994009017944, 0.06906077265739441, 0.08123955130577087, 0.09341832995414734, 0.1055971086025238, 0.11777588725090027, 0.12995466589927673, 0.1421334445476532, 0.15431222319602966, 0.16649100184440613, 0.1786697804927826, 0.19084855914115906, 0.20302733778953552, 0.215206116437912, 0.22738489508628845, 0.23956367373466492, 0.2517424523830414, 0.26392120122909546, 0.2760999798774719, 0.2882787585258484, 0.30045753717422485, 0.3126363158226013, 0.3248150944709778, 0.33699387311935425, 0.3491726517677307, 0.3613514304161072, 0.37353020906448364, 0.3857089877128601, 0.3978877663612366, 0.41006654500961304, 0.4222453236579895, 0.43442410230636597, 0.44660288095474243, 0.4587816596031189]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 11.0, 6.0, 6.0, 13.0, 12.0, 13.0, 16.0, 25.0, 14.0, 28.0, 26.0, 24.0, 36.0, 40.0, 44.0, 30.0, 47.0, 38.0, 45.0, 58.0, 40.0, 49.0, 43.0, 33.0, 41.0, 37.0, 41.0, 18.0, 17.0, 17.0, 29.0, 21.0, 20.0, 16.0, 10.0, 9.0, 11.0, 4.0, 7.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29413020610809326, -0.2850360572338104, -0.27594193816185, -0.26684778928756714, -0.2577536404132843, -0.24865950644016266, -0.23956537246704102, -0.23047122359275818, -0.22137708961963654, -0.2122829556465149, -0.20318880677223206, -0.1940946727991104, -0.18500053882598877, -0.17590638995170593, -0.1668122559785843, -0.15771812200546265, -0.1486239731311798, -0.13952983915805817, -0.13043569028377533, -0.12134155631065369, -0.11224741488695145, -0.1031532734632492, -0.09405913949012756, -0.08496499806642532, -0.07587085664272308, -0.06677671521902084, -0.0576825775206089, -0.04858843982219696, -0.03949429839849472, -0.03040015697479248, -0.02130601927638054, -0.012211881577968597, -0.0031177401542663574, 0.005976399406790733, 0.015070538967847824, 0.024164678528904915, 0.033258818089962006, 0.042352959513664246, 0.05144709721207619, 0.06054123491048813, 0.06963537633419037, 0.07872951775789261, 0.08782365918159485, 0.09691779315471649, 0.10601193457841873, 0.11510607600212097, 0.12420020997524261, 0.13329434394836426, 0.1423884928226471, 0.15148262679576874, 0.16057677567005157, 0.16967090964317322, 0.17876505851745605, 0.1878591924905777, 0.19695332646369934, 0.20604747533798218, 0.21514160931110382, 0.22423574328422546, 0.2333298921585083, 0.24242402613162994, 0.2515181601047516, 0.2606123089790344, 0.26970645785331726, 0.2788005769252777, 0.28789472579956055]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 7.0, 7.0, 19.0, 11.0, 23.0, 41.0, 61.0, 99.0, 157.0, 283.0, 532.0, 990.0, 1733.0, 3175.0, 6101.0, 11763.0, 22771.0, 43793.0, 87335.0, 176514.0, 284369.0, 203599.0, 100198.0, 50614.0, 25977.0, 13329.0, 7028.0, 3556.0, 1975.0, 1047.0, 622.0, 342.0, 177.0, 109.0, 64.0, 40.0, 31.0, 12.0, 13.0, 8.0, 8.0, 6.0, 4.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08294677734375, -0.0800466537475586, -0.07714653015136719, -0.07424640655517578, -0.07134628295898438, -0.06844615936279297, -0.06554603576660156, -0.06264591217041016, -0.05974578857421875, -0.056845664978027344, -0.05394554138183594, -0.05104541778564453, -0.048145294189453125, -0.04524517059326172, -0.04234504699707031, -0.039444923400878906, -0.0365447998046875, -0.033644676208496094, -0.030744552612304688, -0.02784442901611328, -0.024944305419921875, -0.02204418182373047, -0.019144058227539062, -0.016243934631347656, -0.01334381103515625, -0.010443687438964844, -0.0075435638427734375, -0.004643440246582031, -0.001743316650390625, 0.0011568069458007812, 0.0040569305419921875, 0.006957054138183594, 0.009857177734375, 0.012757301330566406, 0.015657424926757812, 0.01855754852294922, 0.021457672119140625, 0.02435779571533203, 0.027257919311523438, 0.030158042907714844, 0.03305816650390625, 0.035958290100097656, 0.03885841369628906, 0.04175853729248047, 0.044658660888671875, 0.04755878448486328, 0.05045890808105469, 0.053359031677246094, 0.0562591552734375, 0.059159278869628906, 0.06205940246582031, 0.06495952606201172, 0.06785964965820312, 0.07075977325439453, 0.07365989685058594, 0.07656002044677734, 0.07946014404296875, 0.08236026763916016, 0.08526039123535156, 0.08816051483154297, 0.09106063842773438, 0.09396076202392578, 0.09686088562011719, 0.0997610092163086, 0.1026611328125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 5.0, 0.0, 5.0, 8.0, 10.0, 7.0, 6.0, 10.0, 6.0, 13.0, 17.0, 24.0, 28.0, 17.0, 24.0, 33.0, 28.0, 37.0, 37.0, 43.0, 41.0, 38.0, 45.0, 44.0, 42.0, 45.0, 26.0, 39.0, 40.0, 39.0, 34.0, 36.0, 26.0, 22.0, 22.0, 22.0, 15.0, 9.0, 15.0, 7.0, 10.0, 6.0, 6.0, 2.0, 7.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.052215576171875, -0.050501346588134766, -0.04878711700439453, -0.0470728874206543, -0.04535865783691406, -0.04364442825317383, -0.041930198669433594, -0.04021596908569336, -0.038501739501953125, -0.03678750991821289, -0.035073280334472656, -0.03335905075073242, -0.03164482116699219, -0.029930591583251953, -0.02821636199951172, -0.026502132415771484, -0.02478790283203125, -0.023073673248291016, -0.02135944366455078, -0.019645214080810547, -0.017930984497070312, -0.016216754913330078, -0.014502525329589844, -0.01278829574584961, -0.011074066162109375, -0.00935983657836914, -0.007645606994628906, -0.005931377410888672, -0.0042171478271484375, -0.002502918243408203, -0.0007886886596679688, 0.0009255409240722656, 0.0026397705078125, 0.004354000091552734, 0.006068229675292969, 0.007782459259033203, 0.009496688842773438, 0.011210918426513672, 0.012925148010253906, 0.01463937759399414, 0.016353607177734375, 0.01806783676147461, 0.019782066345214844, 0.021496295928955078, 0.023210525512695312, 0.024924755096435547, 0.02663898468017578, 0.028353214263916016, 0.03006744384765625, 0.031781673431396484, 0.03349590301513672, 0.03521013259887695, 0.03692436218261719, 0.03863859176635742, 0.040352821350097656, 0.04206705093383789, 0.043781280517578125, 0.04549551010131836, 0.047209739685058594, 0.04892396926879883, 0.05063819885253906, 0.0523524284362793, 0.05406665802001953, 0.055780887603759766, 0.0574951171875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 10.0, 7.0, 10.0, 18.0, 27.0, 26.0, 31.0, 50.0, 54.0, 58.0, 116.0, 164.0, 264.0, 571.0, 1415.0, 3806.0, 11909.0, 37257.0, 118694.0, 409357.0, 329859.0, 91801.0, 28547.0, 9086.0, 3014.0, 1105.0, 464.0, 257.0, 140.0, 100.0, 74.0, 65.0, 55.0, 20.0, 27.0, 19.0, 14.0, 11.0, 16.0, 7.0, 9.0, 4.0, 4.0, 5.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.1929931640625, -0.18761634826660156, -0.18223953247070312, -0.1768627166748047, -0.17148590087890625, -0.1661090850830078, -0.16073226928710938, -0.15535545349121094, -0.1499786376953125, -0.14460182189941406, -0.13922500610351562, -0.1338481903076172, -0.12847137451171875, -0.12309455871582031, -0.11771774291992188, -0.11234092712402344, -0.106964111328125, -0.10158729553222656, -0.09621047973632812, -0.09083366394042969, -0.08545684814453125, -0.08008003234863281, -0.07470321655273438, -0.06932640075683594, -0.0639495849609375, -0.05857276916503906, -0.053195953369140625, -0.04781913757324219, -0.04244232177734375, -0.03706550598144531, -0.031688690185546875, -0.026311874389648438, -0.02093505859375, -0.015558242797851562, -0.010181427001953125, -0.0048046112060546875, 0.00057220458984375, 0.0059490203857421875, 0.011325836181640625, 0.016702651977539062, 0.0220794677734375, 0.027456283569335938, 0.032833099365234375, 0.03820991516113281, 0.04358673095703125, 0.04896354675292969, 0.054340362548828125, 0.05971717834472656, 0.065093994140625, 0.07047080993652344, 0.07584762573242188, 0.08122444152832031, 0.08660125732421875, 0.09197807312011719, 0.09735488891601562, 0.10273170471191406, 0.1081085205078125, 0.11348533630371094, 0.11886215209960938, 0.12423896789550781, 0.12961578369140625, 0.1349925994873047, 0.14036941528320312, 0.14574623107910156, 0.151123046875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 2.0, 5.0, 11.0, 12.0, 12.0, 10.0, 19.0, 19.0, 23.0, 37.0, 25.0, 23.0, 42.0, 40.0, 38.0, 35.0, 39.0, 45.0, 43.0, 51.0, 42.0, 48.0, 49.0, 37.0, 57.0, 31.0, 32.0, 28.0, 23.0, 16.0, 17.0, 16.0, 17.0, 10.0, 10.0, 7.0, 6.0, 8.0, 4.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.169189453125, -0.1636810302734375, -0.158172607421875, -0.1526641845703125, -0.14715576171875, -0.1416473388671875, -0.136138916015625, -0.1306304931640625, -0.1251220703125, -0.1196136474609375, -0.114105224609375, -0.1085968017578125, -0.10308837890625, -0.0975799560546875, -0.092071533203125, -0.0865631103515625, -0.0810546875, -0.0755462646484375, -0.070037841796875, -0.0645294189453125, -0.05902099609375, -0.0535125732421875, -0.048004150390625, -0.0424957275390625, -0.0369873046875, -0.0314788818359375, -0.025970458984375, -0.0204620361328125, -0.01495361328125, -0.0094451904296875, -0.003936767578125, 0.0015716552734375, 0.007080078125, 0.0125885009765625, 0.018096923828125, 0.0236053466796875, 0.02911376953125, 0.0346221923828125, 0.040130615234375, 0.0456390380859375, 0.0511474609375, 0.0566558837890625, 0.062164306640625, 0.0676727294921875, 0.07318115234375, 0.0786895751953125, 0.084197998046875, 0.0897064208984375, 0.09521484375, 0.1007232666015625, 0.106231689453125, 0.1117401123046875, 0.11724853515625, 0.1227569580078125, 0.128265380859375, 0.1337738037109375, 0.1392822265625, 0.1447906494140625, 0.150299072265625, 0.1558074951171875, 0.16131591796875, 0.1668243408203125, 0.172332763671875, 0.1778411865234375, 0.183349609375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 10.0, 6.0, 11.0, 29.0, 23.0, 66.0, 86.0, 131.0, 210.0, 386.0, 876.0, 2041.0, 5536.0, 14806.0, 39112.0, 107972.0, 357033.0, 352239.0, 105571.0, 38316.0, 14835.0, 5428.0, 2087.0, 826.0, 368.0, 193.0, 126.0, 78.0, 50.0, 37.0, 20.0, 14.0, 14.0, 7.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07843017578125, -0.07625102996826172, -0.07407188415527344, -0.07189273834228516, -0.06971359252929688, -0.0675344467163086, -0.06535530090332031, -0.06317615509033203, -0.06099700927734375, -0.05881786346435547, -0.05663871765136719, -0.054459571838378906, -0.052280426025390625, -0.050101280212402344, -0.04792213439941406, -0.04574298858642578, -0.0435638427734375, -0.04138469696044922, -0.03920555114746094, -0.037026405334472656, -0.034847259521484375, -0.032668113708496094, -0.030488967895507812, -0.02830982208251953, -0.02613067626953125, -0.02395153045654297, -0.021772384643554688, -0.019593238830566406, -0.017414093017578125, -0.015234947204589844, -0.013055801391601562, -0.010876655578613281, -0.008697509765625, -0.006518363952636719, -0.0043392181396484375, -0.0021600723266601562, 1.9073486328125e-05, 0.0021982192993164062, 0.0043773651123046875, 0.006556510925292969, 0.00873565673828125, 0.010914802551269531, 0.013093948364257812, 0.015273094177246094, 0.017452239990234375, 0.019631385803222656, 0.021810531616210938, 0.02398967742919922, 0.0261688232421875, 0.02834796905517578, 0.030527114868164062, 0.032706260681152344, 0.034885406494140625, 0.037064552307128906, 0.03924369812011719, 0.04142284393310547, 0.04360198974609375, 0.04578113555908203, 0.04796028137207031, 0.050139427185058594, 0.052318572998046875, 0.054497718811035156, 0.05667686462402344, 0.05885601043701172, 0.06103515625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 8.0, 3.0, 11.0, 13.0, 15.0, 26.0, 25.0, 26.0, 40.0, 51.0, 79.0, 76.0, 90.0, 94.0, 83.0, 65.0, 48.0, 53.0, 55.0, 30.0, 26.0, 19.0, 11.0, 7.0, 9.0, 3.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9729137420654297e-05, -1.9137747585773468e-05, -1.854635775089264e-05, -1.795496791601181e-05, -1.736357808113098e-05, -1.6772188246250153e-05, -1.6180798411369324e-05, -1.5589408576488495e-05, -1.4998018741607666e-05, -1.4406628906726837e-05, -1.3815239071846008e-05, -1.322384923696518e-05, -1.263245940208435e-05, -1.2041069567203522e-05, -1.1449679732322693e-05, -1.0858289897441864e-05, -1.0266900062561035e-05, -9.675510227680206e-06, -9.084120392799377e-06, -8.492730557918549e-06, -7.90134072303772e-06, -7.309950888156891e-06, -6.718561053276062e-06, -6.127171218395233e-06, -5.535781383514404e-06, -4.9443915486335754e-06, -4.353001713752747e-06, -3.7616118788719177e-06, -3.170222043991089e-06, -2.57883220911026e-06, -1.987442374229431e-06, -1.3960525393486023e-06, -8.046627044677734e-07, -2.1327286958694458e-07, 3.781169652938843e-07, 9.695068001747131e-07, 1.560896635055542e-06, 2.152286469936371e-06, 2.7436763048171997e-06, 3.3350661396980286e-06, 3.926455974578857e-06, 4.517845809459686e-06, 5.109235644340515e-06, 5.700625479221344e-06, 6.292015314102173e-06, 6.883405148983002e-06, 7.4747949838638306e-06, 8.06618481874466e-06, 8.657574653625488e-06, 9.248964488506317e-06, 9.840354323387146e-06, 1.0431744158267975e-05, 1.1023133993148804e-05, 1.1614523828029633e-05, 1.2205913662910461e-05, 1.279730349779129e-05, 1.3388693332672119e-05, 1.3980083167552948e-05, 1.4571473002433777e-05, 1.5162862837314606e-05, 1.5754252672195435e-05, 1.6345642507076263e-05, 1.6937032341957092e-05, 1.752842217683792e-05, 1.811981201171875e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 9.0, 14.0, 25.0, 30.0, 56.0, 94.0, 149.0, 319.0, 798.0, 3224.0, 17064.0, 106708.0, 605336.0, 265297.0, 40098.0, 6821.0, 1497.0, 506.0, 216.0, 136.0, 62.0, 42.0, 22.0, 15.0, 11.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11846923828125, -0.11485004425048828, -0.11123085021972656, -0.10761165618896484, -0.10399246215820312, -0.1003732681274414, -0.09675407409667969, -0.09313488006591797, -0.08951568603515625, -0.08589649200439453, -0.08227729797363281, -0.0786581039428711, -0.07503890991210938, -0.07141971588134766, -0.06780052185058594, -0.06418132781982422, -0.0605621337890625, -0.05694293975830078, -0.05332374572753906, -0.049704551696777344, -0.046085357666015625, -0.042466163635253906, -0.03884696960449219, -0.03522777557373047, -0.03160858154296875, -0.02798938751220703, -0.024370193481445312, -0.020750999450683594, -0.017131805419921875, -0.013512611389160156, -0.009893417358398438, -0.006274223327636719, -0.002655029296875, 0.0009641647338867188, 0.0045833587646484375, 0.008202552795410156, 0.011821746826171875, 0.015440940856933594, 0.019060134887695312, 0.02267932891845703, 0.02629852294921875, 0.02991771697998047, 0.03353691101074219, 0.037156105041503906, 0.040775299072265625, 0.044394493103027344, 0.04801368713378906, 0.05163288116455078, 0.0552520751953125, 0.05887126922607422, 0.06249046325683594, 0.06610965728759766, 0.06972885131835938, 0.0733480453491211, 0.07696723937988281, 0.08058643341064453, 0.08420562744140625, 0.08782482147216797, 0.09144401550292969, 0.0950632095336914, 0.09868240356445312, 0.10230159759521484, 0.10592079162597656, 0.10953998565673828, 0.1131591796875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 1.0, 2.0, 5.0, 3.0, 10.0, 11.0, 12.0, 16.0, 17.0, 22.0, 22.0, 39.0, 40.0, 47.0, 67.0, 76.0, 106.0, 89.0, 95.0, 65.0, 52.0, 41.0, 36.0, 26.0, 25.0, 21.0, 13.0, 5.0, 11.0, 9.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0523681640625, -0.05062532424926758, -0.048882484436035156, -0.047139644622802734, -0.04539680480957031, -0.04365396499633789, -0.04191112518310547, -0.04016828536987305, -0.038425445556640625, -0.0366826057434082, -0.03493976593017578, -0.03319692611694336, -0.03145408630371094, -0.029711246490478516, -0.027968406677246094, -0.026225566864013672, -0.02448272705078125, -0.022739887237548828, -0.020997047424316406, -0.019254207611083984, -0.017511367797851562, -0.01576852798461914, -0.014025688171386719, -0.012282848358154297, -0.010540008544921875, -0.008797168731689453, -0.007054328918457031, -0.005311489105224609, -0.0035686492919921875, -0.0018258094787597656, -8.296966552734375e-05, 0.0016598701477050781, 0.0034027099609375, 0.005145549774169922, 0.006888389587402344, 0.008631229400634766, 0.010374069213867188, 0.01211690902709961, 0.013859748840332031, 0.015602588653564453, 0.017345428466796875, 0.019088268280029297, 0.02083110809326172, 0.02257394790649414, 0.024316787719726562, 0.026059627532958984, 0.027802467346191406, 0.029545307159423828, 0.03128814697265625, 0.03303098678588867, 0.034773826599121094, 0.036516666412353516, 0.03825950622558594, 0.04000234603881836, 0.04174518585205078, 0.0434880256652832, 0.045230865478515625, 0.04697370529174805, 0.04871654510498047, 0.05045938491821289, 0.05220222473144531, 0.053945064544677734, 0.055687904357910156, 0.05743074417114258, 0.059173583984375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 13.0, 28.0, 65.0, 129.0, 215.0, 226.0, 170.0, 106.0, 34.0, 13.0, 4.0, 4.0, 2.0, 0.0, 1.0], "bins": [-2.140767812728882, -2.101344347000122, -2.0619211196899414, -2.0224976539611816, -1.983074426651001, -1.9436509609222412, -1.904227614402771, -1.8648042678833008, -1.8253809213638306, -1.7859575748443604, -1.7465342283248901, -1.70711088180542, -1.6676874160766602, -1.62826406955719, -1.5888407230377197, -1.5494173765182495, -1.5099940299987793, -1.470570683479309, -1.4311473369598389, -1.3917239904403687, -1.3523006439208984, -1.3128771781921387, -1.2734538316726685, -1.2340304851531982, -1.194607138633728, -1.1551837921142578, -1.1157604455947876, -1.0763370990753174, -1.0369136333465576, -0.9974903464317322, -0.9580669403076172, -0.918643593788147, -0.879220187664032, -0.8397968411445618, -0.8003734350204468, -0.7609500885009766, -0.7215267419815063, -0.6821033954620361, -0.6426800489425659, -0.6032566428184509, -0.5638332962989807, -0.5244099497795105, -0.4849865734577179, -0.4455631971359253, -0.4061398506164551, -0.36671650409698486, -0.32729312777519226, -0.28786975145339966, -0.24844640493392944, -0.20902304351329803, -0.16959968209266663, -0.13017632067203522, -0.09075295925140381, -0.0513295978307724, -0.011906236410140991, 0.02751713991165161, 0.06694048643112183, 0.10636384785175323, 0.14578720927238464, 0.18521057069301605, 0.22463393211364746, 0.2640572786331177, 0.3034806549549103, 0.3429040312767029, 0.3823273777961731]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 10.0, 7.0, 10.0, 19.0, 13.0, 21.0, 16.0, 31.0, 27.0, 44.0, 43.0, 28.0, 37.0, 50.0, 44.0, 50.0, 53.0, 40.0, 48.0, 47.0, 36.0, 46.0, 36.0, 35.0, 34.0, 29.0, 27.0, 24.0, 19.0, 18.0, 14.0, 8.0, 7.0, 7.0, 5.0, 6.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4714987874031067, -0.4570818245410919, -0.44266486167907715, -0.42824786901474, -0.4138309061527252, -0.39941394329071045, -0.3849969804286957, -0.3705800175666809, -0.35616302490234375, -0.341746062040329, -0.3273290991783142, -0.31291210651397705, -0.2984951436519623, -0.2840781807899475, -0.26966121792793274, -0.25524425506591797, -0.2408272922039032, -0.22641032934188843, -0.21199335157871246, -0.1975763887166977, -0.18315941095352173, -0.16874244809150696, -0.1543254852294922, -0.13990852236747742, -0.12549154460430145, -0.11107457429170609, -0.09665760397911072, -0.08224064111709595, -0.06782367080450058, -0.05340670049190521, -0.03898973762989044, -0.024572767317295074, -0.010155797004699707, 0.004261171445250511, 0.01867813989520073, 0.0330951064825058, 0.047512076795101166, 0.06192904710769653, 0.0763460099697113, 0.09076298028230667, 0.10517995059490204, 0.1195969209074974, 0.13401389122009277, 0.14843085408210754, 0.16284781694412231, 0.17726479470729828, 0.19168175756931305, 0.206098735332489, 0.22051569819450378, 0.23493266105651855, 0.24934963881969452, 0.2637665867805481, 0.27818357944488525, 0.2926005423069, 0.3070175051689148, 0.32143446803092957, 0.33585143089294434, 0.3502683937549591, 0.3646853566169739, 0.37910234928131104, 0.3935193121433258, 0.4079362750053406, 0.42235323786735535, 0.4367702007293701, 0.4511871933937073]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 6.0, 1.0, 9.0, 12.0, 14.0, 20.0, 22.0, 46.0, 57.0, 101.0, 118.0, 220.0, 345.0, 599.0, 1064.0, 1909.0, 3300.0, 6045.0, 11485.0, 22437.0, 45206.0, 96256.0, 222717.0, 591815.0, 1520102.0, 1026428.0, 364044.0, 147088.0, 65978.0, 32139.0, 16041.0, 8167.0, 4511.0, 2495.0, 1381.0, 805.0, 474.0, 274.0, 194.0, 119.0, 91.0, 60.0, 25.0, 24.0, 17.0, 4.0, 4.0, 7.0, 9.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.06201171875, -0.059927940368652344, -0.05784416198730469, -0.05576038360595703, -0.053676605224609375, -0.05159282684326172, -0.04950904846191406, -0.047425270080566406, -0.04534149169921875, -0.043257713317871094, -0.04117393493652344, -0.03909015655517578, -0.037006378173828125, -0.03492259979248047, -0.03283882141113281, -0.030755043029785156, -0.0286712646484375, -0.026587486267089844, -0.024503707885742188, -0.02241992950439453, -0.020336151123046875, -0.01825237274169922, -0.016168594360351562, -0.014084815979003906, -0.01200103759765625, -0.009917259216308594, -0.007833480834960938, -0.005749702453613281, -0.003665924072265625, -0.0015821456909179688, 0.0005016326904296875, 0.0025854110717773438, 0.004669189453125, 0.006752967834472656, 0.008836746215820312, 0.010920524597167969, 0.013004302978515625, 0.015088081359863281, 0.017171859741210938, 0.019255638122558594, 0.02133941650390625, 0.023423194885253906, 0.025506973266601562, 0.02759075164794922, 0.029674530029296875, 0.03175830841064453, 0.03384208679199219, 0.035925865173339844, 0.0380096435546875, 0.040093421936035156, 0.04217720031738281, 0.04426097869873047, 0.046344757080078125, 0.04842853546142578, 0.05051231384277344, 0.052596092224121094, 0.05467987060546875, 0.056763648986816406, 0.05884742736816406, 0.06093120574951172, 0.06301498413085938, 0.06509876251220703, 0.06718254089355469, 0.06926631927490234, 0.07135009765625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 9.0, 6.0, 7.0, 11.0, 13.0, 11.0, 19.0, 19.0, 24.0, 18.0, 29.0, 29.0, 24.0, 32.0, 32.0, 45.0, 35.0, 35.0, 57.0, 46.0, 48.0, 56.0, 44.0, 45.0, 41.0, 33.0, 28.0, 33.0, 30.0, 26.0, 23.0, 19.0, 10.0, 16.0, 7.0, 6.0, 7.0, 5.0, 9.0, 4.0, 0.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05718994140625, -0.05518913269042969, -0.053188323974609375, -0.05118751525878906, -0.04918670654296875, -0.04718589782714844, -0.045185089111328125, -0.04318428039550781, -0.0411834716796875, -0.03918266296386719, -0.037181854248046875, -0.03518104553222656, -0.03318023681640625, -0.031179428100585938, -0.029178619384765625, -0.027177810668945312, -0.025177001953125, -0.023176193237304688, -0.021175384521484375, -0.019174575805664062, -0.01717376708984375, -0.015172958374023438, -0.013172149658203125, -0.011171340942382812, -0.0091705322265625, -0.0071697235107421875, -0.005168914794921875, -0.0031681060791015625, -0.00116729736328125, 0.0008335113525390625, 0.002834320068359375, 0.0048351287841796875, 0.0068359375, 0.008836746215820312, 0.010837554931640625, 0.012838363647460938, 0.01483917236328125, 0.016839981079101562, 0.018840789794921875, 0.020841598510742188, 0.0228424072265625, 0.024843215942382812, 0.026844024658203125, 0.028844833374023438, 0.03084564208984375, 0.03284645080566406, 0.034847259521484375, 0.03684806823730469, 0.038848876953125, 0.04084968566894531, 0.042850494384765625, 0.04485130310058594, 0.04685211181640625, 0.04885292053222656, 0.050853729248046875, 0.05285453796386719, 0.0548553466796875, 0.05685615539550781, 0.058856964111328125, 0.06085777282714844, 0.06285858154296875, 0.06485939025878906, 0.06686019897460938, 0.06886100769042969, 0.07086181640625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 9.0, 6.0, 9.0, 9.0, 25.0, 27.0, 44.0, 71.0, 93.0, 145.0, 199.0, 336.0, 473.0, 834.0, 1326.0, 2282.0, 3996.0, 7221.0, 14640.0, 30310.0, 66291.0, 156797.0, 410652.0, 1275361.0, 1436501.0, 470418.0, 175821.0, 73126.0, 33209.0, 15765.0, 7949.0, 4087.0, 2450.0, 1400.0, 837.0, 534.0, 329.0, 232.0, 142.0, 107.0, 60.0, 64.0, 41.0, 24.0, 8.0, 8.0, 4.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0931396484375, -0.09023475646972656, -0.08732986450195312, -0.08442497253417969, -0.08152008056640625, -0.07861518859863281, -0.07571029663085938, -0.07280540466308594, -0.0699005126953125, -0.06699562072753906, -0.06409072875976562, -0.06118583679199219, -0.05828094482421875, -0.05537605285644531, -0.052471160888671875, -0.04956626892089844, -0.046661376953125, -0.04375648498535156, -0.040851593017578125, -0.03794670104980469, -0.03504180908203125, -0.03213691711425781, -0.029232025146484375, -0.026327133178710938, -0.0234222412109375, -0.020517349243164062, -0.017612457275390625, -0.014707565307617188, -0.01180267333984375, -0.008897781372070312, -0.005992889404296875, -0.0030879974365234375, -0.00018310546875, 0.0027217864990234375, 0.005626678466796875, 0.008531570434570312, 0.01143646240234375, 0.014341354370117188, 0.017246246337890625, 0.020151138305664062, 0.0230560302734375, 0.025960922241210938, 0.028865814208984375, 0.03177070617675781, 0.03467559814453125, 0.03758049011230469, 0.040485382080078125, 0.04339027404785156, 0.046295166015625, 0.04920005798339844, 0.052104949951171875, 0.05500984191894531, 0.05791473388671875, 0.06081962585449219, 0.06372451782226562, 0.06662940979003906, 0.0695343017578125, 0.07243919372558594, 0.07534408569335938, 0.07824897766113281, 0.08115386962890625, 0.08405876159667969, 0.08696365356445312, 0.08986854553222656, 0.0927734375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 5.0, 6.0, 3.0, 5.0, 19.0, 27.0, 25.0, 50.0, 79.0, 103.0, 166.0, 248.0, 417.0, 627.0, 749.0, 557.0, 336.0, 232.0, 131.0, 86.0, 58.0, 46.0, 37.0, 14.0, 16.0, 7.0, 7.0, 2.0, 6.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1256103515625, -0.12064552307128906, -0.11568069458007812, -0.11071586608886719, -0.10575103759765625, -0.10078620910644531, -0.09582138061523438, -0.09085655212402344, -0.0858917236328125, -0.08092689514160156, -0.07596206665039062, -0.07099723815917969, -0.06603240966796875, -0.06106758117675781, -0.056102752685546875, -0.05113792419433594, -0.046173095703125, -0.04120826721191406, -0.036243438720703125, -0.03127861022949219, -0.02631378173828125, -0.021348953247070312, -0.016384124755859375, -0.011419296264648438, -0.0064544677734375, -0.0014896392822265625, 0.003475189208984375, 0.008440017700195312, 0.01340484619140625, 0.018369674682617188, 0.023334503173828125, 0.028299331665039062, 0.03326416015625, 0.03822898864746094, 0.043193817138671875, 0.04815864562988281, 0.05312347412109375, 0.05808830261230469, 0.06305313110351562, 0.06801795959472656, 0.0729827880859375, 0.07794761657714844, 0.08291244506835938, 0.08787727355957031, 0.09284210205078125, 0.09780693054199219, 0.10277175903320312, 0.10773658752441406, 0.112701416015625, 0.11766624450683594, 0.12263107299804688, 0.1275959014892578, 0.13256072998046875, 0.1375255584716797, 0.14249038696289062, 0.14745521545410156, 0.1524200439453125, 0.15738487243652344, 0.16234970092773438, 0.1673145294189453, 0.17227935791015625, 0.1772441864013672, 0.18220901489257812, 0.18717384338378906, 0.192138671875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 7.0, 15.0, 26.0, 50.0, 42.0, 84.0, 99.0, 120.0, 124.0, 115.0, 94.0, 72.0, 59.0, 45.0, 24.0, 10.0, 10.0, 9.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0500328540802002, -1.024706482887268, -0.9993801712989807, -0.9740538597106934, -0.9487274885177612, -0.9234011769294739, -0.8980748653411865, -0.8727484941482544, -0.847422182559967, -0.8220958709716797, -0.7967694997787476, -0.7714431881904602, -0.7461168169975281, -0.7207905054092407, -0.6954641342163086, -0.6701378226280212, -0.6448115110397339, -0.6194851994514465, -0.5941588282585144, -0.568832516670227, -0.5435061454772949, -0.5181798338890076, -0.4928534924983978, -0.4675271511077881, -0.44220077991485596, -0.4168744385242462, -0.3915480971336365, -0.3662217855453491, -0.3408954441547394, -0.31556910276412964, -0.2902427613735199, -0.26491641998291016, -0.2395901083946228, -0.21426376700401306, -0.18893744051456451, -0.16361109912395477, -0.13828477263450623, -0.11295843124389648, -0.08763208985328674, -0.062305763363838196, -0.036979421973228455, -0.011653086170554161, 0.013673249632120132, 0.038999587297439575, 0.06432592123746872, 0.08965225517749786, 0.1149785965681076, 0.14030492305755615, 0.1656312644481659, 0.19095760583877563, 0.21628393232822418, 0.24161027371883392, 0.26693660020828247, 0.2922629415988922, 0.31758928298950195, 0.3429155945777893, 0.36824196577072144, 0.3935683071613312, 0.4188946485519409, 0.44422096014022827, 0.469547301530838, 0.49487364292144775, 0.5202000141143799, 0.5455263257026672, 0.5708526372909546]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 8.0, 8.0, 7.0, 7.0, 10.0, 15.0, 18.0, 19.0, 20.0, 25.0, 36.0, 28.0, 34.0, 37.0, 35.0, 40.0, 39.0, 44.0, 41.0, 39.0, 48.0, 39.0, 37.0, 39.0, 39.0, 36.0, 29.0, 31.0, 28.0, 31.0, 26.0, 16.0, 19.0, 13.0, 8.0, 11.0, 5.0, 10.0, 3.0, 4.0, 3.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.38728368282318115, -0.3750231862068176, -0.3627626895904541, -0.35050222277641296, -0.33824172616004944, -0.3259812295436859, -0.3137207329273224, -0.30146026611328125, -0.2891997694969177, -0.2769392728805542, -0.2646787762641907, -0.25241830945014954, -0.240157812833786, -0.22789731621742249, -0.21563681960105896, -0.20337633788585663, -0.1911158412694931, -0.17885534465312958, -0.16659486293792725, -0.15433436632156372, -0.1420738846063614, -0.12981338798999786, -0.11755289882421494, -0.105292409658432, -0.09303192049264908, -0.08077143132686615, -0.06851094216108322, -0.056250449270009995, -0.043989960104227066, -0.03172947093844414, -0.01946897804737091, -0.007208488881587982, 0.005052000284194946, 0.017312489449977875, 0.029572980478405952, 0.04183347150683403, 0.05409396067261696, 0.06635445356369019, 0.07861494272947311, 0.09087543189525604, 0.10313592106103897, 0.1153964102268219, 0.12765690684318542, 0.13991738855838776, 0.15217788517475128, 0.1644383668899536, 0.17669886350631714, 0.18895936012268066, 0.201219841837883, 0.21348033845424652, 0.22574082016944885, 0.23800131678581238, 0.2502618134021759, 0.26252228021621704, 0.27478277683258057, 0.2870432734489441, 0.2993037700653076, 0.31156426668167114, 0.32382476329803467, 0.3360852301120758, 0.34834572672843933, 0.36060622334480286, 0.3728667199611664, 0.3851271867752075, 0.39738768339157104]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 11.0, 13.0, 18.0, 34.0, 39.0, 70.0, 118.0, 142.0, 294.0, 430.0, 687.0, 1015.0, 1618.0, 2513.0, 4057.0, 6210.0, 9620.0, 14848.0, 23489.0, 37911.0, 62632.0, 107178.0, 177346.0, 217001.0, 151513.0, 88854.0, 52507.0, 32270.0, 20066.0, 12936.0, 8233.0, 5400.0, 3444.0, 2155.0, 1356.0, 930.0, 521.0, 405.0, 228.0, 166.0, 91.0, 68.0, 46.0, 28.0, 13.0, 12.0, 9.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.074462890625, -0.0721597671508789, -0.06985664367675781, -0.06755352020263672, -0.06525039672851562, -0.06294727325439453, -0.06064414978027344, -0.058341026306152344, -0.05603790283203125, -0.053734779357910156, -0.05143165588378906, -0.04912853240966797, -0.046825408935546875, -0.04452228546142578, -0.04221916198730469, -0.039916038513183594, -0.0376129150390625, -0.035309791564941406, -0.03300666809082031, -0.03070354461669922, -0.028400421142578125, -0.02609729766845703, -0.023794174194335938, -0.021491050720214844, -0.01918792724609375, -0.016884803771972656, -0.014581680297851562, -0.012278556823730469, -0.009975433349609375, -0.007672309875488281, -0.0053691864013671875, -0.0030660629272460938, -0.000762939453125, 0.0015401840209960938, 0.0038433074951171875, 0.006146430969238281, 0.008449554443359375, 0.010752677917480469, 0.013055801391601562, 0.015358924865722656, 0.01766204833984375, 0.019965171813964844, 0.022268295288085938, 0.02457141876220703, 0.026874542236328125, 0.02917766571044922, 0.03148078918457031, 0.033783912658691406, 0.0360870361328125, 0.038390159606933594, 0.04069328308105469, 0.04299640655517578, 0.045299530029296875, 0.04760265350341797, 0.04990577697753906, 0.052208900451660156, 0.05451202392578125, 0.056815147399902344, 0.05911827087402344, 0.06142139434814453, 0.06372451782226562, 0.06602764129638672, 0.06833076477050781, 0.0706338882446289, 0.07293701171875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 8.0, 12.0, 5.0, 9.0, 9.0, 10.0, 22.0, 21.0, 26.0, 30.0, 23.0, 28.0, 27.0, 40.0, 38.0, 50.0, 37.0, 41.0, 42.0, 38.0, 47.0, 35.0, 40.0, 37.0, 45.0, 30.0, 40.0, 32.0, 30.0, 28.0, 19.0, 25.0, 9.0, 13.0, 9.0, 5.0, 4.0, 12.0, 3.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.05621337890625, -0.054299354553222656, -0.05238533020019531, -0.05047130584716797, -0.048557281494140625, -0.04664325714111328, -0.04472923278808594, -0.042815208435058594, -0.04090118408203125, -0.038987159729003906, -0.03707313537597656, -0.03515911102294922, -0.033245086669921875, -0.03133106231689453, -0.029417037963867188, -0.027503013610839844, -0.0255889892578125, -0.023674964904785156, -0.021760940551757812, -0.01984691619873047, -0.017932891845703125, -0.01601886749267578, -0.014104843139648438, -0.012190818786621094, -0.01027679443359375, -0.008362770080566406, -0.0064487457275390625, -0.004534721374511719, -0.002620697021484375, -0.0007066726684570312, 0.0012073516845703125, 0.0031213760375976562, 0.005035400390625, 0.006949424743652344, 0.008863449096679688, 0.010777473449707031, 0.012691497802734375, 0.014605522155761719, 0.016519546508789062, 0.018433570861816406, 0.02034759521484375, 0.022261619567871094, 0.024175643920898438, 0.02608966827392578, 0.028003692626953125, 0.02991771697998047, 0.03183174133300781, 0.033745765686035156, 0.0356597900390625, 0.037573814392089844, 0.03948783874511719, 0.04140186309814453, 0.043315887451171875, 0.04522991180419922, 0.04714393615722656, 0.049057960510253906, 0.05097198486328125, 0.052886009216308594, 0.05480003356933594, 0.05671405792236328, 0.058628082275390625, 0.06054210662841797, 0.06245613098144531, 0.06437015533447266, 0.0662841796875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 10.0, 6.0, 8.0, 9.0, 15.0, 31.0, 24.0, 39.0, 50.0, 62.0, 96.0, 145.0, 234.0, 324.0, 607.0, 1592.0, 4950.0, 17198.0, 61364.0, 225380.0, 485938.0, 180014.0, 49755.0, 13856.0, 4021.0, 1335.0, 538.0, 298.0, 182.0, 139.0, 93.0, 64.0, 39.0, 36.0, 25.0, 20.0, 17.0, 10.0, 15.0, 6.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1871337890625, -0.18117713928222656, -0.17522048950195312, -0.1692638397216797, -0.16330718994140625, -0.1573505401611328, -0.15139389038085938, -0.14543724060058594, -0.1394805908203125, -0.13352394104003906, -0.12756729125976562, -0.12161064147949219, -0.11565399169921875, -0.10969734191894531, -0.10374069213867188, -0.09778404235839844, -0.091827392578125, -0.08587074279785156, -0.07991409301757812, -0.07395744323730469, -0.06800079345703125, -0.06204414367675781, -0.056087493896484375, -0.05013084411621094, -0.0441741943359375, -0.03821754455566406, -0.032260894775390625, -0.026304244995117188, -0.02034759521484375, -0.014390945434570312, -0.008434295654296875, -0.0024776458740234375, 0.00347900390625, 0.009435653686523438, 0.015392303466796875, 0.021348953247070312, 0.02730560302734375, 0.03326225280761719, 0.039218902587890625, 0.04517555236816406, 0.0511322021484375, 0.05708885192871094, 0.06304550170898438, 0.06900215148925781, 0.07495880126953125, 0.08091545104980469, 0.08687210083007812, 0.09282875061035156, 0.098785400390625, 0.10474205017089844, 0.11069869995117188, 0.11665534973144531, 0.12261199951171875, 0.1285686492919922, 0.13452529907226562, 0.14048194885253906, 0.1464385986328125, 0.15239524841308594, 0.15835189819335938, 0.1643085479736328, 0.17026519775390625, 0.1762218475341797, 0.18217849731445312, 0.18813514709472656, 0.194091796875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 3.0, 8.0, 12.0, 11.0, 8.0, 13.0, 7.0, 12.0, 14.0, 21.0, 14.0, 33.0, 24.0, 34.0, 31.0, 32.0, 35.0, 40.0, 32.0, 44.0, 35.0, 43.0, 40.0, 38.0, 32.0, 34.0, 38.0, 33.0, 28.0, 35.0, 32.0, 20.0, 23.0, 17.0, 22.0, 7.0, 20.0, 13.0, 17.0, 7.0, 10.0, 8.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1563720703125, -0.15104103088378906, -0.14570999145507812, -0.1403789520263672, -0.13504791259765625, -0.1297168731689453, -0.12438583374023438, -0.11905479431152344, -0.1137237548828125, -0.10839271545410156, -0.10306167602539062, -0.09773063659667969, -0.09239959716796875, -0.08706855773925781, -0.08173751831054688, -0.07640647888183594, -0.071075439453125, -0.06574440002441406, -0.060413360595703125, -0.05508232116699219, -0.04975128173828125, -0.04442024230957031, -0.039089202880859375, -0.03375816345214844, -0.0284271240234375, -0.023096084594726562, -0.017765045166015625, -0.012434005737304688, -0.00710296630859375, -0.0017719268798828125, 0.003559112548828125, 0.008890151977539062, 0.01422119140625, 0.019552230834960938, 0.024883270263671875, 0.030214309692382812, 0.03554534912109375, 0.04087638854980469, 0.046207427978515625, 0.05153846740722656, 0.0568695068359375, 0.06220054626464844, 0.06753158569335938, 0.07286262512207031, 0.07819366455078125, 0.08352470397949219, 0.08885574340820312, 0.09418678283691406, 0.099517822265625, 0.10484886169433594, 0.11017990112304688, 0.11551094055175781, 0.12084197998046875, 0.1261730194091797, 0.13150405883789062, 0.13683509826660156, 0.1421661376953125, 0.14749717712402344, 0.15282821655273438, 0.1581592559814453, 0.16349029541015625, 0.1688213348388672, 0.17415237426757812, 0.17948341369628906, 0.184814453125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 9.0, 4.0, 5.0, 10.0, 15.0, 24.0, 18.0, 27.0, 35.0, 42.0, 69.0, 110.0, 167.0, 342.0, 642.0, 1359.0, 3348.0, 8279.0, 22345.0, 59686.0, 159243.0, 390613.0, 253169.0, 92293.0, 34831.0, 13092.0, 4858.0, 1981.0, 826.0, 412.0, 247.0, 135.0, 92.0, 72.0, 44.0, 28.0, 21.0, 15.0, 11.0, 8.0, 12.0, 4.0, 6.0, 4.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.07373046875, -0.07160711288452148, -0.06948375701904297, -0.06736040115356445, -0.06523704528808594, -0.06311368942260742, -0.060990333557128906, -0.05886697769165039, -0.056743621826171875, -0.05462026596069336, -0.052496910095214844, -0.05037355422973633, -0.04825019836425781, -0.0461268424987793, -0.04400348663330078, -0.041880130767822266, -0.03975677490234375, -0.037633419036865234, -0.03551006317138672, -0.0333867073059082, -0.03126335144042969, -0.029139995574951172, -0.027016639709472656, -0.02489328384399414, -0.022769927978515625, -0.02064657211303711, -0.018523216247558594, -0.016399860382080078, -0.014276504516601562, -0.012153148651123047, -0.010029792785644531, -0.007906436920166016, -0.0057830810546875, -0.0036597251892089844, -0.0015363693237304688, 0.0005869865417480469, 0.0027103424072265625, 0.004833698272705078, 0.006957054138183594, 0.00908041000366211, 0.011203765869140625, 0.01332712173461914, 0.015450477600097656, 0.017573833465576172, 0.019697189331054688, 0.021820545196533203, 0.02394390106201172, 0.026067256927490234, 0.02819061279296875, 0.030313968658447266, 0.03243732452392578, 0.0345606803894043, 0.03668403625488281, 0.03880739212036133, 0.040930747985839844, 0.04305410385131836, 0.045177459716796875, 0.04730081558227539, 0.049424171447753906, 0.05154752731323242, 0.05367088317871094, 0.05579423904418945, 0.05791759490966797, 0.060040950775146484, 0.062164306640625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 5.0, 4.0, 7.0, 17.0, 11.0, 20.0, 20.0, 37.0, 41.0, 50.0, 84.0, 85.0, 84.0, 107.0, 93.0, 69.0, 73.0, 48.0, 50.0, 24.0, 18.0, 17.0, 13.0, 5.0, 10.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.682209014892578e-05, -2.6103109121322632e-05, -2.5384128093719482e-05, -2.4665147066116333e-05, -2.3946166038513184e-05, -2.3227185010910034e-05, -2.2508203983306885e-05, -2.1789222955703735e-05, -2.1070241928100586e-05, -2.0351260900497437e-05, -1.9632279872894287e-05, -1.8913298845291138e-05, -1.8194317817687988e-05, -1.747533679008484e-05, -1.675635576248169e-05, -1.603737473487854e-05, -1.531839370727539e-05, -1.4599412679672241e-05, -1.3880431652069092e-05, -1.3161450624465942e-05, -1.2442469596862793e-05, -1.1723488569259644e-05, -1.1004507541656494e-05, -1.0285526514053345e-05, -9.566545486450195e-06, -8.847564458847046e-06, -8.128583431243896e-06, -7.409602403640747e-06, -6.690621376037598e-06, -5.971640348434448e-06, -5.252659320831299e-06, -4.533678293228149e-06, -3.814697265625e-06, -3.0957162380218506e-06, -2.376735210418701e-06, -1.6577541828155518e-06, -9.387731552124023e-07, -2.1979212760925293e-07, 4.991888999938965e-07, 1.218169927597046e-06, 1.9371509552001953e-06, 2.6561319828033447e-06, 3.375113010406494e-06, 4.0940940380096436e-06, 4.813075065612793e-06, 5.532056093215942e-06, 6.251037120819092e-06, 6.970018148422241e-06, 7.68899917602539e-06, 8.40798020362854e-06, 9.12696123123169e-06, 9.845942258834839e-06, 1.0564923286437988e-05, 1.1283904314041138e-05, 1.2002885341644287e-05, 1.2721866369247437e-05, 1.3440847396850586e-05, 1.4159828424453735e-05, 1.4878809452056885e-05, 1.5597790479660034e-05, 1.6316771507263184e-05, 1.7035752534866333e-05, 1.7754733562469482e-05, 1.8473714590072632e-05, 1.919269561767578e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 9.0, 9.0, 10.0, 18.0, 17.0, 26.0, 37.0, 49.0, 81.0, 119.0, 153.0, 231.0, 507.0, 979.0, 2401.0, 6772.0, 19930.0, 57189.0, 156206.0, 363475.0, 276235.0, 105243.0, 37883.0, 13131.0, 4393.0, 1725.0, 742.0, 373.0, 201.0, 113.0, 90.0, 61.0, 43.0, 36.0, 20.0, 11.0, 9.0, 9.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0687255859375, -0.06663036346435547, -0.06453514099121094, -0.062439918518066406, -0.060344696044921875, -0.058249473571777344, -0.05615425109863281, -0.05405902862548828, -0.05196380615234375, -0.04986858367919922, -0.04777336120605469, -0.045678138732910156, -0.043582916259765625, -0.041487693786621094, -0.03939247131347656, -0.03729724884033203, -0.0352020263671875, -0.03310680389404297, -0.031011581420898438, -0.028916358947753906, -0.026821136474609375, -0.024725914001464844, -0.022630691528320312, -0.02053546905517578, -0.01844024658203125, -0.01634502410888672, -0.014249801635742188, -0.012154579162597656, -0.010059356689453125, -0.007964134216308594, -0.0058689117431640625, -0.0037736892700195312, -0.001678466796875, 0.00041675567626953125, 0.0025119781494140625, 0.004607200622558594, 0.006702423095703125, 0.008797645568847656, 0.010892868041992188, 0.012988090515136719, 0.01508331298828125, 0.01717853546142578, 0.019273757934570312, 0.021368980407714844, 0.023464202880859375, 0.025559425354003906, 0.027654647827148438, 0.02974987030029297, 0.0318450927734375, 0.03394031524658203, 0.03603553771972656, 0.038130760192871094, 0.040225982666015625, 0.042321205139160156, 0.04441642761230469, 0.04651165008544922, 0.04860687255859375, 0.05070209503173828, 0.05279731750488281, 0.054892539978027344, 0.056987762451171875, 0.059082984924316406, 0.06117820739746094, 0.06327342987060547, 0.06536865234375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 5.0, 4.0, 5.0, 5.0, 6.0, 15.0, 10.0, 9.0, 22.0, 20.0, 23.0, 43.0, 39.0, 36.0, 79.0, 95.0, 113.0, 116.0, 77.0, 62.0, 43.0, 39.0, 31.0, 32.0, 15.0, 14.0, 10.0, 14.0, 9.0, 7.0, 5.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.09942626953125, -0.09714698791503906, -0.09486770629882812, -0.09258842468261719, -0.09030914306640625, -0.08802986145019531, -0.08575057983398438, -0.08347129821777344, -0.0811920166015625, -0.07891273498535156, -0.07663345336914062, -0.07435417175292969, -0.07207489013671875, -0.06979560852050781, -0.06751632690429688, -0.06523704528808594, -0.062957763671875, -0.06067848205566406, -0.058399200439453125, -0.05611991882324219, -0.05384063720703125, -0.05156135559082031, -0.049282073974609375, -0.04700279235839844, -0.0447235107421875, -0.04244422912597656, -0.040164947509765625, -0.03788566589355469, -0.03560638427734375, -0.03332710266113281, -0.031047821044921875, -0.028768539428710938, -0.0264892578125, -0.024209976196289062, -0.021930694580078125, -0.019651412963867188, -0.01737213134765625, -0.015092849731445312, -0.012813568115234375, -0.010534286499023438, -0.0082550048828125, -0.0059757232666015625, -0.003696441650390625, -0.0014171600341796875, 0.00086212158203125, 0.0031414031982421875, 0.005420684814453125, 0.0076999664306640625, 0.009979248046875, 0.012258529663085938, 0.014537811279296875, 0.016817092895507812, 0.01909637451171875, 0.021375656127929688, 0.023654937744140625, 0.025934219360351562, 0.0282135009765625, 0.030492782592773438, 0.032772064208984375, 0.03505134582519531, 0.03733062744140625, 0.03960990905761719, 0.041889190673828125, 0.04416847229003906, 0.04644775390625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 11.0, 11.0, 35.0, 50.0, 80.0, 98.0, 137.0, 149.0, 142.0, 112.0, 76.0, 50.0, 27.0, 10.0, 6.0, 7.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6319550275802612, -0.6007624864578247, -0.569570004940033, -0.5383774638175964, -0.5071849822998047, -0.47599244117736816, -0.44479990005493164, -0.4136073887348175, -0.38241487741470337, -0.35122236609458923, -0.3200298547744751, -0.2888373136520386, -0.25764480233192444, -0.2264522910118103, -0.19525976479053497, -0.16406723856925964, -0.1328747272491455, -0.10168220847845078, -0.07048968970775604, -0.03929717093706131, -0.008104652166366577, 0.02308785915374756, 0.05428038537502289, 0.08547291159629822, 0.11666542291641235, 0.1478579342365265, 0.17905046045780182, 0.21024298667907715, 0.24143549799919128, 0.2726280093193054, 0.30382055044174194, 0.3350130617618561, 0.3662055730819702, 0.39739808440208435, 0.4285905957221985, 0.459783136844635, 0.49097564816474915, 0.5221681594848633, 0.5533607006072998, 0.5845532417297363, 0.6157457232475281, 0.6469382643699646, 0.6781307458877563, 0.7093232870101929, 0.7405158281326294, 0.7717083096504211, 0.8029008507728577, 0.8340933322906494, 0.8652858734130859, 0.8964784145355225, 0.9276708960533142, 0.9588634371757507, 0.9900559186935425, 1.021248459815979, 1.0524410009384155, 1.083633542060852, 1.114825963973999, 1.1460185050964355, 1.177211046218872, 1.208403468132019, 1.2395960092544556, 1.270788550376892, 1.3019810914993286, 1.3331736326217651, 1.3643661737442017]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 6.0, 6.0, 10.0, 11.0, 15.0, 17.0, 18.0, 15.0, 25.0, 26.0, 26.0, 27.0, 33.0, 28.0, 39.0, 36.0, 41.0, 46.0, 48.0, 31.0, 41.0, 42.0, 41.0, 39.0, 34.0, 30.0, 36.0, 29.0, 28.0, 37.0, 18.0, 23.0, 12.0, 16.0, 16.0, 12.0, 10.0, 5.0, 6.0, 6.0, 7.0, 1.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.54017174243927, -0.5241564512252808, -0.5081411004066467, -0.49212580919265747, -0.4761105179786682, -0.46009519696235657, -0.4440798759460449, -0.42806458473205566, -0.412049263715744, -0.3960339426994324, -0.3800186514854431, -0.36400333046913147, -0.3479880094528198, -0.33197271823883057, -0.3159573972225189, -0.2999420762062073, -0.283926784992218, -0.26791146397590637, -0.2518961727619171, -0.23588085174560547, -0.21986554563045502, -0.20385023951530457, -0.18783491849899292, -0.17181961238384247, -0.15580430626869202, -0.13978900015354156, -0.12377368658781052, -0.10775837302207947, -0.09174306690692902, -0.07572776079177856, -0.059712447226047516, -0.04369713366031647, -0.027681827545166016, -0.011666517704725266, 0.004348792135715485, 0.020364101976156235, 0.036379411816596985, 0.052394717931747437, 0.06841003149747849, 0.08442534506320953, 0.10044065117835999, 0.11645595729351044, 0.1324712634086609, 0.14848658442497253, 0.16450189054012299, 0.18051719665527344, 0.19653251767158508, 0.21254782378673553, 0.228563129901886, 0.24457843601703644, 0.2605937421321869, 0.27660906314849854, 0.2926243543624878, 0.30863967537879944, 0.3246549963951111, 0.34067028760910034, 0.356685608625412, 0.37270092964172363, 0.3887162208557129, 0.40473154187202454, 0.4207468628883362, 0.43676215410232544, 0.4527774751186371, 0.46879279613494873, 0.484808087348938]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 8.0, 9.0, 14.0, 19.0, 34.0, 42.0, 55.0, 103.0, 169.0, 306.0, 495.0, 810.0, 1550.0, 2781.0, 5417.0, 10370.0, 19787.0, 40330.0, 83473.0, 184631.0, 473966.0, 1387776.0, 1237716.0, 424122.0, 168866.0, 76203.0, 36696.0, 18539.0, 9277.0, 4873.0, 2562.0, 1430.0, 782.0, 424.0, 269.0, 146.0, 84.0, 49.0, 33.0, 23.0, 12.0, 10.0, 8.0, 3.0, 6.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.08477783203125, -0.08248281478881836, -0.08018779754638672, -0.07789278030395508, -0.07559776306152344, -0.0733027458190918, -0.07100772857666016, -0.06871271133422852, -0.06641769409179688, -0.06412267684936523, -0.061827659606933594, -0.05953264236450195, -0.05723762512207031, -0.05494260787963867, -0.05264759063720703, -0.05035257339477539, -0.04805755615234375, -0.04576253890991211, -0.04346752166748047, -0.04117250442504883, -0.03887748718261719, -0.03658246994018555, -0.034287452697753906, -0.031992435455322266, -0.029697418212890625, -0.027402400970458984, -0.025107383728027344, -0.022812366485595703, -0.020517349243164062, -0.018222332000732422, -0.01592731475830078, -0.01363229751586914, -0.0113372802734375, -0.00904226303100586, -0.006747245788574219, -0.004452228546142578, -0.0021572113037109375, 0.00013780593872070312, 0.0024328231811523438, 0.004727840423583984, 0.007022857666015625, 0.009317874908447266, 0.011612892150878906, 0.013907909393310547, 0.016202926635742188, 0.018497943878173828, 0.02079296112060547, 0.02308797836303711, 0.02538299560546875, 0.02767801284790039, 0.02997303009033203, 0.03226804733276367, 0.03456306457519531, 0.03685808181762695, 0.039153099060058594, 0.041448116302490234, 0.043743133544921875, 0.046038150787353516, 0.048333168029785156, 0.0506281852722168, 0.05292320251464844, 0.05521821975708008, 0.05751323699951172, 0.05980825424194336, 0.062103271484375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 7.0, 6.0, 6.0, 10.0, 6.0, 7.0, 6.0, 5.0, 10.0, 13.0, 14.0, 18.0, 27.0, 20.0, 20.0, 29.0, 32.0, 37.0, 33.0, 35.0, 33.0, 38.0, 45.0, 52.0, 49.0, 40.0, 41.0, 38.0, 39.0, 27.0, 35.0, 32.0, 28.0, 24.0, 26.0, 22.0, 12.0, 12.0, 13.0, 9.0, 9.0, 8.0, 6.0, 8.0, 6.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.06884765625, -0.06691455841064453, -0.06498146057128906, -0.0630483627319336, -0.061115264892578125, -0.059182167053222656, -0.05724906921386719, -0.05531597137451172, -0.05338287353515625, -0.05144977569580078, -0.04951667785644531, -0.047583580017089844, -0.045650482177734375, -0.043717384338378906, -0.04178428649902344, -0.03985118865966797, -0.0379180908203125, -0.03598499298095703, -0.03405189514160156, -0.032118797302246094, -0.030185699462890625, -0.028252601623535156, -0.026319503784179688, -0.02438640594482422, -0.02245330810546875, -0.02052021026611328, -0.018587112426757812, -0.016654014587402344, -0.014720916748046875, -0.012787818908691406, -0.010854721069335938, -0.008921623229980469, -0.006988525390625, -0.005055427551269531, -0.0031223297119140625, -0.0011892318725585938, 0.000743865966796875, 0.0026769638061523438, 0.0046100616455078125, 0.006543159484863281, 0.00847625732421875, 0.010409355163574219, 0.012342453002929688, 0.014275550842285156, 0.016208648681640625, 0.018141746520996094, 0.020074844360351562, 0.02200794219970703, 0.0239410400390625, 0.02587413787841797, 0.027807235717773438, 0.029740333557128906, 0.031673431396484375, 0.033606529235839844, 0.03553962707519531, 0.03747272491455078, 0.03940582275390625, 0.04133892059326172, 0.04327201843261719, 0.045205116271972656, 0.047138214111328125, 0.049071311950683594, 0.05100440979003906, 0.05293750762939453, 0.05487060546875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 7.0, 7.0, 19.0, 23.0, 29.0, 43.0, 58.0, 81.0, 121.0, 163.0, 232.0, 452.0, 740.0, 1152.0, 2193.0, 3799.0, 7018.0, 12786.0, 23495.0, 44234.0, 84756.0, 169561.0, 371409.0, 925195.0, 1383059.0, 630435.0, 265364.0, 127690.0, 64674.0, 34193.0, 18193.0, 10022.0, 5611.0, 3119.0, 1672.0, 981.0, 575.0, 373.0, 229.0, 162.0, 109.0, 67.0, 60.0, 32.0, 23.0, 25.0, 10.0, 9.0, 9.0, 7.0, 3.0, 3.0, 2.0], "bins": [-0.0902099609375, -0.08765411376953125, -0.0850982666015625, -0.08254241943359375, -0.079986572265625, -0.07743072509765625, -0.0748748779296875, -0.07231903076171875, -0.06976318359375, -0.06720733642578125, -0.0646514892578125, -0.06209564208984375, -0.059539794921875, -0.05698394775390625, -0.0544281005859375, -0.05187225341796875, -0.04931640625, -0.04676055908203125, -0.0442047119140625, -0.04164886474609375, -0.039093017578125, -0.03653717041015625, -0.0339813232421875, -0.03142547607421875, -0.02886962890625, -0.02631378173828125, -0.0237579345703125, -0.02120208740234375, -0.018646240234375, -0.01609039306640625, -0.0135345458984375, -0.01097869873046875, -0.0084228515625, -0.00586700439453125, -0.0033111572265625, -0.00075531005859375, 0.001800537109375, 0.00435638427734375, 0.0069122314453125, 0.00946807861328125, 0.01202392578125, 0.01457977294921875, 0.0171356201171875, 0.01969146728515625, 0.022247314453125, 0.02480316162109375, 0.0273590087890625, 0.02991485595703125, 0.032470703125, 0.03502655029296875, 0.0375823974609375, 0.04013824462890625, 0.042694091796875, 0.04524993896484375, 0.0478057861328125, 0.05036163330078125, 0.05291748046875, 0.05547332763671875, 0.0580291748046875, 0.06058502197265625, 0.063140869140625, 0.06569671630859375, 0.0682525634765625, 0.07080841064453125, 0.0733642578125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 5.0, 3.0, 9.0, 13.0, 9.0, 13.0, 16.0, 23.0, 45.0, 57.0, 72.0, 102.0, 162.0, 187.0, 316.0, 405.0, 596.0, 590.0, 442.0, 312.0, 192.0, 146.0, 95.0, 69.0, 48.0, 43.0, 34.0, 25.0, 14.0, 15.0, 13.0, 2.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0926513671875, -0.08822250366210938, -0.08379364013671875, -0.07936477661132812, -0.0749359130859375, -0.07050704956054688, -0.06607818603515625, -0.061649322509765625, -0.057220458984375, -0.052791595458984375, -0.04836273193359375, -0.043933868408203125, -0.0395050048828125, -0.035076141357421875, -0.03064727783203125, -0.026218414306640625, -0.02178955078125, -0.017360687255859375, -0.01293182373046875, -0.008502960205078125, -0.0040740966796875, 0.000354766845703125, 0.00478363037109375, 0.009212493896484375, 0.013641357421875, 0.018070220947265625, 0.02249908447265625, 0.026927947998046875, 0.0313568115234375, 0.035785675048828125, 0.04021453857421875, 0.044643402099609375, 0.049072265625, 0.053501129150390625, 0.05792999267578125, 0.062358856201171875, 0.0667877197265625, 0.07121658325195312, 0.07564544677734375, 0.08007431030273438, 0.084503173828125, 0.08893203735351562, 0.09336090087890625, 0.09778976440429688, 0.1022186279296875, 0.10664749145507812, 0.11107635498046875, 0.11550521850585938, 0.11993408203125, 0.12436294555664062, 0.12879180908203125, 0.13322067260742188, 0.1376495361328125, 0.14207839965820312, 0.14650726318359375, 0.15093612670898438, 0.155364990234375, 0.15979385375976562, 0.16422271728515625, 0.16865158081054688, 0.1730804443359375, 0.17750930786132812, 0.18193817138671875, 0.18636703491210938, 0.1907958984375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 10.0, 18.0, 43.0, 70.0, 109.0, 143.0, 167.0, 122.0, 112.0, 103.0, 48.0, 22.0, 18.0, 5.0, 9.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.579384684562683, -1.5455328226089478, -1.5116808414459229, -1.4778289794921875, -1.4439771175384521, -1.4101252555847168, -1.376273274421692, -1.3424214124679565, -1.3085694313049316, -1.2747175693511963, -1.2408655881881714, -1.207013726234436, -1.1731618642807007, -1.1393098831176758, -1.1054580211639404, -1.071606159210205, -1.0377542972564697, -1.0039024353027344, -0.9700505137443542, -0.9361985921859741, -0.9023467302322388, -0.8684948086738586, -0.8346428871154785, -0.8007910251617432, -0.766939103603363, -0.7330871820449829, -0.6992353200912476, -0.6653833985328674, -0.6315314769744873, -0.597679615020752, -0.5638276934623718, -0.5299757719039917, -0.4961237907409668, -0.46227189898490906, -0.4284200072288513, -0.3945680856704712, -0.36071619391441345, -0.3268643021583557, -0.2930123805999756, -0.25916048884391785, -0.2253085970878601, -0.19145670533180237, -0.15760479867458344, -0.1237528994679451, -0.08990100026130676, -0.05604910850524902, -0.02219720184803009, 0.011654704809188843, 0.04550659656524658, 0.07935849577188492, 0.11321039497852325, 0.1470623016357422, 0.18091419339179993, 0.21476608514785767, 0.2486179918050766, 0.28246989846229553, 0.31632179021835327, 0.350173681974411, 0.38402557373046875, 0.4178774952888489, 0.4517293870449066, 0.48558127880096436, 0.5194332003593445, 0.5532851219177246, 0.58713698387146]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 4.0, 3.0, 3.0, 5.0, 3.0, 7.0, 8.0, 9.0, 17.0, 23.0, 18.0, 27.0, 17.0, 28.0, 22.0, 34.0, 34.0, 33.0, 35.0, 40.0, 29.0, 39.0, 41.0, 38.0, 42.0, 38.0, 37.0, 30.0, 36.0, 34.0, 34.0, 23.0, 29.0, 34.0, 20.0, 23.0, 12.0, 14.0, 9.0, 11.0, 8.0, 14.0, 9.0, 6.0, 3.0, 5.0, 5.0, 6.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3596317768096924, -0.34799695014953613, -0.3363621234893799, -0.32472729682922363, -0.3130924701690674, -0.30145764350891113, -0.2898228168487549, -0.27818799018859863, -0.2665531635284424, -0.25491833686828613, -0.24328351020812988, -0.23164868354797363, -0.22001385688781738, -0.20837903022766113, -0.1967441886663437, -0.18510936200618744, -0.17347452044487, -0.16183969378471375, -0.1502048671245575, -0.13857004046440125, -0.126935213804245, -0.11530037969350815, -0.1036655455827713, -0.09203071892261505, -0.0803958922624588, -0.06876106560230255, -0.057126235216856, -0.045491404831409454, -0.033856578171253204, -0.022221751511096954, -0.010586917400360107, 0.0010479092597961426, 0.012682735919952393, 0.024317564442753792, 0.03595239296555519, 0.04758722335100174, 0.05922205001115799, 0.07085687667131424, 0.08249171078205109, 0.09412653744220734, 0.10576136410236359, 0.11739619076251984, 0.1290310174226761, 0.14066585898399353, 0.15230068564414978, 0.16393551230430603, 0.17557033896446228, 0.18720516562461853, 0.19883999228477478, 0.21047481894493103, 0.22210964560508728, 0.23374447226524353, 0.24537929892539978, 0.25701412558555603, 0.26864898204803467, 0.2802838087081909, 0.29191863536834717, 0.3035534620285034, 0.31518828868865967, 0.3268231153488159, 0.33845794200897217, 0.3500927686691284, 0.36172759532928467, 0.3733624219894409, 0.38499724864959717]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 8.0, 6.0, 15.0, 33.0, 35.0, 57.0, 101.0, 136.0, 191.0, 276.0, 404.0, 659.0, 1021.0, 1506.0, 2178.0, 3259.0, 4889.0, 7498.0, 11199.0, 17090.0, 26896.0, 45161.0, 85018.0, 187736.0, 288263.0, 170193.0, 78764.0, 42318.0, 25618.0, 16151.0, 10596.0, 7196.0, 4762.0, 3151.0, 2044.0, 1364.0, 943.0, 609.0, 388.0, 285.0, 162.0, 113.0, 96.0, 49.0, 34.0, 27.0, 18.0, 11.0, 12.0, 6.0, 8.0, 3.0, 3.0, 2.0, 1.0], "bins": [-0.0821533203125, -0.0796966552734375, -0.077239990234375, -0.0747833251953125, -0.07232666015625, -0.0698699951171875, -0.067413330078125, -0.0649566650390625, -0.0625, -0.0600433349609375, -0.057586669921875, -0.0551300048828125, -0.05267333984375, -0.0502166748046875, -0.047760009765625, -0.0453033447265625, -0.0428466796875, -0.0403900146484375, -0.037933349609375, -0.0354766845703125, -0.03302001953125, -0.0305633544921875, -0.028106689453125, -0.0256500244140625, -0.023193359375, -0.0207366943359375, -0.018280029296875, -0.0158233642578125, -0.01336669921875, -0.0109100341796875, -0.008453369140625, -0.0059967041015625, -0.0035400390625, -0.0010833740234375, 0.001373291015625, 0.0038299560546875, 0.00628662109375, 0.0087432861328125, 0.011199951171875, 0.0136566162109375, 0.01611328125, 0.0185699462890625, 0.021026611328125, 0.0234832763671875, 0.02593994140625, 0.0283966064453125, 0.030853271484375, 0.0333099365234375, 0.0357666015625, 0.0382232666015625, 0.040679931640625, 0.0431365966796875, 0.04559326171875, 0.0480499267578125, 0.050506591796875, 0.0529632568359375, 0.055419921875, 0.0578765869140625, 0.060333251953125, 0.0627899169921875, 0.06524658203125, 0.0677032470703125, 0.070159912109375, 0.0726165771484375, 0.0750732421875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 10.0, 10.0, 12.0, 7.0, 13.0, 21.0, 20.0, 24.0, 28.0, 28.0, 27.0, 41.0, 34.0, 48.0, 40.0, 37.0, 50.0, 43.0, 54.0, 58.0, 55.0, 46.0, 35.0, 32.0, 42.0, 30.0, 21.0, 23.0, 21.0, 24.0, 10.0, 13.0, 11.0, 9.0, 3.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0726318359375, -0.07032394409179688, -0.06801605224609375, -0.06570816040039062, -0.0634002685546875, -0.061092376708984375, -0.05878448486328125, -0.056476593017578125, -0.054168701171875, -0.051860809326171875, -0.04955291748046875, -0.047245025634765625, -0.0449371337890625, -0.042629241943359375, -0.04032135009765625, -0.038013458251953125, -0.03570556640625, -0.033397674560546875, -0.03108978271484375, -0.028781890869140625, -0.0264739990234375, -0.024166107177734375, -0.02185821533203125, -0.019550323486328125, -0.017242431640625, -0.014934539794921875, -0.01262664794921875, -0.010318756103515625, -0.0080108642578125, -0.005702972412109375, -0.00339508056640625, -0.001087188720703125, 0.001220703125, 0.003528594970703125, 0.00583648681640625, 0.008144378662109375, 0.0104522705078125, 0.012760162353515625, 0.01506805419921875, 0.017375946044921875, 0.019683837890625, 0.021991729736328125, 0.02429962158203125, 0.026607513427734375, 0.0289154052734375, 0.031223297119140625, 0.03353118896484375, 0.035839080810546875, 0.03814697265625, 0.040454864501953125, 0.04276275634765625, 0.045070648193359375, 0.0473785400390625, 0.049686431884765625, 0.05199432373046875, 0.054302215576171875, 0.056610107421875, 0.058917999267578125, 0.06122589111328125, 0.06353378295898438, 0.0658416748046875, 0.06814956665039062, 0.07045745849609375, 0.07276535034179688, 0.0750732421875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 5.0, 5.0, 3.0, 12.0, 10.0, 15.0, 28.0, 41.0, 55.0, 105.0, 181.0, 355.0, 859.0, 2310.0, 6863.0, 19861.0, 60269.0, 267566.0, 524987.0, 113685.0, 33579.0, 11295.0, 3935.0, 1403.0, 501.0, 256.0, 135.0, 81.0, 43.0, 37.0, 21.0, 15.0, 11.0, 16.0, 7.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.176025390625, -0.17000579833984375, -0.1639862060546875, -0.15796661376953125, -0.151947021484375, -0.14592742919921875, -0.1399078369140625, -0.13388824462890625, -0.12786865234375, -0.12184906005859375, -0.1158294677734375, -0.10980987548828125, -0.103790283203125, -0.09777069091796875, -0.0917510986328125, -0.08573150634765625, -0.0797119140625, -0.07369232177734375, -0.0676727294921875, -0.06165313720703125, -0.055633544921875, -0.04961395263671875, -0.0435943603515625, -0.03757476806640625, -0.03155517578125, -0.02553558349609375, -0.0195159912109375, -0.01349639892578125, -0.007476806640625, -0.00145721435546875, 0.0045623779296875, 0.01058197021484375, 0.0166015625, 0.02262115478515625, 0.0286407470703125, 0.03466033935546875, 0.040679931640625, 0.04669952392578125, 0.0527191162109375, 0.05873870849609375, 0.06475830078125, 0.07077789306640625, 0.0767974853515625, 0.08281707763671875, 0.088836669921875, 0.09485626220703125, 0.1008758544921875, 0.10689544677734375, 0.1129150390625, 0.11893463134765625, 0.1249542236328125, 0.13097381591796875, 0.136993408203125, 0.14301300048828125, 0.1490325927734375, 0.15505218505859375, 0.16107177734375, 0.16709136962890625, 0.1731109619140625, 0.17913055419921875, 0.185150146484375, 0.19116973876953125, 0.1971893310546875, 0.20320892333984375, 0.209228515625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 6.0, 5.0, 6.0, 14.0, 17.0, 18.0, 15.0, 19.0, 12.0, 25.0, 27.0, 31.0, 33.0, 32.0, 32.0, 41.0, 32.0, 33.0, 34.0, 31.0, 44.0, 45.0, 38.0, 44.0, 38.0, 30.0, 38.0, 34.0, 30.0, 29.0, 28.0, 21.0, 23.0, 17.0, 14.0, 9.0, 12.0, 12.0, 7.0, 7.0, 2.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.178955078125, -0.1733245849609375, -0.167694091796875, -0.1620635986328125, -0.15643310546875, -0.1508026123046875, -0.145172119140625, -0.1395416259765625, -0.1339111328125, -0.1282806396484375, -0.122650146484375, -0.1170196533203125, -0.11138916015625, -0.1057586669921875, -0.100128173828125, -0.0944976806640625, -0.0888671875, -0.0832366943359375, -0.077606201171875, -0.0719757080078125, -0.06634521484375, -0.0607147216796875, -0.055084228515625, -0.0494537353515625, -0.0438232421875, -0.0381927490234375, -0.032562255859375, -0.0269317626953125, -0.02130126953125, -0.0156707763671875, -0.010040283203125, -0.0044097900390625, 0.001220703125, 0.0068511962890625, 0.012481689453125, 0.0181121826171875, 0.02374267578125, 0.0293731689453125, 0.035003662109375, 0.0406341552734375, 0.0462646484375, 0.0518951416015625, 0.057525634765625, 0.0631561279296875, 0.06878662109375, 0.0744171142578125, 0.080047607421875, 0.0856781005859375, 0.09130859375, 0.0969390869140625, 0.102569580078125, 0.1082000732421875, 0.11383056640625, 0.1194610595703125, 0.125091552734375, 0.1307220458984375, 0.1363525390625, 0.1419830322265625, 0.147613525390625, 0.1532440185546875, 0.15887451171875, 0.1645050048828125, 0.170135498046875, 0.1757659912109375, 0.181396484375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 10.0, 8.0, 9.0, 27.0, 68.0, 107.0, 167.0, 316.0, 687.0, 1454.0, 3334.0, 7706.0, 17647.0, 43870.0, 111834.0, 339274.0, 337110.0, 110167.0, 43351.0, 17796.0, 7561.0, 3253.0, 1386.0, 700.0, 330.0, 189.0, 71.0, 50.0, 25.0, 25.0, 8.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052764892578125, -0.05100584030151367, -0.049246788024902344, -0.047487735748291016, -0.04572868347167969, -0.04396963119506836, -0.04221057891845703, -0.0404515266418457, -0.038692474365234375, -0.03693342208862305, -0.03517436981201172, -0.03341531753540039, -0.03165626525878906, -0.029897212982177734, -0.028138160705566406, -0.026379108428955078, -0.02462005615234375, -0.022861003875732422, -0.021101951599121094, -0.019342899322509766, -0.017583847045898438, -0.01582479476928711, -0.014065742492675781, -0.012306690216064453, -0.010547637939453125, -0.008788585662841797, -0.007029533386230469, -0.005270481109619141, -0.0035114288330078125, -0.0017523765563964844, 6.67572021484375e-06, 0.0017657279968261719, 0.0035247802734375, 0.005283832550048828, 0.007042884826660156, 0.008801937103271484, 0.010560989379882812, 0.01232004165649414, 0.014079093933105469, 0.015838146209716797, 0.017597198486328125, 0.019356250762939453, 0.02111530303955078, 0.02287435531616211, 0.024633407592773438, 0.026392459869384766, 0.028151512145996094, 0.029910564422607422, 0.03166961669921875, 0.03342866897583008, 0.035187721252441406, 0.036946773529052734, 0.03870582580566406, 0.04046487808227539, 0.04222393035888672, 0.04398298263549805, 0.045742034912109375, 0.0475010871887207, 0.04926013946533203, 0.05101919174194336, 0.05277824401855469, 0.054537296295166016, 0.056296348571777344, 0.05805540084838867, 0.059814453125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 5.0, 3.0, 6.0, 5.0, 10.0, 11.0, 14.0, 24.0, 19.0, 32.0, 43.0, 63.0, 75.0, 71.0, 98.0, 114.0, 105.0, 81.0, 42.0, 49.0, 34.0, 32.0, 15.0, 10.0, 6.0, 6.0, 6.0, 5.0, 4.0, 4.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7821788787841797e-05, -1.7228536307811737e-05, -1.6635283827781677e-05, -1.6042031347751617e-05, -1.5448778867721558e-05, -1.4855526387691498e-05, -1.4262273907661438e-05, -1.3669021427631378e-05, -1.3075768947601318e-05, -1.2482516467571259e-05, -1.1889263987541199e-05, -1.1296011507511139e-05, -1.0702759027481079e-05, -1.010950654745102e-05, -9.51625406742096e-06, -8.9230015873909e-06, -8.32974910736084e-06, -7.73649662733078e-06, -7.14324414730072e-06, -6.54999166727066e-06, -5.956739187240601e-06, -5.363486707210541e-06, -4.770234227180481e-06, -4.176981747150421e-06, -3.5837292671203613e-06, -2.9904767870903015e-06, -2.3972243070602417e-06, -1.8039718270301819e-06, -1.210719347000122e-06, -6.174668669700623e-07, -2.421438694000244e-08, 5.690380930900574e-07, 1.1622905731201172e-06, 1.755543053150177e-06, 2.348795533180237e-06, 2.9420480132102966e-06, 3.5353004932403564e-06, 4.128552973270416e-06, 4.721805453300476e-06, 5.315057933330536e-06, 5.908310413360596e-06, 6.5015628933906555e-06, 7.094815373420715e-06, 7.688067853450775e-06, 8.281320333480835e-06, 8.874572813510895e-06, 9.467825293540955e-06, 1.0061077773571014e-05, 1.0654330253601074e-05, 1.1247582733631134e-05, 1.1840835213661194e-05, 1.2434087693691254e-05, 1.3027340173721313e-05, 1.3620592653751373e-05, 1.4213845133781433e-05, 1.4807097613811493e-05, 1.5400350093841553e-05, 1.5993602573871613e-05, 1.6586855053901672e-05, 1.7180107533931732e-05, 1.7773360013961792e-05, 1.8366612493991852e-05, 1.895986497402191e-05, 1.955311745405197e-05, 2.014636993408203e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 15.0, 26.0, 47.0, 76.0, 184.0, 352.0, 990.0, 3382.0, 15860.0, 93057.0, 572780.0, 305128.0, 45157.0, 8448.0, 1920.0, 603.0, 250.0, 131.0, 72.0, 33.0, 14.0, 12.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10308837890625, -0.09962940216064453, -0.09617042541503906, -0.0927114486694336, -0.08925247192382812, -0.08579349517822266, -0.08233451843261719, -0.07887554168701172, -0.07541656494140625, -0.07195758819580078, -0.06849861145019531, -0.06503963470458984, -0.061580657958984375, -0.058121681213378906, -0.05466270446777344, -0.05120372772216797, -0.0477447509765625, -0.04428577423095703, -0.04082679748535156, -0.037367820739746094, -0.033908843994140625, -0.030449867248535156, -0.026990890502929688, -0.02353191375732422, -0.02007293701171875, -0.01661396026611328, -0.013154983520507812, -0.009696006774902344, -0.006237030029296875, -0.0027780532836914062, 0.0006809234619140625, 0.004139900207519531, 0.007598876953125, 0.011057853698730469, 0.014516830444335938, 0.017975807189941406, 0.021434783935546875, 0.024893760681152344, 0.028352737426757812, 0.03181171417236328, 0.03527069091796875, 0.03872966766357422, 0.04218864440917969, 0.045647621154785156, 0.049106597900390625, 0.052565574645996094, 0.05602455139160156, 0.05948352813720703, 0.0629425048828125, 0.06640148162841797, 0.06986045837402344, 0.0733194351196289, 0.07677841186523438, 0.08023738861083984, 0.08369636535644531, 0.08715534210205078, 0.09061431884765625, 0.09407329559326172, 0.09753227233886719, 0.10099124908447266, 0.10445022583007812, 0.1079092025756836, 0.11136817932128906, 0.11482715606689453, 0.1182861328125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 8.0, 5.0, 6.0, 7.0, 16.0, 14.0, 18.0, 28.0, 29.0, 32.0, 50.0, 73.0, 62.0, 84.0, 91.0, 93.0, 71.0, 58.0, 50.0, 27.0, 31.0, 26.0, 26.0, 18.0, 15.0, 15.0, 8.0, 12.0, 8.0, 2.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.058380126953125, -0.05678367614746094, -0.055187225341796875, -0.05359077453613281, -0.05199432373046875, -0.05039787292480469, -0.048801422119140625, -0.04720497131347656, -0.0456085205078125, -0.04401206970214844, -0.042415618896484375, -0.04081916809082031, -0.03922271728515625, -0.03762626647949219, -0.036029815673828125, -0.03443336486816406, -0.0328369140625, -0.031240463256835938, -0.029644012451171875, -0.028047561645507812, -0.02645111083984375, -0.024854660034179688, -0.023258209228515625, -0.021661758422851562, -0.0200653076171875, -0.018468856811523438, -0.016872406005859375, -0.015275955200195312, -0.01367950439453125, -0.012083053588867188, -0.010486602783203125, -0.008890151977539062, -0.007293701171875, -0.0056972503662109375, -0.004100799560546875, -0.0025043487548828125, -0.00090789794921875, 0.0006885528564453125, 0.002285003662109375, 0.0038814544677734375, 0.0054779052734375, 0.0070743560791015625, 0.008670806884765625, 0.010267257690429688, 0.01186370849609375, 0.013460159301757812, 0.015056610107421875, 0.016653060913085938, 0.01824951171875, 0.019845962524414062, 0.021442413330078125, 0.023038864135742188, 0.02463531494140625, 0.026231765747070312, 0.027828216552734375, 0.029424667358398438, 0.0310211181640625, 0.03261756896972656, 0.034214019775390625, 0.03581047058105469, 0.03740692138671875, 0.03900337219238281, 0.040599822998046875, 0.04219627380371094, 0.043792724609375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 7.0, 39.0, 202.0, 424.0, 271.0, 48.0, 13.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2217077016830444, -1.1432862281799316, -1.0648647546768188, -0.9864432215690613, -0.9080216884613037, -0.8296002149581909, -0.7511787414550781, -0.6727572083473206, -0.5943357348442078, -0.515914261341095, -0.4374927282333374, -0.3590712547302246, -0.28064975142478943, -0.20222824811935425, -0.12380677461624146, -0.04538524150848389, 0.033036231994628906, 0.11145772784948349, 0.18987922370433807, 0.26830071210861206, 0.34672221541404724, 0.4251437187194824, 0.5035651922225952, 0.5819867253303528, 0.6604081988334656, 0.7388296723365784, 0.8172512054443359, 0.8956726789474487, 0.9740941524505615, 1.0525157451629639, 1.130937099456787, 1.2093586921691895, 1.2877800464630127, 1.3662015199661255, 1.4446229934692383, 1.5230445861816406, 1.6014660596847534, 1.6798875331878662, 1.758309006690979, 1.8367304801940918, 1.9151520729064941, 1.993573546409607, 2.0719950199127197, 2.150416612625122, 2.2288379669189453, 2.3072595596313477, 2.38568115234375, 2.4641025066375732, 2.5425238609313965, 2.620945453643799, 2.699366807937622, 2.7777884006500244, 2.8562097549438477, 2.93463134765625, 3.0130529403686523, 3.0914742946624756, 3.169895887374878, 3.2483174800872803, 3.3267388343811035, 3.405160427093506, 3.483581781387329, 3.5620033740997314, 3.6404247283935547, 3.718846321105957, 3.7972679138183594]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 2.0, 15.0, 14.0, 8.0, 12.0, 10.0, 17.0, 30.0, 20.0, 26.0, 31.0, 44.0, 29.0, 34.0, 47.0, 47.0, 50.0, 50.0, 48.0, 42.0, 42.0, 46.0, 44.0, 33.0, 47.0, 26.0, 40.0, 23.0, 26.0, 21.0, 11.0, 12.0, 4.0, 9.0, 6.0, 5.0, 7.0, 3.0, 6.0, 5.0, 1.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48663830757141113, -0.4705071449279785, -0.4543759524822235, -0.4382447898387909, -0.4221135973930359, -0.40598243474960327, -0.38985127210617065, -0.37372010946273804, -0.35758891701698303, -0.3414577543735504, -0.3253265619277954, -0.3091953992843628, -0.2930642366409302, -0.27693304419517517, -0.26080188155174255, -0.24467070400714874, -0.22853952646255493, -0.21240834891796112, -0.1962771713733673, -0.1801460087299347, -0.16401483118534088, -0.14788365364074707, -0.13175249099731445, -0.11562131345272064, -0.09949013590812683, -0.08335895836353302, -0.0672277882695198, -0.05109661445021629, -0.03496544063091278, -0.01883426308631897, -0.0027030929923057556, 0.013428077101707458, 0.029559195041656494, 0.04569036886096001, 0.06182154268026352, 0.07795271277427673, 0.09408389031887054, 0.11021506786346436, 0.12634623050689697, 0.14247740805149078, 0.1586085855960846, 0.1747397631406784, 0.19087094068527222, 0.20700210332870483, 0.22313328087329865, 0.23926445841789246, 0.2553956210613251, 0.2715268135070801, 0.2876579761505127, 0.3037891387939453, 0.3199203312397003, 0.33605149388313293, 0.35218268632888794, 0.36831384897232056, 0.3844450116157532, 0.4005761742591858, 0.4167073667049408, 0.4328385293483734, 0.4489697217941284, 0.46510088443756104, 0.48123204708099365, 0.49736323952674866, 0.5134944319725037, 0.5296255946159363, 0.5457567572593689]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 9.0, 17.0, 21.0, 30.0, 31.0, 54.0, 110.0, 167.0, 291.0, 401.0, 694.0, 1183.0, 1990.0, 3392.0, 5904.0, 10205.0, 17766.0, 31877.0, 57207.0, 108609.0, 225366.0, 574937.0, 1476711.0, 996300.0, 352142.0, 152888.0, 78360.0, 42093.0, 23456.0, 13364.0, 7834.0, 4405.0, 2615.0, 1536.0, 839.0, 537.0, 333.0, 185.0, 128.0, 87.0, 53.0, 43.0, 34.0, 23.0, 21.0, 8.0, 12.0, 9.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06256103515625, -0.06052684783935547, -0.05849266052246094, -0.056458473205566406, -0.054424285888671875, -0.052390098571777344, -0.05035591125488281, -0.04832172393798828, -0.04628753662109375, -0.04425334930419922, -0.04221916198730469, -0.040184974670410156, -0.038150787353515625, -0.036116600036621094, -0.03408241271972656, -0.03204822540283203, -0.0300140380859375, -0.02797985076904297, -0.025945663452148438, -0.023911476135253906, -0.021877288818359375, -0.019843101501464844, -0.017808914184570312, -0.01577472686767578, -0.01374053955078125, -0.011706352233886719, -0.009672164916992188, -0.007637977600097656, -0.005603790283203125, -0.0035696029663085938, -0.0015354156494140625, 0.0004987716674804688, 0.002532958984375, 0.004567146301269531, 0.0066013336181640625, 0.008635520935058594, 0.010669708251953125, 0.012703895568847656, 0.014738082885742188, 0.01677227020263672, 0.01880645751953125, 0.02084064483642578, 0.022874832153320312, 0.024909019470214844, 0.026943206787109375, 0.028977394104003906, 0.031011581420898438, 0.03304576873779297, 0.0350799560546875, 0.03711414337158203, 0.03914833068847656, 0.041182518005371094, 0.043216705322265625, 0.045250892639160156, 0.04728507995605469, 0.04931926727294922, 0.05135345458984375, 0.05338764190673828, 0.05542182922363281, 0.057456016540527344, 0.059490203857421875, 0.061524391174316406, 0.06355857849121094, 0.06559276580810547, 0.067626953125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 11.0, 3.0, 5.0, 7.0, 11.0, 12.0, 18.0, 12.0, 13.0, 17.0, 24.0, 26.0, 27.0, 25.0, 31.0, 28.0, 47.0, 38.0, 50.0, 36.0, 37.0, 39.0, 47.0, 46.0, 41.0, 31.0, 33.0, 32.0, 31.0, 35.0, 28.0, 27.0, 16.0, 23.0, 19.0, 13.0, 11.0, 13.0, 11.0, 7.0, 5.0, 5.0, 6.0, 3.0, 4.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.06317138671875, -0.06129026412963867, -0.059409141540527344, -0.057528018951416016, -0.05564689636230469, -0.05376577377319336, -0.05188465118408203, -0.0500035285949707, -0.048122406005859375, -0.04624128341674805, -0.04436016082763672, -0.04247903823852539, -0.04059791564941406, -0.038716793060302734, -0.036835670471191406, -0.03495454788208008, -0.03307342529296875, -0.031192302703857422, -0.029311180114746094, -0.027430057525634766, -0.025548934936523438, -0.02366781234741211, -0.02178668975830078, -0.019905567169189453, -0.018024444580078125, -0.016143321990966797, -0.014262199401855469, -0.01238107681274414, -0.010499954223632812, -0.008618831634521484, -0.006737709045410156, -0.004856586456298828, -0.0029754638671875, -0.0010943412780761719, 0.0007867813110351562, 0.0026679039001464844, 0.0045490264892578125, 0.006430149078369141, 0.008311271667480469, 0.010192394256591797, 0.012073516845703125, 0.013954639434814453, 0.01583576202392578, 0.01771688461303711, 0.019598007202148438, 0.021479129791259766, 0.023360252380371094, 0.025241374969482422, 0.02712249755859375, 0.029003620147705078, 0.030884742736816406, 0.032765865325927734, 0.03464698791503906, 0.03652811050415039, 0.03840923309326172, 0.04029035568237305, 0.042171478271484375, 0.0440526008605957, 0.04593372344970703, 0.04781484603881836, 0.04969596862792969, 0.051577091217041016, 0.053458213806152344, 0.05533933639526367, 0.057220458984375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 7.0, 14.0, 17.0, 10.0, 28.0, 59.0, 96.0, 130.0, 239.0, 443.0, 749.0, 1343.0, 2308.0, 4425.0, 8720.0, 17362.0, 36099.0, 74752.0, 168885.0, 437954.0, 1482179.0, 1292682.0, 380746.0, 150799.0, 68466.0, 32522.0, 16182.0, 8077.0, 4119.0, 2130.0, 1180.0, 635.0, 355.0, 216.0, 121.0, 84.0, 51.0, 30.0, 28.0, 10.0, 13.0, 10.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10089111328125, -0.09782791137695312, -0.09476470947265625, -0.09170150756835938, -0.0886383056640625, -0.08557510375976562, -0.08251190185546875, -0.07944869995117188, -0.076385498046875, -0.07332229614257812, -0.07025909423828125, -0.06719589233398438, -0.0641326904296875, -0.061069488525390625, -0.05800628662109375, -0.054943084716796875, -0.0518798828125, -0.048816680908203125, -0.04575347900390625, -0.042690277099609375, -0.0396270751953125, -0.036563873291015625, -0.03350067138671875, -0.030437469482421875, -0.027374267578125, -0.024311065673828125, -0.02124786376953125, -0.018184661865234375, -0.0151214599609375, -0.012058258056640625, -0.00899505615234375, -0.005931854248046875, -0.00286865234375, 0.000194549560546875, 0.00325775146484375, 0.006320953369140625, 0.0093841552734375, 0.012447357177734375, 0.01551055908203125, 0.018573760986328125, 0.021636962890625, 0.024700164794921875, 0.02776336669921875, 0.030826568603515625, 0.0338897705078125, 0.036952972412109375, 0.04001617431640625, 0.043079376220703125, 0.046142578125, 0.049205780029296875, 0.05226898193359375, 0.055332183837890625, 0.0583953857421875, 0.061458587646484375, 0.06452178955078125, 0.06758499145507812, 0.070648193359375, 0.07371139526367188, 0.07677459716796875, 0.07983779907226562, 0.0829010009765625, 0.08596420288085938, 0.08902740478515625, 0.09209060668945312, 0.09515380859375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 6.0, 4.0, 6.0, 15.0, 8.0, 25.0, 27.0, 38.0, 35.0, 48.0, 72.0, 97.0, 126.0, 170.0, 240.0, 351.0, 553.0, 572.0, 491.0, 306.0, 232.0, 144.0, 121.0, 82.0, 58.0, 57.0, 39.0, 35.0, 24.0, 19.0, 18.0, 10.0, 9.0, 8.0, 5.0, 5.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.13818359375, -0.13439655303955078, -0.13060951232910156, -0.12682247161865234, -0.12303543090820312, -0.1192483901977539, -0.11546134948730469, -0.11167430877685547, -0.10788726806640625, -0.10410022735595703, -0.10031318664550781, -0.0965261459350586, -0.09273910522460938, -0.08895206451416016, -0.08516502380371094, -0.08137798309326172, -0.0775909423828125, -0.07380390167236328, -0.07001686096191406, -0.06622982025146484, -0.062442779541015625, -0.058655738830566406, -0.05486869812011719, -0.05108165740966797, -0.04729461669921875, -0.04350757598876953, -0.03972053527832031, -0.035933494567871094, -0.032146453857421875, -0.028359413146972656, -0.024572372436523438, -0.02078533172607422, -0.016998291015625, -0.013211250305175781, -0.009424209594726562, -0.005637168884277344, -0.001850128173828125, 0.0019369125366210938, 0.0057239532470703125, 0.009510993957519531, 0.01329803466796875, 0.01708507537841797, 0.020872116088867188, 0.024659156799316406, 0.028446197509765625, 0.032233238220214844, 0.03602027893066406, 0.03980731964111328, 0.0435943603515625, 0.04738140106201172, 0.05116844177246094, 0.054955482482910156, 0.058742523193359375, 0.0625295639038086, 0.06631660461425781, 0.07010364532470703, 0.07389068603515625, 0.07767772674560547, 0.08146476745605469, 0.0852518081665039, 0.08903884887695312, 0.09282588958740234, 0.09661293029785156, 0.10039997100830078, 0.10418701171875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 7.0, 8.0, 26.0, 47.0, 48.0, 68.0, 75.0, 92.0, 95.0, 84.0, 92.0, 101.0, 81.0, 55.0, 36.0, 29.0, 13.0, 19.0, 6.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8095172643661499, -0.7883503437042236, -0.7671834826469421, -0.7460165619850159, -0.7248496413230896, -0.7036827802658081, -0.6825158596038818, -0.6613489389419556, -0.6401820182800293, -0.619015097618103, -0.5978482365608215, -0.5766813158988953, -0.555514395236969, -0.5343475341796875, -0.5131806135177612, -0.49201369285583496, -0.47084683179855347, -0.4496799409389496, -0.4285130202770233, -0.40734612941741943, -0.38617920875549316, -0.3650123178958893, -0.3438454270362854, -0.32267850637435913, -0.30151161551475525, -0.28034472465515137, -0.2591778039932251, -0.23801091313362122, -0.21684400737285614, -0.19567710161209106, -0.17451021075248718, -0.1533433049917221, -0.13217639923095703, -0.11100949347019196, -0.08984259516000748, -0.068675696849823, -0.04750879108905792, -0.026341885328292847, -0.005174994468688965, 0.01599191129207611, 0.037158817052841187, 0.058325719088315964, 0.07949262112379074, 0.10065951943397522, 0.1218264251947403, 0.14299333095550537, 0.16416022181510925, 0.18532712757587433, 0.2064940333366394, 0.22766093909740448, 0.24882784485816956, 0.26999473571777344, 0.2911616563796997, 0.3123285472393036, 0.33349543809890747, 0.35466235876083374, 0.3758292496204376, 0.3969961404800415, 0.4181630611419678, 0.43932995200157166, 0.46049684286117554, 0.4816637635231018, 0.5028306245803833, 0.5239975452423096, 0.5451644659042358]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 4.0, 4.0, 12.0, 9.0, 15.0, 16.0, 18.0, 15.0, 20.0, 26.0, 30.0, 37.0, 39.0, 35.0, 47.0, 39.0, 47.0, 44.0, 37.0, 46.0, 45.0, 35.0, 42.0, 37.0, 32.0, 44.0, 31.0, 29.0, 30.0, 31.0, 14.0, 14.0, 16.0, 16.0, 9.0, 7.0, 7.0, 10.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.4762831926345825, -0.463061660528183, -0.44984012842178345, -0.4366185963153839, -0.4233970642089844, -0.41017553210258484, -0.3969539999961853, -0.38373246788978577, -0.37051093578338623, -0.3572894036769867, -0.34406787157058716, -0.3308463394641876, -0.3176248073577881, -0.30440327525138855, -0.291181743144989, -0.2779602110385895, -0.26473867893218994, -0.2515171468257904, -0.23829561471939087, -0.22507408261299133, -0.2118525505065918, -0.19863101840019226, -0.18540948629379272, -0.1721879541873932, -0.15896639227867126, -0.14574486017227173, -0.1325233280658722, -0.11930179595947266, -0.10608026385307312, -0.09285872429609299, -0.07963719218969345, -0.06641566008329391, -0.053194135427474976, -0.03997260332107544, -0.026751069352030754, -0.013529535382986069, -0.0003080032765865326, 0.012913532555103302, 0.026135064661502838, 0.039356596767902374, 0.05257812887430191, 0.06579966098070145, 0.07902119308710098, 0.09224273264408112, 0.10546426475048065, 0.11868579685688019, 0.13190732896327972, 0.14512886106967926, 0.1583503931760788, 0.17157192528247833, 0.18479345738887787, 0.1980149894952774, 0.21123652160167694, 0.22445806860923767, 0.2376796007156372, 0.25090113282203674, 0.2641226649284363, 0.2773441970348358, 0.29056572914123535, 0.3037872612476349, 0.3170087933540344, 0.33023032546043396, 0.3434518575668335, 0.35667338967323303, 0.36989492177963257]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 7.0, 11.0, 19.0, 17.0, 29.0, 49.0, 74.0, 104.0, 146.0, 265.0, 434.0, 601.0, 1003.0, 1514.0, 2307.0, 3677.0, 5537.0, 8890.0, 14854.0, 28469.0, 61712.0, 153084.0, 309788.0, 251593.0, 105712.0, 44535.0, 21501.0, 12223.0, 7245.0, 4594.0, 3042.0, 1981.0, 1304.0, 797.0, 506.0, 341.0, 222.0, 132.0, 97.0, 43.0, 36.0, 22.0, 16.0, 9.0, 7.0, 1.0, 6.0, 3.0, 0.0, 3.0], "bins": [-0.0985107421875, -0.09583377838134766, -0.09315681457519531, -0.09047985076904297, -0.08780288696289062, -0.08512592315673828, -0.08244895935058594, -0.0797719955444336, -0.07709503173828125, -0.0744180679321289, -0.07174110412597656, -0.06906414031982422, -0.06638717651367188, -0.06371021270751953, -0.06103324890136719, -0.058356285095214844, -0.0556793212890625, -0.053002357482910156, -0.05032539367675781, -0.04764842987060547, -0.044971466064453125, -0.04229450225830078, -0.03961753845214844, -0.036940574645996094, -0.03426361083984375, -0.031586647033691406, -0.028909683227539062, -0.02623271942138672, -0.023555755615234375, -0.02087879180908203, -0.018201828002929688, -0.015524864196777344, -0.012847900390625, -0.010170936584472656, -0.0074939727783203125, -0.004817008972167969, -0.002140045166015625, 0.0005369186401367188, 0.0032138824462890625, 0.005890846252441406, 0.00856781005859375, 0.011244773864746094, 0.013921737670898438, 0.01659870147705078, 0.019275665283203125, 0.02195262908935547, 0.024629592895507812, 0.027306556701660156, 0.0299835205078125, 0.032660484313964844, 0.03533744812011719, 0.03801441192626953, 0.040691375732421875, 0.04336833953857422, 0.04604530334472656, 0.048722267150878906, 0.05139923095703125, 0.054076194763183594, 0.05675315856933594, 0.05943012237548828, 0.062107086181640625, 0.06478404998779297, 0.06746101379394531, 0.07013797760009766, 0.07281494140625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 3.0, 2.0, 5.0, 8.0, 11.0, 7.0, 9.0, 15.0, 13.0, 14.0, 21.0, 21.0, 30.0, 30.0, 25.0, 27.0, 34.0, 26.0, 38.0, 38.0, 42.0, 45.0, 33.0, 28.0, 35.0, 43.0, 47.0, 38.0, 33.0, 31.0, 30.0, 24.0, 19.0, 27.0, 24.0, 21.0, 16.0, 12.0, 17.0, 15.0, 5.0, 8.0, 5.0, 3.0, 2.0, 11.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.059112548828125, -0.05726814270019531, -0.055423736572265625, -0.05357933044433594, -0.05173492431640625, -0.04989051818847656, -0.048046112060546875, -0.04620170593261719, -0.0443572998046875, -0.04251289367675781, -0.040668487548828125, -0.03882408142089844, -0.03697967529296875, -0.03513526916503906, -0.033290863037109375, -0.03144645690917969, -0.02960205078125, -0.027757644653320312, -0.025913238525390625, -0.024068832397460938, -0.02222442626953125, -0.020380020141601562, -0.018535614013671875, -0.016691207885742188, -0.0148468017578125, -0.013002395629882812, -0.011157989501953125, -0.009313583374023438, -0.00746917724609375, -0.0056247711181640625, -0.003780364990234375, -0.0019359588623046875, -9.1552734375e-05, 0.0017528533935546875, 0.003597259521484375, 0.0054416656494140625, 0.00728607177734375, 0.009130477905273438, 0.010974884033203125, 0.012819290161132812, 0.0146636962890625, 0.016508102416992188, 0.018352508544921875, 0.020196914672851562, 0.02204132080078125, 0.023885726928710938, 0.025730133056640625, 0.027574539184570312, 0.0294189453125, 0.03126335144042969, 0.033107757568359375, 0.03495216369628906, 0.03679656982421875, 0.03864097595214844, 0.040485382080078125, 0.04232978820800781, 0.0441741943359375, 0.04601860046386719, 0.047863006591796875, 0.04970741271972656, 0.05155181884765625, 0.05339622497558594, 0.055240631103515625, 0.05708503723144531, 0.058929443359375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 5.0, 5.0, 6.0, 9.0, 17.0, 18.0, 21.0, 33.0, 34.0, 52.0, 83.0, 109.0, 216.0, 348.0, 604.0, 1192.0, 2529.0, 5561.0, 12320.0, 30000.0, 84748.0, 275409.0, 403617.0, 148902.0, 48660.0, 18736.0, 7972.0, 3731.0, 1605.0, 817.0, 440.0, 266.0, 146.0, 95.0, 57.0, 47.0, 35.0, 26.0, 24.0, 19.0, 9.0, 13.0, 7.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.125732421875, -0.12170791625976562, -0.11768341064453125, -0.11365890502929688, -0.1096343994140625, -0.10560989379882812, -0.10158538818359375, -0.09756088256835938, -0.093536376953125, -0.08951187133789062, -0.08548736572265625, -0.08146286010742188, -0.0774383544921875, -0.07341384887695312, -0.06938934326171875, -0.06536483764648438, -0.06134033203125, -0.057315826416015625, -0.05329132080078125, -0.049266815185546875, -0.0452423095703125, -0.041217803955078125, -0.03719329833984375, -0.033168792724609375, -0.029144287109375, -0.025119781494140625, -0.02109527587890625, -0.017070770263671875, -0.0130462646484375, -0.009021759033203125, -0.00499725341796875, -0.000972747802734375, 0.0030517578125, 0.007076263427734375, 0.01110076904296875, 0.015125274658203125, 0.0191497802734375, 0.023174285888671875, 0.02719879150390625, 0.031223297119140625, 0.035247802734375, 0.039272308349609375, 0.04329681396484375, 0.047321319580078125, 0.0513458251953125, 0.055370330810546875, 0.05939483642578125, 0.06341934204101562, 0.06744384765625, 0.07146835327148438, 0.07549285888671875, 0.07951736450195312, 0.0835418701171875, 0.08756637573242188, 0.09159088134765625, 0.09561538696289062, 0.099639892578125, 0.10366439819335938, 0.10768890380859375, 0.11171340942382812, 0.1157379150390625, 0.11976242065429688, 0.12378692626953125, 0.12781143188476562, 0.1318359375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 8.0, 7.0, 6.0, 8.0, 10.0, 13.0, 15.0, 14.0, 16.0, 17.0, 26.0, 34.0, 33.0, 38.0, 34.0, 33.0, 35.0, 46.0, 32.0, 43.0, 46.0, 53.0, 47.0, 51.0, 36.0, 37.0, 32.0, 34.0, 33.0, 36.0, 21.0, 22.0, 21.0, 3.0, 18.0, 9.0, 8.0, 4.0, 3.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.2298583984375, -0.22360801696777344, -0.21735763549804688, -0.2111072540283203, -0.20485687255859375, -0.1986064910888672, -0.19235610961914062, -0.18610572814941406, -0.1798553466796875, -0.17360496520996094, -0.16735458374023438, -0.1611042022705078, -0.15485382080078125, -0.1486034393310547, -0.14235305786132812, -0.13610267639160156, -0.129852294921875, -0.12360191345214844, -0.11735153198242188, -0.11110115051269531, -0.10485076904296875, -0.09860038757324219, -0.09235000610351562, -0.08609962463378906, -0.0798492431640625, -0.07359886169433594, -0.06734848022460938, -0.06109809875488281, -0.05484771728515625, -0.04859733581542969, -0.042346954345703125, -0.03609657287597656, -0.02984619140625, -0.023595809936523438, -0.017345428466796875, -0.011095046997070312, -0.00484466552734375, 0.0014057159423828125, 0.007656097412109375, 0.013906478881835938, 0.0201568603515625, 0.026407241821289062, 0.032657623291015625, 0.03890800476074219, 0.04515838623046875, 0.05140876770019531, 0.057659149169921875, 0.06390953063964844, 0.070159912109375, 0.07641029357910156, 0.08266067504882812, 0.08891105651855469, 0.09516143798828125, 0.10141181945800781, 0.10766220092773438, 0.11391258239746094, 0.1201629638671875, 0.12641334533691406, 0.13266372680664062, 0.1389141082763672, 0.14516448974609375, 0.1514148712158203, 0.15766525268554688, 0.16391563415527344, 0.170166015625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 7.0, 9.0, 11.0, 15.0, 33.0, 60.0, 130.0, 425.0, 1312.0, 4810.0, 15647.0, 54053.0, 241431.0, 533636.0, 145200.0, 36487.0, 10754.0, 3091.0, 940.0, 270.0, 125.0, 46.0, 29.0, 17.0, 8.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0697021484375, -0.0671529769897461, -0.06460380554199219, -0.06205463409423828, -0.059505462646484375, -0.05695629119873047, -0.05440711975097656, -0.051857948303222656, -0.04930877685546875, -0.046759605407714844, -0.04421043395996094, -0.04166126251220703, -0.039112091064453125, -0.03656291961669922, -0.03401374816894531, -0.031464576721191406, -0.0289154052734375, -0.026366233825683594, -0.023817062377929688, -0.02126789093017578, -0.018718719482421875, -0.01616954803466797, -0.013620376586914062, -0.011071205139160156, -0.00852203369140625, -0.005972862243652344, -0.0034236907958984375, -0.0008745193481445312, 0.001674652099609375, 0.004223823547363281, 0.0067729949951171875, 0.009322166442871094, 0.011871337890625, 0.014420509338378906, 0.016969680786132812, 0.01951885223388672, 0.022068023681640625, 0.02461719512939453, 0.027166366577148438, 0.029715538024902344, 0.03226470947265625, 0.034813880920410156, 0.03736305236816406, 0.03991222381591797, 0.042461395263671875, 0.04501056671142578, 0.04755973815917969, 0.050108909606933594, 0.0526580810546875, 0.055207252502441406, 0.05775642395019531, 0.06030559539794922, 0.06285476684570312, 0.06540393829345703, 0.06795310974121094, 0.07050228118896484, 0.07305145263671875, 0.07560062408447266, 0.07814979553222656, 0.08069896697998047, 0.08324813842773438, 0.08579730987548828, 0.08834648132324219, 0.0908956527709961, 0.09344482421875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 4.0, 7.0, 14.0, 9.0, 24.0, 32.0, 30.0, 39.0, 72.0, 73.0, 78.0, 100.0, 95.0, 83.0, 73.0, 73.0, 61.0, 24.0, 30.0, 15.0, 11.0, 6.0, 8.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.609325408935547e-05, -1.5541911125183105e-05, -1.4990568161010742e-05, -1.4439225196838379e-05, -1.3887882232666016e-05, -1.3336539268493652e-05, -1.2785196304321289e-05, -1.2233853340148926e-05, -1.1682510375976562e-05, -1.11311674118042e-05, -1.0579824447631836e-05, -1.0028481483459473e-05, -9.47713851928711e-06, -8.925795555114746e-06, -8.374452590942383e-06, -7.82310962677002e-06, -7.271766662597656e-06, -6.720423698425293e-06, -6.16908073425293e-06, -5.617737770080566e-06, -5.066394805908203e-06, -4.51505184173584e-06, -3.9637088775634766e-06, -3.4123659133911133e-06, -2.86102294921875e-06, -2.3096799850463867e-06, -1.7583370208740234e-06, -1.2069940567016602e-06, -6.556510925292969e-07, -1.043081283569336e-07, 4.470348358154297e-07, 9.98377799987793e-07, 1.5497207641601562e-06, 2.1010637283325195e-06, 2.652406692504883e-06, 3.203749656677246e-06, 3.7550926208496094e-06, 4.306435585021973e-06, 4.857778549194336e-06, 5.409121513366699e-06, 5.9604644775390625e-06, 6.511807441711426e-06, 7.063150405883789e-06, 7.614493370056152e-06, 8.165836334228516e-06, 8.717179298400879e-06, 9.268522262573242e-06, 9.819865226745605e-06, 1.0371208190917969e-05, 1.0922551155090332e-05, 1.1473894119262695e-05, 1.2025237083435059e-05, 1.2576580047607422e-05, 1.3127923011779785e-05, 1.3679265975952148e-05, 1.4230608940124512e-05, 1.4781951904296875e-05, 1.5333294868469238e-05, 1.58846378326416e-05, 1.6435980796813965e-05, 1.6987323760986328e-05, 1.753866672515869e-05, 1.8090009689331055e-05, 1.8641352653503418e-05, 1.919269561767578e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 7.0, 5.0, 13.0, 10.0, 13.0, 14.0, 35.0, 41.0, 60.0, 108.0, 132.0, 222.0, 367.0, 687.0, 1286.0, 2522.0, 5207.0, 11319.0, 24828.0, 58599.0, 142623.0, 304341.0, 280171.0, 123483.0, 50660.0, 22362.0, 9830.0, 4632.0, 2286.0, 1183.0, 584.0, 380.0, 180.0, 108.0, 85.0, 55.0, 30.0, 26.0, 19.0, 17.0, 11.0, 2.0, 2.0, 5.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.048248291015625, -0.046736717224121094, -0.04522514343261719, -0.04371356964111328, -0.042201995849609375, -0.04069042205810547, -0.03917884826660156, -0.037667274475097656, -0.03615570068359375, -0.034644126892089844, -0.03313255310058594, -0.03162097930908203, -0.030109405517578125, -0.02859783172607422, -0.027086257934570312, -0.025574684143066406, -0.0240631103515625, -0.022551536560058594, -0.021039962768554688, -0.01952838897705078, -0.018016815185546875, -0.01650524139404297, -0.014993667602539062, -0.013482093811035156, -0.01197052001953125, -0.010458946228027344, -0.008947372436523438, -0.007435798645019531, -0.005924224853515625, -0.004412651062011719, -0.0029010772705078125, -0.0013895034790039062, 0.0001220703125, 0.0016336441040039062, 0.0031452178955078125, 0.004656791687011719, 0.006168365478515625, 0.007679939270019531, 0.009191513061523438, 0.010703086853027344, 0.01221466064453125, 0.013726234436035156, 0.015237808227539062, 0.01674938201904297, 0.018260955810546875, 0.01977252960205078, 0.021284103393554688, 0.022795677185058594, 0.0243072509765625, 0.025818824768066406, 0.027330398559570312, 0.02884197235107422, 0.030353546142578125, 0.03186511993408203, 0.03337669372558594, 0.034888267517089844, 0.03639984130859375, 0.037911415100097656, 0.03942298889160156, 0.04093456268310547, 0.042446136474609375, 0.04395771026611328, 0.04546928405761719, 0.046980857849121094, 0.048492431640625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 1.0, 5.0, 10.0, 7.0, 17.0, 9.0, 13.0, 11.0, 24.0, 23.0, 39.0, 44.0, 49.0, 52.0, 63.0, 64.0, 75.0, 76.0, 70.0, 58.0, 52.0, 38.0, 37.0, 30.0, 21.0, 23.0, 15.0, 15.0, 13.0, 12.0, 6.0, 6.0, 2.0, 7.0, 1.0, 7.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04058837890625, -0.038956642150878906, -0.03732490539550781, -0.03569316864013672, -0.034061431884765625, -0.03242969512939453, -0.030797958374023438, -0.029166221618652344, -0.02753448486328125, -0.025902748107910156, -0.024271011352539062, -0.02263927459716797, -0.021007537841796875, -0.01937580108642578, -0.017744064331054688, -0.016112327575683594, -0.0144805908203125, -0.012848854064941406, -0.011217117309570312, -0.009585380554199219, -0.007953643798828125, -0.006321907043457031, -0.0046901702880859375, -0.0030584335327148438, -0.00142669677734375, 0.00020503997802734375, 0.0018367767333984375, 0.0034685134887695312, 0.005100250244140625, 0.006731986999511719, 0.008363723754882812, 0.009995460510253906, 0.011627197265625, 0.013258934020996094, 0.014890670776367188, 0.01652240753173828, 0.018154144287109375, 0.01978588104248047, 0.021417617797851562, 0.023049354553222656, 0.02468109130859375, 0.026312828063964844, 0.027944564819335938, 0.02957630157470703, 0.031208038330078125, 0.03283977508544922, 0.03447151184082031, 0.036103248596191406, 0.0377349853515625, 0.039366722106933594, 0.04099845886230469, 0.04263019561767578, 0.044261932373046875, 0.04589366912841797, 0.04752540588378906, 0.049157142639160156, 0.05078887939453125, 0.052420616149902344, 0.05405235290527344, 0.05568408966064453, 0.057315826416015625, 0.05894756317138672, 0.06057929992675781, 0.062211036682128906, 0.0638427734375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 13.0, 37.0, 88.0, 133.0, 166.0, 197.0, 169.0, 89.0, 52.0, 31.0, 10.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7692256569862366, -0.7388582229614258, -0.708490788936615, -0.6781233549118042, -0.6477559804916382, -0.6173884868621826, -0.5870211124420166, -0.5566536784172058, -0.526286244392395, -0.49591881036758423, -0.46555137634277344, -0.43518397212028503, -0.40481653809547424, -0.37444910407066345, -0.34408169984817505, -0.31371426582336426, -0.28334683179855347, -0.2529793977737427, -0.22261197865009308, -0.19224455952644348, -0.1618771255016327, -0.1315096914768219, -0.1011422723531723, -0.0707748532295227, -0.040407419204711914, -0.01003999263048172, 0.020327433943748474, 0.05069486051797867, 0.08106228709220886, 0.11142972111701965, 0.14179714024066925, 0.17216455936431885, 0.20253205299377441, 0.2328994870185852, 0.263266921043396, 0.2936343252658844, 0.3240017592906952, 0.354369193315506, 0.3847365975379944, 0.4151040315628052, 0.44547146558761597, 0.47583889961242676, 0.5062063336372375, 0.5365737676620483, 0.5669411420822144, 0.5973086357116699, 0.6276760101318359, 0.6580434441566467, 0.6884108781814575, 0.7187783122062683, 0.7491457462310791, 0.7795131802558899, 0.8098806142807007, 0.8402479887008667, 0.8706154227256775, 0.9009828567504883, 0.9313502907752991, 0.9617177248001099, 0.9920851588249207, 1.0224525928497314, 1.0528199672698975, 1.083187460899353, 1.113554835319519, 1.1439223289489746, 1.1742897033691406]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 6.0, 6.0, 9.0, 10.0, 11.0, 9.0, 19.0, 18.0, 14.0, 19.0, 27.0, 24.0, 34.0, 22.0, 27.0, 29.0, 26.0, 30.0, 25.0, 51.0, 55.0, 36.0, 43.0, 43.0, 43.0, 32.0, 43.0, 39.0, 20.0, 29.0, 31.0, 20.0, 17.0, 28.0, 11.0, 17.0, 13.0, 13.0, 8.0, 10.0, 6.0, 6.0, 3.0, 8.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.4376823902130127, -0.4242086708545685, -0.41073498129844666, -0.39726126194000244, -0.3837875425815582, -0.370313823223114, -0.3568401336669922, -0.343366414308548, -0.32989269495010376, -0.31641897559165955, -0.3029452860355377, -0.2894715666770935, -0.2759978473186493, -0.2625241279602051, -0.24905043840408325, -0.23557671904563904, -0.22210301458835602, -0.208629310131073, -0.19515559077262878, -0.18168188631534576, -0.16820816695690155, -0.15473446249961853, -0.14126074314117432, -0.1277870386838913, -0.11431332677602768, -0.10083961486816406, -0.08736590296030045, -0.07389219105243683, -0.06041848286986351, -0.04694477468729019, -0.033471062779426575, -0.019997350871562958, -0.006523638963699341, 0.0069500720128417015, 0.020423782989382744, 0.03389749303460121, 0.04737120494246483, 0.06084491312503815, 0.07431862503290176, 0.08779233694076538, 0.101266048848629, 0.11473976075649261, 0.12821346521377563, 0.14168718457221985, 0.15516088902950287, 0.1686345934867859, 0.1821083128452301, 0.19558203220367432, 0.20905573666095734, 0.22252944111824036, 0.23600316047668457, 0.2494768649339676, 0.2629505693912506, 0.2764242887496948, 0.28989800810813904, 0.30337172746658325, 0.3168454170227051, 0.3303191363811493, 0.3437928259372711, 0.35726654529571533, 0.37074026465415955, 0.38421398401260376, 0.3976876735687256, 0.4111613929271698, 0.424635112285614]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 4.0, 8.0, 11.0, 18.0, 20.0, 29.0, 48.0, 57.0, 90.0, 160.0, 301.0, 498.0, 926.0, 1814.0, 3586.0, 7394.0, 15461.0, 33440.0, 74647.0, 174964.0, 479842.0, 1390819.0, 1296196.0, 427737.0, 158337.0, 67796.0, 31336.0, 14516.0, 6837.0, 3440.0, 1786.0, 908.0, 493.0, 298.0, 160.0, 106.0, 69.0, 34.0, 22.0, 22.0, 16.0, 15.0, 9.0, 3.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07769775390625, -0.07501411437988281, -0.07233047485351562, -0.06964683532714844, -0.06696319580078125, -0.06427955627441406, -0.061595916748046875, -0.05891227722167969, -0.0562286376953125, -0.05354499816894531, -0.050861358642578125, -0.04817771911621094, -0.04549407958984375, -0.04281044006347656, -0.040126800537109375, -0.03744316101074219, -0.034759521484375, -0.03207588195800781, -0.029392242431640625, -0.026708602905273438, -0.02402496337890625, -0.021341323852539062, -0.018657684326171875, -0.015974044799804688, -0.0132904052734375, -0.010606765747070312, -0.007923126220703125, -0.0052394866943359375, -0.00255584716796875, 0.0001277923583984375, 0.002811431884765625, 0.0054950714111328125, 0.0081787109375, 0.010862350463867188, 0.013545989990234375, 0.016229629516601562, 0.01891326904296875, 0.021596908569335938, 0.024280548095703125, 0.026964187622070312, 0.0296478271484375, 0.03233146667480469, 0.035015106201171875, 0.03769874572753906, 0.04038238525390625, 0.04306602478027344, 0.045749664306640625, 0.04843330383300781, 0.051116943359375, 0.05380058288574219, 0.056484222412109375, 0.05916786193847656, 0.06185150146484375, 0.06453514099121094, 0.06721878051757812, 0.06990242004394531, 0.0725860595703125, 0.07526969909667969, 0.07795333862304688, 0.08063697814941406, 0.08332061767578125, 0.08600425720214844, 0.08868789672851562, 0.09137153625488281, 0.09405517578125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 6.0, 14.0, 14.0, 15.0, 11.0, 26.0, 21.0, 32.0, 24.0, 42.0, 28.0, 31.0, 23.0, 46.0, 41.0, 51.0, 49.0, 42.0, 39.0, 43.0, 28.0, 30.0, 34.0, 38.0, 30.0, 29.0, 27.0, 27.0, 21.0, 22.0, 18.0, 18.0, 3.0, 12.0, 12.0, 6.0, 5.0, 10.0, 3.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.06451416015625, -0.06258296966552734, -0.06065177917480469, -0.05872058868408203, -0.056789398193359375, -0.05485820770263672, -0.05292701721191406, -0.050995826721191406, -0.04906463623046875, -0.047133445739746094, -0.04520225524902344, -0.04327106475830078, -0.041339874267578125, -0.03940868377685547, -0.03747749328613281, -0.035546302795410156, -0.0336151123046875, -0.031683921813964844, -0.029752731323242188, -0.02782154083251953, -0.025890350341796875, -0.02395915985107422, -0.022027969360351562, -0.020096778869628906, -0.01816558837890625, -0.016234397888183594, -0.014303207397460938, -0.012372016906738281, -0.010440826416015625, -0.008509635925292969, -0.0065784454345703125, -0.004647254943847656, -0.002716064453125, -0.0007848739624023438, 0.0011463165283203125, 0.0030775070190429688, 0.005008697509765625, 0.006939888000488281, 0.008871078491210938, 0.010802268981933594, 0.01273345947265625, 0.014664649963378906, 0.016595840454101562, 0.01852703094482422, 0.020458221435546875, 0.02238941192626953, 0.024320602416992188, 0.026251792907714844, 0.0281829833984375, 0.030114173889160156, 0.03204536437988281, 0.03397655487060547, 0.035907745361328125, 0.03783893585205078, 0.03977012634277344, 0.041701316833496094, 0.04363250732421875, 0.045563697814941406, 0.04749488830566406, 0.04942607879638672, 0.051357269287109375, 0.05328845977783203, 0.05521965026855469, 0.057150840759277344, 0.05908203125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 13.0, 22.0, 43.0, 53.0, 104.0, 140.0, 290.0, 466.0, 867.0, 1680.0, 2998.0, 6077.0, 12265.0, 24470.0, 49708.0, 106767.0, 241818.0, 655306.0, 1652122.0, 884365.0, 305739.0, 130285.0, 60485.0, 28871.0, 14171.0, 7296.0, 3662.0, 1855.0, 980.0, 573.0, 294.0, 194.0, 109.0, 71.0, 40.0, 28.0, 19.0, 12.0, 6.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0953369140625, -0.09266090393066406, -0.08998489379882812, -0.08730888366699219, -0.08463287353515625, -0.08195686340332031, -0.07928085327148438, -0.07660484313964844, -0.0739288330078125, -0.07125282287597656, -0.06857681274414062, -0.06590080261230469, -0.06322479248046875, -0.06054878234863281, -0.057872772216796875, -0.05519676208496094, -0.052520751953125, -0.04984474182128906, -0.047168731689453125, -0.04449272155761719, -0.04181671142578125, -0.03914070129394531, -0.036464691162109375, -0.03378868103027344, -0.0311126708984375, -0.028436660766601562, -0.025760650634765625, -0.023084640502929688, -0.02040863037109375, -0.017732620239257812, -0.015056610107421875, -0.012380599975585938, -0.00970458984375, -0.0070285797119140625, -0.004352569580078125, -0.0016765594482421875, 0.00099945068359375, 0.0036754608154296875, 0.006351470947265625, 0.009027481079101562, 0.0117034912109375, 0.014379501342773438, 0.017055511474609375, 0.019731521606445312, 0.02240753173828125, 0.025083541870117188, 0.027759552001953125, 0.030435562133789062, 0.033111572265625, 0.03578758239746094, 0.038463592529296875, 0.04113960266113281, 0.04381561279296875, 0.04649162292480469, 0.049167633056640625, 0.05184364318847656, 0.0545196533203125, 0.05719566345214844, 0.059871673583984375, 0.06254768371582031, 0.06522369384765625, 0.06789970397949219, 0.07057571411132812, 0.07325172424316406, 0.075927734375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 7.0, 3.0, 8.0, 18.0, 18.0, 17.0, 29.0, 22.0, 48.0, 31.0, 66.0, 70.0, 100.0, 104.0, 185.0, 243.0, 311.0, 416.0, 509.0, 485.0, 355.0, 256.0, 173.0, 139.0, 100.0, 88.0, 60.0, 60.0, 35.0, 28.0, 26.0, 13.0, 18.0, 6.0, 7.0, 10.0, 3.0, 4.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.10858154296875, -0.10491275787353516, -0.10124397277832031, -0.09757518768310547, -0.09390640258789062, -0.09023761749267578, -0.08656883239746094, -0.0829000473022461, -0.07923126220703125, -0.0755624771118164, -0.07189369201660156, -0.06822490692138672, -0.06455612182617188, -0.06088733673095703, -0.05721855163574219, -0.053549766540527344, -0.0498809814453125, -0.046212196350097656, -0.04254341125488281, -0.03887462615966797, -0.035205841064453125, -0.03153705596923828, -0.027868270874023438, -0.024199485778808594, -0.02053070068359375, -0.016861915588378906, -0.013193130493164062, -0.009524345397949219, -0.005855560302734375, -0.0021867752075195312, 0.0014820098876953125, 0.005150794982910156, 0.008819580078125, 0.012488365173339844, 0.016157150268554688, 0.01982593536376953, 0.023494720458984375, 0.02716350555419922, 0.030832290649414062, 0.034501075744628906, 0.03816986083984375, 0.041838645935058594, 0.04550743103027344, 0.04917621612548828, 0.052845001220703125, 0.05651378631591797, 0.06018257141113281, 0.06385135650634766, 0.0675201416015625, 0.07118892669677734, 0.07485771179199219, 0.07852649688720703, 0.08219528198242188, 0.08586406707763672, 0.08953285217285156, 0.0932016372680664, 0.09687042236328125, 0.1005392074584961, 0.10420799255371094, 0.10787677764892578, 0.11154556274414062, 0.11521434783935547, 0.11888313293457031, 0.12255191802978516, 0.126220703125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 7.0, 8.0, 8.0, 23.0, 30.0, 50.0, 50.0, 75.0, 97.0, 84.0, 98.0, 103.0, 90.0, 59.0, 67.0, 63.0, 36.0, 17.0, 7.0, 11.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6537379026412964, -0.6325673460960388, -0.6113967895507812, -0.5902261734008789, -0.5690556168556213, -0.5478850603103638, -0.5267145037651062, -0.5055439472198486, -0.4843733608722687, -0.4632028043270111, -0.44203221797943115, -0.4208616614341736, -0.399691104888916, -0.37852051854133606, -0.3573499619960785, -0.33617937564849854, -0.31500881910324097, -0.2938382625579834, -0.27266767621040344, -0.2514971196651459, -0.2303265482187271, -0.20915597677230835, -0.18798542022705078, -0.16681484878063202, -0.14564427733421326, -0.1244737058877945, -0.10330314189195633, -0.08213257789611816, -0.0609620064496994, -0.03979143500328064, -0.01862087845802307, 0.002549692988395691, 0.023720204830169678, 0.04489077255129814, 0.0660613402724266, 0.08723190426826477, 0.10840247571468353, 0.1295730471611023, 0.15074360370635986, 0.17191417515277863, 0.1930847465991974, 0.21425531804561615, 0.2354258894920349, 0.2565964460372925, 0.27776700258255005, 0.29893758893013, 0.3201081454753876, 0.34127873182296753, 0.3624492883682251, 0.38361984491348267, 0.4047904312610626, 0.4259609878063202, 0.44713157415390015, 0.4683021306991577, 0.4894726872444153, 0.5106432437896729, 0.5318138599395752, 0.5529844164848328, 0.5741549730300903, 0.5953255891799927, 0.6164961457252502, 0.6376667022705078, 0.6588372588157654, 0.680007815361023, 0.7011783719062805]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 6.0, 5.0, 7.0, 5.0, 23.0, 13.0, 13.0, 20.0, 25.0, 24.0, 24.0, 29.0, 35.0, 33.0, 35.0, 33.0, 34.0, 42.0, 43.0, 37.0, 42.0, 42.0, 35.0, 44.0, 40.0, 38.0, 39.0, 20.0, 32.0, 33.0, 17.0, 22.0, 22.0, 15.0, 9.0, 5.0, 13.0, 12.0, 7.0, 7.0, 3.0, 2.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.3592570424079895, -0.34792518615722656, -0.3365933299064636, -0.3252614736557007, -0.31392964720726013, -0.3025977909564972, -0.29126593470573425, -0.2799340784549713, -0.26860225200653076, -0.2572703957557678, -0.24593855440616608, -0.23460669815540314, -0.2232748568058014, -0.21194300055503845, -0.2006111443042755, -0.18927928805351257, -0.17794743180274963, -0.1666155755519867, -0.15528373420238495, -0.143951877951622, -0.13262003660202026, -0.12128818035125732, -0.10995632410049438, -0.09862447530031204, -0.0872926265001297, -0.07596077769994736, -0.06462892889976501, -0.053297072649002075, -0.04196522384881973, -0.03063337504863739, -0.01930151879787445, -0.007969669997692108, 0.0033621788024902344, 0.014694029465317726, 0.026025880128145218, 0.03735773265361786, 0.0486895814538002, 0.060021430253982544, 0.07135328650474548, 0.08268513530492783, 0.09401698410511017, 0.10534883290529251, 0.11668068170547485, 0.1280125379562378, 0.13934439420700073, 0.15067623555660248, 0.16200809180736542, 0.17333993315696716, 0.1846717894077301, 0.19600364565849304, 0.2073354870080948, 0.21866734325885773, 0.22999918460845947, 0.2413310408592224, 0.25266289710998535, 0.2639947533607483, 0.27532660961151123, 0.28665846586227417, 0.2979903221130371, 0.30932217836380005, 0.3206540048122406, 0.33198586106300354, 0.3433177173137665, 0.3546495735645294, 0.36598140001296997]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 7.0, 9.0, 9.0, 20.0, 34.0, 51.0, 74.0, 98.0, 166.0, 231.0, 302.0, 479.0, 667.0, 906.0, 1369.0, 1749.0, 2516.0, 3359.0, 4955.0, 6664.0, 9492.0, 14605.0, 23792.0, 46993.0, 123014.0, 306828.0, 282633.0, 107380.0, 42559.0, 22110.0, 13700.0, 9201.0, 6315.0, 4596.0, 3327.0, 2399.0, 1843.0, 1181.0, 905.0, 630.0, 444.0, 309.0, 210.0, 147.0, 116.0, 65.0, 33.0, 23.0, 19.0, 13.0, 7.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0858154296875, -0.08284950256347656, -0.07988357543945312, -0.07691764831542969, -0.07395172119140625, -0.07098579406738281, -0.06801986694335938, -0.06505393981933594, -0.0620880126953125, -0.05912208557128906, -0.056156158447265625, -0.05319023132324219, -0.05022430419921875, -0.04725837707519531, -0.044292449951171875, -0.04132652282714844, -0.038360595703125, -0.03539466857910156, -0.032428741455078125, -0.029462814331054688, -0.02649688720703125, -0.023530960083007812, -0.020565032958984375, -0.017599105834960938, -0.0146331787109375, -0.011667251586914062, -0.008701324462890625, -0.0057353973388671875, -0.00276947021484375, 0.0001964569091796875, 0.003162384033203125, 0.0061283111572265625, 0.00909423828125, 0.012060165405273438, 0.015026092529296875, 0.017992019653320312, 0.02095794677734375, 0.023923873901367188, 0.026889801025390625, 0.029855728149414062, 0.0328216552734375, 0.03578758239746094, 0.038753509521484375, 0.04171943664550781, 0.04468536376953125, 0.04765129089355469, 0.050617218017578125, 0.05358314514160156, 0.056549072265625, 0.05951499938964844, 0.062480926513671875, 0.06544685363769531, 0.06841278076171875, 0.07137870788574219, 0.07434463500976562, 0.07731056213378906, 0.0802764892578125, 0.08324241638183594, 0.08620834350585938, 0.08917427062988281, 0.09214019775390625, 0.09510612487792969, 0.09807205200195312, 0.10103797912597656, 0.10400390625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 5.0, 8.0, 4.0, 8.0, 9.0, 18.0, 12.0, 20.0, 19.0, 24.0, 37.0, 24.0, 25.0, 32.0, 28.0, 32.0, 38.0, 38.0, 42.0, 37.0, 48.0, 41.0, 38.0, 33.0, 42.0, 34.0, 30.0, 28.0, 31.0, 27.0, 24.0, 24.0, 19.0, 23.0, 19.0, 10.0, 12.0, 9.0, 10.0, 5.0, 8.0, 8.0, 4.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.06451416015625, -0.0626683235168457, -0.060822486877441406, -0.05897665023803711, -0.05713081359863281, -0.055284976959228516, -0.05343914031982422, -0.05159330368041992, -0.049747467041015625, -0.04790163040161133, -0.04605579376220703, -0.044209957122802734, -0.04236412048339844, -0.04051828384399414, -0.038672447204589844, -0.03682661056518555, -0.03498077392578125, -0.03313493728637695, -0.031289100646972656, -0.02944326400756836, -0.027597427368164062, -0.025751590728759766, -0.02390575408935547, -0.022059917449951172, -0.020214080810546875, -0.018368244171142578, -0.01652240753173828, -0.014676570892333984, -0.012830734252929688, -0.01098489761352539, -0.009139060974121094, -0.007293224334716797, -0.0054473876953125, -0.003601551055908203, -0.0017557144165039062, 9.012222290039062e-05, 0.0019359588623046875, 0.0037817955017089844, 0.005627632141113281, 0.007473468780517578, 0.009319305419921875, 0.011165142059326172, 0.013010978698730469, 0.014856815338134766, 0.016702651977539062, 0.01854848861694336, 0.020394325256347656, 0.022240161895751953, 0.02408599853515625, 0.025931835174560547, 0.027777671813964844, 0.02962350845336914, 0.03146934509277344, 0.033315181732177734, 0.03516101837158203, 0.03700685501098633, 0.038852691650390625, 0.04069852828979492, 0.04254436492919922, 0.044390201568603516, 0.04623603820800781, 0.04808187484741211, 0.049927711486816406, 0.0517735481262207, 0.053619384765625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 6.0, 3.0, 7.0, 3.0, 5.0, 15.0, 19.0, 28.0, 37.0, 42.0, 60.0, 94.0, 172.0, 241.0, 432.0, 899.0, 2004.0, 4828.0, 11774.0, 28912.0, 85595.0, 426469.0, 367379.0, 74747.0, 26110.0, 10604.0, 4439.0, 1773.0, 798.0, 413.0, 215.0, 140.0, 85.0, 50.0, 45.0, 40.0, 25.0, 9.0, 14.0, 10.0, 7.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1719970703125, -0.16643905639648438, -0.16088104248046875, -0.15532302856445312, -0.1497650146484375, -0.14420700073242188, -0.13864898681640625, -0.13309097290039062, -0.127532958984375, -0.12197494506835938, -0.11641693115234375, -0.11085891723632812, -0.1053009033203125, -0.09974288940429688, -0.09418487548828125, -0.08862686157226562, -0.08306884765625, -0.07751083374023438, -0.07195281982421875, -0.06639480590820312, -0.0608367919921875, -0.055278778076171875, -0.04972076416015625, -0.044162750244140625, -0.038604736328125, -0.033046722412109375, -0.02748870849609375, -0.021930694580078125, -0.0163726806640625, -0.010814666748046875, -0.00525665283203125, 0.000301361083984375, 0.005859375, 0.011417388916015625, 0.01697540283203125, 0.022533416748046875, 0.0280914306640625, 0.033649444580078125, 0.03920745849609375, 0.044765472412109375, 0.050323486328125, 0.055881500244140625, 0.06143951416015625, 0.06699752807617188, 0.0725555419921875, 0.07811355590820312, 0.08367156982421875, 0.08922958374023438, 0.09478759765625, 0.10034561157226562, 0.10590362548828125, 0.11146163940429688, 0.1170196533203125, 0.12257766723632812, 0.12813568115234375, 0.13369369506835938, 0.139251708984375, 0.14480972290039062, 0.15036773681640625, 0.15592575073242188, 0.1614837646484375, 0.16704177856445312, 0.17259979248046875, 0.17815780639648438, 0.1837158203125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 9.0, 9.0, 2.0, 9.0, 11.0, 8.0, 9.0, 16.0, 21.0, 20.0, 33.0, 23.0, 16.0, 34.0, 27.0, 31.0, 35.0, 44.0, 46.0, 36.0, 38.0, 39.0, 35.0, 41.0, 55.0, 46.0, 39.0, 36.0, 31.0, 30.0, 21.0, 21.0, 19.0, 18.0, 17.0, 14.0, 14.0, 5.0, 10.0, 3.0, 11.0, 9.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.1522216796875, -0.14736175537109375, -0.1425018310546875, -0.13764190673828125, -0.132781982421875, -0.12792205810546875, -0.1230621337890625, -0.11820220947265625, -0.11334228515625, -0.10848236083984375, -0.1036224365234375, -0.09876251220703125, -0.093902587890625, -0.08904266357421875, -0.0841827392578125, -0.07932281494140625, -0.074462890625, -0.06960296630859375, -0.0647430419921875, -0.05988311767578125, -0.055023193359375, -0.05016326904296875, -0.0453033447265625, -0.04044342041015625, -0.03558349609375, -0.03072357177734375, -0.0258636474609375, -0.02100372314453125, -0.016143798828125, -0.01128387451171875, -0.0064239501953125, -0.00156402587890625, 0.0032958984375, 0.00815582275390625, 0.0130157470703125, 0.01787567138671875, 0.022735595703125, 0.02759552001953125, 0.0324554443359375, 0.03731536865234375, 0.04217529296875, 0.04703521728515625, 0.0518951416015625, 0.05675506591796875, 0.061614990234375, 0.06647491455078125, 0.0713348388671875, 0.07619476318359375, 0.0810546875, 0.08591461181640625, 0.0907745361328125, 0.09563446044921875, 0.100494384765625, 0.10535430908203125, 0.1102142333984375, 0.11507415771484375, 0.11993408203125, 0.12479400634765625, 0.1296539306640625, 0.13451385498046875, 0.139373779296875, 0.14423370361328125, 0.1490936279296875, 0.15395355224609375, 0.1588134765625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 7.0, 8.0, 15.0, 22.0, 37.0, 60.0, 80.0, 156.0, 253.0, 437.0, 648.0, 1133.0, 1839.0, 2944.0, 4822.0, 7853.0, 13739.0, 27855.0, 69603.0, 217873.0, 393962.0, 187463.0, 61206.0, 24736.0, 12752.0, 7392.0, 4511.0, 2759.0, 1717.0, 1083.0, 610.0, 346.0, 224.0, 147.0, 88.0, 53.0, 43.0, 28.0, 19.0, 12.0, 2.0, 7.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.045928955078125, -0.0445551872253418, -0.043181419372558594, -0.04180765151977539, -0.04043388366699219, -0.039060115814208984, -0.03768634796142578, -0.03631258010864258, -0.034938812255859375, -0.03356504440307617, -0.03219127655029297, -0.030817508697509766, -0.029443740844726562, -0.02806997299194336, -0.026696205139160156, -0.025322437286376953, -0.02394866943359375, -0.022574901580810547, -0.021201133728027344, -0.01982736587524414, -0.018453598022460938, -0.017079830169677734, -0.01570606231689453, -0.014332294464111328, -0.012958526611328125, -0.011584758758544922, -0.010210990905761719, -0.008837223052978516, -0.0074634552001953125, -0.006089687347412109, -0.004715919494628906, -0.003342151641845703, -0.0019683837890625, -0.0005946159362792969, 0.0007791519165039062, 0.0021529197692871094, 0.0035266876220703125, 0.004900455474853516, 0.006274223327636719, 0.007647991180419922, 0.009021759033203125, 0.010395526885986328, 0.011769294738769531, 0.013143062591552734, 0.014516830444335938, 0.01589059829711914, 0.017264366149902344, 0.018638134002685547, 0.02001190185546875, 0.021385669708251953, 0.022759437561035156, 0.02413320541381836, 0.025506973266601562, 0.026880741119384766, 0.02825450897216797, 0.029628276824951172, 0.031002044677734375, 0.03237581253051758, 0.03374958038330078, 0.035123348236083984, 0.03649711608886719, 0.03787088394165039, 0.039244651794433594, 0.0406184196472168, 0.0419921875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 1.0, 6.0, 3.0, 7.0, 6.0, 14.0, 22.0, 21.0, 33.0, 53.0, 80.0, 92.0, 117.0, 109.0, 112.0, 98.0, 60.0, 35.0, 40.0, 17.0, 19.0, 5.0, 10.0, 6.0, 2.0, 3.0, 5.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0205974578857422e-05, -1.955777406692505e-05, -1.8909573554992676e-05, -1.8261373043060303e-05, -1.761317253112793e-05, -1.6964972019195557e-05, -1.6316771507263184e-05, -1.566857099533081e-05, -1.5020370483398438e-05, -1.4372169971466064e-05, -1.3723969459533691e-05, -1.3075768947601318e-05, -1.2427568435668945e-05, -1.1779367923736572e-05, -1.11311674118042e-05, -1.0482966899871826e-05, -9.834766387939453e-06, -9.18656587600708e-06, -8.538365364074707e-06, -7.890164852142334e-06, -7.241964340209961e-06, -6.593763828277588e-06, -5.945563316345215e-06, -5.297362804412842e-06, -4.649162292480469e-06, -4.000961780548096e-06, -3.3527612686157227e-06, -2.7045607566833496e-06, -2.0563602447509766e-06, -1.4081597328186035e-06, -7.599592208862305e-07, -1.1175870895385742e-07, 5.364418029785156e-07, 1.1846423149108887e-06, 1.8328428268432617e-06, 2.4810433387756348e-06, 3.129243850708008e-06, 3.777444362640381e-06, 4.425644874572754e-06, 5.073845386505127e-06, 5.7220458984375e-06, 6.370246410369873e-06, 7.018446922302246e-06, 7.666647434234619e-06, 8.314847946166992e-06, 8.963048458099365e-06, 9.611248970031738e-06, 1.0259449481964111e-05, 1.0907649993896484e-05, 1.1555850505828857e-05, 1.220405101776123e-05, 1.2852251529693604e-05, 1.3500452041625977e-05, 1.414865255355835e-05, 1.4796853065490723e-05, 1.5445053577423096e-05, 1.609325408935547e-05, 1.6741454601287842e-05, 1.7389655113220215e-05, 1.8037855625152588e-05, 1.868605613708496e-05, 1.9334256649017334e-05, 1.9982457160949707e-05, 2.063065767288208e-05, 2.1278858184814453e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 3.0, 5.0, 7.0, 10.0, 8.0, 19.0, 17.0, 32.0, 43.0, 70.0, 103.0, 166.0, 255.0, 425.0, 875.0, 1705.0, 3175.0, 6099.0, 12757.0, 28552.0, 81552.0, 247954.0, 377174.0, 184813.0, 59467.0, 22002.0, 10272.0, 5183.0, 2708.0, 1338.0, 731.0, 401.0, 211.0, 144.0, 81.0, 57.0, 39.0, 25.0, 15.0, 19.0, 5.0, 9.0, 5.0, 7.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.04620361328125, -0.044730186462402344, -0.04325675964355469, -0.04178333282470703, -0.040309906005859375, -0.03883647918701172, -0.03736305236816406, -0.035889625549316406, -0.03441619873046875, -0.032942771911621094, -0.03146934509277344, -0.02999591827392578, -0.028522491455078125, -0.02704906463623047, -0.025575637817382812, -0.024102210998535156, -0.0226287841796875, -0.021155357360839844, -0.019681930541992188, -0.01820850372314453, -0.016735076904296875, -0.015261650085449219, -0.013788223266601562, -0.012314796447753906, -0.01084136962890625, -0.009367942810058594, -0.007894515991210938, -0.006421089172363281, -0.004947662353515625, -0.0034742355346679688, -0.0020008087158203125, -0.0005273818969726562, 0.000946044921875, 0.0024194717407226562, 0.0038928985595703125, 0.005366325378417969, 0.006839752197265625, 0.008313179016113281, 0.009786605834960938, 0.011260032653808594, 0.01273345947265625, 0.014206886291503906, 0.015680313110351562, 0.01715373992919922, 0.018627166748046875, 0.02010059356689453, 0.021574020385742188, 0.023047447204589844, 0.0245208740234375, 0.025994300842285156, 0.027467727661132812, 0.02894115447998047, 0.030414581298828125, 0.03188800811767578, 0.03336143493652344, 0.034834861755371094, 0.03630828857421875, 0.037781715393066406, 0.03925514221191406, 0.04072856903076172, 0.042201995849609375, 0.04367542266845703, 0.04514884948730469, 0.046622276306152344, 0.048095703125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 5.0, 5.0, 3.0, 9.0, 6.0, 9.0, 12.0, 9.0, 14.0, 26.0, 43.0, 41.0, 75.0, 77.0, 76.0, 95.0, 93.0, 85.0, 74.0, 54.0, 36.0, 36.0, 20.0, 20.0, 18.0, 18.0, 17.0, 5.0, 6.0, 3.0, 5.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042755126953125, -0.041228294372558594, -0.03970146179199219, -0.03817462921142578, -0.036647796630859375, -0.03512096405029297, -0.03359413146972656, -0.032067298889160156, -0.03054046630859375, -0.029013633728027344, -0.027486801147460938, -0.02595996856689453, -0.024433135986328125, -0.02290630340576172, -0.021379470825195312, -0.019852638244628906, -0.0183258056640625, -0.016798973083496094, -0.015272140502929688, -0.013745307922363281, -0.012218475341796875, -0.010691642761230469, -0.009164810180664062, -0.007637977600097656, -0.00611114501953125, -0.004584312438964844, -0.0030574798583984375, -0.0015306472778320312, -3.814697265625e-06, 0.0015230178833007812, 0.0030498504638671875, 0.004576683044433594, 0.006103515625, 0.007630348205566406, 0.009157180786132812, 0.010684013366699219, 0.012210845947265625, 0.013737678527832031, 0.015264511108398438, 0.016791343688964844, 0.01831817626953125, 0.019845008850097656, 0.021371841430664062, 0.02289867401123047, 0.024425506591796875, 0.02595233917236328, 0.027479171752929688, 0.029006004333496094, 0.0305328369140625, 0.032059669494628906, 0.03358650207519531, 0.03511333465576172, 0.036640167236328125, 0.03816699981689453, 0.03969383239746094, 0.041220664978027344, 0.04274749755859375, 0.044274330139160156, 0.04580116271972656, 0.04732799530029297, 0.048854827880859375, 0.05038166046142578, 0.05190849304199219, 0.053435325622558594, 0.054962158203125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 8.0, 10.0, 32.0, 48.0, 78.0, 103.0, 144.0, 135.0, 138.0, 113.0, 73.0, 51.0, 28.0, 16.0, 12.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.9762471914291382, -0.9521121382713318, -0.9279770851135254, -0.9038420915603638, -0.8797070384025574, -0.855571985244751, -0.8314369916915894, -0.807301938533783, -0.7831668853759766, -0.7590318322181702, -0.7348967790603638, -0.7107617855072021, -0.6866267323493958, -0.6624916791915894, -0.6383566856384277, -0.6142216324806213, -0.5900865793228149, -0.5659515261650085, -0.5418164730072021, -0.5176814794540405, -0.49354642629623413, -0.46941137313842773, -0.4452763497829437, -0.4211413264274597, -0.3970062732696533, -0.3728712201118469, -0.3487361967563629, -0.3246011734008789, -0.3004661202430725, -0.2763310670852661, -0.2521960437297821, -0.2280610054731369, -0.2039259672164917, -0.1797909289598465, -0.1556558907032013, -0.1315208524465561, -0.10738581418991089, -0.08325077593326569, -0.05911573767662048, -0.03498069941997528, -0.010845661163330078, 0.013289377093315125, 0.03742441534996033, 0.06155945360660553, 0.08569449186325073, 0.10982953011989594, 0.13396456837654114, 0.15809960663318634, 0.18223464488983154, 0.20636968314647675, 0.23050472140312195, 0.25463974475860596, 0.27877479791641235, 0.30290985107421875, 0.32704487442970276, 0.35117989778518677, 0.37531495094299316, 0.39945000410079956, 0.42358502745628357, 0.4477200508117676, 0.471855103969574, 0.49599015712738037, 0.520125150680542, 0.5442602038383484, 0.5683952569961548]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 1.0, 4.0, 6.0, 2.0, 7.0, 8.0, 17.0, 11.0, 18.0, 14.0, 18.0, 19.0, 22.0, 27.0, 34.0, 21.0, 30.0, 40.0, 44.0, 46.0, 40.0, 45.0, 51.0, 51.0, 42.0, 46.0, 43.0, 40.0, 40.0, 27.0, 23.0, 34.0, 18.0, 25.0, 18.0, 18.0, 10.0, 11.0, 8.0, 7.0, 6.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.4616820216178894, -0.4485746920108795, -0.43546736240386963, -0.42236006259918213, -0.40925273299217224, -0.39614540338516235, -0.38303810358047485, -0.36993077397346497, -0.3568234443664551, -0.3437161147594452, -0.3306087851524353, -0.3175014853477478, -0.3043941557407379, -0.291286826133728, -0.2781795263290405, -0.26507219672203064, -0.25196486711502075, -0.23885753750801086, -0.22575022280216217, -0.21264290809631348, -0.1995355784893036, -0.1864282488822937, -0.173320934176445, -0.1602136194705963, -0.14710628986358643, -0.13399896025657654, -0.12089164555072784, -0.10778432339429855, -0.09467700123786926, -0.08156967908143997, -0.06846235692501068, -0.05535503476858139, -0.0422477126121521, -0.02914039045572281, -0.016033068299293518, -0.0029257461428642273, 0.010181576013565063, 0.023288898169994354, 0.036396220326423645, 0.049503542482852936, 0.06261086463928223, 0.07571818679571152, 0.08882550895214081, 0.1019328311085701, 0.11504015326499939, 0.12814748287200928, 0.14125479757785797, 0.15436211228370667, 0.16746944189071655, 0.18057677149772644, 0.19368408620357513, 0.20679140090942383, 0.21989873051643372, 0.2330060601234436, 0.2461133748292923, 0.259220689535141, 0.2723280191421509, 0.28543534874916077, 0.29854267835617065, 0.31164997816085815, 0.32475730776786804, 0.33786463737487793, 0.35097193717956543, 0.3640792667865753, 0.3771865963935852]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 1.0, 7.0, 7.0, 6.0, 9.0, 14.0, 27.0, 29.0, 63.0, 65.0, 107.0, 193.0, 314.0, 557.0, 1065.0, 2066.0, 4127.0, 8268.0, 17335.0, 37143.0, 85546.0, 227379.0, 765036.0, 1733876.0, 880342.0, 260882.0, 94215.0, 39942.0, 18259.0, 8618.0, 4225.0, 2092.0, 1048.0, 555.0, 323.0, 192.0, 117.0, 71.0, 55.0, 34.0, 22.0, 21.0, 15.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.08978271484375, -0.08710670471191406, -0.08443069458007812, -0.08175468444824219, -0.07907867431640625, -0.07640266418457031, -0.07372665405273438, -0.07105064392089844, -0.0683746337890625, -0.06569862365722656, -0.06302261352539062, -0.06034660339355469, -0.05767059326171875, -0.05499458312988281, -0.052318572998046875, -0.04964256286621094, -0.046966552734375, -0.04429054260253906, -0.041614532470703125, -0.03893852233886719, -0.03626251220703125, -0.03358650207519531, -0.030910491943359375, -0.028234481811523438, -0.0255584716796875, -0.022882461547851562, -0.020206451416015625, -0.017530441284179688, -0.01485443115234375, -0.012178421020507812, -0.009502410888671875, -0.0068264007568359375, -0.004150390625, -0.0014743804931640625, 0.001201629638671875, 0.0038776397705078125, 0.00655364990234375, 0.009229660034179688, 0.011905670166015625, 0.014581680297851562, 0.0172576904296875, 0.019933700561523438, 0.022609710693359375, 0.025285720825195312, 0.02796173095703125, 0.030637741088867188, 0.033313751220703125, 0.03598976135253906, 0.038665771484375, 0.04134178161621094, 0.044017791748046875, 0.04669380187988281, 0.04936981201171875, 0.05204582214355469, 0.054721832275390625, 0.05739784240722656, 0.0600738525390625, 0.06274986267089844, 0.06542587280273438, 0.06810188293457031, 0.07077789306640625, 0.07345390319824219, 0.07612991333007812, 0.07880592346191406, 0.08148193359375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 5.0, 8.0, 5.0, 5.0, 11.0, 16.0, 17.0, 18.0, 24.0, 23.0, 18.0, 31.0, 25.0, 30.0, 33.0, 47.0, 32.0, 34.0, 46.0, 38.0, 41.0, 44.0, 29.0, 40.0, 28.0, 44.0, 29.0, 32.0, 27.0, 34.0, 32.0, 22.0, 18.0, 25.0, 9.0, 13.0, 16.0, 11.0, 8.0, 5.0, 10.0, 1.0, 4.0, 4.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0631103515625, -0.06129598617553711, -0.05948162078857422, -0.05766725540161133, -0.05585289001464844, -0.05403852462768555, -0.052224159240722656, -0.050409793853759766, -0.048595428466796875, -0.046781063079833984, -0.044966697692871094, -0.0431523323059082, -0.04133796691894531, -0.03952360153198242, -0.03770923614501953, -0.03589487075805664, -0.03408050537109375, -0.03226613998413086, -0.03045177459716797, -0.028637409210205078, -0.026823043823242188, -0.025008678436279297, -0.023194313049316406, -0.021379947662353516, -0.019565582275390625, -0.017751216888427734, -0.015936851501464844, -0.014122486114501953, -0.012308120727539062, -0.010493755340576172, -0.008679389953613281, -0.006865024566650391, -0.0050506591796875, -0.0032362937927246094, -0.0014219284057617188, 0.0003924369812011719, 0.0022068023681640625, 0.004021167755126953, 0.005835533142089844, 0.007649898529052734, 0.009464263916015625, 0.011278629302978516, 0.013092994689941406, 0.014907360076904297, 0.016721725463867188, 0.018536090850830078, 0.02035045623779297, 0.02216482162475586, 0.02397918701171875, 0.02579355239868164, 0.02760791778564453, 0.029422283172607422, 0.031236648559570312, 0.0330510139465332, 0.034865379333496094, 0.036679744720458984, 0.038494110107421875, 0.040308475494384766, 0.042122840881347656, 0.04393720626831055, 0.04575157165527344, 0.04756593704223633, 0.04938030242919922, 0.05119466781616211, 0.053009033203125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 11.0, 14.0, 17.0, 20.0, 43.0, 68.0, 93.0, 176.0, 322.0, 611.0, 1131.0, 2183.0, 4725.0, 10273.0, 23629.0, 56655.0, 144599.0, 445675.0, 1743557.0, 1257429.0, 314668.0, 109739.0, 43657.0, 18850.0, 8223.0, 3829.0, 1869.0, 960.0, 522.0, 250.0, 178.0, 102.0, 62.0, 52.0, 35.0, 16.0, 16.0, 8.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0966796875, -0.09344196319580078, -0.09020423889160156, -0.08696651458740234, -0.08372879028320312, -0.0804910659790039, -0.07725334167480469, -0.07401561737060547, -0.07077789306640625, -0.06754016876220703, -0.06430244445800781, -0.061064720153808594, -0.057826995849609375, -0.054589271545410156, -0.05135154724121094, -0.04811382293701172, -0.0448760986328125, -0.04163837432861328, -0.03840065002441406, -0.035162925720214844, -0.031925201416015625, -0.028687477111816406, -0.025449752807617188, -0.02221202850341797, -0.01897430419921875, -0.01573657989501953, -0.012498855590820312, -0.009261131286621094, -0.006023406982421875, -0.0027856826782226562, 0.0004520416259765625, 0.0036897659301757812, 0.006927490234375, 0.010165214538574219, 0.013402938842773438, 0.016640663146972656, 0.019878387451171875, 0.023116111755371094, 0.026353836059570312, 0.02959156036376953, 0.03282928466796875, 0.03606700897216797, 0.03930473327636719, 0.042542457580566406, 0.045780181884765625, 0.049017906188964844, 0.05225563049316406, 0.05549335479736328, 0.0587310791015625, 0.06196880340576172, 0.06520652770996094, 0.06844425201416016, 0.07168197631835938, 0.0749197006225586, 0.07815742492675781, 0.08139514923095703, 0.08463287353515625, 0.08787059783935547, 0.09110832214355469, 0.0943460464477539, 0.09758377075195312, 0.10082149505615234, 0.10405921936035156, 0.10729694366455078, 0.11053466796875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 6.0, 3.0, 8.0, 14.0, 18.0, 17.0, 26.0, 34.0, 44.0, 60.0, 60.0, 92.0, 112.0, 162.0, 228.0, 347.0, 487.0, 524.0, 503.0, 373.0, 257.0, 184.0, 111.0, 74.0, 83.0, 52.0, 38.0, 34.0, 25.0, 13.0, 21.0, 14.0, 15.0, 6.0, 6.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1273193359375, -0.12353515625, -0.1197509765625, -0.115966796875, -0.1121826171875, -0.1083984375, -0.1046142578125, -0.100830078125, -0.0970458984375, -0.09326171875, -0.0894775390625, -0.085693359375, -0.0819091796875, -0.078125, -0.0743408203125, -0.070556640625, -0.0667724609375, -0.06298828125, -0.0592041015625, -0.055419921875, -0.0516357421875, -0.0478515625, -0.0440673828125, -0.040283203125, -0.0364990234375, -0.03271484375, -0.0289306640625, -0.025146484375, -0.0213623046875, -0.017578125, -0.0137939453125, -0.010009765625, -0.0062255859375, -0.00244140625, 0.0013427734375, 0.005126953125, 0.0089111328125, 0.0126953125, 0.0164794921875, 0.020263671875, 0.0240478515625, 0.02783203125, 0.0316162109375, 0.035400390625, 0.0391845703125, 0.04296875, 0.0467529296875, 0.050537109375, 0.0543212890625, 0.05810546875, 0.0618896484375, 0.065673828125, 0.0694580078125, 0.0732421875, 0.0770263671875, 0.080810546875, 0.0845947265625, 0.08837890625, 0.0921630859375, 0.095947265625, 0.0997314453125, 0.103515625, 0.1072998046875, 0.111083984375, 0.1148681640625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 7.0, 3.0, 6.0, 7.0, 16.0, 23.0, 42.0, 65.0, 73.0, 99.0, 122.0, 145.0, 114.0, 98.0, 71.0, 58.0, 28.0, 12.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8450343608856201, -0.8171789050102234, -0.7893233895301819, -0.7614679336547852, -0.7336124181747437, -0.7057569622993469, -0.6779014468193054, -0.6500459909439087, -0.6221904754638672, -0.5943350195884705, -0.566479504108429, -0.5386240482330322, -0.5107685327529907, -0.482913076877594, -0.4550575613975525, -0.42720210552215576, -0.39934661984443665, -0.37149113416671753, -0.3436356484889984, -0.3157801628112793, -0.2879246771335602, -0.26006919145584106, -0.23221372067928314, -0.20435823500156403, -0.1765027493238449, -0.1486472636461258, -0.12079177796840668, -0.09293629974126816, -0.06508081406354904, -0.03722533583641052, -0.009369850158691406, 0.01848563551902771, 0.046341121196746826, 0.07419660687446594, 0.10205209255218506, 0.12990757822990417, 0.1577630639076233, 0.1856185346841812, 0.21347402036190033, 0.24132950603961945, 0.26918500661849976, 0.29704049229621887, 0.324895977973938, 0.3527514636516571, 0.3806069493293762, 0.40846240520477295, 0.43631792068481445, 0.4641733765602112, 0.4920288622379303, 0.5198843479156494, 0.5477398037910461, 0.5755953192710876, 0.6034507751464844, 0.6313062906265259, 0.6591617465019226, 0.6870172619819641, 0.7148727178573608, 0.7427281737327576, 0.7705836892127991, 0.7984391450881958, 0.8262946605682373, 0.854150116443634, 0.8820056319236755, 0.9098610877990723, 0.9377166032791138]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 7.0, 7.0, 8.0, 8.0, 12.0, 12.0, 12.0, 25.0, 17.0, 22.0, 21.0, 30.0, 36.0, 32.0, 42.0, 44.0, 38.0, 52.0, 39.0, 47.0, 36.0, 37.0, 44.0, 51.0, 40.0, 47.0, 30.0, 36.0, 26.0, 21.0, 15.0, 25.0, 19.0, 11.0, 15.0, 8.0, 14.0, 8.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36221349239349365, -0.34868741035461426, -0.3351612985134125, -0.3216352164745331, -0.3081091046333313, -0.2945830225944519, -0.2810569405555725, -0.2675308287143707, -0.25400471687316895, -0.24047861993312836, -0.22695252299308777, -0.21342644095420837, -0.1999003291130066, -0.1863742470741272, -0.1728481501340866, -0.15932205319404602, -0.14579597115516663, -0.13226987421512604, -0.11874377727508545, -0.10521768778562546, -0.09169159084558487, -0.07816549390554428, -0.06463940441608429, -0.0511133074760437, -0.03758721053600311, -0.024061115458607674, -0.010535020381212234, 0.0029910728335380554, 0.016517169773578644, 0.030043266713619232, 0.043569356203079224, 0.05709545314311981, 0.0706215500831604, 0.08414764702320099, 0.09767374396324158, 0.11119983345270157, 0.12472593039274216, 0.13825201988220215, 0.15177811682224274, 0.16530421376228333, 0.1788303107023239, 0.1923564076423645, 0.2058825045824051, 0.21940860152244568, 0.23293468356132507, 0.24646079540252686, 0.25998687744140625, 0.27351295948028564, 0.2870390713214874, 0.3005651533603668, 0.3140912652015686, 0.327617347240448, 0.3411434590816498, 0.3546695411205292, 0.36819565296173096, 0.38172173500061035, 0.39524781703948975, 0.40877389907836914, 0.4223000109195709, 0.4358260929584503, 0.4493522047996521, 0.4628782868385315, 0.4764043688774109, 0.48993048071861267, 0.5034565925598145]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 5.0, 6.0, 11.0, 21.0, 33.0, 49.0, 66.0, 95.0, 187.0, 254.0, 426.0, 602.0, 977.0, 1592.0, 2457.0, 3802.0, 5673.0, 8589.0, 12920.0, 19648.0, 32807.0, 71819.0, 196762.0, 330310.0, 196810.0, 72198.0, 33051.0, 19482.0, 13009.0, 8688.0, 5676.0, 3753.0, 2361.0, 1576.0, 1011.0, 709.0, 402.0, 252.0, 147.0, 116.0, 69.0, 30.0, 39.0, 25.0, 11.0, 9.0, 8.0, 8.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.09515380859375, -0.09222602844238281, -0.08929824829101562, -0.08637046813964844, -0.08344268798828125, -0.08051490783691406, -0.07758712768554688, -0.07465934753417969, -0.0717315673828125, -0.06880378723144531, -0.06587600708007812, -0.06294822692871094, -0.06002044677734375, -0.05709266662597656, -0.054164886474609375, -0.05123710632324219, -0.048309326171875, -0.04538154602050781, -0.042453765869140625, -0.03952598571777344, -0.03659820556640625, -0.03367042541503906, -0.030742645263671875, -0.027814865112304688, -0.0248870849609375, -0.021959304809570312, -0.019031524658203125, -0.016103744506835938, -0.01317596435546875, -0.010248184204101562, -0.007320404052734375, -0.0043926239013671875, -0.00146484375, 0.0014629364013671875, 0.004390716552734375, 0.0073184967041015625, 0.01024627685546875, 0.013174057006835938, 0.016101837158203125, 0.019029617309570312, 0.0219573974609375, 0.024885177612304688, 0.027812957763671875, 0.030740737915039062, 0.03366851806640625, 0.03659629821777344, 0.039524078369140625, 0.04245185852050781, 0.045379638671875, 0.04830741882324219, 0.051235198974609375, 0.05416297912597656, 0.05709075927734375, 0.06001853942871094, 0.06294631958007812, 0.06587409973144531, 0.0688018798828125, 0.07172966003417969, 0.07465744018554688, 0.07758522033691406, 0.08051300048828125, 0.08344078063964844, 0.08636856079101562, 0.08929634094238281, 0.09222412109375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 5.0, 4.0, 7.0, 11.0, 15.0, 17.0, 15.0, 19.0, 17.0, 19.0, 29.0, 31.0, 29.0, 44.0, 44.0, 38.0, 44.0, 52.0, 45.0, 45.0, 44.0, 52.0, 49.0, 48.0, 45.0, 32.0, 40.0, 40.0, 22.0, 11.0, 18.0, 18.0, 9.0, 7.0, 9.0, 10.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0743408203125, -0.07226181030273438, -0.07018280029296875, -0.06810379028320312, -0.0660247802734375, -0.06394577026367188, -0.06186676025390625, -0.059787750244140625, -0.057708740234375, -0.055629730224609375, -0.05355072021484375, -0.051471710205078125, -0.0493927001953125, -0.047313690185546875, -0.04523468017578125, -0.043155670166015625, -0.04107666015625, -0.038997650146484375, -0.03691864013671875, -0.034839630126953125, -0.0327606201171875, -0.030681610107421875, -0.02860260009765625, -0.026523590087890625, -0.024444580078125, -0.022365570068359375, -0.02028656005859375, -0.018207550048828125, -0.0161285400390625, -0.014049530029296875, -0.01197052001953125, -0.009891510009765625, -0.0078125, -0.005733489990234375, -0.00365447998046875, -0.001575469970703125, 0.0005035400390625, 0.002582550048828125, 0.00466156005859375, 0.006740570068359375, 0.008819580078125, 0.010898590087890625, 0.01297760009765625, 0.015056610107421875, 0.0171356201171875, 0.019214630126953125, 0.02129364013671875, 0.023372650146484375, 0.02545166015625, 0.027530670166015625, 0.02960968017578125, 0.031688690185546875, 0.0337677001953125, 0.035846710205078125, 0.03792572021484375, 0.040004730224609375, 0.042083740234375, 0.044162750244140625, 0.04624176025390625, 0.048320770263671875, 0.0503997802734375, 0.052478790283203125, 0.05455780029296875, 0.056636810302734375, 0.0587158203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 9.0, 12.0, 4.0, 13.0, 14.0, 32.0, 58.0, 94.0, 121.0, 201.0, 364.0, 690.0, 1836.0, 5647.0, 19490.0, 75789.0, 534318.0, 337566.0, 51728.0, 13879.0, 4007.0, 1342.0, 557.0, 303.0, 180.0, 103.0, 61.0, 45.0, 35.0, 22.0, 16.0, 7.0, 5.0, 7.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2216796875, -0.21400070190429688, -0.20632171630859375, -0.19864273071289062, -0.1909637451171875, -0.18328475952148438, -0.17560577392578125, -0.16792678833007812, -0.160247802734375, -0.15256881713867188, -0.14488983154296875, -0.13721084594726562, -0.1295318603515625, -0.12185287475585938, -0.11417388916015625, -0.10649490356445312, -0.09881591796875, -0.09113693237304688, -0.08345794677734375, -0.07577896118164062, -0.0680999755859375, -0.060420989990234375, -0.05274200439453125, -0.045063018798828125, -0.037384033203125, -0.029705047607421875, -0.02202606201171875, -0.014347076416015625, -0.0066680908203125, 0.001010894775390625, 0.00868988037109375, 0.016368865966796875, 0.0240478515625, 0.031726837158203125, 0.03940582275390625, 0.047084808349609375, 0.0547637939453125, 0.062442779541015625, 0.07012176513671875, 0.07780075073242188, 0.085479736328125, 0.09315872192382812, 0.10083770751953125, 0.10851669311523438, 0.1161956787109375, 0.12387466430664062, 0.13155364990234375, 0.13923263549804688, 0.14691162109375, 0.15459060668945312, 0.16226959228515625, 0.16994857788085938, 0.1776275634765625, 0.18530654907226562, 0.19298553466796875, 0.20066452026367188, 0.208343505859375, 0.21602249145507812, 0.22370147705078125, 0.23138046264648438, 0.2390594482421875, 0.24673843383789062, 0.25441741943359375, 0.2620964050292969, 0.269775390625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 6.0, 9.0, 8.0, 7.0, 13.0, 13.0, 13.0, 16.0, 19.0, 22.0, 20.0, 24.0, 25.0, 26.0, 41.0, 44.0, 38.0, 44.0, 54.0, 36.0, 40.0, 41.0, 47.0, 38.0, 42.0, 37.0, 38.0, 36.0, 30.0, 25.0, 20.0, 14.0, 11.0, 21.0, 16.0, 17.0, 7.0, 13.0, 8.0, 3.0, 4.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.169189453125, -0.16368484497070312, -0.15818023681640625, -0.15267562866210938, -0.1471710205078125, -0.14166641235351562, -0.13616180419921875, -0.13065719604492188, -0.125152587890625, -0.11964797973632812, -0.11414337158203125, -0.10863876342773438, -0.1031341552734375, -0.09762954711914062, -0.09212493896484375, -0.08662033081054688, -0.08111572265625, -0.07561111450195312, -0.07010650634765625, -0.06460189819335938, -0.0590972900390625, -0.053592681884765625, -0.04808807373046875, -0.042583465576171875, -0.037078857421875, -0.031574249267578125, -0.02606964111328125, -0.020565032958984375, -0.0150604248046875, -0.009555816650390625, -0.00405120849609375, 0.001453399658203125, 0.0069580078125, 0.012462615966796875, 0.01796722412109375, 0.023471832275390625, 0.0289764404296875, 0.034481048583984375, 0.03998565673828125, 0.045490264892578125, 0.050994873046875, 0.056499481201171875, 0.06200408935546875, 0.06750869750976562, 0.0730133056640625, 0.07851791381835938, 0.08402252197265625, 0.08952713012695312, 0.09503173828125, 0.10053634643554688, 0.10604095458984375, 0.11154556274414062, 0.1170501708984375, 0.12255477905273438, 0.12805938720703125, 0.13356399536132812, 0.139068603515625, 0.14457321166992188, 0.15007781982421875, 0.15558242797851562, 0.1610870361328125, 0.16659164428710938, 0.17209625244140625, 0.17760086059570312, 0.18310546875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 9.0, 8.0, 7.0, 18.0, 42.0, 57.0, 60.0, 106.0, 205.0, 403.0, 723.0, 1383.0, 2758.0, 5527.0, 10717.0, 20390.0, 40584.0, 105673.0, 392825.0, 312707.0, 82529.0, 34791.0, 17985.0, 9288.0, 4696.0, 2394.0, 1221.0, 606.0, 374.0, 204.0, 96.0, 55.0, 37.0, 19.0, 16.0, 12.0, 9.0, 9.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.057861328125, -0.05610227584838867, -0.054343223571777344, -0.052584171295166016, -0.05082511901855469, -0.04906606674194336, -0.04730701446533203, -0.0455479621887207, -0.043788909912109375, -0.04202985763549805, -0.04027080535888672, -0.03851175308227539, -0.03675270080566406, -0.034993648529052734, -0.033234596252441406, -0.03147554397583008, -0.02971649169921875, -0.027957439422607422, -0.026198387145996094, -0.024439334869384766, -0.022680282592773438, -0.02092123031616211, -0.01916217803955078, -0.017403125762939453, -0.015644073486328125, -0.013885021209716797, -0.012125968933105469, -0.01036691665649414, -0.008607864379882812, -0.006848812103271484, -0.005089759826660156, -0.003330707550048828, -0.0015716552734375, 0.00018739700317382812, 0.0019464492797851562, 0.0037055015563964844, 0.0054645538330078125, 0.007223606109619141, 0.008982658386230469, 0.010741710662841797, 0.012500762939453125, 0.014259815216064453, 0.01601886749267578, 0.01777791976928711, 0.019536972045898438, 0.021296024322509766, 0.023055076599121094, 0.024814128875732422, 0.02657318115234375, 0.028332233428955078, 0.030091285705566406, 0.031850337982177734, 0.03360939025878906, 0.03536844253540039, 0.03712749481201172, 0.03888654708862305, 0.040645599365234375, 0.0424046516418457, 0.04416370391845703, 0.04592275619506836, 0.04768180847167969, 0.049440860748291016, 0.051199913024902344, 0.05295896530151367, 0.054718017578125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 2.0, 5.0, 7.0, 6.0, 3.0, 9.0, 11.0, 10.0, 19.0, 20.0, 34.0, 66.0, 77.0, 108.0, 135.0, 118.0, 94.0, 71.0, 54.0, 31.0, 17.0, 18.0, 10.0, 13.0, 13.0, 9.0, 8.0, 7.0, 4.0, 3.0, 4.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1338462829589844e-05, -2.055242657661438e-05, -1.9766390323638916e-05, -1.8980354070663452e-05, -1.8194317817687988e-05, -1.7408281564712524e-05, -1.662224531173706e-05, -1.5836209058761597e-05, -1.5050172805786133e-05, -1.4264136552810669e-05, -1.3478100299835205e-05, -1.2692064046859741e-05, -1.1906027793884277e-05, -1.1119991540908813e-05, -1.033395528793335e-05, -9.547919034957886e-06, -8.761882781982422e-06, -7.975846529006958e-06, -7.189810276031494e-06, -6.40377402305603e-06, -5.617737770080566e-06, -4.8317015171051025e-06, -4.045665264129639e-06, -3.259629011154175e-06, -2.473592758178711e-06, -1.687556505203247e-06, -9.015202522277832e-07, -1.1548399925231934e-07, 6.705522537231445e-07, 1.4565885066986084e-06, 2.2426247596740723e-06, 3.028661012649536e-06, 3.814697265625e-06, 4.600733518600464e-06, 5.386769771575928e-06, 6.172806024551392e-06, 6.9588422775268555e-06, 7.74487853050232e-06, 8.530914783477783e-06, 9.316951036453247e-06, 1.0102987289428711e-05, 1.0889023542404175e-05, 1.1675059795379639e-05, 1.2461096048355103e-05, 1.3247132301330566e-05, 1.403316855430603e-05, 1.4819204807281494e-05, 1.5605241060256958e-05, 1.6391277313232422e-05, 1.7177313566207886e-05, 1.796334981918335e-05, 1.8749386072158813e-05, 1.9535422325134277e-05, 2.032145857810974e-05, 2.1107494831085205e-05, 2.189353108406067e-05, 2.2679567337036133e-05, 2.3465603590011597e-05, 2.425163984298706e-05, 2.5037676095962524e-05, 2.5823712348937988e-05, 2.6609748601913452e-05, 2.7395784854888916e-05, 2.818182110786438e-05, 2.8967857360839844e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 7.0, 7.0, 8.0, 4.0, 18.0, 19.0, 30.0, 47.0, 51.0, 82.0, 148.0, 217.0, 403.0, 651.0, 1297.0, 2756.0, 6824.0, 17497.0, 44681.0, 133912.0, 440771.0, 274384.0, 76494.0, 28506.0, 11200.0, 4502.0, 1904.0, 931.0, 450.0, 272.0, 173.0, 93.0, 62.0, 42.0, 36.0, 26.0, 13.0, 12.0, 11.0, 8.0, 3.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.06610107421875, -0.06419944763183594, -0.062297821044921875, -0.06039619445800781, -0.05849456787109375, -0.05659294128417969, -0.054691314697265625, -0.05278968811035156, -0.0508880615234375, -0.04898643493652344, -0.047084808349609375, -0.04518318176269531, -0.04328155517578125, -0.04137992858886719, -0.039478302001953125, -0.03757667541503906, -0.035675048828125, -0.03377342224121094, -0.031871795654296875, -0.029970169067382812, -0.02806854248046875, -0.026166915893554688, -0.024265289306640625, -0.022363662719726562, -0.0204620361328125, -0.018560409545898438, -0.016658782958984375, -0.014757156372070312, -0.01285552978515625, -0.010953903198242188, -0.009052276611328125, -0.0071506500244140625, -0.0052490234375, -0.0033473968505859375, -0.001445770263671875, 0.0004558563232421875, 0.00235748291015625, 0.0042591094970703125, 0.006160736083984375, 0.008062362670898438, 0.0099639892578125, 0.011865615844726562, 0.013767242431640625, 0.015668869018554688, 0.01757049560546875, 0.019472122192382812, 0.021373748779296875, 0.023275375366210938, 0.025177001953125, 0.027078628540039062, 0.028980255126953125, 0.030881881713867188, 0.03278350830078125, 0.03468513488769531, 0.036586761474609375, 0.03848838806152344, 0.0403900146484375, 0.04229164123535156, 0.044193267822265625, 0.04609489440917969, 0.04799652099609375, 0.04989814758300781, 0.051799774169921875, 0.05370140075683594, 0.05560302734375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 2.0, 2.0, 3.0, 4.0, 7.0, 2.0, 11.0, 6.0, 7.0, 5.0, 14.0, 7.0, 14.0, 18.0, 21.0, 28.0, 29.0, 35.0, 62.0, 55.0, 74.0, 77.0, 85.0, 72.0, 53.0, 53.0, 44.0, 36.0, 31.0, 22.0, 19.0, 16.0, 16.0, 13.0, 12.0, 8.0, 5.0, 4.0, 4.0, 6.0, 1.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.046112060546875, -0.044704437255859375, -0.04329681396484375, -0.041889190673828125, -0.0404815673828125, -0.039073944091796875, -0.03766632080078125, -0.036258697509765625, -0.03485107421875, -0.033443450927734375, -0.03203582763671875, -0.030628204345703125, -0.0292205810546875, -0.027812957763671875, -0.02640533447265625, -0.024997711181640625, -0.023590087890625, -0.022182464599609375, -0.02077484130859375, -0.019367218017578125, -0.0179595947265625, -0.016551971435546875, -0.01514434814453125, -0.013736724853515625, -0.0123291015625, -0.010921478271484375, -0.00951385498046875, -0.008106231689453125, -0.0066986083984375, -0.005290985107421875, -0.00388336181640625, -0.002475738525390625, -0.001068115234375, 0.000339508056640625, 0.00174713134765625, 0.003154754638671875, 0.0045623779296875, 0.005970001220703125, 0.00737762451171875, 0.008785247802734375, 0.01019287109375, 0.011600494384765625, 0.01300811767578125, 0.014415740966796875, 0.0158233642578125, 0.017230987548828125, 0.01863861083984375, 0.020046234130859375, 0.021453857421875, 0.022861480712890625, 0.02426910400390625, 0.025676727294921875, 0.0270843505859375, 0.028491973876953125, 0.02989959716796875, 0.031307220458984375, 0.03271484375, 0.034122467041015625, 0.03553009033203125, 0.036937713623046875, 0.0383453369140625, 0.039752960205078125, 0.04116058349609375, 0.042568206787109375, 0.043975830078125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 13.0, 18.0, 65.0, 125.0, 194.0, 226.0, 178.0, 108.0, 34.0, 13.0, 7.0, 4.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.7120633125305176, -1.6716995239257812, -1.6313356161117554, -1.5909717082977295, -1.5506079196929932, -1.5102441310882568, -1.469880223274231, -1.429516315460205, -1.3891525268554688, -1.3487887382507324, -1.3084248304367065, -1.2680609226226807, -1.2276971340179443, -1.187333345413208, -1.1469694375991821, -1.1066055297851562, -1.06624174118042, -1.0258779525756836, -0.9855140447616577, -0.9451501965522766, -0.9047863483428955, -0.8644225001335144, -0.8240586519241333, -0.7836948037147522, -0.7433309555053711, -0.70296710729599, -0.6626032590866089, -0.6222394108772278, -0.5818755626678467, -0.5415117144584656, -0.5011478662490845, -0.46078401803970337, -0.4204202890396118, -0.3800564408302307, -0.3396925926208496, -0.2993287444114685, -0.2589648962020874, -0.2186010479927063, -0.1782371997833252, -0.1378733515739441, -0.09750950336456299, -0.057145655155181885, -0.01678180694580078, 0.023582041263580322, 0.06394588947296143, 0.10430973768234253, 0.14467358589172363, 0.18503743410110474, 0.22540128231048584, 0.26576513051986694, 0.30612897872924805, 0.34649282693862915, 0.38685667514801025, 0.42722052335739136, 0.46758437156677246, 0.5079482197761536, 0.5483120679855347, 0.5886759161949158, 0.6290397644042969, 0.669403612613678, 0.7097674608230591, 0.7501313090324402, 0.7904951572418213, 0.8308590054512024, 0.8712228536605835]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 9.0, 2.0, 5.0, 4.0, 5.0, 9.0, 11.0, 11.0, 16.0, 11.0, 29.0, 25.0, 27.0, 20.0, 29.0, 23.0, 34.0, 22.0, 31.0, 32.0, 25.0, 45.0, 40.0, 55.0, 51.0, 40.0, 32.0, 39.0, 33.0, 39.0, 19.0, 26.0, 24.0, 26.0, 17.0, 25.0, 14.0, 18.0, 14.0, 9.0, 19.0, 9.0, 13.0, 2.0, 4.0, 8.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.39768993854522705, -0.38538652658462524, -0.37308311462402344, -0.36077970266342163, -0.3484762907028198, -0.336172878742218, -0.3238694667816162, -0.311566025018692, -0.2992626130580902, -0.2869592010974884, -0.2746557891368866, -0.2623523771762848, -0.250048965215683, -0.23774553835391998, -0.22544212639331818, -0.21313869953155518, -0.20083530247211456, -0.18853189051151276, -0.17622847855091095, -0.16392505168914795, -0.15162163972854614, -0.13931822776794434, -0.12701481580734253, -0.11471139639616013, -0.10240798443555832, -0.09010457247495651, -0.07780115306377411, -0.0654977411031723, -0.0531943254172802, -0.04089090973138809, -0.028587497770786285, -0.016284078359603882, -0.003980666399002075, 0.008322748355567455, 0.020626163110136986, 0.03292957693338394, 0.04523299261927605, 0.05753640830516815, 0.06983982026576996, 0.08214323967695236, 0.09444665163755417, 0.10675006359815598, 0.11905348300933838, 0.13135689496994019, 0.143660306930542, 0.1559637188911438, 0.1682671308517456, 0.1805705577135086, 0.1928739696741104, 0.20517738163471222, 0.21748079359531403, 0.22978422045707703, 0.24208763241767883, 0.25439104437828064, 0.26669445633888245, 0.27899786829948425, 0.29130128026008606, 0.30360469222068787, 0.3159081041812897, 0.3282115161418915, 0.3405149281024933, 0.3528183698654175, 0.3651217818260193, 0.3774251937866211, 0.3897286057472229]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 7.0, 6.0, 8.0, 5.0, 15.0, 22.0, 32.0, 65.0, 93.0, 174.0, 294.0, 560.0, 984.0, 1824.0, 3371.0, 6430.0, 12408.0, 23788.0, 47052.0, 99021.0, 236291.0, 614397.0, 1224278.0, 1075287.0, 487142.0, 195678.0, 83788.0, 39640.0, 20012.0, 10292.0, 5323.0, 2788.0, 1460.0, 765.0, 443.0, 261.0, 127.0, 73.0, 36.0, 22.0, 15.0, 7.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.080078125, -0.07796382904052734, -0.07584953308105469, -0.07373523712158203, -0.07162094116210938, -0.06950664520263672, -0.06739234924316406, -0.0652780532836914, -0.06316375732421875, -0.061049461364746094, -0.05893516540527344, -0.05682086944580078, -0.054706573486328125, -0.05259227752685547, -0.05047798156738281, -0.048363685607910156, -0.0462493896484375, -0.044135093688964844, -0.04202079772949219, -0.03990650177001953, -0.037792205810546875, -0.03567790985107422, -0.03356361389160156, -0.031449317932128906, -0.02933502197265625, -0.027220726013183594, -0.025106430053710938, -0.02299213409423828, -0.020877838134765625, -0.01876354217529297, -0.016649246215820312, -0.014534950256347656, -0.012420654296875, -0.010306358337402344, -0.008192062377929688, -0.006077766418457031, -0.003963470458984375, -0.0018491744995117188, 0.0002651214599609375, 0.0023794174194335938, 0.00449371337890625, 0.006608009338378906, 0.008722305297851562, 0.010836601257324219, 0.012950897216796875, 0.015065193176269531, 0.017179489135742188, 0.019293785095214844, 0.0214080810546875, 0.023522377014160156, 0.025636672973632812, 0.02775096893310547, 0.029865264892578125, 0.03197956085205078, 0.03409385681152344, 0.036208152770996094, 0.03832244873046875, 0.040436744689941406, 0.04255104064941406, 0.04466533660888672, 0.046779632568359375, 0.04889392852783203, 0.05100822448730469, 0.053122520446777344, 0.05523681640625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 1.0, 4.0, 2.0, 9.0, 4.0, 8.0, 12.0, 18.0, 6.0, 21.0, 21.0, 25.0, 21.0, 26.0, 32.0, 30.0, 32.0, 37.0, 41.0, 42.0, 40.0, 61.0, 50.0, 43.0, 50.0, 40.0, 39.0, 36.0, 34.0, 38.0, 24.0, 20.0, 21.0, 22.0, 16.0, 18.0, 16.0, 9.0, 7.0, 8.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06402587890625, -0.06201171875, -0.05999755859375, -0.0579833984375, -0.05596923828125, -0.053955078125, -0.05194091796875, -0.0499267578125, -0.04791259765625, -0.0458984375, -0.04388427734375, -0.0418701171875, -0.03985595703125, -0.037841796875, -0.03582763671875, -0.0338134765625, -0.03179931640625, -0.02978515625, -0.02777099609375, -0.0257568359375, -0.02374267578125, -0.021728515625, -0.01971435546875, -0.0177001953125, -0.01568603515625, -0.013671875, -0.01165771484375, -0.0096435546875, -0.00762939453125, -0.005615234375, -0.00360107421875, -0.0015869140625, 0.00042724609375, 0.00244140625, 0.00445556640625, 0.0064697265625, 0.00848388671875, 0.010498046875, 0.01251220703125, 0.0145263671875, 0.01654052734375, 0.0185546875, 0.02056884765625, 0.0225830078125, 0.02459716796875, 0.026611328125, 0.02862548828125, 0.0306396484375, 0.03265380859375, 0.03466796875, 0.03668212890625, 0.0386962890625, 0.04071044921875, 0.042724609375, 0.04473876953125, 0.0467529296875, 0.04876708984375, 0.05078125, 0.05279541015625, 0.0548095703125, 0.05682373046875, 0.058837890625, 0.06085205078125, 0.0628662109375, 0.06488037109375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 4.0, 16.0, 17.0, 22.0, 26.0, 44.0, 66.0, 106.0, 150.0, 285.0, 452.0, 896.0, 1895.0, 4609.0, 12672.0, 35699.0, 106722.0, 360781.0, 1574127.0, 1570973.0, 360427.0, 106471.0, 35830.0, 13016.0, 4843.0, 1892.0, 935.0, 473.0, 313.0, 183.0, 118.0, 77.0, 46.0, 29.0, 19.0, 13.0, 6.0, 8.0, 8.0, 3.0, 3.0, 1.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1297607421875, -0.1259441375732422, -0.12212753295898438, -0.11831092834472656, -0.11449432373046875, -0.11067771911621094, -0.10686111450195312, -0.10304450988769531, -0.0992279052734375, -0.09541130065917969, -0.09159469604492188, -0.08777809143066406, -0.08396148681640625, -0.08014488220214844, -0.07632827758789062, -0.07251167297363281, -0.068695068359375, -0.06487846374511719, -0.061061859130859375, -0.05724525451660156, -0.05342864990234375, -0.04961204528808594, -0.045795440673828125, -0.04197883605957031, -0.0381622314453125, -0.03434562683105469, -0.030529022216796875, -0.026712417602539062, -0.02289581298828125, -0.019079208374023438, -0.015262603759765625, -0.011445999145507812, -0.00762939453125, -0.0038127899169921875, 3.814697265625e-06, 0.0038204193115234375, 0.00763702392578125, 0.011453628540039062, 0.015270233154296875, 0.019086837768554688, 0.0229034423828125, 0.026720046997070312, 0.030536651611328125, 0.03435325622558594, 0.03816986083984375, 0.04198646545410156, 0.045803070068359375, 0.04961967468261719, 0.053436279296875, 0.05725288391113281, 0.061069488525390625, 0.06488609313964844, 0.06870269775390625, 0.07251930236816406, 0.07633590698242188, 0.08015251159667969, 0.0839691162109375, 0.08778572082519531, 0.09160232543945312, 0.09541893005371094, 0.09923553466796875, 0.10305213928222656, 0.10686874389648438, 0.11068534851074219, 0.114501953125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 1.0, 3.0, 1.0, 6.0, 7.0, 9.0, 8.0, 14.0, 11.0, 17.0, 29.0, 31.0, 41.0, 64.0, 62.0, 93.0, 105.0, 145.0, 210.0, 276.0, 375.0, 411.0, 452.0, 361.0, 286.0, 239.0, 208.0, 124.0, 89.0, 77.0, 63.0, 52.0, 47.0, 37.0, 29.0, 18.0, 14.0, 18.0, 13.0, 11.0, 6.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09564208984375, -0.09200382232666016, -0.08836555480957031, -0.08472728729248047, -0.08108901977539062, -0.07745075225830078, -0.07381248474121094, -0.0701742172241211, -0.06653594970703125, -0.0628976821899414, -0.05925941467285156, -0.05562114715576172, -0.051982879638671875, -0.04834461212158203, -0.04470634460449219, -0.041068077087402344, -0.0374298095703125, -0.033791542053222656, -0.030153274536132812, -0.02651500701904297, -0.022876739501953125, -0.01923847198486328, -0.015600204467773438, -0.011961936950683594, -0.00832366943359375, -0.004685401916503906, -0.0010471343994140625, 0.0025911331176757812, 0.006229400634765625, 0.009867668151855469, 0.013505935668945312, 0.017144203186035156, 0.020782470703125, 0.024420738220214844, 0.028059005737304688, 0.03169727325439453, 0.035335540771484375, 0.03897380828857422, 0.04261207580566406, 0.046250343322753906, 0.04988861083984375, 0.053526878356933594, 0.05716514587402344, 0.06080341339111328, 0.06444168090820312, 0.06807994842529297, 0.07171821594238281, 0.07535648345947266, 0.0789947509765625, 0.08263301849365234, 0.08627128601074219, 0.08990955352783203, 0.09354782104492188, 0.09718608856201172, 0.10082435607910156, 0.1044626235961914, 0.10810089111328125, 0.1117391586303711, 0.11537742614746094, 0.11901569366455078, 0.12265396118164062, 0.12629222869873047, 0.1299304962158203, 0.13356876373291016, 0.13720703125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 9.0, 14.0, 44.0, 71.0, 142.0, 187.0, 197.0, 165.0, 82.0, 54.0, 19.0, 9.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8802762031555176, -1.837556004524231, -1.7948358058929443, -1.7521157264709473, -1.7093955278396606, -1.666675329208374, -1.623955249786377, -1.5812350511550903, -1.5385148525238037, -1.495794653892517, -1.4530744552612305, -1.4103543758392334, -1.3676341772079468, -1.3249139785766602, -1.282193899154663, -1.2394737005233765, -1.1967535018920898, -1.1540333032608032, -1.1113131046295166, -1.0685930252075195, -1.025872826576233, -0.9831526279449463, -0.9404324889183044, -0.8977123498916626, -0.854992151260376, -0.8122719526290894, -0.7695518136024475, -0.7268316745758057, -0.684111475944519, -0.6413912773132324, -0.5986711382865906, -0.5559509992599487, -0.5132307410240173, -0.4705105721950531, -0.42779040336608887, -0.38507023453712463, -0.3423500657081604, -0.29962989687919617, -0.25690972805023193, -0.2141895592212677, -0.17146939039230347, -0.12874922156333923, -0.086029052734375, -0.04330888390541077, -0.0005887150764465332, 0.0421314537525177, 0.08485162258148193, 0.12757179141044617, 0.1702919602394104, 0.21301212906837463, 0.25573229789733887, 0.2984524667263031, 0.34117263555526733, 0.38389280438423157, 0.4266129732131958, 0.46933314204216003, 0.5120533108711243, 0.5547734498977661, 0.5974936485290527, 0.6402138471603394, 0.6829339861869812, 0.725654125213623, 0.7683743238449097, 0.8110945224761963, 0.8538146615028381]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 4.0, 4.0, 2.0, 9.0, 3.0, 12.0, 8.0, 16.0, 9.0, 17.0, 16.0, 11.0, 22.0, 18.0, 28.0, 29.0, 35.0, 30.0, 36.0, 34.0, 36.0, 39.0, 30.0, 41.0, 44.0, 33.0, 43.0, 40.0, 40.0, 37.0, 29.0, 31.0, 24.0, 28.0, 24.0, 23.0, 17.0, 18.0, 21.0, 11.0, 11.0, 6.0, 10.0, 5.0, 1.0, 6.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.3717927932739258, -0.359464555978775, -0.3471362888813019, -0.3348080515861511, -0.322479784488678, -0.3101515471935272, -0.29782330989837646, -0.2854950428009033, -0.27316680550575256, -0.2608385682106018, -0.24851030111312866, -0.2361820638179779, -0.22385381162166595, -0.211525559425354, -0.19919732213020325, -0.1868690699338913, -0.17454081773757935, -0.1622125655412674, -0.14988431334495544, -0.1375560760498047, -0.12522782385349274, -0.11289957165718079, -0.10057132691144943, -0.08824308216571808, -0.07591482996940613, -0.06358657777309418, -0.051258333027362823, -0.03893008455634117, -0.02660183608531952, -0.014273587614297867, -0.0019453391432762146, 0.01038290560245514, 0.02271115779876709, 0.03503940626978874, 0.047367654740810394, 0.059695903211832047, 0.0720241516828537, 0.08435240387916565, 0.096680648624897, 0.10900889337062836, 0.12133714556694031, 0.13366539776325226, 0.1459936499595642, 0.15832188725471497, 0.17065013945102692, 0.18297839164733887, 0.19530662894248962, 0.20763488113880157, 0.21996313333511353, 0.23229138553142548, 0.24461963772773743, 0.2569478750228882, 0.26927614212036133, 0.2816043794155121, 0.29393261671066284, 0.306260883808136, 0.31858912110328674, 0.3309173583984375, 0.34324562549591064, 0.3555738627910614, 0.36790210008621216, 0.3802303671836853, 0.39255860447883606, 0.4048868417739868, 0.41721510887145996]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 8.0, 7.0, 10.0, 17.0, 18.0, 38.0, 50.0, 94.0, 136.0, 253.0, 435.0, 686.0, 1268.0, 2372.0, 4338.0, 7748.0, 13839.0, 23824.0, 44284.0, 96363.0, 230495.0, 311308.0, 164630.0, 68521.0, 33980.0, 18844.0, 10986.0, 6158.0, 3393.0, 1929.0, 1063.0, 553.0, 351.0, 215.0, 117.0, 78.0, 36.0, 42.0, 25.0, 13.0, 12.0, 12.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09552001953125, -0.09236717224121094, -0.08921432495117188, -0.08606147766113281, -0.08290863037109375, -0.07975578308105469, -0.07660293579101562, -0.07345008850097656, -0.0702972412109375, -0.06714439392089844, -0.06399154663085938, -0.06083869934082031, -0.05768585205078125, -0.05453300476074219, -0.051380157470703125, -0.04822731018066406, -0.045074462890625, -0.04192161560058594, -0.038768768310546875, -0.03561592102050781, -0.03246307373046875, -0.029310226440429688, -0.026157379150390625, -0.023004531860351562, -0.0198516845703125, -0.016698837280273438, -0.013545989990234375, -0.010393142700195312, -0.00724029541015625, -0.0040874481201171875, -0.000934600830078125, 0.0022182464599609375, 0.00537109375, 0.008523941040039062, 0.011676788330078125, 0.014829635620117188, 0.01798248291015625, 0.021135330200195312, 0.024288177490234375, 0.027441024780273438, 0.0305938720703125, 0.03374671936035156, 0.036899566650390625, 0.04005241394042969, 0.04320526123046875, 0.04635810852050781, 0.049510955810546875, 0.05266380310058594, 0.055816650390625, 0.05896949768066406, 0.062122344970703125, 0.06527519226074219, 0.06842803955078125, 0.07158088684082031, 0.07473373413085938, 0.07788658142089844, 0.0810394287109375, 0.08419227600097656, 0.08734512329101562, 0.09049797058105469, 0.09365081787109375, 0.09680366516113281, 0.09995651245117188, 0.10310935974121094, 0.10626220703125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 7.0, 4.0, 2.0, 9.0, 11.0, 11.0, 15.0, 19.0, 15.0, 20.0, 15.0, 21.0, 30.0, 34.0, 22.0, 29.0, 35.0, 24.0, 42.0, 37.0, 41.0, 31.0, 35.0, 35.0, 34.0, 27.0, 31.0, 39.0, 27.0, 34.0, 23.0, 40.0, 29.0, 23.0, 20.0, 19.0, 20.0, 12.0, 12.0, 15.0, 14.0, 7.0, 8.0, 5.0, 5.0, 2.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.0562744140625, -0.05449390411376953, -0.05271339416503906, -0.050932884216308594, -0.049152374267578125, -0.047371864318847656, -0.04559135437011719, -0.04381084442138672, -0.04203033447265625, -0.04024982452392578, -0.03846931457519531, -0.036688804626464844, -0.034908294677734375, -0.033127784729003906, -0.03134727478027344, -0.02956676483154297, -0.0277862548828125, -0.02600574493408203, -0.024225234985351562, -0.022444725036621094, -0.020664215087890625, -0.018883705139160156, -0.017103195190429688, -0.015322685241699219, -0.01354217529296875, -0.011761665344238281, -0.009981155395507812, -0.008200645446777344, -0.006420135498046875, -0.004639625549316406, -0.0028591156005859375, -0.0010786056518554688, 0.000701904296875, 0.0024824142456054688, 0.0042629241943359375, 0.006043434143066406, 0.007823944091796875, 0.009604454040527344, 0.011384963989257812, 0.013165473937988281, 0.01494598388671875, 0.01672649383544922, 0.018507003784179688, 0.020287513732910156, 0.022068023681640625, 0.023848533630371094, 0.025629043579101562, 0.02740955352783203, 0.0291900634765625, 0.03097057342529297, 0.03275108337402344, 0.034531593322753906, 0.036312103271484375, 0.038092613220214844, 0.03987312316894531, 0.04165363311767578, 0.04343414306640625, 0.04521465301513672, 0.04699516296386719, 0.048775672912597656, 0.050556182861328125, 0.052336692810058594, 0.05411720275878906, 0.05589771270751953, 0.05767822265625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 5.0, 8.0, 6.0, 8.0, 19.0, 24.0, 37.0, 36.0, 55.0, 90.0, 112.0, 165.0, 282.0, 463.0, 736.0, 1518.0, 3513.0, 8957.0, 23760.0, 66787.0, 238742.0, 471313.0, 154519.0, 47705.0, 17349.0, 6609.0, 2732.0, 1226.0, 629.0, 371.0, 230.0, 176.0, 116.0, 77.0, 48.0, 32.0, 26.0, 22.0, 18.0, 7.0, 5.0, 9.0, 6.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.18408203125, -0.1783905029296875, -0.172698974609375, -0.1670074462890625, -0.16131591796875, -0.1556243896484375, -0.149932861328125, -0.1442413330078125, -0.1385498046875, -0.1328582763671875, -0.127166748046875, -0.1214752197265625, -0.11578369140625, -0.1100921630859375, -0.104400634765625, -0.0987091064453125, -0.093017578125, -0.0873260498046875, -0.081634521484375, -0.0759429931640625, -0.07025146484375, -0.0645599365234375, -0.058868408203125, -0.0531768798828125, -0.0474853515625, -0.0417938232421875, -0.036102294921875, -0.0304107666015625, -0.02471923828125, -0.0190277099609375, -0.013336181640625, -0.0076446533203125, -0.001953125, 0.0037384033203125, 0.009429931640625, 0.0151214599609375, 0.02081298828125, 0.0265045166015625, 0.032196044921875, 0.0378875732421875, 0.0435791015625, 0.0492706298828125, 0.054962158203125, 0.0606536865234375, 0.06634521484375, 0.0720367431640625, 0.077728271484375, 0.0834197998046875, 0.089111328125, 0.0948028564453125, 0.100494384765625, 0.1061859130859375, 0.11187744140625, 0.1175689697265625, 0.123260498046875, 0.1289520263671875, 0.1346435546875, 0.1403350830078125, 0.146026611328125, 0.1517181396484375, 0.15740966796875, 0.1631011962890625, 0.168792724609375, 0.1744842529296875, 0.18017578125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 10.0, 6.0, 8.0, 11.0, 9.0, 18.0, 8.0, 16.0, 19.0, 25.0, 28.0, 38.0, 28.0, 31.0, 39.0, 47.0, 43.0, 43.0, 55.0, 35.0, 57.0, 40.0, 41.0, 38.0, 31.0, 31.0, 32.0, 22.0, 35.0, 25.0, 22.0, 11.0, 17.0, 13.0, 20.0, 5.0, 8.0, 9.0, 7.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2109375, -0.20474815368652344, -0.19855880737304688, -0.1923694610595703, -0.18618011474609375, -0.1799907684326172, -0.17380142211914062, -0.16761207580566406, -0.1614227294921875, -0.15523338317871094, -0.14904403686523438, -0.1428546905517578, -0.13666534423828125, -0.1304759979248047, -0.12428665161132812, -0.11809730529785156, -0.111907958984375, -0.10571861267089844, -0.09952926635742188, -0.09333992004394531, -0.08715057373046875, -0.08096122741699219, -0.07477188110351562, -0.06858253479003906, -0.0623931884765625, -0.05620384216308594, -0.050014495849609375, -0.04382514953613281, -0.03763580322265625, -0.03144645690917969, -0.025257110595703125, -0.019067764282226562, -0.01287841796875, -0.0066890716552734375, -0.000499725341796875, 0.0056896209716796875, 0.01187896728515625, 0.018068313598632812, 0.024257659912109375, 0.030447006225585938, 0.0366363525390625, 0.04282569885253906, 0.049015045166015625, 0.05520439147949219, 0.06139373779296875, 0.06758308410644531, 0.07377243041992188, 0.07996177673339844, 0.086151123046875, 0.09234046936035156, 0.09852981567382812, 0.10471916198730469, 0.11090850830078125, 0.11709785461425781, 0.12328720092773438, 0.12947654724121094, 0.1356658935546875, 0.14185523986816406, 0.14804458618164062, 0.1542339324951172, 0.16042327880859375, 0.1666126251220703, 0.17280197143554688, 0.17899131774902344, 0.1851806640625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 2.0, 9.0, 17.0, 18.0, 39.0, 50.0, 68.0, 102.0, 201.0, 320.0, 608.0, 1150.0, 2204.0, 4389.0, 8763.0, 17548.0, 36897.0, 89578.0, 247247.0, 357992.0, 165990.0, 61607.0, 26822.0, 13114.0, 6589.0, 3425.0, 1702.0, 938.0, 473.0, 273.0, 152.0, 99.0, 54.0, 43.0, 27.0, 11.0, 11.0, 14.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.04937744140625, -0.04784870147705078, -0.04631996154785156, -0.044791221618652344, -0.043262481689453125, -0.041733741760253906, -0.04020500183105469, -0.03867626190185547, -0.03714752197265625, -0.03561878204345703, -0.03409004211425781, -0.032561302185058594, -0.031032562255859375, -0.029503822326660156, -0.027975082397460938, -0.02644634246826172, -0.0249176025390625, -0.02338886260986328, -0.021860122680664062, -0.020331382751464844, -0.018802642822265625, -0.017273902893066406, -0.015745162963867188, -0.014216423034667969, -0.01268768310546875, -0.011158943176269531, -0.009630203247070312, -0.008101463317871094, -0.006572723388671875, -0.005043983459472656, -0.0035152435302734375, -0.0019865036010742188, -0.000457763671875, 0.0010709762573242188, 0.0025997161865234375, 0.004128456115722656, 0.005657196044921875, 0.007185935974121094, 0.008714675903320312, 0.010243415832519531, 0.01177215576171875, 0.013300895690917969, 0.014829635620117188, 0.016358375549316406, 0.017887115478515625, 0.019415855407714844, 0.020944595336914062, 0.02247333526611328, 0.0240020751953125, 0.02553081512451172, 0.027059555053710938, 0.028588294982910156, 0.030117034912109375, 0.031645774841308594, 0.03317451477050781, 0.03470325469970703, 0.03623199462890625, 0.03776073455810547, 0.03928947448730469, 0.040818214416503906, 0.042346954345703125, 0.043875694274902344, 0.04540443420410156, 0.04693317413330078, 0.0484619140625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 5.0, 4.0, 8.0, 11.0, 13.0, 13.0, 13.0, 11.0, 25.0, 24.0, 33.0, 49.0, 53.0, 67.0, 73.0, 94.0, 76.0, 81.0, 58.0, 60.0, 50.0, 36.0, 23.0, 19.0, 16.0, 8.0, 16.0, 14.0, 5.0, 14.0, 10.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.627206802368164e-05, -1.5676021575927734e-05, -1.5079975128173828e-05, -1.4483928680419922e-05, -1.3887882232666016e-05, -1.329183578491211e-05, -1.2695789337158203e-05, -1.2099742889404297e-05, -1.150369644165039e-05, -1.0907649993896484e-05, -1.0311603546142578e-05, -9.715557098388672e-06, -9.119510650634766e-06, -8.52346420288086e-06, -7.927417755126953e-06, -7.331371307373047e-06, -6.735324859619141e-06, -6.139278411865234e-06, -5.543231964111328e-06, -4.947185516357422e-06, -4.351139068603516e-06, -3.7550926208496094e-06, -3.159046173095703e-06, -2.562999725341797e-06, -1.9669532775878906e-06, -1.3709068298339844e-06, -7.748603820800781e-07, -1.7881393432617188e-07, 4.172325134277344e-07, 1.0132789611816406e-06, 1.6093254089355469e-06, 2.205371856689453e-06, 2.8014183044433594e-06, 3.3974647521972656e-06, 3.993511199951172e-06, 4.589557647705078e-06, 5.185604095458984e-06, 5.781650543212891e-06, 6.377696990966797e-06, 6.973743438720703e-06, 7.569789886474609e-06, 8.165836334228516e-06, 8.761882781982422e-06, 9.357929229736328e-06, 9.953975677490234e-06, 1.055002212524414e-05, 1.1146068572998047e-05, 1.1742115020751953e-05, 1.233816146850586e-05, 1.2934207916259766e-05, 1.3530254364013672e-05, 1.4126300811767578e-05, 1.4722347259521484e-05, 1.531839370727539e-05, 1.5914440155029297e-05, 1.6510486602783203e-05, 1.710653305053711e-05, 1.7702579498291016e-05, 1.8298625946044922e-05, 1.8894672393798828e-05, 1.9490718841552734e-05, 2.008676528930664e-05, 2.0682811737060547e-05, 2.1278858184814453e-05, 2.187490463256836e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 15.0, 11.0, 13.0, 27.0, 23.0, 49.0, 100.0, 194.0, 486.0, 966.0, 2924.0, 10916.0, 50079.0, 252132.0, 521887.0, 164309.0, 33173.0, 7625.0, 2110.0, 764.0, 364.0, 170.0, 85.0, 54.0, 34.0, 16.0, 15.0, 5.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06231689453125, -0.0598602294921875, -0.057403564453125, -0.0549468994140625, -0.052490234375, -0.0500335693359375, -0.047576904296875, -0.0451202392578125, -0.04266357421875, -0.0402069091796875, -0.037750244140625, -0.0352935791015625, -0.0328369140625, -0.0303802490234375, -0.027923583984375, -0.0254669189453125, -0.02301025390625, -0.0205535888671875, -0.018096923828125, -0.0156402587890625, -0.01318359375, -0.0107269287109375, -0.008270263671875, -0.0058135986328125, -0.00335693359375, -0.0009002685546875, 0.001556396484375, 0.0040130615234375, 0.0064697265625, 0.0089263916015625, 0.011383056640625, 0.0138397216796875, 0.01629638671875, 0.0187530517578125, 0.021209716796875, 0.0236663818359375, 0.026123046875, 0.0285797119140625, 0.031036376953125, 0.0334930419921875, 0.03594970703125, 0.0384063720703125, 0.040863037109375, 0.0433197021484375, 0.0457763671875, 0.0482330322265625, 0.050689697265625, 0.0531463623046875, 0.05560302734375, 0.0580596923828125, 0.060516357421875, 0.0629730224609375, 0.0654296875, 0.0678863525390625, 0.070343017578125, 0.0727996826171875, 0.07525634765625, 0.0777130126953125, 0.080169677734375, 0.0826263427734375, 0.0850830078125, 0.0875396728515625, 0.089996337890625, 0.0924530029296875, 0.09490966796875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 5.0, 6.0, 2.0, 7.0, 7.0, 12.0, 23.0, 23.0, 23.0, 25.0, 32.0, 33.0, 50.0, 37.0, 60.0, 51.0, 58.0, 58.0, 63.0, 57.0, 66.0, 46.0, 46.0, 42.0, 34.0, 22.0, 19.0, 14.0, 11.0, 11.0, 16.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.046722412109375, -0.04535865783691406, -0.043994903564453125, -0.04263114929199219, -0.04126739501953125, -0.03990364074707031, -0.038539886474609375, -0.03717613220214844, -0.0358123779296875, -0.03444862365722656, -0.033084869384765625, -0.03172111511230469, -0.03035736083984375, -0.028993606567382812, -0.027629852294921875, -0.026266098022460938, -0.02490234375, -0.023538589477539062, -0.022174835205078125, -0.020811080932617188, -0.01944732666015625, -0.018083572387695312, -0.016719818115234375, -0.015356063842773438, -0.0139923095703125, -0.012628555297851562, -0.011264801025390625, -0.009901046752929688, -0.00853729248046875, -0.0071735382080078125, -0.005809783935546875, -0.0044460296630859375, -0.003082275390625, -0.0017185211181640625, -0.000354766845703125, 0.0010089874267578125, 0.00237274169921875, 0.0037364959716796875, 0.005100250244140625, 0.0064640045166015625, 0.0078277587890625, 0.009191513061523438, 0.010555267333984375, 0.011919021606445312, 0.01328277587890625, 0.014646530151367188, 0.016010284423828125, 0.017374038696289062, 0.01873779296875, 0.020101547241210938, 0.021465301513671875, 0.022829055786132812, 0.02419281005859375, 0.025556564331054688, 0.026920318603515625, 0.028284072875976562, 0.0296478271484375, 0.031011581420898438, 0.032375335693359375, 0.03373908996582031, 0.03510284423828125, 0.03646659851074219, 0.037830352783203125, 0.03919410705566406, 0.040557861328125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 28.0, 42.0, 80.0, 159.0, 208.0, 177.0, 135.0, 79.0, 48.0, 18.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.45541250705719, -1.4207514524459839, -1.3860903978347778, -1.3514293432235718, -1.3167684078216553, -1.2821073532104492, -1.2474462985992432, -1.212785243988037, -1.178124189376831, -1.143463134765625, -1.108802080154419, -1.074141025543213, -1.0394799709320068, -1.0048190355300903, -0.9701579809188843, -0.9354969263076782, -0.9008358716964722, -0.8661748170852661, -0.8315137624740601, -0.7968527674674988, -0.7621917128562927, -0.7275306582450867, -0.6928696632385254, -0.6582086086273193, -0.6235475540161133, -0.5888864994049072, -0.5542254447937012, -0.5195644497871399, -0.48490339517593384, -0.4502423405647278, -0.4155813157558441, -0.38092029094696045, -0.3462591767311096, -0.31159812211990356, -0.2769370973110199, -0.24227605760097504, -0.20761501789093018, -0.17295397818088531, -0.13829293847084045, -0.1036318987607956, -0.06897085905075073, -0.03430981934070587, 0.00035122036933898926, 0.03501226007938385, 0.06967329978942871, 0.10433433949947357, 0.13899537920951843, 0.1736564189195633, 0.20831745862960815, 0.24297849833965302, 0.2776395380496979, 0.31230056285858154, 0.3469616174697876, 0.38162267208099365, 0.4162836968898773, 0.450944721698761, 0.48560577630996704, 0.5202668309211731, 0.5549278259277344, 0.5895888805389404, 0.6242499351501465, 0.6589109897613525, 0.6935720443725586, 0.7282330393791199, 0.7628940939903259]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 4.0, 5.0, 12.0, 7.0, 9.0, 18.0, 16.0, 15.0, 21.0, 28.0, 22.0, 26.0, 33.0, 37.0, 43.0, 34.0, 38.0, 38.0, 32.0, 37.0, 47.0, 40.0, 46.0, 39.0, 31.0, 30.0, 37.0, 31.0, 32.0, 25.0, 22.0, 14.0, 15.0, 26.0, 16.0, 15.0, 15.0, 6.0, 7.0, 8.0, 6.0, 5.0, 5.0, 2.0, 6.0, 0.0, 1.0, 2.0], "bins": [-0.516281008720398, -0.502227783203125, -0.48817455768585205, -0.4741213321685791, -0.46006810665130615, -0.4460148811340332, -0.43196165561676025, -0.4179084002971649, -0.40385517477989197, -0.389801949262619, -0.37574872374534607, -0.3616954982280731, -0.34764227271080017, -0.33358901739120483, -0.3195357918739319, -0.30548256635665894, -0.291429340839386, -0.27737611532211304, -0.2633228898048401, -0.24926966428756714, -0.235216423869133, -0.22116319835186005, -0.2071099728345871, -0.19305673241615295, -0.1790035367012024, -0.16495031118392944, -0.1508970856666565, -0.13684386014938354, -0.1227906197309494, -0.10873739421367645, -0.0946841686964035, -0.08063093572854996, -0.06657770276069641, -0.05252447351813316, -0.038471244275569916, -0.024418018758296967, -0.010364789515733719, 0.003688439726829529, 0.017741665244102478, 0.031794898211956024, 0.04584812372922897, 0.05990135297179222, 0.07395458221435547, 0.08800780773162842, 0.10206103324890137, 0.11611426621675491, 0.13016748428344727, 0.1442207247018814, 0.15827395021915436, 0.1723271757364273, 0.18638040125370026, 0.2004336416721344, 0.21448686718940735, 0.2285400927066803, 0.24259331822395325, 0.2566465437412262, 0.27069976925849915, 0.2847529947757721, 0.29880622029304504, 0.312859445810318, 0.32691267132759094, 0.3409659266471863, 0.35501915216445923, 0.3690723776817322, 0.3831256031990051]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 8.0, 6.0, 12.0, 13.0, 31.0, 51.0, 88.0, 162.0, 244.0, 500.0, 876.0, 1651.0, 3106.0, 5664.0, 10591.0, 19699.0, 38737.0, 79944.0, 182147.0, 447510.0, 968942.0, 1191834.0, 708654.0, 295909.0, 122571.0, 55991.0, 28014.0, 14610.0, 7643.0, 4181.0, 2208.0, 1182.0, 639.0, 367.0, 196.0, 115.0, 64.0, 41.0, 33.0, 19.0, 10.0, 3.0, 4.0, 2.0, 6.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.06622314453125, -0.06423234939575195, -0.062241554260253906, -0.06025075912475586, -0.05825996398925781, -0.056269168853759766, -0.05427837371826172, -0.05228757858276367, -0.050296783447265625, -0.04830598831176758, -0.04631519317626953, -0.044324398040771484, -0.04233360290527344, -0.04034280776977539, -0.038352012634277344, -0.0363612174987793, -0.03437042236328125, -0.0323796272277832, -0.030388832092285156, -0.02839803695678711, -0.026407241821289062, -0.024416446685791016, -0.02242565155029297, -0.020434856414794922, -0.018444061279296875, -0.016453266143798828, -0.014462471008300781, -0.012471675872802734, -0.010480880737304688, -0.00849008560180664, -0.006499290466308594, -0.004508495330810547, -0.0025177001953125, -0.0005269050598144531, 0.0014638900756835938, 0.0034546852111816406, 0.0054454803466796875, 0.007436275482177734, 0.009427070617675781, 0.011417865753173828, 0.013408660888671875, 0.015399456024169922, 0.01739025115966797, 0.019381046295166016, 0.021371841430664062, 0.02336263656616211, 0.025353431701660156, 0.027344226837158203, 0.02933502197265625, 0.0313258171081543, 0.033316612243652344, 0.03530740737915039, 0.03729820251464844, 0.039288997650146484, 0.04127979278564453, 0.04327058792114258, 0.045261383056640625, 0.04725217819213867, 0.04924297332763672, 0.051233768463134766, 0.05322456359863281, 0.05521535873413086, 0.057206153869628906, 0.05919694900512695, 0.061187744140625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 7.0, 4.0, 3.0, 5.0, 4.0, 6.0, 9.0, 8.0, 17.0, 14.0, 16.0, 11.0, 22.0, 22.0, 23.0, 31.0, 29.0, 39.0, 34.0, 34.0, 31.0, 34.0, 37.0, 43.0, 53.0, 51.0, 42.0, 36.0, 37.0, 35.0, 38.0, 23.0, 36.0, 23.0, 18.0, 19.0, 16.0, 10.0, 13.0, 14.0, 15.0, 9.0, 10.0, 5.0, 3.0, 5.0, 3.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.06463623046875, -0.06268692016601562, -0.06073760986328125, -0.058788299560546875, -0.0568389892578125, -0.054889678955078125, -0.05294036865234375, -0.050991058349609375, -0.049041748046875, -0.047092437744140625, -0.04514312744140625, -0.043193817138671875, -0.0412445068359375, -0.039295196533203125, -0.03734588623046875, -0.035396575927734375, -0.033447265625, -0.031497955322265625, -0.02954864501953125, -0.027599334716796875, -0.0256500244140625, -0.023700714111328125, -0.02175140380859375, -0.019802093505859375, -0.017852783203125, -0.015903472900390625, -0.01395416259765625, -0.012004852294921875, -0.0100555419921875, -0.008106231689453125, -0.00615692138671875, -0.004207611083984375, -0.00225830078125, -0.000308990478515625, 0.00164031982421875, 0.003589630126953125, 0.0055389404296875, 0.007488250732421875, 0.00943756103515625, 0.011386871337890625, 0.013336181640625, 0.015285491943359375, 0.01723480224609375, 0.019184112548828125, 0.0211334228515625, 0.023082733154296875, 0.02503204345703125, 0.026981353759765625, 0.0289306640625, 0.030879974365234375, 0.03282928466796875, 0.034778594970703125, 0.0367279052734375, 0.038677215576171875, 0.04062652587890625, 0.042575836181640625, 0.044525146484375, 0.046474456787109375, 0.04842376708984375, 0.050373077392578125, 0.0523223876953125, 0.054271697998046875, 0.05622100830078125, 0.058170318603515625, 0.06011962890625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 6.0, 16.0, 22.0, 31.0, 31.0, 66.0, 89.0, 138.0, 222.0, 317.0, 495.0, 848.0, 1539.0, 2971.0, 6687.0, 15964.0, 42078.0, 117197.0, 373415.0, 1570194.0, 1519390.0, 359837.0, 113633.0, 40892.0, 15264.0, 6351.0, 2860.0, 1476.0, 809.0, 491.0, 295.0, 195.0, 143.0, 109.0, 61.0, 41.0, 27.0, 27.0, 17.0, 7.0, 9.0, 6.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1109619140625, -0.10738086700439453, -0.10379981994628906, -0.1002187728881836, -0.09663772583007812, -0.09305667877197266, -0.08947563171386719, -0.08589458465576172, -0.08231353759765625, -0.07873249053955078, -0.07515144348144531, -0.07157039642333984, -0.06798934936523438, -0.0644083023071289, -0.06082725524902344, -0.05724620819091797, -0.0536651611328125, -0.05008411407470703, -0.04650306701660156, -0.042922019958496094, -0.039340972900390625, -0.035759925842285156, -0.03217887878417969, -0.02859783172607422, -0.02501678466796875, -0.02143573760986328, -0.017854690551757812, -0.014273643493652344, -0.010692596435546875, -0.007111549377441406, -0.0035305023193359375, 5.054473876953125e-05, 0.003631591796875, 0.007212638854980469, 0.010793685913085938, 0.014374732971191406, 0.017955780029296875, 0.021536827087402344, 0.025117874145507812, 0.02869892120361328, 0.03227996826171875, 0.03586101531982422, 0.03944206237792969, 0.043023109436035156, 0.046604156494140625, 0.050185203552246094, 0.05376625061035156, 0.05734729766845703, 0.0609283447265625, 0.06450939178466797, 0.06809043884277344, 0.0716714859008789, 0.07525253295898438, 0.07883358001708984, 0.08241462707519531, 0.08599567413330078, 0.08957672119140625, 0.09315776824951172, 0.09673881530761719, 0.10031986236572266, 0.10390090942382812, 0.1074819564819336, 0.11106300354003906, 0.11464405059814453, 0.11822509765625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 5.0, 8.0, 6.0, 15.0, 13.0, 17.0, 30.0, 48.0, 47.0, 53.0, 105.0, 98.0, 158.0, 212.0, 277.0, 410.0, 523.0, 517.0, 387.0, 323.0, 225.0, 144.0, 92.0, 84.0, 72.0, 39.0, 41.0, 30.0, 24.0, 19.0, 14.0, 11.0, 5.0, 5.0, 5.0, 0.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1416015625, -0.13732337951660156, -0.13304519653320312, -0.1287670135498047, -0.12448883056640625, -0.12021064758300781, -0.11593246459960938, -0.11165428161621094, -0.1073760986328125, -0.10309791564941406, -0.09881973266601562, -0.09454154968261719, -0.09026336669921875, -0.08598518371582031, -0.08170700073242188, -0.07742881774902344, -0.073150634765625, -0.06887245178222656, -0.06459426879882812, -0.06031608581542969, -0.05603790283203125, -0.05175971984863281, -0.047481536865234375, -0.04320335388183594, -0.0389251708984375, -0.03464698791503906, -0.030368804931640625, -0.026090621948242188, -0.02181243896484375, -0.017534255981445312, -0.013256072998046875, -0.008977890014648438, -0.00469970703125, -0.0004215240478515625, 0.003856658935546875, 0.008134841918945312, 0.01241302490234375, 0.016691207885742188, 0.020969390869140625, 0.025247573852539062, 0.0295257568359375, 0.03380393981933594, 0.038082122802734375, 0.04236030578613281, 0.04663848876953125, 0.05091667175292969, 0.055194854736328125, 0.05947303771972656, 0.063751220703125, 0.06802940368652344, 0.07230758666992188, 0.07658576965332031, 0.08086395263671875, 0.08514213562011719, 0.08942031860351562, 0.09369850158691406, 0.0979766845703125, 0.10225486755371094, 0.10653305053710938, 0.11081123352050781, 0.11508941650390625, 0.11936759948730469, 0.12364578247070312, 0.12792396545410156, 0.1322021484375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 15.0, 75.0, 156.0, 297.0, 274.0, 111.0, 44.0, 14.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3617911338806152, -3.291457414627075, -3.221123695373535, -3.150789976119995, -3.080456256866455, -3.010122537612915, -2.939788818359375, -2.869455099105835, -2.799121379852295, -2.728787660598755, -2.658453941345215, -2.588120222091675, -2.5177865028381348, -2.4474527835845947, -2.3771190643310547, -2.3067853450775146, -2.2364516258239746, -2.1661179065704346, -2.0957841873168945, -2.0254504680633545, -1.9551167488098145, -1.8847830295562744, -1.8144493103027344, -1.7441155910491943, -1.6737818717956543, -1.6034481525421143, -1.5331144332885742, -1.4627807140350342, -1.3924469947814941, -1.322113275527954, -1.251779556274414, -1.181445837020874, -1.1111118793487549, -1.0407781600952148, -0.9704444408416748, -0.9001107215881348, -0.8297770023345947, -0.7594432830810547, -0.6891095638275146, -0.6187758445739746, -0.5484421253204346, -0.47810840606689453, -0.4077746868133545, -0.33744096755981445, -0.2671072483062744, -0.19677352905273438, -0.12643980979919434, -0.0561060905456543, 0.014227628707885742, 0.08456134796142578, 0.15489506721496582, 0.22522878646850586, 0.2955625057220459, 0.36589622497558594, 0.436229944229126, 0.506563663482666, 0.576897382736206, 0.6472311019897461, 0.7175648212432861, 0.7878985404968262, 0.8582322597503662, 0.9285659790039062, 0.9988996982574463, 1.0692334175109863, 1.1395671367645264]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 4.0, 5.0, 12.0, 8.0, 14.0, 15.0, 10.0, 24.0, 29.0, 30.0, 21.0, 34.0, 29.0, 44.0, 43.0, 49.0, 45.0, 46.0, 44.0, 44.0, 44.0, 46.0, 39.0, 45.0, 28.0, 33.0, 33.0, 26.0, 25.0, 16.0, 23.0, 18.0, 16.0, 14.0, 14.0, 7.0, 4.0, 4.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.43745726346969604, -0.4223458170890808, -0.40723440051078796, -0.3921229839324951, -0.3770115375518799, -0.36190009117126465, -0.3467886745929718, -0.33167725801467896, -0.3165658116340637, -0.3014543652534485, -0.28634294867515564, -0.2712315320968628, -0.25612008571624756, -0.24100865423679352, -0.22589722275733948, -0.21078579127788544, -0.1956743597984314, -0.18056292831897736, -0.16545149683952332, -0.15034006536006927, -0.13522863388061523, -0.1201172024011612, -0.10500577092170715, -0.08989433944225311, -0.07478290796279907, -0.05967147648334503, -0.04456004500389099, -0.02944861352443695, -0.01433718204498291, 0.0007742494344711304, 0.01588568091392517, 0.03099711239337921, 0.04610854387283325, 0.06121997535228729, 0.07633140683174133, 0.09144283831119537, 0.10655426979064941, 0.12166570127010345, 0.1367771327495575, 0.15188856422901154, 0.16699999570846558, 0.18211142718791962, 0.19722285866737366, 0.2123342901468277, 0.22744572162628174, 0.24255715310573578, 0.2576685845851898, 0.27278000116348267, 0.2878914475440979, 0.30300289392471313, 0.318114310503006, 0.33322572708129883, 0.34833717346191406, 0.3634486198425293, 0.37856003642082214, 0.393671452999115, 0.4087828993797302, 0.42389434576034546, 0.4390057623386383, 0.45411717891693115, 0.4692286252975464, 0.4843400716781616, 0.49945148825645447, 0.5145629048347473, 0.5296743512153625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 15.0, 22.0, 38.0, 72.0, 152.0, 303.0, 761.0, 1803.0, 4963.0, 13239.0, 40368.0, 120689.0, 280762.0, 325106.0, 170883.0, 58862.0, 19273.0, 6765.0, 2579.0, 1065.0, 426.0, 209.0, 96.0, 40.0, 25.0, 11.0, 9.0, 2.0, 4.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09881591796875, -0.095428466796875, -0.092041015625, -0.088653564453125, -0.08526611328125, -0.081878662109375, -0.0784912109375, -0.075103759765625, -0.07171630859375, -0.068328857421875, -0.06494140625, -0.061553955078125, -0.05816650390625, -0.054779052734375, -0.0513916015625, -0.048004150390625, -0.04461669921875, -0.041229248046875, -0.037841796875, -0.034454345703125, -0.03106689453125, -0.027679443359375, -0.0242919921875, -0.020904541015625, -0.01751708984375, -0.014129638671875, -0.0107421875, -0.007354736328125, -0.00396728515625, -0.000579833984375, 0.0028076171875, 0.006195068359375, 0.00958251953125, 0.012969970703125, 0.016357421875, 0.019744873046875, 0.02313232421875, 0.026519775390625, 0.0299072265625, 0.033294677734375, 0.03668212890625, 0.040069580078125, 0.04345703125, 0.046844482421875, 0.05023193359375, 0.053619384765625, 0.0570068359375, 0.060394287109375, 0.06378173828125, 0.067169189453125, 0.070556640625, 0.073944091796875, 0.07733154296875, 0.080718994140625, 0.0841064453125, 0.087493896484375, 0.09088134765625, 0.094268798828125, 0.09765625, 0.101043701171875, 0.10443115234375, 0.107818603515625, 0.1112060546875, 0.114593505859375, 0.11798095703125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 2.0, 6.0, 4.0, 8.0, 5.0, 10.0, 19.0, 19.0, 14.0, 18.0, 20.0, 29.0, 24.0, 30.0, 23.0, 29.0, 38.0, 36.0, 29.0, 51.0, 37.0, 41.0, 42.0, 39.0, 31.0, 40.0, 30.0, 33.0, 31.0, 37.0, 27.0, 23.0, 34.0, 21.0, 12.0, 21.0, 16.0, 14.0, 11.0, 11.0, 7.0, 5.0, 8.0, 4.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061370849609375, -0.05946063995361328, -0.05755043029785156, -0.055640220642089844, -0.053730010986328125, -0.051819801330566406, -0.04990959167480469, -0.04799938201904297, -0.04608917236328125, -0.04417896270751953, -0.04226875305175781, -0.040358543395996094, -0.038448333740234375, -0.036538124084472656, -0.03462791442871094, -0.03271770477294922, -0.0308074951171875, -0.02889728546142578, -0.026987075805664062, -0.025076866149902344, -0.023166656494140625, -0.021256446838378906, -0.019346237182617188, -0.01743602752685547, -0.01552581787109375, -0.013615608215332031, -0.011705398559570312, -0.009795188903808594, -0.007884979248046875, -0.005974769592285156, -0.0040645599365234375, -0.0021543502807617188, -0.000244140625, 0.0016660690307617188, 0.0035762786865234375, 0.005486488342285156, 0.007396697998046875, 0.009306907653808594, 0.011217117309570312, 0.013127326965332031, 0.01503753662109375, 0.01694774627685547, 0.018857955932617188, 0.020768165588378906, 0.022678375244140625, 0.024588584899902344, 0.026498794555664062, 0.02840900421142578, 0.0303192138671875, 0.03222942352294922, 0.03413963317871094, 0.036049842834472656, 0.037960052490234375, 0.039870262145996094, 0.04178047180175781, 0.04369068145751953, 0.04560089111328125, 0.04751110076904297, 0.04942131042480469, 0.051331520080566406, 0.053241729736328125, 0.055151939392089844, 0.05706214904785156, 0.05897235870361328, 0.060882568359375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 3.0, 6.0, 4.0, 6.0, 12.0, 7.0, 16.0, 28.0, 39.0, 59.0, 100.0, 180.0, 310.0, 620.0, 1474.0, 3523.0, 9792.0, 32014.0, 116894.0, 350410.0, 359764.0, 123045.0, 33333.0, 10305.0, 3745.0, 1476.0, 628.0, 304.0, 181.0, 99.0, 64.0, 40.0, 15.0, 12.0, 11.0, 13.0, 11.0, 3.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.13134765625, -0.12697219848632812, -0.12259674072265625, -0.11822128295898438, -0.1138458251953125, -0.10947036743164062, -0.10509490966796875, -0.10071945190429688, -0.096343994140625, -0.09196853637695312, -0.08759307861328125, -0.08321762084960938, -0.0788421630859375, -0.07446670532226562, -0.07009124755859375, -0.06571578979492188, -0.06134033203125, -0.056964874267578125, -0.05258941650390625, -0.048213958740234375, -0.0438385009765625, -0.039463043212890625, -0.03508758544921875, -0.030712127685546875, -0.026336669921875, -0.021961212158203125, -0.01758575439453125, -0.013210296630859375, -0.0088348388671875, -0.004459381103515625, -8.392333984375e-05, 0.004291534423828125, 0.0086669921875, 0.013042449951171875, 0.01741790771484375, 0.021793365478515625, 0.0261688232421875, 0.030544281005859375, 0.03491973876953125, 0.039295196533203125, 0.043670654296875, 0.048046112060546875, 0.05242156982421875, 0.056797027587890625, 0.0611724853515625, 0.06554794311523438, 0.06992340087890625, 0.07429885864257812, 0.07867431640625, 0.08304977416992188, 0.08742523193359375, 0.09180068969726562, 0.0961761474609375, 0.10055160522460938, 0.10492706298828125, 0.10930252075195312, 0.113677978515625, 0.11805343627929688, 0.12242889404296875, 0.12680435180664062, 0.1311798095703125, 0.13555526733398438, 0.13993072509765625, 0.14430618286132812, 0.148681640625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 5.0, 6.0, 12.0, 16.0, 12.0, 9.0, 16.0, 20.0, 12.0, 25.0, 33.0, 32.0, 33.0, 30.0, 47.0, 34.0, 40.0, 47.0, 38.0, 55.0, 59.0, 49.0, 49.0, 44.0, 33.0, 37.0, 28.0, 28.0, 33.0, 23.0, 15.0, 15.0, 14.0, 10.0, 15.0, 5.0, 3.0, 2.0, 3.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.2271728515625, -0.2204437255859375, -0.213714599609375, -0.2069854736328125, -0.20025634765625, -0.1935272216796875, -0.186798095703125, -0.1800689697265625, -0.17333984375, -0.1666107177734375, -0.159881591796875, -0.1531524658203125, -0.14642333984375, -0.1396942138671875, -0.132965087890625, -0.1262359619140625, -0.1195068359375, -0.1127777099609375, -0.106048583984375, -0.0993194580078125, -0.09259033203125, -0.0858612060546875, -0.079132080078125, -0.0724029541015625, -0.065673828125, -0.0589447021484375, -0.052215576171875, -0.0454864501953125, -0.03875732421875, -0.0320281982421875, -0.025299072265625, -0.0185699462890625, -0.0118408203125, -0.0051116943359375, 0.001617431640625, 0.0083465576171875, 0.01507568359375, 0.0218048095703125, 0.028533935546875, 0.0352630615234375, 0.0419921875, 0.0487213134765625, 0.055450439453125, 0.0621795654296875, 0.06890869140625, 0.0756378173828125, 0.082366943359375, 0.0890960693359375, 0.0958251953125, 0.1025543212890625, 0.109283447265625, 0.1160125732421875, 0.12274169921875, 0.1294708251953125, 0.136199951171875, 0.1429290771484375, 0.149658203125, 0.1563873291015625, 0.163116455078125, 0.1698455810546875, 0.17657470703125, 0.1833038330078125, 0.190032958984375, 0.1967620849609375, 0.2034912109375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 13.0, 8.0, 21.0, 28.0, 58.0, 85.0, 122.0, 229.0, 452.0, 750.0, 1346.0, 2403.0, 4616.0, 9050.0, 19051.0, 40490.0, 90230.0, 184651.0, 266941.0, 217008.0, 113153.0, 50991.0, 23342.0, 11177.0, 5600.0, 2967.0, 1702.0, 872.0, 495.0, 286.0, 161.0, 92.0, 58.0, 40.0, 13.0, 17.0, 7.0, 9.0, 4.0, 7.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0416259765625, -0.04045820236206055, -0.039290428161621094, -0.03812265396118164, -0.03695487976074219, -0.035787105560302734, -0.03461933135986328, -0.03345155715942383, -0.032283782958984375, -0.031116008758544922, -0.02994823455810547, -0.028780460357666016, -0.027612686157226562, -0.02644491195678711, -0.025277137756347656, -0.024109363555908203, -0.02294158935546875, -0.021773815155029297, -0.020606040954589844, -0.01943826675415039, -0.018270492553710938, -0.017102718353271484, -0.01593494415283203, -0.014767169952392578, -0.013599395751953125, -0.012431621551513672, -0.011263847351074219, -0.010096073150634766, -0.008928298950195312, -0.007760524749755859, -0.006592750549316406, -0.005424976348876953, -0.0042572021484375, -0.003089427947998047, -0.0019216537475585938, -0.0007538795471191406, 0.0004138946533203125, 0.0015816688537597656, 0.0027494430541992188, 0.003917217254638672, 0.005084991455078125, 0.006252765655517578, 0.007420539855957031, 0.008588314056396484, 0.009756088256835938, 0.01092386245727539, 0.012091636657714844, 0.013259410858154297, 0.01442718505859375, 0.015594959259033203, 0.016762733459472656, 0.01793050765991211, 0.019098281860351562, 0.020266056060791016, 0.02143383026123047, 0.022601604461669922, 0.023769378662109375, 0.024937152862548828, 0.02610492706298828, 0.027272701263427734, 0.028440475463867188, 0.02960824966430664, 0.030776023864746094, 0.03194379806518555, 0.033111572265625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 13.0, 14.0, 12.0, 18.0, 20.0, 19.0, 45.0, 44.0, 47.0, 48.0, 49.0, 62.0, 74.0, 69.0, 69.0, 57.0, 51.0, 42.0, 31.0, 52.0, 24.0, 24.0, 22.0, 19.0, 15.0, 6.0, 7.0, 12.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.2993812561035156e-05, -1.2588687241077423e-05, -1.218356192111969e-05, -1.1778436601161957e-05, -1.1373311281204224e-05, -1.096818596124649e-05, -1.0563060641288757e-05, -1.0157935321331024e-05, -9.752810001373291e-06, -9.347684681415558e-06, -8.942559361457825e-06, -8.537434041500092e-06, -8.132308721542358e-06, -7.727183401584625e-06, -7.322058081626892e-06, -6.916932761669159e-06, -6.511807441711426e-06, -6.106682121753693e-06, -5.7015568017959595e-06, -5.296431481838226e-06, -4.891306161880493e-06, -4.48618084192276e-06, -4.081055521965027e-06, -3.6759302020072937e-06, -3.2708048820495605e-06, -2.8656795620918274e-06, -2.4605542421340942e-06, -2.055428922176361e-06, -1.650303602218628e-06, -1.2451782822608948e-06, -8.400529623031616e-07, -4.3492764234542847e-07, -2.9802322387695312e-08, 3.7532299757003784e-07, 7.80448317527771e-07, 1.1855736374855042e-06, 1.5906989574432373e-06, 1.9958242774009705e-06, 2.4009495973587036e-06, 2.8060749173164368e-06, 3.21120023727417e-06, 3.616325557231903e-06, 4.021450877189636e-06, 4.426576197147369e-06, 4.8317015171051025e-06, 5.236826837062836e-06, 5.641952157020569e-06, 6.047077476978302e-06, 6.452202796936035e-06, 6.857328116893768e-06, 7.2624534368515015e-06, 7.667578756809235e-06, 8.072704076766968e-06, 8.477829396724701e-06, 8.882954716682434e-06, 9.288080036640167e-06, 9.6932053565979e-06, 1.0098330676555634e-05, 1.0503455996513367e-05, 1.09085813164711e-05, 1.1313706636428833e-05, 1.1718831956386566e-05, 1.21239572763443e-05, 1.2529082596302032e-05, 1.2934207916259766e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 2.0, 5.0, 12.0, 12.0, 11.0, 19.0, 27.0, 39.0, 65.0, 100.0, 123.0, 232.0, 437.0, 823.0, 1611.0, 3301.0, 7370.0, 16391.0, 35982.0, 77572.0, 155302.0, 243021.0, 234690.0, 141499.0, 70231.0, 32109.0, 14551.0, 6612.0, 3140.0, 1464.0, 785.0, 379.0, 222.0, 133.0, 90.0, 57.0, 43.0, 29.0, 21.0, 18.0, 11.0, 3.0, 1.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.042388916015625, -0.04120922088623047, -0.04002952575683594, -0.038849830627441406, -0.037670135498046875, -0.036490440368652344, -0.03531074523925781, -0.03413105010986328, -0.03295135498046875, -0.03177165985107422, -0.030591964721679688, -0.029412269592285156, -0.028232574462890625, -0.027052879333496094, -0.025873184204101562, -0.02469348907470703, -0.0235137939453125, -0.02233409881591797, -0.021154403686523438, -0.019974708557128906, -0.018795013427734375, -0.017615318298339844, -0.016435623168945312, -0.015255928039550781, -0.01407623291015625, -0.012896537780761719, -0.011716842651367188, -0.010537147521972656, -0.009357452392578125, -0.008177757263183594, -0.0069980621337890625, -0.005818367004394531, -0.004638671875, -0.0034589767456054688, -0.0022792816162109375, -0.0010995864868164062, 8.0108642578125e-05, 0.0012598037719726562, 0.0024394989013671875, 0.0036191940307617188, 0.00479888916015625, 0.005978584289550781, 0.0071582794189453125, 0.008337974548339844, 0.009517669677734375, 0.010697364807128906, 0.011877059936523438, 0.013056755065917969, 0.0142364501953125, 0.015416145324707031, 0.016595840454101562, 0.017775535583496094, 0.018955230712890625, 0.020134925842285156, 0.021314620971679688, 0.02249431610107422, 0.02367401123046875, 0.02485370635986328, 0.026033401489257812, 0.027213096618652344, 0.028392791748046875, 0.029572486877441406, 0.030752182006835938, 0.03193187713623047, 0.033111572265625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 9.0, 10.0, 15.0, 28.0, 22.0, 40.0, 48.0, 50.0, 65.0, 74.0, 78.0, 84.0, 91.0, 62.0, 66.0, 58.0, 46.0, 33.0, 43.0, 17.0, 17.0, 16.0, 8.0, 8.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.074951171875, -0.07318258285522461, -0.07141399383544922, -0.06964540481567383, -0.06787681579589844, -0.06610822677612305, -0.06433963775634766, -0.06257104873657227, -0.060802459716796875, -0.059033870697021484, -0.057265281677246094, -0.0554966926574707, -0.05372810363769531, -0.05195951461791992, -0.05019092559814453, -0.04842233657836914, -0.04665374755859375, -0.04488515853881836, -0.04311656951904297, -0.04134798049926758, -0.03957939147949219, -0.0378108024597168, -0.036042213439941406, -0.034273624420166016, -0.032505035400390625, -0.030736446380615234, -0.028967857360839844, -0.027199268341064453, -0.025430679321289062, -0.023662090301513672, -0.02189350128173828, -0.02012491226196289, -0.0183563232421875, -0.01658773422241211, -0.014819145202636719, -0.013050556182861328, -0.011281967163085938, -0.009513378143310547, -0.007744789123535156, -0.005976200103759766, -0.004207611083984375, -0.0024390220642089844, -0.0006704330444335938, 0.0010981559753417969, 0.0028667449951171875, 0.004635334014892578, 0.006403923034667969, 0.00817251205444336, 0.00994110107421875, 0.01170969009399414, 0.013478279113769531, 0.015246868133544922, 0.017015457153320312, 0.018784046173095703, 0.020552635192871094, 0.022321224212646484, 0.024089813232421875, 0.025858402252197266, 0.027626991271972656, 0.029395580291748047, 0.031164169311523438, 0.03293275833129883, 0.03470134735107422, 0.03646993637084961, 0.038238525390625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 7.0, 20.0, 65.0, 261.0, 354.0, 197.0, 65.0, 19.0, 5.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4630708694458008, -1.4112446308135986, -1.359418272972107, -1.3075919151306152, -1.255765676498413, -1.203939437866211, -1.1521130800247192, -1.1002867221832275, -1.0484604835510254, -0.9966341853141785, -0.9448078870773315, -0.8929815888404846, -0.8411552906036377, -0.7893289923667908, -0.7375026941299438, -0.6856763958930969, -0.63385009765625, -0.5820237994194031, -0.5301975011825562, -0.47837120294570923, -0.4265449047088623, -0.3747186064720154, -0.32289230823516846, -0.27106600999832153, -0.2192397117614746, -0.16741341352462769, -0.11558711528778076, -0.06376081705093384, -0.011934518814086914, 0.03989177942276001, 0.09171807765960693, 0.14354437589645386, 0.19537067413330078, 0.2471969723701477, 0.29902327060699463, 0.35084956884384155, 0.4026758670806885, 0.4545021653175354, 0.5063284635543823, 0.5581547617912292, 0.6099810600280762, 0.6618073582649231, 0.71363365650177, 0.7654599547386169, 0.8172862529754639, 0.8691125512123108, 0.9209388494491577, 0.9727651476860046, 1.0245914459228516, 1.0764176845550537, 1.1282440423965454, 1.180070400238037, 1.2318966388702393, 1.2837228775024414, 1.335549235343933, 1.3873755931854248, 1.439201831817627, 1.491028070449829, 1.5428544282913208, 1.5946807861328125, 1.6465070247650146, 1.6983332633972168, 1.7501596212387085, 1.8019859790802002, 1.8538122177124023]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 3.0, 7.0, 3.0, 8.0, 13.0, 9.0, 15.0, 15.0, 22.0, 23.0, 28.0, 31.0, 25.0, 33.0, 37.0, 35.0, 37.0, 38.0, 42.0, 47.0, 39.0, 32.0, 50.0, 40.0, 32.0, 38.0, 38.0, 31.0, 33.0, 30.0, 38.0, 29.0, 17.0, 16.0, 11.0, 9.0, 7.0, 7.0, 3.0, 8.0, 5.0, 6.0, 3.0, 0.0, 8.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.526828944683075, -0.510692834854126, -0.494556725025177, -0.478420615196228, -0.46228450536727905, -0.4461483955383301, -0.4300122857093811, -0.41387617588043213, -0.39774006605148315, -0.3816039562225342, -0.3654678463935852, -0.34933173656463623, -0.33319562673568726, -0.3170595169067383, -0.3009234070777893, -0.28478729724884033, -0.26865118741989136, -0.2525150775909424, -0.2363789677619934, -0.22024285793304443, -0.20410674810409546, -0.18797063827514648, -0.1718345284461975, -0.15569841861724854, -0.13956230878829956, -0.12342619895935059, -0.10729008913040161, -0.09115397930145264, -0.07501786947250366, -0.05888175964355469, -0.04274564981460571, -0.02660953998565674, -0.010473489761352539, 0.0056626200675964355, 0.02179872989654541, 0.037934839725494385, 0.05407094955444336, 0.07020705938339233, 0.08634316921234131, 0.10247927904129028, 0.11861538887023926, 0.13475149869918823, 0.1508876085281372, 0.16702371835708618, 0.18315982818603516, 0.19929593801498413, 0.2154320478439331, 0.23156815767288208, 0.24770426750183105, 0.26384037733078003, 0.279976487159729, 0.296112596988678, 0.31224870681762695, 0.3283848166465759, 0.3445209264755249, 0.3606570363044739, 0.37679314613342285, 0.3929292559623718, 0.4090653657913208, 0.4252014756202698, 0.44133758544921875, 0.4574736952781677, 0.4736098051071167, 0.4897459149360657, 0.5058820247650146]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 9.0, 4.0, 3.0, 10.0, 18.0, 21.0, 24.0, 30.0, 56.0, 74.0, 107.0, 197.0, 344.0, 675.0, 1326.0, 2766.0, 6573.0, 16170.0, 42554.0, 129119.0, 408932.0, 1074726.0, 1438208.0, 718799.0, 235044.0, 73527.0, 25957.0, 10413.0, 4282.0, 2010.0, 999.0, 501.0, 276.0, 188.0, 112.0, 70.0, 47.0, 26.0, 23.0, 18.0, 15.0, 15.0, 9.0, 8.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.085693359375, -0.08326339721679688, -0.08083343505859375, -0.07840347290039062, -0.0759735107421875, -0.07354354858398438, -0.07111358642578125, -0.06868362426757812, -0.066253662109375, -0.06382369995117188, -0.06139373779296875, -0.058963775634765625, -0.0565338134765625, -0.054103851318359375, -0.05167388916015625, -0.049243927001953125, -0.04681396484375, -0.044384002685546875, -0.04195404052734375, -0.039524078369140625, -0.0370941162109375, -0.034664154052734375, -0.03223419189453125, -0.029804229736328125, -0.027374267578125, -0.024944305419921875, -0.02251434326171875, -0.020084381103515625, -0.0176544189453125, -0.015224456787109375, -0.01279449462890625, -0.010364532470703125, -0.0079345703125, -0.005504608154296875, -0.00307464599609375, -0.000644683837890625, 0.0017852783203125, 0.004215240478515625, 0.00664520263671875, 0.009075164794921875, 0.011505126953125, 0.013935089111328125, 0.01636505126953125, 0.018795013427734375, 0.0212249755859375, 0.023654937744140625, 0.02608489990234375, 0.028514862060546875, 0.03094482421875, 0.033374786376953125, 0.03580474853515625, 0.038234710693359375, 0.0406646728515625, 0.043094635009765625, 0.04552459716796875, 0.047954559326171875, 0.050384521484375, 0.052814483642578125, 0.05524444580078125, 0.057674407958984375, 0.0601043701171875, 0.06253433227539062, 0.06496429443359375, 0.06739425659179688, 0.06982421875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 8.0, 3.0, 8.0, 6.0, 12.0, 19.0, 11.0, 13.0, 18.0, 8.0, 24.0, 25.0, 28.0, 27.0, 37.0, 39.0, 40.0, 44.0, 48.0, 34.0, 39.0, 41.0, 37.0, 45.0, 35.0, 33.0, 31.0, 37.0, 34.0, 37.0, 20.0, 15.0, 15.0, 21.0, 18.0, 16.0, 7.0, 17.0, 12.0, 8.0, 8.0, 8.0, 6.0, 4.0, 0.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.07281494140625, -0.07056522369384766, -0.06831550598144531, -0.06606578826904297, -0.06381607055664062, -0.06156635284423828, -0.05931663513183594, -0.057066917419433594, -0.05481719970703125, -0.052567481994628906, -0.05031776428222656, -0.04806804656982422, -0.045818328857421875, -0.04356861114501953, -0.04131889343261719, -0.039069175720214844, -0.0368194580078125, -0.034569740295410156, -0.03232002258300781, -0.03007030487060547, -0.027820587158203125, -0.02557086944580078, -0.023321151733398438, -0.021071434020996094, -0.01882171630859375, -0.016571998596191406, -0.014322280883789062, -0.012072563171386719, -0.009822845458984375, -0.007573127746582031, -0.0053234100341796875, -0.0030736923217773438, -0.000823974609375, 0.0014257431030273438, 0.0036754608154296875, 0.005925178527832031, 0.008174896240234375, 0.010424613952636719, 0.012674331665039062, 0.014924049377441406, 0.01717376708984375, 0.019423484802246094, 0.021673202514648438, 0.02392292022705078, 0.026172637939453125, 0.02842235565185547, 0.030672073364257812, 0.032921791076660156, 0.0351715087890625, 0.037421226501464844, 0.03967094421386719, 0.04192066192626953, 0.044170379638671875, 0.04642009735107422, 0.04866981506347656, 0.050919532775878906, 0.05316925048828125, 0.055418968200683594, 0.05766868591308594, 0.05991840362548828, 0.062168121337890625, 0.06441783905029297, 0.06666755676269531, 0.06891727447509766, 0.0711669921875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 12.0, 15.0, 23.0, 38.0, 72.0, 140.0, 209.0, 458.0, 889.0, 2276.0, 6793.0, 26063.0, 123595.0, 923294.0, 2633868.0, 388153.0, 65760.0, 15101.0, 4476.0, 1601.0, 689.0, 314.0, 187.0, 101.0, 49.0, 30.0, 17.0, 19.0, 12.0, 10.0, 1.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1795654296875, -0.1746196746826172, -0.16967391967773438, -0.16472816467285156, -0.15978240966796875, -0.15483665466308594, -0.14989089965820312, -0.1449451446533203, -0.1399993896484375, -0.1350536346435547, -0.13010787963867188, -0.12516212463378906, -0.12021636962890625, -0.11527061462402344, -0.11032485961914062, -0.10537910461425781, -0.100433349609375, -0.09548759460449219, -0.09054183959960938, -0.08559608459472656, -0.08065032958984375, -0.07570457458496094, -0.07075881958007812, -0.06581306457519531, -0.0608673095703125, -0.05592155456542969, -0.050975799560546875, -0.04603004455566406, -0.04108428955078125, -0.03613853454589844, -0.031192779541015625, -0.026247024536132812, -0.02130126953125, -0.016355514526367188, -0.011409759521484375, -0.0064640045166015625, -0.00151824951171875, 0.0034275054931640625, 0.008373260498046875, 0.013319015502929688, 0.0182647705078125, 0.023210525512695312, 0.028156280517578125, 0.03310203552246094, 0.03804779052734375, 0.04299354553222656, 0.047939300537109375, 0.05288505554199219, 0.057830810546875, 0.06277656555175781, 0.06772232055664062, 0.07266807556152344, 0.07761383056640625, 0.08255958557128906, 0.08750534057617188, 0.09245109558105469, 0.0973968505859375, 0.10234260559082031, 0.10728836059570312, 0.11223411560058594, 0.11717987060546875, 0.12212562561035156, 0.12707138061523438, 0.1320171356201172, 0.136962890625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 11.0, 14.0, 22.0, 23.0, 18.0, 31.0, 38.0, 52.0, 83.0, 110.0, 161.0, 239.0, 365.0, 408.0, 531.0, 527.0, 404.0, 300.0, 193.0, 126.0, 101.0, 73.0, 53.0, 37.0, 35.0, 27.0, 21.0, 11.0, 13.0, 3.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 4.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09765625, -0.093719482421875, -0.08978271484375, -0.085845947265625, -0.0819091796875, -0.077972412109375, -0.07403564453125, -0.070098876953125, -0.066162109375, -0.062225341796875, -0.05828857421875, -0.054351806640625, -0.0504150390625, -0.046478271484375, -0.04254150390625, -0.038604736328125, -0.03466796875, -0.030731201171875, -0.02679443359375, -0.022857666015625, -0.0189208984375, -0.014984130859375, -0.01104736328125, -0.007110595703125, -0.003173828125, 0.000762939453125, 0.00469970703125, 0.008636474609375, 0.0125732421875, 0.016510009765625, 0.02044677734375, 0.024383544921875, 0.0283203125, 0.032257080078125, 0.03619384765625, 0.040130615234375, 0.0440673828125, 0.048004150390625, 0.05194091796875, 0.055877685546875, 0.059814453125, 0.063751220703125, 0.06768798828125, 0.071624755859375, 0.0755615234375, 0.079498291015625, 0.08343505859375, 0.087371826171875, 0.09130859375, 0.095245361328125, 0.09918212890625, 0.103118896484375, 0.1070556640625, 0.110992431640625, 0.11492919921875, 0.118865966796875, 0.122802734375, 0.126739501953125, 0.13067626953125, 0.134613037109375, 0.1385498046875, 0.142486572265625, 0.14642333984375, 0.150360107421875, 0.154296875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 10.0, 14.0, 20.0, 38.0, 78.0, 92.0, 116.0, 152.0, 126.0, 114.0, 84.0, 65.0, 39.0, 16.0, 14.0, 9.0, 6.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.0181869268417358, -0.9925392866134644, -0.9668917059898376, -0.9412440657615662, -0.9155964851379395, -0.889948844909668, -0.8643012046813965, -0.8386536240577698, -0.8130060434341431, -0.7873584032058716, -0.7617108225822449, -0.7360631823539734, -0.7104156017303467, -0.6847679615020752, -0.6591203212738037, -0.633472740650177, -0.6078251004219055, -0.582177460193634, -0.5565298795700073, -0.5308822393417358, -0.5052346587181091, -0.47958701848983765, -0.45393940806388855, -0.42829179763793945, -0.40264418721199036, -0.37699657678604126, -0.35134896636009216, -0.32570135593414307, -0.3000537157058716, -0.2744061350822449, -0.2487584948539734, -0.2231108844280243, -0.1974632740020752, -0.1718156635761261, -0.146168053150177, -0.12052042782306671, -0.09487281739711761, -0.06922520697116852, -0.04357758164405823, -0.01792997121810913, 0.007717639207839966, 0.03336525335907936, 0.059012867510318756, 0.08466048538684845, 0.11030809581279755, 0.13595570623874664, 0.16160333156585693, 0.18725094199180603, 0.21289855241775513, 0.23854616284370422, 0.2641937732696533, 0.2898414134979248, 0.3154889941215515, 0.341136634349823, 0.3667842447757721, 0.3924318552017212, 0.4180794656276703, 0.4437270760536194, 0.4693746864795685, 0.4950222969055176, 0.5206699371337891, 0.5463175177574158, 0.5719651579856873, 0.597612738609314, 0.6232603788375854]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 7.0, 7.0, 3.0, 9.0, 16.0, 15.0, 19.0, 18.0, 28.0, 25.0, 35.0, 25.0, 40.0, 40.0, 43.0, 66.0, 55.0, 47.0, 46.0, 43.0, 41.0, 41.0, 54.0, 38.0, 41.0, 32.0, 24.0, 32.0, 31.0, 18.0, 12.0, 12.0, 17.0, 6.0, 3.0, 4.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5241436958312988, -0.5090140700340271, -0.49388444423675537, -0.47875481843948364, -0.4636251926422119, -0.4484955668449402, -0.43336591124534607, -0.41823628544807434, -0.4031066596508026, -0.3879770338535309, -0.37284740805625916, -0.3577177822589874, -0.3425881266593933, -0.3274585008621216, -0.31232887506484985, -0.2971992492675781, -0.2820696234703064, -0.26693999767303467, -0.25181037187576294, -0.23668073117733002, -0.2215511053800583, -0.20642147958278656, -0.19129183888435364, -0.1761622130870819, -0.16103258728981018, -0.14590296149253845, -0.13077333569526672, -0.1156436949968338, -0.10051406919956207, -0.08538444340229034, -0.07025481015443802, -0.05512517690658569, -0.039995551109313965, -0.024865921586751938, -0.009736292064189911, 0.005393337458372116, 0.020522966980934143, 0.03565259277820587, 0.0507822260260582, 0.06591185927391052, 0.08104148507118225, 0.09617111086845398, 0.1113007441163063, 0.12643037736415863, 0.14156000316143036, 0.1566896289587021, 0.171819269657135, 0.18694889545440674, 0.20207852125167847, 0.2172081470489502, 0.23233777284622192, 0.24746741354465485, 0.2625970244407654, 0.2777266502380371, 0.2928563058376312, 0.30798593163490295, 0.3231155574321747, 0.3382451832294464, 0.35337480902671814, 0.36850443482398987, 0.383634090423584, 0.3987637162208557, 0.41389334201812744, 0.42902296781539917, 0.4441525936126709]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 11.0, 13.0, 31.0, 44.0, 69.0, 136.0, 260.0, 561.0, 1209.0, 3088.0, 8227.0, 23399.0, 85583.0, 346571.0, 415748.0, 117054.0, 29958.0, 10119.0, 3811.0, 1454.0, 562.0, 291.0, 158.0, 75.0, 50.0, 29.0, 14.0, 14.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.15087890625, -0.14569473266601562, -0.14051055908203125, -0.13532638549804688, -0.1301422119140625, -0.12495803833007812, -0.11977386474609375, -0.11458969116210938, -0.109405517578125, -0.10422134399414062, -0.09903717041015625, -0.09385299682617188, -0.0886688232421875, -0.08348464965820312, -0.07830047607421875, -0.07311630249023438, -0.06793212890625, -0.06274795532226562, -0.05756378173828125, -0.052379608154296875, -0.0471954345703125, -0.042011260986328125, -0.03682708740234375, -0.031642913818359375, -0.026458740234375, -0.021274566650390625, -0.01609039306640625, -0.010906219482421875, -0.0057220458984375, -0.000537872314453125, 0.00464630126953125, 0.009830474853515625, 0.0150146484375, 0.020198822021484375, 0.02538299560546875, 0.030567169189453125, 0.0357513427734375, 0.040935516357421875, 0.04611968994140625, 0.051303863525390625, 0.056488037109375, 0.061672210693359375, 0.06685638427734375, 0.07204055786132812, 0.0772247314453125, 0.08240890502929688, 0.08759307861328125, 0.09277725219726562, 0.09796142578125, 0.10314559936523438, 0.10832977294921875, 0.11351394653320312, 0.1186981201171875, 0.12388229370117188, 0.12906646728515625, 0.13425064086914062, 0.139434814453125, 0.14461898803710938, 0.14980316162109375, 0.15498733520507812, 0.1601715087890625, 0.16535568237304688, 0.17053985595703125, 0.17572402954101562, 0.180908203125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 7.0, 3.0, 4.0, 10.0, 17.0, 8.0, 9.0, 16.0, 17.0, 15.0, 21.0, 27.0, 28.0, 26.0, 26.0, 36.0, 29.0, 37.0, 29.0, 40.0, 43.0, 45.0, 38.0, 39.0, 38.0, 50.0, 38.0, 37.0, 38.0, 29.0, 27.0, 35.0, 13.0, 21.0, 13.0, 18.0, 13.0, 8.0, 11.0, 9.0, 7.0, 9.0, 2.0, 8.0, 2.0, 1.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07025146484375, -0.06804466247558594, -0.06583786010742188, -0.06363105773925781, -0.06142425537109375, -0.05921745300292969, -0.057010650634765625, -0.05480384826660156, -0.0525970458984375, -0.05039024353027344, -0.048183441162109375, -0.04597663879394531, -0.04376983642578125, -0.04156303405761719, -0.039356231689453125, -0.03714942932128906, -0.034942626953125, -0.03273582458496094, -0.030529022216796875, -0.028322219848632812, -0.02611541748046875, -0.023908615112304688, -0.021701812744140625, -0.019495010375976562, -0.0172882080078125, -0.015081405639648438, -0.012874603271484375, -0.010667800903320312, -0.00846099853515625, -0.0062541961669921875, -0.004047393798828125, -0.0018405914306640625, 0.0003662109375, 0.0025730133056640625, 0.004779815673828125, 0.0069866180419921875, 0.00919342041015625, 0.011400222778320312, 0.013607025146484375, 0.015813827514648438, 0.0180206298828125, 0.020227432250976562, 0.022434234619140625, 0.024641036987304688, 0.02684783935546875, 0.029054641723632812, 0.031261444091796875, 0.03346824645996094, 0.035675048828125, 0.03788185119628906, 0.040088653564453125, 0.04229545593261719, 0.04450225830078125, 0.04670906066894531, 0.048915863037109375, 0.05112266540527344, 0.0533294677734375, 0.05553627014160156, 0.057743072509765625, 0.05994987487792969, 0.06215667724609375, 0.06436347961425781, 0.06657028198242188, 0.06877708435058594, 0.07098388671875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 12.0, 13.0, 16.0, 27.0, 35.0, 53.0, 110.0, 132.0, 247.0, 442.0, 783.0, 1503.0, 3004.0, 5923.0, 12502.0, 29141.0, 84162.0, 263428.0, 389729.0, 166566.0, 52456.0, 19851.0, 9011.0, 4497.0, 2216.0, 1156.0, 639.0, 293.0, 239.0, 117.0, 72.0, 51.0, 40.0, 26.0, 18.0, 12.0, 3.0, 3.0, 2.0, 4.0, 1.0, 6.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12890625, -0.124786376953125, -0.12066650390625, -0.116546630859375, -0.1124267578125, -0.108306884765625, -0.10418701171875, -0.100067138671875, -0.095947265625, -0.091827392578125, -0.08770751953125, -0.083587646484375, -0.0794677734375, -0.075347900390625, -0.07122802734375, -0.067108154296875, -0.06298828125, -0.058868408203125, -0.05474853515625, -0.050628662109375, -0.0465087890625, -0.042388916015625, -0.03826904296875, -0.034149169921875, -0.030029296875, -0.025909423828125, -0.02178955078125, -0.017669677734375, -0.0135498046875, -0.009429931640625, -0.00531005859375, -0.001190185546875, 0.0029296875, 0.007049560546875, 0.01116943359375, 0.015289306640625, 0.0194091796875, 0.023529052734375, 0.02764892578125, 0.031768798828125, 0.035888671875, 0.040008544921875, 0.04412841796875, 0.048248291015625, 0.0523681640625, 0.056488037109375, 0.06060791015625, 0.064727783203125, 0.06884765625, 0.072967529296875, 0.07708740234375, 0.081207275390625, 0.0853271484375, 0.089447021484375, 0.09356689453125, 0.097686767578125, 0.101806640625, 0.105926513671875, 0.11004638671875, 0.114166259765625, 0.1182861328125, 0.122406005859375, 0.12652587890625, 0.130645751953125, 0.134765625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 10.0, 9.0, 12.0, 11.0, 16.0, 21.0, 26.0, 29.0, 38.0, 35.0, 49.0, 37.0, 43.0, 50.0, 59.0, 59.0, 46.0, 54.0, 41.0, 44.0, 41.0, 38.0, 29.0, 37.0, 30.0, 21.0, 21.0, 14.0, 16.0, 19.0, 14.0, 5.0, 7.0, 8.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.224609375, -0.21668243408203125, -0.2087554931640625, -0.20082855224609375, -0.192901611328125, -0.18497467041015625, -0.1770477294921875, -0.16912078857421875, -0.16119384765625, -0.15326690673828125, -0.1453399658203125, -0.13741302490234375, -0.129486083984375, -0.12155914306640625, -0.1136322021484375, -0.10570526123046875, -0.0977783203125, -0.08985137939453125, -0.0819244384765625, -0.07399749755859375, -0.066070556640625, -0.05814361572265625, -0.0502166748046875, -0.04228973388671875, -0.03436279296875, -0.02643585205078125, -0.0185089111328125, -0.01058197021484375, -0.002655029296875, 0.00527191162109375, 0.0131988525390625, 0.02112579345703125, 0.029052734375, 0.03697967529296875, 0.0449066162109375, 0.05283355712890625, 0.060760498046875, 0.06868743896484375, 0.0766143798828125, 0.08454132080078125, 0.09246826171875, 0.10039520263671875, 0.1083221435546875, 0.11624908447265625, 0.124176025390625, 0.13210296630859375, 0.1400299072265625, 0.14795684814453125, 0.1558837890625, 0.16381072998046875, 0.1717376708984375, 0.17966461181640625, 0.187591552734375, 0.19551849365234375, 0.2034454345703125, 0.21137237548828125, 0.21929931640625, 0.22722625732421875, 0.2351531982421875, 0.24308013916015625, 0.251007080078125, 0.25893402099609375, 0.2668609619140625, 0.27478790283203125, 0.28271484375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 9.0, 9.0, 15.0, 15.0, 21.0, 37.0, 63.0, 77.0, 134.0, 194.0, 358.0, 525.0, 737.0, 1244.0, 1880.0, 3006.0, 5016.0, 8043.0, 13878.0, 25436.0, 50556.0, 110948.0, 233992.0, 281047.0, 161020.0, 71570.0, 33647.0, 18107.0, 10282.0, 6241.0, 3813.0, 2337.0, 1442.0, 986.0, 632.0, 421.0, 288.0, 176.0, 126.0, 90.0, 46.0, 36.0, 18.0, 13.0, 11.0, 9.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0345458984375, -0.03343963623046875, -0.0323333740234375, -0.03122711181640625, -0.030120849609375, -0.02901458740234375, -0.0279083251953125, -0.02680206298828125, -0.02569580078125, -0.02458953857421875, -0.0234832763671875, -0.02237701416015625, -0.021270751953125, -0.02016448974609375, -0.0190582275390625, -0.01795196533203125, -0.016845703125, -0.01573944091796875, -0.0146331787109375, -0.01352691650390625, -0.012420654296875, -0.01131439208984375, -0.0102081298828125, -0.00910186767578125, -0.00799560546875, -0.00688934326171875, -0.0057830810546875, -0.00467681884765625, -0.003570556640625, -0.00246429443359375, -0.0013580322265625, -0.00025177001953125, 0.0008544921875, 0.00196075439453125, 0.0030670166015625, 0.00417327880859375, 0.005279541015625, 0.00638580322265625, 0.0074920654296875, 0.00859832763671875, 0.00970458984375, 0.01081085205078125, 0.0119171142578125, 0.01302337646484375, 0.014129638671875, 0.01523590087890625, 0.0163421630859375, 0.01744842529296875, 0.0185546875, 0.01966094970703125, 0.0207672119140625, 0.02187347412109375, 0.022979736328125, 0.02408599853515625, 0.0251922607421875, 0.02629852294921875, 0.02740478515625, 0.02851104736328125, 0.0296173095703125, 0.03072357177734375, 0.031829833984375, 0.03293609619140625, 0.0340423583984375, 0.03514862060546875, 0.0362548828125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 8.0, 5.0, 10.0, 10.0, 9.0, 22.0, 24.0, 22.0, 39.0, 67.0, 94.0, 92.0, 99.0, 95.0, 82.0, 85.0, 63.0, 48.0, 35.0, 21.0, 17.0, 15.0, 12.0, 6.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5437602996826172e-05, -1.4842487871646881e-05, -1.424737274646759e-05, -1.36522576212883e-05, -1.3057142496109009e-05, -1.2462027370929718e-05, -1.1866912245750427e-05, -1.1271797120571136e-05, -1.0676681995391846e-05, -1.0081566870212555e-05, -9.486451745033264e-06, -8.891336619853973e-06, -8.296221494674683e-06, -7.701106369495392e-06, -7.105991244316101e-06, -6.51087611913681e-06, -5.9157609939575195e-06, -5.320645868778229e-06, -4.725530743598938e-06, -4.130415618419647e-06, -3.5353004932403564e-06, -2.9401853680610657e-06, -2.345070242881775e-06, -1.7499551177024841e-06, -1.1548399925231934e-06, -5.597248673439026e-07, 3.5390257835388184e-08, 6.30505383014679e-07, 1.2256205081939697e-06, 1.8207356333732605e-06, 2.4158507585525513e-06, 3.010965883731842e-06, 3.606081008911133e-06, 4.201196134090424e-06, 4.796311259269714e-06, 5.391426384449005e-06, 5.986541509628296e-06, 6.581656634807587e-06, 7.1767717599868774e-06, 7.771886885166168e-06, 8.367002010345459e-06, 8.96211713552475e-06, 9.55723226070404e-06, 1.0152347385883331e-05, 1.0747462511062622e-05, 1.1342577636241913e-05, 1.1937692761421204e-05, 1.2532807886600494e-05, 1.3127923011779785e-05, 1.3723038136959076e-05, 1.4318153262138367e-05, 1.4913268387317657e-05, 1.5508383512496948e-05, 1.610349863767624e-05, 1.669861376285553e-05, 1.729372888803482e-05, 1.788884401321411e-05, 1.8483959138393402e-05, 1.9079074263572693e-05, 1.9674189388751984e-05, 2.0269304513931274e-05, 2.0864419639110565e-05, 2.1459534764289856e-05, 2.2054649889469147e-05, 2.2649765014648438e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 8.0, 9.0, 12.0, 14.0, 37.0, 48.0, 92.0, 186.0, 383.0, 823.0, 1720.0, 3894.0, 9033.0, 20306.0, 47786.0, 122532.0, 278443.0, 309787.0, 151562.0, 58031.0, 24335.0, 10696.0, 4774.0, 2086.0, 981.0, 435.0, 243.0, 125.0, 70.0, 37.0, 25.0, 8.0, 10.0, 8.0, 4.0, 6.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03765869140625, -0.0362696647644043, -0.034880638122558594, -0.03349161148071289, -0.03210258483886719, -0.030713558197021484, -0.02932453155517578, -0.027935504913330078, -0.026546478271484375, -0.025157451629638672, -0.02376842498779297, -0.022379398345947266, -0.020990371704101562, -0.01960134506225586, -0.018212318420410156, -0.016823291778564453, -0.01543426513671875, -0.014045238494873047, -0.012656211853027344, -0.01126718521118164, -0.009878158569335938, -0.008489131927490234, -0.007100105285644531, -0.005711078643798828, -0.004322052001953125, -0.002933025360107422, -0.0015439987182617188, -0.00015497207641601562, 0.0012340545654296875, 0.0026230812072753906, 0.004012107849121094, 0.005401134490966797, 0.0067901611328125, 0.008179187774658203, 0.009568214416503906, 0.01095724105834961, 0.012346267700195312, 0.013735294342041016, 0.015124320983886719, 0.016513347625732422, 0.017902374267578125, 0.019291400909423828, 0.02068042755126953, 0.022069454193115234, 0.023458480834960938, 0.02484750747680664, 0.026236534118652344, 0.027625560760498047, 0.02901458740234375, 0.030403614044189453, 0.031792640686035156, 0.03318166732788086, 0.03457069396972656, 0.035959720611572266, 0.03734874725341797, 0.03873777389526367, 0.040126800537109375, 0.04151582717895508, 0.04290485382080078, 0.044293880462646484, 0.04568290710449219, 0.04707193374633789, 0.048460960388183594, 0.0498499870300293, 0.051239013671875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 3.0, 6.0, 2.0, 4.0, 8.0, 9.0, 17.0, 22.0, 24.0, 38.0, 35.0, 52.0, 49.0, 71.0, 80.0, 60.0, 72.0, 66.0, 53.0, 58.0, 49.0, 30.0, 33.0, 28.0, 18.0, 14.0, 24.0, 9.0, 11.0, 6.0, 5.0, 3.0, 5.0, 6.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.045257568359375, -0.043843746185302734, -0.04242992401123047, -0.0410161018371582, -0.03960227966308594, -0.03818845748901367, -0.036774635314941406, -0.03536081314086914, -0.033946990966796875, -0.03253316879272461, -0.031119346618652344, -0.029705524444580078, -0.028291702270507812, -0.026877880096435547, -0.02546405792236328, -0.024050235748291016, -0.02263641357421875, -0.021222591400146484, -0.01980876922607422, -0.018394947052001953, -0.016981124877929688, -0.015567302703857422, -0.014153480529785156, -0.01273965835571289, -0.011325836181640625, -0.00991201400756836, -0.008498191833496094, -0.007084369659423828, -0.0056705474853515625, -0.004256725311279297, -0.0028429031372070312, -0.0014290809631347656, -1.52587890625e-05, 0.0013985633850097656, 0.0028123855590820312, 0.004226207733154297, 0.0056400299072265625, 0.007053852081298828, 0.008467674255371094, 0.00988149642944336, 0.011295318603515625, 0.01270914077758789, 0.014122962951660156, 0.015536785125732422, 0.016950607299804688, 0.018364429473876953, 0.01977825164794922, 0.021192073822021484, 0.02260589599609375, 0.024019718170166016, 0.02543354034423828, 0.026847362518310547, 0.028261184692382812, 0.029675006866455078, 0.031088829040527344, 0.03250265121459961, 0.033916473388671875, 0.03533029556274414, 0.036744117736816406, 0.03815793991088867, 0.03957176208496094, 0.0409855842590332, 0.04239940643310547, 0.043813228607177734, 0.04522705078125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 5.0, 6.0, 19.0, 50.0, 98.0, 166.0, 201.0, 178.0, 143.0, 70.0, 39.0, 9.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5278503894805908, -1.4943004846572876, -1.4607505798339844, -1.4272006750106812, -1.393650770187378, -1.3601009845733643, -1.326551079750061, -1.2930011749267578, -1.2594512701034546, -1.2259013652801514, -1.1923514604568481, -1.158801555633545, -1.1252517700195312, -1.091701865196228, -1.0581519603729248, -1.0246020555496216, -0.9910521507263184, -0.9575022459030151, -0.9239523410797119, -0.8904024958610535, -0.8568525910377502, -0.823302686214447, -0.7897528409957886, -0.7562029361724854, -0.7226530313491821, -0.6891031265258789, -0.6555532217025757, -0.6220033764839172, -0.588453471660614, -0.5549035668373108, -0.5213537216186523, -0.4878038167953491, -0.4542539119720459, -0.4207040071487427, -0.38715413212776184, -0.353604257106781, -0.3200543522834778, -0.28650444746017456, -0.2529545724391937, -0.2194046825170517, -0.18585479259490967, -0.15230490267276764, -0.11875501275062561, -0.08520512282848358, -0.05165523290634155, -0.018105342984199524, 0.015444546937942505, 0.048994436860084534, 0.08254432678222656, 0.11609421670436859, 0.14964410662651062, 0.18319399654865265, 0.21674388647079468, 0.2502937912940979, 0.28384366631507874, 0.31739354133605957, 0.3509434461593628, 0.384493350982666, 0.41804322600364685, 0.4515931010246277, 0.4851430058479309, 0.5186929106712341, 0.5522427558898926, 0.5857926607131958, 0.619342565536499]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 9.0, 13.0, 20.0, 21.0, 18.0, 27.0, 26.0, 29.0, 37.0, 44.0, 36.0, 43.0, 43.0, 53.0, 44.0, 56.0, 49.0, 37.0, 46.0, 51.0, 38.0, 31.0, 28.0, 33.0, 23.0, 20.0, 18.0, 21.0, 21.0, 7.0, 17.0, 9.0, 7.0, 3.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5830000638961792, -0.5650597214698792, -0.5471193194389343, -0.5291789770126343, -0.5112386345863342, -0.4932982325553894, -0.47535789012908936, -0.4574175179004669, -0.4394771456718445, -0.42153677344322205, -0.403596431016922, -0.38565605878829956, -0.3677156865596771, -0.3497753143310547, -0.33183497190475464, -0.3138945996761322, -0.29595425724983215, -0.2780138850212097, -0.26007354259490967, -0.24213317036628723, -0.2241927981376648, -0.20625244081020355, -0.1883120834827423, -0.17037171125411987, -0.15243135392665863, -0.1344909965991974, -0.11655062437057495, -0.09861026704311371, -0.08066990226507187, -0.06272953748703003, -0.04478918015956879, -0.02684880793094635, -0.008908450603485107, 0.009031912311911583, 0.026972275227308273, 0.044912636280059814, 0.06285300105810165, 0.0807933658361435, 0.09873372316360474, 0.11667409539222717, 0.13461445271968842, 0.15255481004714966, 0.1704951822757721, 0.18843553960323334, 0.20637589693069458, 0.22431626915931702, 0.24225662648677826, 0.2601969838142395, 0.27813735604286194, 0.2960777282714844, 0.3140180706977844, 0.33195844292640686, 0.3498988151550293, 0.36783915758132935, 0.3857795298099518, 0.4037199020385742, 0.42166024446487427, 0.4396006166934967, 0.45754095911979675, 0.4754813313484192, 0.4934217035770416, 0.5113620758056641, 0.5293024182319641, 0.5472427606582642, 0.565183162689209]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 9.0, 12.0, 20.0, 21.0, 29.0, 53.0, 94.0, 167.0, 262.0, 476.0, 891.0, 1803.0, 3472.0, 7926.0, 18723.0, 45754.0, 114271.0, 279064.0, 599656.0, 977980.0, 1004317.0, 627732.0, 298477.0, 125389.0, 50570.0, 20235.0, 8923.0, 4029.0, 1853.0, 953.0, 515.0, 248.0, 138.0, 81.0, 51.0, 27.0, 13.0, 20.0, 9.0, 7.0, 2.0, 1.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05975341796875, -0.05782794952392578, -0.05590248107910156, -0.053977012634277344, -0.052051544189453125, -0.050126075744628906, -0.04820060729980469, -0.04627513885498047, -0.04434967041015625, -0.04242420196533203, -0.04049873352050781, -0.038573265075683594, -0.036647796630859375, -0.034722328186035156, -0.03279685974121094, -0.03087139129638672, -0.0289459228515625, -0.02702045440673828, -0.025094985961914062, -0.023169517517089844, -0.021244049072265625, -0.019318580627441406, -0.017393112182617188, -0.015467643737792969, -0.01354217529296875, -0.011616706848144531, -0.009691238403320312, -0.007765769958496094, -0.005840301513671875, -0.003914833068847656, -0.0019893646240234375, -6.389617919921875e-05, 0.001861572265625, 0.0037870407104492188, 0.0057125091552734375, 0.007637977600097656, 0.009563446044921875, 0.011488914489746094, 0.013414382934570312, 0.015339851379394531, 0.01726531982421875, 0.01919078826904297, 0.021116256713867188, 0.023041725158691406, 0.024967193603515625, 0.026892662048339844, 0.028818130493164062, 0.03074359893798828, 0.0326690673828125, 0.03459453582763672, 0.03652000427246094, 0.038445472717285156, 0.040370941162109375, 0.042296409606933594, 0.04422187805175781, 0.04614734649658203, 0.04807281494140625, 0.04999828338623047, 0.05192375183105469, 0.053849220275878906, 0.055774688720703125, 0.057700157165527344, 0.05962562561035156, 0.06155109405517578, 0.0634765625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 2.0, 5.0, 5.0, 11.0, 7.0, 8.0, 12.0, 17.0, 16.0, 17.0, 24.0, 12.0, 27.0, 30.0, 26.0, 32.0, 28.0, 37.0, 45.0, 57.0, 56.0, 54.0, 38.0, 42.0, 36.0, 24.0, 47.0, 38.0, 24.0, 30.0, 22.0, 23.0, 31.0, 22.0, 13.0, 12.0, 17.0, 7.0, 12.0, 11.0, 4.0, 4.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0791015625, -0.07668399810791016, -0.07426643371582031, -0.07184886932373047, -0.06943130493164062, -0.06701374053955078, -0.06459617614746094, -0.062178611755371094, -0.05976104736328125, -0.057343482971191406, -0.05492591857910156, -0.05250835418701172, -0.050090789794921875, -0.04767322540283203, -0.04525566101074219, -0.042838096618652344, -0.0404205322265625, -0.038002967834472656, -0.03558540344238281, -0.03316783905029297, -0.030750274658203125, -0.02833271026611328, -0.025915145874023438, -0.023497581481933594, -0.02108001708984375, -0.018662452697753906, -0.016244888305664062, -0.013827323913574219, -0.011409759521484375, -0.008992195129394531, -0.0065746307373046875, -0.004157066345214844, -0.001739501953125, 0.0006780624389648438, 0.0030956268310546875, 0.005513191223144531, 0.007930755615234375, 0.010348320007324219, 0.012765884399414062, 0.015183448791503906, 0.01760101318359375, 0.020018577575683594, 0.022436141967773438, 0.02485370635986328, 0.027271270751953125, 0.02968883514404297, 0.03210639953613281, 0.034523963928222656, 0.0369415283203125, 0.039359092712402344, 0.04177665710449219, 0.04419422149658203, 0.046611785888671875, 0.04902935028076172, 0.05144691467285156, 0.053864479064941406, 0.05628204345703125, 0.058699607849121094, 0.06111717224121094, 0.06353473663330078, 0.06595230102539062, 0.06836986541748047, 0.07078742980957031, 0.07320499420166016, 0.07562255859375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 4.0, 4.0, 7.0, 10.0, 19.0, 22.0, 43.0, 74.0, 120.0, 336.0, 847.0, 3084.0, 14582.0, 98381.0, 1059179.0, 2670946.0, 301412.0, 36396.0, 6313.0, 1552.0, 488.0, 201.0, 131.0, 44.0, 41.0, 17.0, 8.0, 14.0, 11.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14208984375, -0.13597869873046875, -0.1298675537109375, -0.12375640869140625, -0.117645263671875, -0.11153411865234375, -0.1054229736328125, -0.09931182861328125, -0.09320068359375, -0.08708953857421875, -0.0809783935546875, -0.07486724853515625, -0.068756103515625, -0.06264495849609375, -0.0565338134765625, -0.05042266845703125, -0.0443115234375, -0.03820037841796875, -0.0320892333984375, -0.02597808837890625, -0.019866943359375, -0.01375579833984375, -0.0076446533203125, -0.00153350830078125, 0.00457763671875, 0.01068878173828125, 0.0167999267578125, 0.02291107177734375, 0.029022216796875, 0.03513336181640625, 0.0412445068359375, 0.04735565185546875, 0.053466796875, 0.05957794189453125, 0.0656890869140625, 0.07180023193359375, 0.077911376953125, 0.08402252197265625, 0.0901336669921875, 0.09624481201171875, 0.10235595703125, 0.10846710205078125, 0.1145782470703125, 0.12068939208984375, 0.126800537109375, 0.13291168212890625, 0.1390228271484375, 0.14513397216796875, 0.1512451171875, 0.15735626220703125, 0.1634674072265625, 0.16957855224609375, 0.175689697265625, 0.18180084228515625, 0.1879119873046875, 0.19402313232421875, 0.20013427734375, 0.20624542236328125, 0.2123565673828125, 0.21846771240234375, 0.224578857421875, 0.23069000244140625, 0.2368011474609375, 0.24291229248046875, 0.2490234375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 2.0, 14.0, 17.0, 43.0, 54.0, 68.0, 144.0, 200.0, 314.0, 578.0, 730.0, 710.0, 484.0, 262.0, 157.0, 106.0, 63.0, 50.0, 34.0, 14.0, 14.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12890625, -0.12238693237304688, -0.11586761474609375, -0.10934829711914062, -0.1028289794921875, -0.09630966186523438, -0.08979034423828125, -0.08327102661132812, -0.076751708984375, -0.07023239135742188, -0.06371307373046875, -0.057193756103515625, -0.0506744384765625, -0.044155120849609375, -0.03763580322265625, -0.031116485595703125, -0.02459716796875, -0.018077850341796875, -0.01155853271484375, -0.005039215087890625, 0.0014801025390625, 0.007999420166015625, 0.01451873779296875, 0.021038055419921875, 0.027557373046875, 0.034076690673828125, 0.04059600830078125, 0.047115325927734375, 0.0536346435546875, 0.060153961181640625, 0.06667327880859375, 0.07319259643554688, 0.0797119140625, 0.08623123168945312, 0.09275054931640625, 0.09926986694335938, 0.1057891845703125, 0.11230850219726562, 0.11882781982421875, 0.12534713745117188, 0.131866455078125, 0.13838577270507812, 0.14490509033203125, 0.15142440795898438, 0.1579437255859375, 0.16446304321289062, 0.17098236083984375, 0.17750167846679688, 0.18402099609375, 0.19054031372070312, 0.19705963134765625, 0.20357894897460938, 0.2100982666015625, 0.21661758422851562, 0.22313690185546875, 0.22965621948242188, 0.236175537109375, 0.24269485473632812, 0.24921417236328125, 0.2557334899902344, 0.2622528076171875, 0.2687721252441406, 0.27529144287109375, 0.2818107604980469, 0.288330078125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 6.0, 24.0, 36.0, 69.0, 115.0, 157.0, 178.0, 163.0, 100.0, 78.0, 42.0, 13.0, 5.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4230341911315918, -1.3887436389923096, -1.3544529676437378, -1.3201624155044556, -1.2858717441558838, -1.2515811920166016, -1.2172906398773193, -1.1829999685287476, -1.1487094163894653, -1.114418864250183, -1.0801281929016113, -1.045837640762329, -1.0115470886230469, -0.9772564172744751, -0.9429658651351929, -0.9086752533912659, -0.8743846416473389, -0.8400940299034119, -0.8058034181594849, -0.7715128660202026, -0.7372222542762756, -0.7029316425323486, -0.6686410903930664, -0.6343504786491394, -0.6000598669052124, -0.5657692551612854, -0.5314786434173584, -0.49718809127807617, -0.46289747953414917, -0.42860686779022217, -0.39431628584861755, -0.36002570390701294, -0.3257349729537964, -0.2914443612098694, -0.25715377926826477, -0.22286318242549896, -0.18857258558273315, -0.15428198873996735, -0.11999139189720154, -0.08570079505443573, -0.05141019821166992, -0.017119601368904114, 0.017170995473861694, 0.0514615923166275, 0.08575218915939331, 0.12004278600215912, 0.15433338284492493, 0.18862397968769073, 0.22291457653045654, 0.25720518827438354, 0.29149577021598816, 0.3257863521575928, 0.3600769639015198, 0.3943675756454468, 0.4286581575870514, 0.462948739528656, 0.497239351272583, 0.53152996301651, 0.565820574760437, 0.6001111268997192, 0.6344017386436462, 0.6686923503875732, 0.7029829025268555, 0.7372735142707825, 0.7715641260147095]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 10.0, 7.0, 8.0, 11.0, 6.0, 10.0, 18.0, 22.0, 23.0, 25.0, 25.0, 35.0, 19.0, 30.0, 45.0, 44.0, 44.0, 41.0, 36.0, 57.0, 67.0, 48.0, 44.0, 33.0, 45.0, 32.0, 35.0, 36.0, 18.0, 28.0, 24.0, 19.0, 20.0, 13.0, 8.0, 4.0, 4.0, 4.0, 1.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.5732724666595459, -0.5583806037902832, -0.5434887409210205, -0.5285968780517578, -0.5137050151824951, -0.4988131523132324, -0.4839212894439697, -0.46902942657470703, -0.45413756370544434, -0.43924570083618164, -0.42435383796691895, -0.40946197509765625, -0.39457011222839355, -0.37967824935913086, -0.36478638648986816, -0.34989452362060547, -0.3350026309490204, -0.3201107680797577, -0.305218905210495, -0.2903270423412323, -0.2754351794719696, -0.2605433166027069, -0.24565143883228302, -0.23075957596302032, -0.21586771309375763, -0.20097585022449493, -0.18608398735523224, -0.17119210958480835, -0.15630024671554565, -0.14140838384628296, -0.12651652097702026, -0.11162465810775757, -0.09673279523849487, -0.08184093236923218, -0.06694906949996948, -0.05205719918012619, -0.037165336310863495, -0.0222734734416008, -0.007381603121757507, 0.007510259747505188, 0.022402122616767883, 0.03729398548603058, 0.05218585208058357, 0.06707771867513657, 0.08196958154439926, 0.09686144441366196, 0.11175331473350525, 0.12664517760276794, 0.14153704047203064, 0.15642890334129333, 0.17132076621055603, 0.18621262907981873, 0.20110449194908142, 0.21599635481834412, 0.230888232588768, 0.2457800954580307, 0.2606719732284546, 0.2755638360977173, 0.29045569896698, 0.3053475618362427, 0.32023942470550537, 0.33513128757476807, 0.35002315044403076, 0.36491501331329346, 0.37980687618255615]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 8.0, 3.0, 12.0, 13.0, 14.0, 19.0, 35.0, 43.0, 67.0, 100.0, 172.0, 253.0, 395.0, 690.0, 1235.0, 1961.0, 3538.0, 5916.0, 10722.0, 21564.0, 52332.0, 142322.0, 285459.0, 284515.0, 139946.0, 51052.0, 21175.0, 10476.0, 5839.0, 3623.0, 2093.0, 1135.0, 667.0, 386.0, 264.0, 186.0, 96.0, 69.0, 40.0, 37.0, 28.0, 18.0, 9.0, 6.0, 4.0, 5.0, 6.0, 2.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.12109375, -0.11742305755615234, -0.11375236511230469, -0.11008167266845703, -0.10641098022460938, -0.10274028778076172, -0.09906959533691406, -0.0953989028930664, -0.09172821044921875, -0.0880575180053711, -0.08438682556152344, -0.08071613311767578, -0.07704544067382812, -0.07337474822998047, -0.06970405578613281, -0.06603336334228516, -0.0623626708984375, -0.058691978454589844, -0.05502128601074219, -0.05135059356689453, -0.047679901123046875, -0.04400920867919922, -0.04033851623535156, -0.036667823791503906, -0.03299713134765625, -0.029326438903808594, -0.025655746459960938, -0.02198505401611328, -0.018314361572265625, -0.014643669128417969, -0.010972976684570312, -0.007302284240722656, -0.003631591796875, 3.910064697265625e-05, 0.0037097930908203125, 0.007380485534667969, 0.011051177978515625, 0.014721870422363281, 0.018392562866210938, 0.022063255310058594, 0.02573394775390625, 0.029404640197753906, 0.03307533264160156, 0.03674602508544922, 0.040416717529296875, 0.04408740997314453, 0.04775810241699219, 0.051428794860839844, 0.0550994873046875, 0.058770179748535156, 0.06244087219238281, 0.06611156463623047, 0.06978225708007812, 0.07345294952392578, 0.07712364196777344, 0.0807943344116211, 0.08446502685546875, 0.0881357192993164, 0.09180641174316406, 0.09547710418701172, 0.09914779663085938, 0.10281848907470703, 0.10648918151855469, 0.11015987396240234, 0.11383056640625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 0.0, 2.0, 4.0, 9.0, 10.0, 14.0, 10.0, 16.0, 17.0, 14.0, 22.0, 22.0, 22.0, 45.0, 31.0, 28.0, 36.0, 40.0, 38.0, 39.0, 38.0, 51.0, 52.0, 46.0, 49.0, 36.0, 44.0, 35.0, 28.0, 27.0, 29.0, 30.0, 28.0, 17.0, 12.0, 14.0, 9.0, 15.0, 5.0, 1.0, 6.0, 4.0, 5.0, 8.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.0970458984375, -0.09445381164550781, -0.09186172485351562, -0.08926963806152344, -0.08667755126953125, -0.08408546447753906, -0.08149337768554688, -0.07890129089355469, -0.0763092041015625, -0.07371711730957031, -0.07112503051757812, -0.06853294372558594, -0.06594085693359375, -0.06334877014160156, -0.060756683349609375, -0.05816459655761719, -0.055572509765625, -0.05298042297363281, -0.050388336181640625, -0.04779624938964844, -0.04520416259765625, -0.04261207580566406, -0.040019989013671875, -0.03742790222167969, -0.0348358154296875, -0.03224372863769531, -0.029651641845703125, -0.027059555053710938, -0.02446746826171875, -0.021875381469726562, -0.019283294677734375, -0.016691207885742188, -0.01409912109375, -0.011507034301757812, -0.008914947509765625, -0.0063228607177734375, -0.00373077392578125, -0.0011386871337890625, 0.001453399658203125, 0.0040454864501953125, 0.0066375732421875, 0.009229660034179688, 0.011821746826171875, 0.014413833618164062, 0.01700592041015625, 0.019598007202148438, 0.022190093994140625, 0.024782180786132812, 0.027374267578125, 0.029966354370117188, 0.032558441162109375, 0.03515052795410156, 0.03774261474609375, 0.04033470153808594, 0.042926788330078125, 0.04551887512207031, 0.0481109619140625, 0.05070304870605469, 0.053295135498046875, 0.05588722229003906, 0.05847930908203125, 0.06107139587402344, 0.06366348266601562, 0.06625556945800781, 0.06884765625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 14.0, 6.0, 16.0, 16.0, 38.0, 54.0, 61.0, 113.0, 217.0, 444.0, 1079.0, 2435.0, 5749.0, 14822.0, 43081.0, 183488.0, 491992.0, 224954.0, 51644.0, 16868.0, 6573.0, 2672.0, 1139.0, 489.0, 226.0, 138.0, 77.0, 49.0, 34.0, 19.0, 12.0, 12.0, 2.0, 5.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.171630859375, -0.1654052734375, -0.1591796875, -0.1529541015625, -0.146728515625, -0.1405029296875, -0.13427734375, -0.1280517578125, -0.121826171875, -0.1156005859375, -0.109375, -0.1031494140625, -0.096923828125, -0.0906982421875, -0.08447265625, -0.0782470703125, -0.072021484375, -0.0657958984375, -0.0595703125, -0.0533447265625, -0.047119140625, -0.0408935546875, -0.03466796875, -0.0284423828125, -0.022216796875, -0.0159912109375, -0.009765625, -0.0035400390625, 0.002685546875, 0.0089111328125, 0.01513671875, 0.0213623046875, 0.027587890625, 0.0338134765625, 0.0400390625, 0.0462646484375, 0.052490234375, 0.0587158203125, 0.06494140625, 0.0711669921875, 0.077392578125, 0.0836181640625, 0.08984375, 0.0960693359375, 0.102294921875, 0.1085205078125, 0.11474609375, 0.1209716796875, 0.127197265625, 0.1334228515625, 0.1396484375, 0.1458740234375, 0.152099609375, 0.1583251953125, 0.16455078125, 0.1707763671875, 0.177001953125, 0.1832275390625, 0.189453125, 0.1956787109375, 0.201904296875, 0.2081298828125, 0.21435546875, 0.2205810546875, 0.226806640625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 2.0, 5.0, 9.0, 7.0, 12.0, 7.0, 20.0, 16.0, 25.0, 23.0, 28.0, 31.0, 32.0, 40.0, 37.0, 35.0, 35.0, 51.0, 40.0, 41.0, 57.0, 47.0, 46.0, 39.0, 45.0, 44.0, 29.0, 15.0, 21.0, 26.0, 26.0, 24.0, 12.0, 18.0, 9.0, 9.0, 5.0, 6.0, 8.0, 8.0, 3.0, 0.0, 3.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2489013671875, -0.24129676818847656, -0.23369216918945312, -0.2260875701904297, -0.21848297119140625, -0.2108783721923828, -0.20327377319335938, -0.19566917419433594, -0.1880645751953125, -0.18045997619628906, -0.17285537719726562, -0.1652507781982422, -0.15764617919921875, -0.1500415802001953, -0.14243698120117188, -0.13483238220214844, -0.127227783203125, -0.11962318420410156, -0.11201858520507812, -0.10441398620605469, -0.09680938720703125, -0.08920478820800781, -0.08160018920898438, -0.07399559020996094, -0.0663909912109375, -0.05878639221191406, -0.051181793212890625, -0.04357719421386719, -0.03597259521484375, -0.028367996215820312, -0.020763397216796875, -0.013158798217773438, -0.00555419921875, 0.0020503997802734375, 0.009654998779296875, 0.017259597778320312, 0.02486419677734375, 0.03246879577636719, 0.040073394775390625, 0.04767799377441406, 0.0552825927734375, 0.06288719177246094, 0.07049179077148438, 0.07809638977050781, 0.08570098876953125, 0.09330558776855469, 0.10091018676757812, 0.10851478576660156, 0.116119384765625, 0.12372398376464844, 0.13132858276367188, 0.1389331817626953, 0.14653778076171875, 0.1541423797607422, 0.16174697875976562, 0.16935157775878906, 0.1769561767578125, 0.18456077575683594, 0.19216537475585938, 0.1997699737548828, 0.20737457275390625, 0.2149791717529297, 0.22258377075195312, 0.23018836975097656, 0.23779296875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 10.0, 11.0, 17.0, 31.0, 51.0, 77.0, 122.0, 205.0, 422.0, 662.0, 1382.0, 2260.0, 4401.0, 7696.0, 14093.0, 27671.0, 64560.0, 183192.0, 368363.0, 226191.0, 78963.0, 32355.0, 16214.0, 8721.0, 4872.0, 2648.0, 1513.0, 807.0, 479.0, 240.0, 129.0, 90.0, 38.0, 27.0, 15.0, 12.0, 11.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.049468994140625, -0.047951698303222656, -0.04643440246582031, -0.04491710662841797, -0.043399810791015625, -0.04188251495361328, -0.04036521911621094, -0.038847923278808594, -0.03733062744140625, -0.035813331604003906, -0.03429603576660156, -0.03277873992919922, -0.031261444091796875, -0.02974414825439453, -0.028226852416992188, -0.026709556579589844, -0.0251922607421875, -0.023674964904785156, -0.022157669067382812, -0.02064037322998047, -0.019123077392578125, -0.01760578155517578, -0.016088485717773438, -0.014571189880371094, -0.01305389404296875, -0.011536598205566406, -0.010019302368164062, -0.008502006530761719, -0.006984710693359375, -0.005467414855957031, -0.0039501190185546875, -0.0024328231811523438, -0.00091552734375, 0.0006017684936523438, 0.0021190643310546875, 0.0036363601684570312, 0.005153656005859375, 0.006670951843261719, 0.008188247680664062, 0.009705543518066406, 0.01122283935546875, 0.012740135192871094, 0.014257431030273438, 0.01577472686767578, 0.017292022705078125, 0.01880931854248047, 0.020326614379882812, 0.021843910217285156, 0.0233612060546875, 0.024878501892089844, 0.026395797729492188, 0.02791309356689453, 0.029430389404296875, 0.03094768524169922, 0.03246498107910156, 0.033982276916503906, 0.03549957275390625, 0.037016868591308594, 0.03853416442871094, 0.04005146026611328, 0.041568756103515625, 0.04308605194091797, 0.04460334777832031, 0.046120643615722656, 0.047637939453125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 2.0, 2.0, 10.0, 9.0, 11.0, 10.0, 16.0, 12.0, 22.0, 41.0, 33.0, 61.0, 80.0, 92.0, 106.0, 87.0, 82.0, 78.0, 53.0, 46.0, 44.0, 26.0, 15.0, 10.0, 11.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.823902130126953e-05, -1.7630867660045624e-05, -1.7022714018821716e-05, -1.641456037759781e-05, -1.58064067363739e-05, -1.5198253095149994e-05, -1.4590099453926086e-05, -1.3981945812702179e-05, -1.3373792171478271e-05, -1.2765638530254364e-05, -1.2157484889030457e-05, -1.1549331247806549e-05, -1.0941177606582642e-05, -1.0333023965358734e-05, -9.724870324134827e-06, -9.11671668291092e-06, -8.508563041687012e-06, -7.900409400463104e-06, -7.292255759239197e-06, -6.684102118015289e-06, -6.075948476791382e-06, -5.467794835567474e-06, -4.859641194343567e-06, -4.2514875531196594e-06, -3.643333911895752e-06, -3.0351802706718445e-06, -2.427026629447937e-06, -1.8188729882240295e-06, -1.210719347000122e-06, -6.025657057762146e-07, 5.587935447692871e-09, 6.137415766716003e-07, 1.2218952178955078e-06, 1.8300488591194153e-06, 2.4382025003433228e-06, 3.0463561415672302e-06, 3.6545097827911377e-06, 4.262663424015045e-06, 4.870817065238953e-06, 5.47897070646286e-06, 6.087124347686768e-06, 6.695277988910675e-06, 7.3034316301345825e-06, 7.91158527135849e-06, 8.519738912582397e-06, 9.127892553806305e-06, 9.736046195030212e-06, 1.034419983625412e-05, 1.0952353477478027e-05, 1.1560507118701935e-05, 1.2168660759925842e-05, 1.277681440114975e-05, 1.3384968042373657e-05, 1.3993121683597565e-05, 1.4601275324821472e-05, 1.520942896604538e-05, 1.5817582607269287e-05, 1.6425736248493195e-05, 1.7033889889717102e-05, 1.764204353094101e-05, 1.8250197172164917e-05, 1.8858350813388824e-05, 1.9466504454612732e-05, 2.007465809583664e-05, 2.0682811737060547e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 4.0, 5.0, 11.0, 13.0, 8.0, 17.0, 26.0, 32.0, 57.0, 75.0, 124.0, 203.0, 353.0, 598.0, 1230.0, 2256.0, 4457.0, 8705.0, 16886.0, 35025.0, 78431.0, 179793.0, 292891.0, 229586.0, 106014.0, 46432.0, 22220.0, 11199.0, 5583.0, 2836.0, 1494.0, 827.0, 472.0, 259.0, 152.0, 89.0, 49.0, 42.0, 25.0, 17.0, 19.0, 10.0, 7.0, 4.0, 7.0, 6.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04248046875, -0.041219234466552734, -0.03995800018310547, -0.0386967658996582, -0.03743553161621094, -0.03617429733276367, -0.034913063049316406, -0.03365182876586914, -0.032390594482421875, -0.03112936019897461, -0.029868125915527344, -0.028606891632080078, -0.027345657348632812, -0.026084423065185547, -0.02482318878173828, -0.023561954498291016, -0.02230072021484375, -0.021039485931396484, -0.01977825164794922, -0.018517017364501953, -0.017255783081054688, -0.015994548797607422, -0.014733314514160156, -0.01347208023071289, -0.012210845947265625, -0.01094961166381836, -0.009688377380371094, -0.008427143096923828, -0.0071659088134765625, -0.005904674530029297, -0.004643440246582031, -0.0033822059631347656, -0.0021209716796875, -0.0008597373962402344, 0.00040149688720703125, 0.0016627311706542969, 0.0029239654541015625, 0.004185199737548828, 0.005446434020996094, 0.006707668304443359, 0.007968902587890625, 0.00923013687133789, 0.010491371154785156, 0.011752605438232422, 0.013013839721679688, 0.014275074005126953, 0.015536308288574219, 0.016797542572021484, 0.01805877685546875, 0.019320011138916016, 0.02058124542236328, 0.021842479705810547, 0.023103713989257812, 0.024364948272705078, 0.025626182556152344, 0.02688741683959961, 0.028148651123046875, 0.02940988540649414, 0.030671119689941406, 0.03193235397338867, 0.03319358825683594, 0.0344548225402832, 0.03571605682373047, 0.036977291107177734, 0.038238525390625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 8.0, 7.0, 12.0, 9.0, 7.0, 12.0, 14.0, 22.0, 31.0, 32.0, 44.0, 44.0, 61.0, 69.0, 79.0, 79.0, 76.0, 69.0, 67.0, 57.0, 35.0, 32.0, 32.0, 17.0, 20.0, 11.0, 10.0, 7.0, 10.0, 8.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.0633544921875, -0.061719417572021484, -0.06008434295654297, -0.05844926834106445, -0.05681419372558594, -0.05517911911010742, -0.053544044494628906, -0.05190896987915039, -0.050273895263671875, -0.04863882064819336, -0.047003746032714844, -0.04536867141723633, -0.04373359680175781, -0.0420985221862793, -0.04046344757080078, -0.038828372955322266, -0.03719329833984375, -0.035558223724365234, -0.03392314910888672, -0.0322880744934082, -0.030652999877929688, -0.029017925262451172, -0.027382850646972656, -0.02574777603149414, -0.024112701416015625, -0.02247762680053711, -0.020842552185058594, -0.019207477569580078, -0.017572402954101562, -0.015937328338623047, -0.014302253723144531, -0.012667179107666016, -0.0110321044921875, -0.009397029876708984, -0.007761955261230469, -0.006126880645751953, -0.0044918060302734375, -0.002856731414794922, -0.0012216567993164062, 0.0004134178161621094, 0.002048492431640625, 0.0036835670471191406, 0.005318641662597656, 0.006953716278076172, 0.008588790893554688, 0.010223865509033203, 0.011858940124511719, 0.013494014739990234, 0.01512908935546875, 0.016764163970947266, 0.01839923858642578, 0.020034313201904297, 0.021669387817382812, 0.023304462432861328, 0.024939537048339844, 0.02657461166381836, 0.028209686279296875, 0.02984476089477539, 0.031479835510253906, 0.03311491012573242, 0.03474998474121094, 0.03638505935668945, 0.03802013397216797, 0.039655208587646484, 0.041290283203125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 14.0, 16.0, 42.0, 77.0, 137.0, 193.0, 197.0, 166.0, 76.0, 35.0, 16.0, 7.0, 4.0, 5.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4243934154510498, -1.3868799209594727, -1.349366545677185, -1.311853051185608, -1.2743396759033203, -1.2368261814117432, -1.199312686920166, -1.1617991924285889, -1.1242858171463013, -1.0867723226547241, -1.0492589473724365, -1.0117454528808594, -0.974232017993927, -0.9367185831069946, -0.8992050886154175, -0.8616916537284851, -0.8241782188415527, -0.7866647839546204, -0.749151349067688, -0.7116378545761108, -0.6741244196891785, -0.6366109848022461, -0.599097490310669, -0.5615840554237366, -0.5240706205368042, -0.4865571856498718, -0.44904372096061707, -0.4115302562713623, -0.37401682138442993, -0.33650338649749756, -0.2989899218082428, -0.26147645711898804, -0.22396314144134521, -0.18644969165325165, -0.14893624186515808, -0.11142279207706451, -0.07390934228897095, -0.03639589250087738, 0.0011175572872161865, 0.03863102197647095, 0.07614445686340332, 0.11365790665149689, 0.15117135643959045, 0.18868480622768402, 0.2261982560157776, 0.26371169090270996, 0.3012251555919647, 0.3387386202812195, 0.37625205516815186, 0.41376549005508423, 0.451278954744339, 0.48879241943359375, 0.5263058543205261, 0.5638192892074585, 0.6013327836990356, 0.638846218585968, 0.6763596534729004, 0.7138730883598328, 0.7513865232467651, 0.7889000177383423, 0.8264134526252747, 0.863926887512207, 0.9014403820037842, 0.9389538168907166, 0.9764672517776489]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 6.0, 4.0, 7.0, 7.0, 8.0, 8.0, 15.0, 12.0, 29.0, 22.0, 29.0, 14.0, 30.0, 24.0, 23.0, 40.0, 37.0, 42.0, 33.0, 46.0, 46.0, 39.0, 41.0, 31.0, 35.0, 44.0, 38.0, 37.0, 27.0, 34.0, 19.0, 27.0, 22.0, 27.0, 20.0, 11.0, 5.0, 10.0, 17.0, 8.0, 5.0, 9.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.4886553883552551, -0.4730220139026642, -0.45738863945007324, -0.4417552351951599, -0.42612186074256897, -0.410488486289978, -0.3948551118373871, -0.37922173738479614, -0.3635883331298828, -0.34795495867729187, -0.3323215842247009, -0.3166881799697876, -0.30105480551719666, -0.2854214310646057, -0.26978805661201477, -0.25415468215942383, -0.23852130770683289, -0.22288793325424194, -0.2072545439004898, -0.19162116944789886, -0.17598778009414673, -0.1603544056415558, -0.14472103118896484, -0.1290876567363739, -0.11345426738262177, -0.09782088547945023, -0.08218750357627869, -0.06655412912368774, -0.050920747220516205, -0.035287365317344666, -0.019653990864753723, -0.004020608961582184, 0.011612772941589355, 0.027246152982115746, 0.042879533022642136, 0.058512911200523376, 0.07414629310369492, 0.08977967500686646, 0.1054130494594574, 0.12104643136262894, 0.13667981326580048, 0.15231318771839142, 0.16794657707214355, 0.1835799515247345, 0.19921332597732544, 0.21484671533107758, 0.23048008978366852, 0.24611347913742065, 0.2617468535900116, 0.27738022804260254, 0.2930136024951935, 0.3086469769477844, 0.32428038120269775, 0.3399137556552887, 0.35554713010787964, 0.3711805045604706, 0.3868138790130615, 0.40244725346565247, 0.4180806279182434, 0.43371403217315674, 0.4493474066257477, 0.4649807810783386, 0.48061415553092957, 0.4962475299835205, 0.5118809342384338]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 20.0, 13.0, 25.0, 42.0, 117.0, 217.0, 479.0, 977.0, 2388.0, 6276.0, 18899.0, 64388.0, 233756.0, 734585.0, 1384374.0, 1117316.0, 449770.0, 129086.0, 34489.0, 10552.0, 3704.0, 1515.0, 675.0, 325.0, 137.0, 64.0, 35.0, 28.0, 11.0, 6.0, 4.0, 5.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062255859375, -0.059393882751464844, -0.05653190612792969, -0.05366992950439453, -0.050807952880859375, -0.04794597625732422, -0.04508399963378906, -0.042222023010253906, -0.03936004638671875, -0.036498069763183594, -0.03363609313964844, -0.03077411651611328, -0.027912139892578125, -0.02505016326904297, -0.022188186645507812, -0.019326210021972656, -0.0164642333984375, -0.013602256774902344, -0.010740280151367188, -0.007878303527832031, -0.005016326904296875, -0.0021543502807617188, 0.0007076263427734375, 0.0035696029663085938, 0.00643157958984375, 0.009293556213378906, 0.012155532836914062, 0.015017509460449219, 0.017879486083984375, 0.02074146270751953, 0.023603439331054688, 0.026465415954589844, 0.029327392578125, 0.032189369201660156, 0.03505134582519531, 0.03791332244873047, 0.040775299072265625, 0.04363727569580078, 0.04649925231933594, 0.049361228942871094, 0.05222320556640625, 0.055085182189941406, 0.05794715881347656, 0.06080913543701172, 0.06367111206054688, 0.06653308868408203, 0.06939506530761719, 0.07225704193115234, 0.0751190185546875, 0.07798099517822266, 0.08084297180175781, 0.08370494842529297, 0.08656692504882812, 0.08942890167236328, 0.09229087829589844, 0.0951528549194336, 0.09801483154296875, 0.1008768081665039, 0.10373878479003906, 0.10660076141357422, 0.10946273803710938, 0.11232471466064453, 0.11518669128417969, 0.11804866790771484, 0.12091064453125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 2.0, 4.0, 6.0, 10.0, 8.0, 11.0, 20.0, 21.0, 17.0, 15.0, 16.0, 25.0, 30.0, 36.0, 29.0, 35.0, 35.0, 39.0, 35.0, 54.0, 36.0, 45.0, 47.0, 37.0, 44.0, 32.0, 32.0, 40.0, 37.0, 23.0, 27.0, 23.0, 16.0, 28.0, 20.0, 11.0, 5.0, 17.0, 7.0, 9.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.07659912109375, -0.0741567611694336, -0.07171440124511719, -0.06927204132080078, -0.06682968139648438, -0.06438732147216797, -0.06194496154785156, -0.059502601623535156, -0.05706024169921875, -0.054617881774902344, -0.05217552185058594, -0.04973316192626953, -0.047290802001953125, -0.04484844207763672, -0.04240608215332031, -0.039963722229003906, -0.0375213623046875, -0.035079002380371094, -0.03263664245605469, -0.03019428253173828, -0.027751922607421875, -0.02530956268310547, -0.022867202758789062, -0.020424842834472656, -0.01798248291015625, -0.015540122985839844, -0.013097763061523438, -0.010655403137207031, -0.008213043212890625, -0.005770683288574219, -0.0033283233642578125, -0.0008859634399414062, 0.001556396484375, 0.003998756408691406, 0.0064411163330078125, 0.008883476257324219, 0.011325836181640625, 0.013768196105957031, 0.016210556030273438, 0.018652915954589844, 0.02109527587890625, 0.023537635803222656, 0.025979995727539062, 0.02842235565185547, 0.030864715576171875, 0.03330707550048828, 0.03574943542480469, 0.038191795349121094, 0.0406341552734375, 0.043076515197753906, 0.04551887512207031, 0.04796123504638672, 0.050403594970703125, 0.05284595489501953, 0.05528831481933594, 0.057730674743652344, 0.06017303466796875, 0.06261539459228516, 0.06505775451660156, 0.06750011444091797, 0.06994247436523438, 0.07238483428955078, 0.07482719421386719, 0.0772695541381836, 0.0797119140625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 10.0, 24.0, 33.0, 61.0, 93.0, 219.0, 429.0, 898.0, 2139.0, 5714.0, 16074.0, 52621.0, 203724.0, 972199.0, 2094644.0, 646256.0, 141131.0, 38251.0, 12105.0, 4315.0, 1767.0, 769.0, 350.0, 213.0, 97.0, 50.0, 39.0, 21.0, 13.0, 6.0, 10.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1507568359375, -0.1469278335571289, -0.1430988311767578, -0.13926982879638672, -0.13544082641601562, -0.13161182403564453, -0.12778282165527344, -0.12395381927490234, -0.12012481689453125, -0.11629581451416016, -0.11246681213378906, -0.10863780975341797, -0.10480880737304688, -0.10097980499267578, -0.09715080261230469, -0.0933218002319336, -0.0894927978515625, -0.0856637954711914, -0.08183479309082031, -0.07800579071044922, -0.07417678833007812, -0.07034778594970703, -0.06651878356933594, -0.06268978118896484, -0.05886077880859375, -0.055031776428222656, -0.05120277404785156, -0.04737377166748047, -0.043544769287109375, -0.03971576690673828, -0.03588676452636719, -0.032057762145996094, -0.028228759765625, -0.024399757385253906, -0.020570755004882812, -0.01674175262451172, -0.012912750244140625, -0.009083747863769531, -0.0052547454833984375, -0.0014257431030273438, 0.00240325927734375, 0.006232261657714844, 0.010061264038085938, 0.013890266418457031, 0.017719268798828125, 0.02154827117919922, 0.025377273559570312, 0.029206275939941406, 0.0330352783203125, 0.036864280700683594, 0.04069328308105469, 0.04452228546142578, 0.048351287841796875, 0.05218029022216797, 0.05600929260253906, 0.059838294982910156, 0.06366729736328125, 0.06749629974365234, 0.07132530212402344, 0.07515430450439453, 0.07898330688476562, 0.08281230926513672, 0.08664131164550781, 0.0904703140258789, 0.09429931640625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 6.0, 9.0, 10.0, 15.0, 21.0, 26.0, 33.0, 39.0, 52.0, 76.0, 104.0, 127.0, 154.0, 228.0, 272.0, 330.0, 372.0, 396.0, 385.0, 318.0, 254.0, 210.0, 148.0, 101.0, 88.0, 68.0, 54.0, 42.0, 22.0, 30.0, 18.0, 19.0, 12.0, 7.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 6.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.11474609375, -0.11117839813232422, -0.10761070251464844, -0.10404300689697266, -0.10047531127929688, -0.0969076156616211, -0.09333992004394531, -0.08977222442626953, -0.08620452880859375, -0.08263683319091797, -0.07906913757324219, -0.0755014419555664, -0.07193374633789062, -0.06836605072021484, -0.06479835510253906, -0.06123065948486328, -0.0576629638671875, -0.05409526824951172, -0.05052757263183594, -0.046959877014160156, -0.043392181396484375, -0.039824485778808594, -0.03625679016113281, -0.03268909454345703, -0.02912139892578125, -0.02555370330810547, -0.021986007690429688, -0.018418312072753906, -0.014850616455078125, -0.011282920837402344, -0.0077152252197265625, -0.004147529602050781, -0.000579833984375, 0.0029878616333007812, 0.0065555572509765625, 0.010123252868652344, 0.013690948486328125, 0.017258644104003906, 0.020826339721679688, 0.02439403533935547, 0.02796173095703125, 0.03152942657470703, 0.03509712219238281, 0.038664817810058594, 0.042232513427734375, 0.045800209045410156, 0.04936790466308594, 0.05293560028076172, 0.0565032958984375, 0.06007099151611328, 0.06363868713378906, 0.06720638275146484, 0.07077407836914062, 0.0743417739868164, 0.07790946960449219, 0.08147716522216797, 0.08504486083984375, 0.08861255645751953, 0.09218025207519531, 0.0957479476928711, 0.09931564331054688, 0.10288333892822266, 0.10645103454589844, 0.11001873016357422, 0.11358642578125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 8.0, 12.0, 16.0, 36.0, 73.0, 105.0, 159.0, 170.0, 148.0, 132.0, 65.0, 31.0, 20.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7154151201248169, -0.6804477572441101, -0.6454803943634033, -0.6105130314826965, -0.5755456686019897, -0.540578305721283, -0.5056109428405762, -0.4706435799598694, -0.4356762170791626, -0.4007088541984558, -0.365741491317749, -0.33077412843704224, -0.29580676555633545, -0.26083940267562866, -0.22587203979492188, -0.1909046769142151, -0.1559373140335083, -0.12096995115280151, -0.08600258827209473, -0.05103522539138794, -0.016067862510681152, 0.018899500370025635, 0.05386686325073242, 0.08883422613143921, 0.123801589012146, 0.15876895189285278, 0.19373631477355957, 0.22870367765426636, 0.26367104053497314, 0.29863840341567993, 0.3336057662963867, 0.3685731291770935, 0.40354037284851074, 0.43850773572921753, 0.4734750986099243, 0.5084424614906311, 0.5434098243713379, 0.5783771872520447, 0.6133445501327515, 0.6483119130134583, 0.683279275894165, 0.7182466387748718, 0.7532140016555786, 0.7881813645362854, 0.8231487274169922, 0.858116090297699, 0.8930834531784058, 0.9280508160591125, 0.9630181789398193, 0.9979855418205261, 1.032952904701233, 1.067920207977295, 1.1028876304626465, 1.137855052947998, 1.17282235622406, 1.207789659500122, 1.2427570819854736, 1.2777245044708252, 1.3126918077468872, 1.3476591110229492, 1.3826265335083008, 1.4175939559936523, 1.4525612592697144, 1.4875285625457764, 1.522495985031128]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 4.0, 3.0, 13.0, 13.0, 9.0, 10.0, 14.0, 16.0, 24.0, 31.0, 30.0, 40.0, 39.0, 35.0, 47.0, 36.0, 38.0, 33.0, 40.0, 46.0, 57.0, 53.0, 50.0, 37.0, 39.0, 45.0, 32.0, 23.0, 37.0, 28.0, 16.0, 18.0, 7.0, 13.0, 7.0, 6.0, 9.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45728325843811035, -0.4416397213935852, -0.42599615454673767, -0.41035258769989014, -0.394709050655365, -0.37906551361083984, -0.3634219467639923, -0.3477783799171448, -0.33213484287261963, -0.3164913058280945, -0.30084773898124695, -0.2852041721343994, -0.26956063508987427, -0.2539170980453491, -0.2382735311985016, -0.22262997925281525, -0.2069864273071289, -0.19134287536144257, -0.17569932341575623, -0.16005577147006989, -0.14441221952438354, -0.1287686675786972, -0.11312511563301086, -0.09748156368732452, -0.08183801174163818, -0.06619445979595184, -0.0505509078502655, -0.03490735590457916, -0.019263803958892822, -0.003620252013206482, 0.012023299932479858, 0.0276668518781662, 0.04331040382385254, 0.05895395576953888, 0.07459750771522522, 0.09024105966091156, 0.1058846116065979, 0.12152816355228424, 0.13717171549797058, 0.15281526744365692, 0.16845881938934326, 0.1841023713350296, 0.19974592328071594, 0.21538947522640228, 0.23103302717208862, 0.24667657911777496, 0.2623201310634613, 0.27796369791030884, 0.293607234954834, 0.30925077199935913, 0.32489433884620667, 0.3405379056930542, 0.35618144273757935, 0.3718249797821045, 0.387468546628952, 0.40311211347579956, 0.4187556505203247, 0.43439918756484985, 0.4500427544116974, 0.4656863212585449, 0.48132985830307007, 0.4969733953475952, 0.5126169919967651, 0.5282605290412903, 0.5439040660858154]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 7.0, 7.0, 11.0, 14.0, 24.0, 36.0, 59.0, 85.0, 154.0, 197.0, 326.0, 599.0, 944.0, 1586.0, 2816.0, 5512.0, 12665.0, 38045.0, 126855.0, 318396.0, 332078.0, 139708.0, 41374.0, 14057.0, 5945.0, 3002.0, 1561.0, 931.0, 573.0, 371.0, 229.0, 126.0, 87.0, 55.0, 48.0, 36.0, 15.0, 11.0, 9.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.135498046875, -0.13139724731445312, -0.12729644775390625, -0.12319564819335938, -0.1190948486328125, -0.11499404907226562, -0.11089324951171875, -0.10679244995117188, -0.102691650390625, -0.09859085083007812, -0.09449005126953125, -0.09038925170898438, -0.0862884521484375, -0.08218765258789062, -0.07808685302734375, -0.07398605346679688, -0.06988525390625, -0.06578445434570312, -0.06168365478515625, -0.057582855224609375, -0.0534820556640625, -0.049381256103515625, -0.04528045654296875, -0.041179656982421875, -0.037078857421875, -0.032978057861328125, -0.02887725830078125, -0.024776458740234375, -0.0206756591796875, -0.016574859619140625, -0.01247406005859375, -0.008373260498046875, -0.0042724609375, -0.000171661376953125, 0.00392913818359375, 0.008029937744140625, 0.0121307373046875, 0.016231536865234375, 0.02033233642578125, 0.024433135986328125, 0.028533935546875, 0.032634735107421875, 0.03673553466796875, 0.040836334228515625, 0.0449371337890625, 0.049037933349609375, 0.05313873291015625, 0.057239532470703125, 0.06134033203125, 0.06544113159179688, 0.06954193115234375, 0.07364273071289062, 0.0777435302734375, 0.08184432983398438, 0.08594512939453125, 0.09004592895507812, 0.094146728515625, 0.09824752807617188, 0.10234832763671875, 0.10644912719726562, 0.1105499267578125, 0.11465072631835938, 0.11875152587890625, 0.12285232543945312, 0.126953125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 7.0, 2.0, 5.0, 9.0, 10.0, 17.0, 14.0, 17.0, 12.0, 22.0, 30.0, 28.0, 31.0, 49.0, 33.0, 41.0, 44.0, 47.0, 43.0, 39.0, 56.0, 58.0, 45.0, 45.0, 36.0, 33.0, 34.0, 25.0, 23.0, 22.0, 23.0, 17.0, 12.0, 14.0, 12.0, 5.0, 5.0, 8.0, 5.0, 8.0, 6.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.083251953125, -0.08035564422607422, -0.07745933532714844, -0.07456302642822266, -0.07166671752929688, -0.0687704086303711, -0.06587409973144531, -0.06297779083251953, -0.06008148193359375, -0.05718517303466797, -0.05428886413574219, -0.051392555236816406, -0.048496246337890625, -0.045599937438964844, -0.04270362854003906, -0.03980731964111328, -0.0369110107421875, -0.03401470184326172, -0.031118392944335938, -0.028222084045410156, -0.025325775146484375, -0.022429466247558594, -0.019533157348632812, -0.01663684844970703, -0.01374053955078125, -0.010844230651855469, -0.007947921752929688, -0.005051612854003906, -0.002155303955078125, 0.0007410049438476562, 0.0036373138427734375, 0.006533622741699219, 0.009429931640625, 0.012326240539550781, 0.015222549438476562, 0.018118858337402344, 0.021015167236328125, 0.023911476135253906, 0.026807785034179688, 0.02970409393310547, 0.03260040283203125, 0.03549671173095703, 0.03839302062988281, 0.041289329528808594, 0.044185638427734375, 0.047081947326660156, 0.04997825622558594, 0.05287456512451172, 0.0557708740234375, 0.05866718292236328, 0.06156349182128906, 0.06445980072021484, 0.06735610961914062, 0.0702524185180664, 0.07314872741699219, 0.07604503631591797, 0.07894134521484375, 0.08183765411376953, 0.08473396301269531, 0.0876302719116211, 0.09052658081054688, 0.09342288970947266, 0.09631919860839844, 0.09921550750732422, 0.10211181640625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 9.0, 10.0, 21.0, 23.0, 30.0, 53.0, 87.0, 132.0, 250.0, 430.0, 750.0, 1391.0, 2482.0, 4827.0, 9743.0, 21180.0, 51930.0, 139783.0, 288164.0, 290019.0, 141890.0, 53294.0, 21454.0, 9955.0, 4967.0, 2534.0, 1352.0, 728.0, 399.0, 246.0, 164.0, 79.0, 55.0, 40.0, 14.0, 15.0, 10.0, 12.0, 5.0, 6.0, 5.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.1146240234375, -0.11104297637939453, -0.10746192932128906, -0.1038808822631836, -0.10029983520507812, -0.09671878814697266, -0.09313774108886719, -0.08955669403076172, -0.08597564697265625, -0.08239459991455078, -0.07881355285644531, -0.07523250579833984, -0.07165145874023438, -0.0680704116821289, -0.06448936462402344, -0.06090831756591797, -0.0573272705078125, -0.05374622344970703, -0.05016517639160156, -0.046584129333496094, -0.043003082275390625, -0.039422035217285156, -0.03584098815917969, -0.03225994110107422, -0.02867889404296875, -0.02509784698486328, -0.021516799926757812, -0.017935752868652344, -0.014354705810546875, -0.010773658752441406, -0.0071926116943359375, -0.0036115646362304688, -3.0517578125e-05, 0.0035505294799804688, 0.0071315765380859375, 0.010712623596191406, 0.014293670654296875, 0.017874717712402344, 0.021455764770507812, 0.02503681182861328, 0.02861785888671875, 0.03219890594482422, 0.03577995300292969, 0.039361000061035156, 0.042942047119140625, 0.046523094177246094, 0.05010414123535156, 0.05368518829345703, 0.0572662353515625, 0.06084728240966797, 0.06442832946777344, 0.0680093765258789, 0.07159042358398438, 0.07517147064208984, 0.07875251770019531, 0.08233356475830078, 0.08591461181640625, 0.08949565887451172, 0.09307670593261719, 0.09665775299072266, 0.10023880004882812, 0.1038198471069336, 0.10740089416503906, 0.11098194122314453, 0.11456298828125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 9.0, 2.0, 5.0, 7.0, 4.0, 13.0, 9.0, 13.0, 11.0, 13.0, 22.0, 25.0, 25.0, 29.0, 21.0, 36.0, 29.0, 40.0, 44.0, 46.0, 32.0, 37.0, 42.0, 39.0, 47.0, 35.0, 56.0, 36.0, 35.0, 39.0, 30.0, 26.0, 22.0, 26.0, 22.0, 12.0, 13.0, 11.0, 7.0, 10.0, 11.0, 8.0, 3.0, 4.0, 3.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.220947265625, -0.21349334716796875, -0.2060394287109375, -0.19858551025390625, -0.191131591796875, -0.18367767333984375, -0.1762237548828125, -0.16876983642578125, -0.16131591796875, -0.15386199951171875, -0.1464080810546875, -0.13895416259765625, -0.131500244140625, -0.12404632568359375, -0.1165924072265625, -0.10913848876953125, -0.1016845703125, -0.09423065185546875, -0.0867767333984375, -0.07932281494140625, -0.071868896484375, -0.06441497802734375, -0.0569610595703125, -0.04950714111328125, -0.04205322265625, -0.03459930419921875, -0.0271453857421875, -0.01969146728515625, -0.012237548828125, -0.00478363037109375, 0.0026702880859375, 0.01012420654296875, 0.017578125, 0.02503204345703125, 0.0324859619140625, 0.03993988037109375, 0.047393798828125, 0.05484771728515625, 0.0623016357421875, 0.06975555419921875, 0.07720947265625, 0.08466339111328125, 0.0921173095703125, 0.09957122802734375, 0.107025146484375, 0.11447906494140625, 0.1219329833984375, 0.12938690185546875, 0.1368408203125, 0.14429473876953125, 0.1517486572265625, 0.15920257568359375, 0.166656494140625, 0.17411041259765625, 0.1815643310546875, 0.18901824951171875, 0.19647216796875, 0.20392608642578125, 0.2113800048828125, 0.21883392333984375, 0.226287841796875, 0.23374176025390625, 0.2411956787109375, 0.24864959716796875, 0.256103515625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 7.0, 12.0, 22.0, 27.0, 37.0, 72.0, 124.0, 200.0, 320.0, 498.0, 851.0, 1340.0, 2402.0, 4255.0, 7593.0, 14982.0, 32337.0, 80106.0, 199789.0, 324221.0, 219406.0, 89285.0, 35528.0, 16292.0, 8121.0, 4385.0, 2544.0, 1508.0, 861.0, 528.0, 343.0, 201.0, 134.0, 86.0, 56.0, 31.0, 20.0, 10.0, 8.0, 4.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0283660888671875, -0.027256250381469727, -0.026146411895751953, -0.02503657341003418, -0.023926734924316406, -0.022816896438598633, -0.02170705795288086, -0.020597219467163086, -0.019487380981445312, -0.01837754249572754, -0.017267704010009766, -0.016157865524291992, -0.015048027038574219, -0.013938188552856445, -0.012828350067138672, -0.011718511581420898, -0.010608673095703125, -0.009498834609985352, -0.008388996124267578, -0.007279157638549805, -0.006169319152832031, -0.005059480667114258, -0.003949642181396484, -0.002839803695678711, -0.0017299652099609375, -0.0006201267242431641, 0.0004897117614746094, 0.0015995502471923828, 0.0027093887329101562, 0.0038192272186279297, 0.004929065704345703, 0.0060389041900634766, 0.00714874267578125, 0.008258581161499023, 0.009368419647216797, 0.01047825813293457, 0.011588096618652344, 0.012697935104370117, 0.01380777359008789, 0.014917612075805664, 0.016027450561523438, 0.01713728904724121, 0.018247127532958984, 0.019356966018676758, 0.02046680450439453, 0.021576642990112305, 0.022686481475830078, 0.02379631996154785, 0.024906158447265625, 0.0260159969329834, 0.027125835418701172, 0.028235673904418945, 0.02934551239013672, 0.030455350875854492, 0.031565189361572266, 0.03267502784729004, 0.03378486633300781, 0.034894704818725586, 0.03600454330444336, 0.03711438179016113, 0.038224220275878906, 0.03933405876159668, 0.04044389724731445, 0.04155373573303223, 0.04266357421875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 7.0, 7.0, 19.0, 19.0, 23.0, 30.0, 43.0, 45.0, 61.0, 80.0, 85.0, 85.0, 72.0, 90.0, 77.0, 72.0, 41.0, 31.0, 29.0, 21.0, 22.0, 9.0, 9.0, 4.0, 4.0, 3.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6570091247558594e-05, -1.6014091670513153e-05, -1.5458092093467712e-05, -1.4902092516422272e-05, -1.4346092939376831e-05, -1.379009336233139e-05, -1.323409378528595e-05, -1.2678094208240509e-05, -1.2122094631195068e-05, -1.1566095054149628e-05, -1.1010095477104187e-05, -1.0454095900058746e-05, -9.898096323013306e-06, -9.342096745967865e-06, -8.786097168922424e-06, -8.230097591876984e-06, -7.674098014831543e-06, -7.118098437786102e-06, -6.562098860740662e-06, -6.006099283695221e-06, -5.45009970664978e-06, -4.89410012960434e-06, -4.338100552558899e-06, -3.7821009755134583e-06, -3.2261013984680176e-06, -2.670101821422577e-06, -2.1141022443771362e-06, -1.5581026673316956e-06, -1.0021030902862549e-06, -4.461035132408142e-07, 1.0989606380462646e-07, 6.658956408500671e-07, 1.2218952178955078e-06, 1.7778947949409485e-06, 2.333894371986389e-06, 2.88989394903183e-06, 3.4458935260772705e-06, 4.001893103122711e-06, 4.557892680168152e-06, 5.1138922572135925e-06, 5.669891834259033e-06, 6.225891411304474e-06, 6.7818909883499146e-06, 7.337890565395355e-06, 7.893890142440796e-06, 8.449889719486237e-06, 9.005889296531677e-06, 9.561888873577118e-06, 1.0117888450622559e-05, 1.0673888027668e-05, 1.122988760471344e-05, 1.178588718175888e-05, 1.2341886758804321e-05, 1.2897886335849762e-05, 1.3453885912895203e-05, 1.4009885489940643e-05, 1.4565885066986084e-05, 1.5121884644031525e-05, 1.5677884221076965e-05, 1.6233883798122406e-05, 1.6789883375167847e-05, 1.7345882952213287e-05, 1.7901882529258728e-05, 1.845788210630417e-05, 1.901388168334961e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 10.0, 8.0, 6.0, 20.0, 29.0, 38.0, 66.0, 98.0, 155.0, 281.0, 477.0, 899.0, 1764.0, 3522.0, 7327.0, 15131.0, 32356.0, 72411.0, 158080.0, 264937.0, 245450.0, 133001.0, 60159.0, 26947.0, 12828.0, 6134.0, 3031.0, 1526.0, 775.0, 464.0, 234.0, 143.0, 75.0, 56.0, 44.0, 18.0, 20.0, 7.0, 10.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.03582763671875, -0.03480052947998047, -0.03377342224121094, -0.032746315002441406, -0.031719207763671875, -0.030692100524902344, -0.029664993286132812, -0.02863788604736328, -0.02761077880859375, -0.02658367156982422, -0.025556564331054688, -0.024529457092285156, -0.023502349853515625, -0.022475242614746094, -0.021448135375976562, -0.02042102813720703, -0.0193939208984375, -0.01836681365966797, -0.017339706420898438, -0.016312599182128906, -0.015285491943359375, -0.014258384704589844, -0.013231277465820312, -0.012204170227050781, -0.01117706298828125, -0.010149955749511719, -0.009122848510742188, -0.008095741271972656, -0.007068634033203125, -0.006041526794433594, -0.0050144195556640625, -0.003987312316894531, -0.002960205078125, -0.0019330978393554688, -0.0009059906005859375, 0.00012111663818359375, 0.001148223876953125, 0.0021753311157226562, 0.0032024383544921875, 0.004229545593261719, 0.00525665283203125, 0.006283760070800781, 0.0073108673095703125, 0.008337974548339844, 0.009365081787109375, 0.010392189025878906, 0.011419296264648438, 0.012446403503417969, 0.0134735107421875, 0.014500617980957031, 0.015527725219726562, 0.016554832458496094, 0.017581939697265625, 0.018609046936035156, 0.019636154174804688, 0.02066326141357422, 0.02169036865234375, 0.02271747589111328, 0.023744583129882812, 0.024771690368652344, 0.025798797607421875, 0.026825904846191406, 0.027853012084960938, 0.02888011932373047, 0.0299072265625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 6.0, 6.0, 8.0, 4.0, 7.0, 8.0, 14.0, 11.0, 7.0, 17.0, 20.0, 21.0, 30.0, 35.0, 36.0, 38.0, 51.0, 62.0, 41.0, 65.0, 48.0, 58.0, 64.0, 50.0, 36.0, 40.0, 44.0, 26.0, 26.0, 26.0, 26.0, 14.0, 12.0, 9.0, 7.0, 5.0, 6.0, 5.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03668212890625, -0.03542137145996094, -0.034160614013671875, -0.03289985656738281, -0.03163909912109375, -0.030378341674804688, -0.029117584228515625, -0.027856826782226562, -0.0265960693359375, -0.025335311889648438, -0.024074554443359375, -0.022813796997070312, -0.02155303955078125, -0.020292282104492188, -0.019031524658203125, -0.017770767211914062, -0.016510009765625, -0.015249252319335938, -0.013988494873046875, -0.012727737426757812, -0.01146697998046875, -0.010206222534179688, -0.008945465087890625, -0.0076847076416015625, -0.0064239501953125, -0.0051631927490234375, -0.003902435302734375, -0.0026416778564453125, -0.00138092041015625, -0.0001201629638671875, 0.001140594482421875, 0.0024013519287109375, 0.003662109375, 0.0049228668212890625, 0.006183624267578125, 0.0074443817138671875, 0.00870513916015625, 0.009965896606445312, 0.011226654052734375, 0.012487411499023438, 0.0137481689453125, 0.015008926391601562, 0.016269683837890625, 0.017530441284179688, 0.01879119873046875, 0.020051956176757812, 0.021312713623046875, 0.022573471069335938, 0.023834228515625, 0.025094985961914062, 0.026355743408203125, 0.027616500854492188, 0.02887725830078125, 0.030138015747070312, 0.031398773193359375, 0.03265953063964844, 0.0339202880859375, 0.03518104553222656, 0.036441802978515625, 0.03770256042480469, 0.03896331787109375, 0.04022407531738281, 0.041484832763671875, 0.04274559020996094, 0.04400634765625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 2.0, 5.0, 7.0, 12.0, 15.0, 24.0, 62.0, 164.0, 226.0, 225.0, 143.0, 61.0, 34.0, 8.0, 8.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1912773847579956, -1.150343656539917, -1.1094098091125488, -1.0684760808944702, -1.0275423526763916, -0.986608624458313, -0.9456748366355896, -0.9047410488128662, -0.8638073205947876, -0.822873592376709, -0.7819398045539856, -0.7410060167312622, -0.7000722885131836, -0.659138560295105, -0.6182047724723816, -0.5772709846496582, -0.5363372564315796, -0.4954034984111786, -0.4544697403907776, -0.4135359823703766, -0.3726022243499756, -0.3316684663295746, -0.2907347083091736, -0.24980095028877258, -0.20886719226837158, -0.16793343424797058, -0.12699967622756958, -0.08606591820716858, -0.04513216018676758, -0.004198402166366577, 0.036735355854034424, 0.07766911387443542, 0.11860299110412598, 0.15953674912452698, 0.20047050714492798, 0.24140426516532898, 0.28233802318573, 0.323271781206131, 0.364205539226532, 0.405139297246933, 0.446073055267334, 0.487006813287735, 0.527940571308136, 0.5688743591308594, 0.609808087348938, 0.6507418155670166, 0.69167560338974, 0.7326093912124634, 0.773543119430542, 0.8144768476486206, 0.855410635471344, 0.8963444232940674, 0.937278151512146, 0.9782118797302246, 1.0191457271575928, 1.0600794553756714, 1.10101318359375, 1.1419469118118286, 1.1828806400299072, 1.2238144874572754, 1.264748215675354, 1.3056819438934326, 1.3466157913208008, 1.3875495195388794, 1.428483247756958]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 9.0, 11.0, 10.0, 7.0, 22.0, 13.0, 17.0, 24.0, 25.0, 38.0, 39.0, 35.0, 24.0, 47.0, 41.0, 50.0, 53.0, 50.0, 52.0, 45.0, 59.0, 49.0, 47.0, 45.0, 34.0, 21.0, 23.0, 32.0, 18.0, 13.0, 13.0, 8.0, 10.0, 5.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6935819387435913, -0.6730813980102539, -0.6525807976722717, -0.6320801973342896, -0.6115796566009521, -0.5910791158676147, -0.5705785155296326, -0.5500779151916504, -0.529577374458313, -0.5090768337249756, -0.4885762333869934, -0.4680756628513336, -0.44757509231567383, -0.42707452178001404, -0.40657395124435425, -0.38607338070869446, -0.36557281017303467, -0.3450722396373749, -0.3245716691017151, -0.3040710985660553, -0.2835705280303955, -0.2630699574947357, -0.24256938695907593, -0.22206881642341614, -0.20156824588775635, -0.18106767535209656, -0.16056710481643677, -0.14006653428077698, -0.11956596374511719, -0.0990653932094574, -0.07856482267379761, -0.05806425213813782, -0.0375637412071228, -0.017063170671463013, 0.0034373998641967773, 0.023937970399856567, 0.04443854093551636, 0.06493911147117615, 0.08543968200683594, 0.10594025254249573, 0.12644082307815552, 0.1469413936138153, 0.1674419641494751, 0.1879425346851349, 0.20844310522079468, 0.22894367575645447, 0.24944424629211426, 0.26994481682777405, 0.29044538736343384, 0.31094595789909363, 0.3314465284347534, 0.3519470989704132, 0.372447669506073, 0.3929482400417328, 0.4134488105773926, 0.43394938111305237, 0.45444995164871216, 0.47495052218437195, 0.49545109272003174, 0.5159516334533691, 0.5364522337913513, 0.5569528341293335, 0.5774533748626709, 0.5979539155960083, 0.6184545159339905]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 6.0, 6.0, 8.0, 11.0, 11.0, 17.0, 21.0, 37.0, 64.0, 83.0, 112.0, 180.0, 285.0, 498.0, 832.0, 1463.0, 2776.0, 5288.0, 10847.0, 23047.0, 53215.0, 127617.0, 305597.0, 634084.0, 984984.0, 953203.0, 593662.0, 285448.0, 120421.0, 49509.0, 21170.0, 9716.0, 4601.0, 2408.0, 1341.0, 690.0, 394.0, 235.0, 144.0, 89.0, 56.0, 48.0, 23.0, 14.0, 10.0, 8.0, 3.0, 4.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-0.07244873046875, -0.07043123245239258, -0.06841373443603516, -0.06639623641967773, -0.06437873840332031, -0.06236124038696289, -0.06034374237060547, -0.05832624435424805, -0.056308746337890625, -0.0542912483215332, -0.05227375030517578, -0.05025625228881836, -0.04823875427246094, -0.046221256256103516, -0.044203758239746094, -0.04218626022338867, -0.04016876220703125, -0.03815126419067383, -0.036133766174316406, -0.034116268157958984, -0.03209877014160156, -0.03008127212524414, -0.02806377410888672, -0.026046276092529297, -0.024028778076171875, -0.022011280059814453, -0.01999378204345703, -0.01797628402709961, -0.015958786010742188, -0.013941287994384766, -0.011923789978027344, -0.009906291961669922, -0.0078887939453125, -0.005871295928955078, -0.0038537979125976562, -0.0018362998962402344, 0.0001811981201171875, 0.0021986961364746094, 0.004216194152832031, 0.006233692169189453, 0.008251190185546875, 0.010268688201904297, 0.012286186218261719, 0.01430368423461914, 0.016321182250976562, 0.018338680267333984, 0.020356178283691406, 0.022373676300048828, 0.02439117431640625, 0.026408672332763672, 0.028426170349121094, 0.030443668365478516, 0.03246116638183594, 0.03447866439819336, 0.03649616241455078, 0.0385136604309082, 0.040531158447265625, 0.04254865646362305, 0.04456615447998047, 0.04658365249633789, 0.04860115051269531, 0.050618648529052734, 0.052636146545410156, 0.05465364456176758, 0.056671142578125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 4.0, 13.0, 8.0, 8.0, 13.0, 14.0, 19.0, 19.0, 17.0, 22.0, 29.0, 30.0, 36.0, 35.0, 39.0, 37.0, 39.0, 54.0, 47.0, 50.0, 47.0, 53.0, 44.0, 42.0, 37.0, 45.0, 31.0, 20.0, 21.0, 20.0, 24.0, 17.0, 12.0, 18.0, 10.0, 9.0, 1.0, 6.0, 8.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.084228515625, -0.08170890808105469, -0.07918930053710938, -0.07666969299316406, -0.07415008544921875, -0.07163047790527344, -0.06911087036132812, -0.06659126281738281, -0.0640716552734375, -0.06155204772949219, -0.059032440185546875, -0.05651283264160156, -0.05399322509765625, -0.05147361755371094, -0.048954010009765625, -0.04643440246582031, -0.043914794921875, -0.04139518737792969, -0.038875579833984375, -0.03635597229003906, -0.03383636474609375, -0.03131675720214844, -0.028797149658203125, -0.026277542114257812, -0.0237579345703125, -0.021238327026367188, -0.018718719482421875, -0.016199111938476562, -0.01367950439453125, -0.011159896850585938, -0.008640289306640625, -0.0061206817626953125, -0.00360107421875, -0.0010814666748046875, 0.001438140869140625, 0.0039577484130859375, 0.00647735595703125, 0.008996963500976562, 0.011516571044921875, 0.014036178588867188, 0.0165557861328125, 0.019075393676757812, 0.021595001220703125, 0.024114608764648438, 0.02663421630859375, 0.029153823852539062, 0.031673431396484375, 0.03419303894042969, 0.036712646484375, 0.03923225402832031, 0.041751861572265625, 0.04427146911621094, 0.04679107666015625, 0.04931068420410156, 0.051830291748046875, 0.05434989929199219, 0.0568695068359375, 0.05938911437988281, 0.061908721923828125, 0.06442832946777344, 0.06694793701171875, 0.06946754455566406, 0.07198715209960938, 0.07450675964355469, 0.0770263671875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 3.0, 12.0, 18.0, 38.0, 66.0, 131.0, 209.0, 476.0, 1137.0, 3225.0, 11349.0, 53841.0, 432900.0, 2896172.0, 697317.0, 76164.0, 14768.0, 3920.0, 1426.0, 584.0, 237.0, 113.0, 83.0, 43.0, 20.0, 13.0, 10.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.201904296875, -0.19623184204101562, -0.19055938720703125, -0.18488693237304688, -0.1792144775390625, -0.17354202270507812, -0.16786956787109375, -0.16219711303710938, -0.156524658203125, -0.15085220336914062, -0.14517974853515625, -0.13950729370117188, -0.1338348388671875, -0.12816238403320312, -0.12248992919921875, -0.11681747436523438, -0.11114501953125, -0.10547256469726562, -0.09980010986328125, -0.09412765502929688, -0.0884552001953125, -0.08278274536132812, -0.07711029052734375, -0.07143783569335938, -0.065765380859375, -0.060092926025390625, -0.05442047119140625, -0.048748016357421875, -0.0430755615234375, -0.037403106689453125, -0.03173065185546875, -0.026058197021484375, -0.0203857421875, -0.014713287353515625, -0.00904083251953125, -0.003368377685546875, 0.0023040771484375, 0.007976531982421875, 0.01364898681640625, 0.019321441650390625, 0.024993896484375, 0.030666351318359375, 0.03633880615234375, 0.042011260986328125, 0.0476837158203125, 0.053356170654296875, 0.05902862548828125, 0.06470108032226562, 0.07037353515625, 0.07604598999023438, 0.08171844482421875, 0.08739089965820312, 0.0930633544921875, 0.09873580932617188, 0.10440826416015625, 0.11008071899414062, 0.115753173828125, 0.12142562866210938, 0.12709808349609375, 0.13277053833007812, 0.1384429931640625, 0.14411544799804688, 0.14978790283203125, 0.15546035766601562, 0.1611328125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 3.0, 7.0, 13.0, 10.0, 32.0, 37.0, 58.0, 87.0, 148.0, 228.0, 339.0, 514.0, 646.0, 622.0, 453.0, 287.0, 197.0, 117.0, 94.0, 55.0, 30.0, 32.0, 22.0, 11.0, 8.0, 6.0, 7.0, 5.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1861572265625, -0.1806507110595703, -0.17514419555664062, -0.16963768005371094, -0.16413116455078125, -0.15862464904785156, -0.15311813354492188, -0.1476116180419922, -0.1421051025390625, -0.1365985870361328, -0.13109207153320312, -0.12558555603027344, -0.12007904052734375, -0.11457252502441406, -0.10906600952148438, -0.10355949401855469, -0.098052978515625, -0.09254646301269531, -0.08703994750976562, -0.08153343200683594, -0.07602691650390625, -0.07052040100097656, -0.06501388549804688, -0.05950736999511719, -0.0540008544921875, -0.04849433898925781, -0.042987823486328125, -0.03748130798339844, -0.03197479248046875, -0.026468276977539062, -0.020961761474609375, -0.015455245971679688, -0.00994873046875, -0.0044422149658203125, 0.001064300537109375, 0.0065708160400390625, 0.01207733154296875, 0.017583847045898438, 0.023090362548828125, 0.028596878051757812, 0.0341033935546875, 0.03960990905761719, 0.045116424560546875, 0.05062294006347656, 0.05612945556640625, 0.06163597106933594, 0.06714248657226562, 0.07264900207519531, 0.078155517578125, 0.08366203308105469, 0.08916854858398438, 0.09467506408691406, 0.10018157958984375, 0.10568809509277344, 0.11119461059570312, 0.11670112609863281, 0.1222076416015625, 0.1277141571044922, 0.13322067260742188, 0.13872718811035156, 0.14423370361328125, 0.14974021911621094, 0.15524673461914062, 0.1607532501220703, 0.166259765625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 8.0, 17.0, 28.0, 49.0, 110.0, 157.0, 178.0, 172.0, 115.0, 72.0, 45.0, 20.0, 8.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0852274894714355, -1.0457690954208374, -1.0063108205795288, -0.9668524265289307, -0.9273940920829773, -0.8879357576370239, -0.8484773635864258, -0.8090190291404724, -0.769560694694519, -0.7301023602485657, -0.6906439661979675, -0.6511856317520142, -0.6117272973060608, -0.5722689628601074, -0.5328105688095093, -0.4933522343635559, -0.45389384031295776, -0.414435476064682, -0.37497714161872864, -0.3355187773704529, -0.2960604429244995, -0.25660207867622375, -0.217143714427948, -0.17768537998199463, -0.13822701573371887, -0.09876866638660431, -0.05931030958890915, -0.01985195279121399, 0.019606396555900574, 0.05906474590301514, 0.0985231101512909, 0.13798144459724426, 0.17743980884552002, 0.21689815819263458, 0.25635650753974915, 0.2958148717880249, 0.33527320623397827, 0.37473157048225403, 0.4141899347305298, 0.45364826917648315, 0.4931066334247589, 0.5325649976730347, 0.572023332118988, 0.6114816665649414, 0.6509400606155396, 0.6903983950614929, 0.7298567295074463, 0.7693151235580444, 0.8087734580039978, 0.8482317924499512, 0.8876901865005493, 0.9271485209465027, 0.966606855392456, 1.0060652494430542, 1.0455236434936523, 1.084981918334961, 1.124440312385559, 1.1638987064361572, 1.2033569812774658, 1.242815375328064, 1.282273769378662, 1.3217320442199707, 1.3611904382705688, 1.400648832321167, 1.4401071071624756]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 8.0, 6.0, 7.0, 14.0, 18.0, 15.0, 36.0, 28.0, 31.0, 29.0, 25.0, 37.0, 45.0, 36.0, 40.0, 38.0, 32.0, 44.0, 47.0, 45.0, 40.0, 48.0, 46.0, 40.0, 29.0, 31.0, 29.0, 22.0, 23.0, 26.0, 14.0, 17.0, 11.0, 12.0, 6.0, 3.0, 6.0, 5.0, 1.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.48263466358184814, -0.4694255590438843, -0.4562164545059204, -0.44300737977027893, -0.42979827523231506, -0.4165891706943512, -0.4033800959587097, -0.39017099142074585, -0.376961886882782, -0.3637527823448181, -0.35054367780685425, -0.33733460307121277, -0.3241254985332489, -0.31091639399528503, -0.29770731925964355, -0.2844982147216797, -0.2712891101837158, -0.25808000564575195, -0.24487091600894928, -0.2316618263721466, -0.21845272183418274, -0.20524361729621887, -0.1920345276594162, -0.17882543802261353, -0.16561633348464966, -0.1524072289466858, -0.13919813930988312, -0.12598904967308044, -0.11277994513511658, -0.0995708480477333, -0.08636175096035004, -0.07315265387296677, -0.059943556785583496, -0.046734459698200226, -0.033525362610816956, -0.020316265523433685, -0.007107168436050415, 0.006101928651332855, 0.019311025738716125, 0.032520122826099396, 0.045729219913482666, 0.058938317000865936, 0.0721474140882492, 0.08535651117563248, 0.09856560826301575, 0.11177470535039902, 0.12498380243778229, 0.13819289207458496, 0.15140199661254883, 0.1646111011505127, 0.17782019078731537, 0.19102928042411804, 0.2042383849620819, 0.21744748950004578, 0.23065657913684845, 0.24386566877365112, 0.257074773311615, 0.27028387784957886, 0.2834929823875427, 0.2967020571231842, 0.30991116166114807, 0.32312026619911194, 0.3363293409347534, 0.3495384454727173, 0.36274755001068115]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 1.0, 5.0, 9.0, 14.0, 19.0, 30.0, 41.0, 53.0, 79.0, 95.0, 152.0, 217.0, 368.0, 609.0, 924.0, 1695.0, 2878.0, 5045.0, 9119.0, 16546.0, 30240.0, 55005.0, 94044.0, 145743.0, 183626.0, 178149.0, 133529.0, 83279.0, 47349.0, 26341.0, 14495.0, 8101.0, 4350.0, 2578.0, 1459.0, 837.0, 559.0, 340.0, 200.0, 132.0, 90.0, 72.0, 42.0, 29.0, 16.0, 16.0, 11.0, 7.0, 7.0, 4.0, 6.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.0654296875, -0.06337738037109375, -0.0613250732421875, -0.05927276611328125, -0.057220458984375, -0.05516815185546875, -0.0531158447265625, -0.05106353759765625, -0.04901123046875, -0.04695892333984375, -0.0449066162109375, -0.04285430908203125, -0.040802001953125, -0.03874969482421875, -0.0366973876953125, -0.03464508056640625, -0.0325927734375, -0.03054046630859375, -0.0284881591796875, -0.02643585205078125, -0.024383544921875, -0.02233123779296875, -0.0202789306640625, -0.01822662353515625, -0.01617431640625, -0.01412200927734375, -0.0120697021484375, -0.01001739501953125, -0.007965087890625, -0.00591278076171875, -0.0038604736328125, -0.00180816650390625, 0.000244140625, 0.00229644775390625, 0.0043487548828125, 0.00640106201171875, 0.008453369140625, 0.01050567626953125, 0.0125579833984375, 0.01461029052734375, 0.01666259765625, 0.01871490478515625, 0.0207672119140625, 0.02281951904296875, 0.024871826171875, 0.02692413330078125, 0.0289764404296875, 0.03102874755859375, 0.0330810546875, 0.03513336181640625, 0.0371856689453125, 0.03923797607421875, 0.041290283203125, 0.04334259033203125, 0.0453948974609375, 0.04744720458984375, 0.04949951171875, 0.05155181884765625, 0.0536041259765625, 0.05565643310546875, 0.057708740234375, 0.05976104736328125, 0.0618133544921875, 0.06386566162109375, 0.06591796875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 2.0, 7.0, 10.0, 15.0, 24.0, 20.0, 18.0, 26.0, 22.0, 34.0, 28.0, 54.0, 49.0, 56.0, 38.0, 58.0, 53.0, 46.0, 45.0, 45.0, 47.0, 41.0, 51.0, 32.0, 31.0, 28.0, 17.0, 10.0, 17.0, 13.0, 10.0, 10.0, 6.0, 10.0, 4.0, 4.0, 2.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09368896484375, -0.09053230285644531, -0.08737564086914062, -0.08421897888183594, -0.08106231689453125, -0.07790565490722656, -0.07474899291992188, -0.07159233093261719, -0.0684356689453125, -0.06527900695800781, -0.062122344970703125, -0.05896568298339844, -0.05580902099609375, -0.05265235900878906, -0.049495697021484375, -0.04633903503417969, -0.043182373046875, -0.04002571105957031, -0.036869049072265625, -0.03371238708496094, -0.03055572509765625, -0.027399063110351562, -0.024242401123046875, -0.021085739135742188, -0.0179290771484375, -0.014772415161132812, -0.011615753173828125, -0.008459091186523438, -0.00530242919921875, -0.0021457672119140625, 0.001010894775390625, 0.0041675567626953125, 0.00732421875, 0.010480880737304688, 0.013637542724609375, 0.016794204711914062, 0.01995086669921875, 0.023107528686523438, 0.026264190673828125, 0.029420852661132812, 0.0325775146484375, 0.03573417663574219, 0.038890838623046875, 0.04204750061035156, 0.04520416259765625, 0.04836082458496094, 0.051517486572265625, 0.05467414855957031, 0.057830810546875, 0.06098747253417969, 0.06414413452148438, 0.06730079650878906, 0.07045745849609375, 0.07361412048339844, 0.07677078247070312, 0.07992744445800781, 0.0830841064453125, 0.08624076843261719, 0.08939743041992188, 0.09255409240722656, 0.09571075439453125, 0.09886741638183594, 0.10202407836914062, 0.10518074035644531, 0.10833740234375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 11.0, 21.0, 32.0, 22.0, 41.0, 49.0, 110.0, 188.0, 241.0, 424.0, 827.0, 1456.0, 2663.0, 4890.0, 9677.0, 18661.0, 37638.0, 72459.0, 133107.0, 207941.0, 236409.0, 149370.0, 84106.0, 42934.0, 21782.0, 10992.0, 5739.0, 3011.0, 1581.0, 896.0, 501.0, 304.0, 155.0, 108.0, 62.0, 53.0, 31.0, 20.0, 9.0, 9.0, 8.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.069091796875, -0.0666341781616211, -0.06417655944824219, -0.06171894073486328, -0.059261322021484375, -0.05680370330810547, -0.05434608459472656, -0.051888465881347656, -0.04943084716796875, -0.046973228454589844, -0.04451560974121094, -0.04205799102783203, -0.039600372314453125, -0.03714275360107422, -0.03468513488769531, -0.032227516174316406, -0.0297698974609375, -0.027312278747558594, -0.024854660034179688, -0.02239704132080078, -0.019939422607421875, -0.01748180389404297, -0.015024185180664062, -0.012566566467285156, -0.01010894775390625, -0.007651329040527344, -0.0051937103271484375, -0.0027360916137695312, -0.000278472900390625, 0.0021791458129882812, 0.0046367645263671875, 0.007094383239746094, 0.009552001953125, 0.012009620666503906, 0.014467239379882812, 0.01692485809326172, 0.019382476806640625, 0.02184009552001953, 0.024297714233398438, 0.026755332946777344, 0.02921295166015625, 0.031670570373535156, 0.03412818908691406, 0.03658580780029297, 0.039043426513671875, 0.04150104522705078, 0.04395866394042969, 0.046416282653808594, 0.0488739013671875, 0.051331520080566406, 0.05378913879394531, 0.05624675750732422, 0.058704376220703125, 0.06116199493408203, 0.06361961364746094, 0.06607723236083984, 0.06853485107421875, 0.07099246978759766, 0.07345008850097656, 0.07590770721435547, 0.07836532592773438, 0.08082294464111328, 0.08328056335449219, 0.0857381820678711, 0.08819580078125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 11.0, 10.0, 10.0, 9.0, 9.0, 18.0, 13.0, 29.0, 27.0, 28.0, 47.0, 32.0, 37.0, 46.0, 57.0, 51.0, 54.0, 60.0, 43.0, 44.0, 58.0, 45.0, 42.0, 43.0, 24.0, 26.0, 33.0, 23.0, 12.0, 15.0, 10.0, 15.0, 3.0, 6.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.328857421875, -0.32010650634765625, -0.3113555908203125, -0.30260467529296875, -0.293853759765625, -0.28510284423828125, -0.2763519287109375, -0.26760101318359375, -0.25885009765625, -0.25009918212890625, -0.2413482666015625, -0.23259735107421875, -0.223846435546875, -0.21509552001953125, -0.2063446044921875, -0.19759368896484375, -0.1888427734375, -0.18009185791015625, -0.1713409423828125, -0.16259002685546875, -0.153839111328125, -0.14508819580078125, -0.1363372802734375, -0.12758636474609375, -0.11883544921875, -0.11008453369140625, -0.1013336181640625, -0.09258270263671875, -0.083831787109375, -0.07508087158203125, -0.0663299560546875, -0.05757904052734375, -0.048828125, -0.04007720947265625, -0.0313262939453125, -0.02257537841796875, -0.013824462890625, -0.00507354736328125, 0.0036773681640625, 0.01242828369140625, 0.02117919921875, 0.02993011474609375, 0.0386810302734375, 0.04743194580078125, 0.056182861328125, 0.06493377685546875, 0.0736846923828125, 0.08243560791015625, 0.0911865234375, 0.09993743896484375, 0.1086883544921875, 0.11743927001953125, 0.126190185546875, 0.13494110107421875, 0.1436920166015625, 0.15244293212890625, 0.16119384765625, 0.16994476318359375, 0.1786956787109375, 0.18744659423828125, 0.196197509765625, 0.20494842529296875, 0.2136993408203125, 0.22245025634765625, 0.231201171875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 6.0, 9.0, 15.0, 19.0, 25.0, 49.0, 94.0, 140.0, 232.0, 319.0, 598.0, 974.0, 1792.0, 3437.0, 6500.0, 12872.0, 24868.0, 47668.0, 88968.0, 154008.0, 241748.0, 197339.0, 123474.0, 68167.0, 36026.0, 18622.0, 9652.0, 4907.0, 2576.0, 1445.0, 806.0, 444.0, 256.0, 184.0, 109.0, 73.0, 44.0, 29.0, 25.0, 13.0, 8.0, 10.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0169219970703125, -0.016353845596313477, -0.015785694122314453, -0.01521754264831543, -0.014649391174316406, -0.014081239700317383, -0.01351308822631836, -0.012944936752319336, -0.012376785278320312, -0.011808633804321289, -0.011240482330322266, -0.010672330856323242, -0.010104179382324219, -0.009536027908325195, -0.008967876434326172, -0.008399724960327148, -0.007831573486328125, -0.0072634220123291016, -0.006695270538330078, -0.006127119064331055, -0.005558967590332031, -0.004990816116333008, -0.004422664642333984, -0.003854513168334961, -0.0032863616943359375, -0.002718210220336914, -0.0021500587463378906, -0.0015819072723388672, -0.0010137557983398438, -0.0004456043243408203, 0.00012254714965820312, 0.0006906986236572266, 0.00125885009765625, 0.0018270015716552734, 0.002395153045654297, 0.0029633045196533203, 0.0035314559936523438, 0.004099607467651367, 0.004667758941650391, 0.005235910415649414, 0.0058040618896484375, 0.006372213363647461, 0.006940364837646484, 0.007508516311645508, 0.008076667785644531, 0.008644819259643555, 0.009212970733642578, 0.009781122207641602, 0.010349273681640625, 0.010917425155639648, 0.011485576629638672, 0.012053728103637695, 0.012621879577636719, 0.013190031051635742, 0.013758182525634766, 0.014326333999633789, 0.014894485473632812, 0.015462636947631836, 0.01603078842163086, 0.016598939895629883, 0.017167091369628906, 0.01773524284362793, 0.018303394317626953, 0.018871545791625977, 0.019439697265625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 9.0, 2.0, 8.0, 10.0, 6.0, 12.0, 12.0, 17.0, 16.0, 23.0, 19.0, 34.0, 32.0, 25.0, 27.0, 31.0, 46.0, 52.0, 64.0, 49.0, 49.0, 46.0, 45.0, 33.0, 43.0, 37.0, 33.0, 43.0, 26.0, 28.0, 14.0, 15.0, 18.0, 16.0, 11.0, 13.0, 8.0, 5.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-1.0728836059570312e-05, -1.043267548084259e-05, -1.0136514902114868e-05, -9.840354323387146e-06, -9.544193744659424e-06, -9.248033165931702e-06, -8.95187258720398e-06, -8.655712008476257e-06, -8.359551429748535e-06, -8.063390851020813e-06, -7.76723027229309e-06, -7.471069693565369e-06, -7.1749091148376465e-06, -6.878748536109924e-06, -6.582587957382202e-06, -6.28642737865448e-06, -5.990266799926758e-06, -5.694106221199036e-06, -5.3979456424713135e-06, -5.101785063743591e-06, -4.805624485015869e-06, -4.509463906288147e-06, -4.213303327560425e-06, -3.917142748832703e-06, -3.6209821701049805e-06, -3.3248215913772583e-06, -3.028661012649536e-06, -2.732500433921814e-06, -2.436339855194092e-06, -2.1401792764663696e-06, -1.8440186977386475e-06, -1.5478581190109253e-06, -1.2516975402832031e-06, -9.55536961555481e-07, -6.593763828277588e-07, -3.632158041000366e-07, -6.705522537231445e-08, 2.2910535335540771e-07, 5.252659320831299e-07, 8.21426510810852e-07, 1.1175870895385742e-06, 1.4137476682662964e-06, 1.7099082469940186e-06, 2.0060688257217407e-06, 2.302229404449463e-06, 2.598389983177185e-06, 2.8945505619049072e-06, 3.1907111406326294e-06, 3.4868717193603516e-06, 3.7830322980880737e-06, 4.079192876815796e-06, 4.375353455543518e-06, 4.67151403427124e-06, 4.967674612998962e-06, 5.2638351917266846e-06, 5.559995770454407e-06, 5.856156349182129e-06, 6.152316927909851e-06, 6.448477506637573e-06, 6.744638085365295e-06, 7.040798664093018e-06, 7.33695924282074e-06, 7.633119821548462e-06, 7.929280400276184e-06, 8.225440979003906e-06]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 7.0, 9.0, 14.0, 10.0, 19.0, 41.0, 51.0, 85.0, 119.0, 239.0, 350.0, 558.0, 898.0, 1574.0, 2774.0, 4848.0, 8457.0, 15236.0, 28629.0, 51307.0, 90607.0, 145030.0, 214628.0, 183814.0, 126859.0, 76168.0, 43119.0, 23416.0, 12833.0, 7172.0, 4010.0, 2314.0, 1297.0, 732.0, 497.0, 283.0, 192.0, 107.0, 82.0, 50.0, 34.0, 22.0, 20.0, 9.0, 7.0, 12.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0172882080078125, -0.016727685928344727, -0.016167163848876953, -0.01560664176940918, -0.015046119689941406, -0.014485597610473633, -0.01392507553100586, -0.013364553451538086, -0.012804031372070312, -0.012243509292602539, -0.011682987213134766, -0.011122465133666992, -0.010561943054199219, -0.010001420974731445, -0.009440898895263672, -0.008880376815795898, -0.008319854736328125, -0.0077593326568603516, -0.007198810577392578, -0.006638288497924805, -0.006077766418457031, -0.005517244338989258, -0.004956722259521484, -0.004396200180053711, -0.0038356781005859375, -0.003275156021118164, -0.0027146339416503906, -0.002154111862182617, -0.0015935897827148438, -0.0010330677032470703, -0.0004725456237792969, 8.797645568847656e-05, 0.00064849853515625, 0.0012090206146240234, 0.0017695426940917969, 0.0023300647735595703, 0.0028905868530273438, 0.003451108932495117, 0.004011631011962891, 0.004572153091430664, 0.0051326751708984375, 0.005693197250366211, 0.006253719329833984, 0.006814241409301758, 0.007374763488769531, 0.007935285568237305, 0.008495807647705078, 0.009056329727172852, 0.009616851806640625, 0.010177373886108398, 0.010737895965576172, 0.011298418045043945, 0.011858940124511719, 0.012419462203979492, 0.012979984283447266, 0.013540506362915039, 0.014101028442382812, 0.014661550521850586, 0.01522207260131836, 0.015782594680786133, 0.016343116760253906, 0.01690363883972168, 0.017464160919189453, 0.018024682998657227, 0.018585205078125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 6.0, 3.0, 7.0, 1.0, 5.0, 7.0, 6.0, 12.0, 16.0, 18.0, 20.0, 21.0, 29.0, 35.0, 35.0, 45.0, 52.0, 38.0, 45.0, 57.0, 49.0, 50.0, 42.0, 44.0, 52.0, 39.0, 41.0, 29.0, 34.0, 30.0, 22.0, 20.0, 12.0, 13.0, 11.0, 16.0, 11.0, 5.0, 10.0, 4.0, 2.0, 1.0, 3.0, 5.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0311737060546875, -0.030230045318603516, -0.02928638458251953, -0.028342723846435547, -0.027399063110351562, -0.026455402374267578, -0.025511741638183594, -0.02456808090209961, -0.023624420166015625, -0.02268075942993164, -0.021737098693847656, -0.020793437957763672, -0.019849777221679688, -0.018906116485595703, -0.01796245574951172, -0.017018795013427734, -0.01607513427734375, -0.015131473541259766, -0.014187812805175781, -0.013244152069091797, -0.012300491333007812, -0.011356830596923828, -0.010413169860839844, -0.00946950912475586, -0.008525848388671875, -0.007582187652587891, -0.006638526916503906, -0.005694866180419922, -0.0047512054443359375, -0.003807544708251953, -0.0028638839721679688, -0.0019202232360839844, -0.0009765625, -3.2901763916015625e-05, 0.0009107589721679688, 0.0018544197082519531, 0.0027980804443359375, 0.003741741180419922, 0.004685401916503906, 0.005629062652587891, 0.006572723388671875, 0.007516384124755859, 0.008460044860839844, 0.009403705596923828, 0.010347366333007812, 0.011291027069091797, 0.012234687805175781, 0.013178348541259766, 0.01412200927734375, 0.015065670013427734, 0.01600933074951172, 0.016952991485595703, 0.017896652221679688, 0.018840312957763672, 0.019783973693847656, 0.02072763442993164, 0.021671295166015625, 0.02261495590209961, 0.023558616638183594, 0.024502277374267578, 0.025445938110351562, 0.026389598846435547, 0.02733325958251953, 0.028276920318603516, 0.0292205810546875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 3.0, 18.0, 20.0, 44.0, 72.0, 89.0, 116.0, 149.0, 156.0, 105.0, 93.0, 50.0, 35.0, 12.0, 9.0, 10.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.0282689332962036, -1.005516529083252, -0.9827641844749451, -0.9600118398666382, -0.9372594952583313, -0.9145071506500244, -0.8917547464370728, -0.8690024018287659, -0.846250057220459, -0.8234977126121521, -0.8007453083992004, -0.7779929637908936, -0.7552406191825867, -0.7324882745742798, -0.7097358703613281, -0.6869835257530212, -0.6642311811447144, -0.6414788365364075, -0.6187264323234558, -0.5959740877151489, -0.573221743106842, -0.5504693984985352, -0.5277169942855835, -0.5049646496772766, -0.48221224546432495, -0.4594598710536957, -0.4367075264453888, -0.4139551520347595, -0.39120280742645264, -0.36845043301582336, -0.3456980586051941, -0.3229457139968872, -0.30019333958625793, -0.27744096517562866, -0.2546886205673218, -0.2319362461566925, -0.20918390154838562, -0.18643152713775635, -0.16367916762828827, -0.1409268081188202, -0.11817444860935211, -0.09542208909988403, -0.07266972959041595, -0.04991736263036728, -0.0271650031208992, -0.004412643611431122, 0.018339723348617554, 0.04109208285808563, 0.06384444236755371, 0.08659680187702179, 0.10934916138648987, 0.13210153579711914, 0.15485388040542603, 0.1776062548160553, 0.20035861432552338, 0.22311097383499146, 0.24586333334445953, 0.2686156928539276, 0.2913680672645569, 0.31412041187286377, 0.33687278628349304, 0.3596251308917999, 0.3823775053024292, 0.4051298499107361, 0.42788222432136536]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 2.0, 4.0, 7.0, 15.0, 11.0, 24.0, 21.0, 20.0, 32.0, 28.0, 28.0, 33.0, 36.0, 37.0, 49.0, 47.0, 55.0, 52.0, 56.0, 46.0, 56.0, 28.0, 46.0, 36.0, 41.0, 43.0, 24.0, 31.0, 23.0, 11.0, 10.0, 14.0, 9.0, 4.0, 6.0, 7.0, 6.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.7194504141807556, -0.6988180875778198, -0.678185760974884, -0.6575534343719482, -0.6369211077690125, -0.6162887811660767, -0.5956564545631409, -0.5750241279602051, -0.5543918013572693, -0.5337594747543335, -0.5131271481513977, -0.4924948215484619, -0.4718624949455261, -0.45123016834259033, -0.43059784173965454, -0.40996551513671875, -0.38933318853378296, -0.36870086193084717, -0.3480685353279114, -0.3274362087249756, -0.3068038821220398, -0.286171555519104, -0.2655392289161682, -0.24490690231323242, -0.22427457571029663, -0.20364224910736084, -0.18300992250442505, -0.16237759590148926, -0.14174526929855347, -0.12111294269561768, -0.10048061609268188, -0.0798482894897461, -0.0592159628868103, -0.03858363628387451, -0.01795130968093872, 0.0026810169219970703, 0.02331334352493286, 0.04394567012786865, 0.06457799673080444, 0.08521032333374023, 0.10584264993667603, 0.12647497653961182, 0.1471073031425476, 0.1677396297454834, 0.1883719563484192, 0.20900428295135498, 0.22963660955429077, 0.25026893615722656, 0.27090126276016235, 0.29153358936309814, 0.31216591596603394, 0.3327982425689697, 0.3534305691719055, 0.3740628957748413, 0.3946952223777771, 0.4153275489807129, 0.4359598755836487, 0.4565922021865845, 0.47722452878952026, 0.49785685539245605, 0.5184891819953918, 0.5391215085983276, 0.5597538352012634, 0.5803861618041992, 0.601018488407135]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 17.0, 18.0, 21.0, 35.0, 56.0, 81.0, 137.0, 205.0, 378.0, 671.0, 1187.0, 2269.0, 4569.0, 10077.0, 24645.0, 62124.0, 155652.0, 350430.0, 635717.0, 853271.0, 844392.0, 623481.0, 356575.0, 161065.0, 63784.0, 24327.0, 9877.0, 4393.0, 2125.0, 1081.0, 596.0, 383.0, 240.0, 151.0, 93.0, 56.0, 30.0, 26.0, 18.0, 12.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05841064453125, -0.056396484375, -0.05438232421875, -0.0523681640625, -0.05035400390625, -0.04833984375, -0.04632568359375, -0.0443115234375, -0.04229736328125, -0.040283203125, -0.03826904296875, -0.0362548828125, -0.03424072265625, -0.0322265625, -0.03021240234375, -0.0281982421875, -0.02618408203125, -0.024169921875, -0.02215576171875, -0.0201416015625, -0.01812744140625, -0.01611328125, -0.01409912109375, -0.0120849609375, -0.01007080078125, -0.008056640625, -0.00604248046875, -0.0040283203125, -0.00201416015625, 0.0, 0.00201416015625, 0.0040283203125, 0.00604248046875, 0.008056640625, 0.01007080078125, 0.0120849609375, 0.01409912109375, 0.01611328125, 0.01812744140625, 0.0201416015625, 0.02215576171875, 0.024169921875, 0.02618408203125, 0.0281982421875, 0.03021240234375, 0.0322265625, 0.03424072265625, 0.0362548828125, 0.03826904296875, 0.040283203125, 0.04229736328125, 0.0443115234375, 0.04632568359375, 0.04833984375, 0.05035400390625, 0.0523681640625, 0.05438232421875, 0.056396484375, 0.05841064453125, 0.0604248046875, 0.06243896484375, 0.064453125, 0.06646728515625, 0.0684814453125, 0.07049560546875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 5.0, 6.0, 7.0, 11.0, 9.0, 13.0, 18.0, 15.0, 15.0, 29.0, 31.0, 27.0, 24.0, 25.0, 32.0, 34.0, 33.0, 38.0, 49.0, 40.0, 47.0, 39.0, 29.0, 41.0, 47.0, 33.0, 40.0, 54.0, 28.0, 38.0, 20.0, 26.0, 20.0, 18.0, 18.0, 12.0, 8.0, 4.0, 5.0, 6.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.08013916015625, -0.07768726348876953, -0.07523536682128906, -0.0727834701538086, -0.07033157348632812, -0.06787967681884766, -0.06542778015136719, -0.06297588348388672, -0.06052398681640625, -0.05807209014892578, -0.05562019348144531, -0.053168296813964844, -0.050716400146484375, -0.048264503479003906, -0.04581260681152344, -0.04336071014404297, -0.0409088134765625, -0.03845691680908203, -0.03600502014160156, -0.033553123474121094, -0.031101226806640625, -0.028649330139160156, -0.026197433471679688, -0.02374553680419922, -0.02129364013671875, -0.01884174346923828, -0.016389846801757812, -0.013937950134277344, -0.011486053466796875, -0.009034156799316406, -0.0065822601318359375, -0.004130363464355469, -0.001678466796875, 0.0007734298706054688, 0.0032253265380859375, 0.005677223205566406, 0.008129119873046875, 0.010581016540527344, 0.013032913208007812, 0.015484809875488281, 0.01793670654296875, 0.02038860321044922, 0.022840499877929688, 0.025292396545410156, 0.027744293212890625, 0.030196189880371094, 0.03264808654785156, 0.03509998321533203, 0.0375518798828125, 0.04000377655029297, 0.04245567321777344, 0.044907569885253906, 0.047359466552734375, 0.049811363220214844, 0.05226325988769531, 0.05471515655517578, 0.05716705322265625, 0.05961894989013672, 0.06207084655761719, 0.06452274322509766, 0.06697463989257812, 0.0694265365600586, 0.07187843322753906, 0.07433032989501953, 0.0767822265625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 5.0, 2.0, 1.0, 2.0, 5.0, 6.0, 6.0, 7.0, 17.0, 15.0, 28.0, 40.0, 43.0, 88.0, 98.0, 177.0, 230.0, 446.0, 735.0, 1470.0, 3264.0, 9176.0, 40608.0, 314330.0, 2697042.0, 1002407.0, 96816.0, 17536.0, 4994.0, 2026.0, 1006.0, 588.0, 372.0, 204.0, 157.0, 121.0, 62.0, 45.0, 40.0, 21.0, 22.0, 12.0, 11.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15185546875, -0.14657020568847656, -0.14128494262695312, -0.1359996795654297, -0.13071441650390625, -0.1254291534423828, -0.12014389038085938, -0.11485862731933594, -0.1095733642578125, -0.10428810119628906, -0.09900283813476562, -0.09371757507324219, -0.08843231201171875, -0.08314704895019531, -0.07786178588867188, -0.07257652282714844, -0.067291259765625, -0.06200599670410156, -0.056720733642578125, -0.05143547058105469, -0.04615020751953125, -0.04086494445800781, -0.035579681396484375, -0.030294418334960938, -0.0250091552734375, -0.019723892211914062, -0.014438629150390625, -0.009153366088867188, -0.00386810302734375, 0.0014171600341796875, 0.006702423095703125, 0.011987686157226562, 0.01727294921875, 0.022558212280273438, 0.027843475341796875, 0.03312873840332031, 0.03841400146484375, 0.04369926452636719, 0.048984527587890625, 0.05426979064941406, 0.0595550537109375, 0.06484031677246094, 0.07012557983398438, 0.07541084289550781, 0.08069610595703125, 0.08598136901855469, 0.09126663208007812, 0.09655189514160156, 0.101837158203125, 0.10712242126464844, 0.11240768432617188, 0.11769294738769531, 0.12297821044921875, 0.1282634735107422, 0.13354873657226562, 0.13883399963378906, 0.1441192626953125, 0.14940452575683594, 0.15468978881835938, 0.1599750518798828, 0.16526031494140625, 0.1705455780029297, 0.17583084106445312, 0.18111610412597656, 0.1864013671875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 5.0, 2.0, 6.0, 5.0, 6.0, 9.0, 19.0, 18.0, 21.0, 33.0, 55.0, 77.0, 100.0, 138.0, 180.0, 251.0, 298.0, 352.0, 427.0, 416.0, 403.0, 321.0, 249.0, 189.0, 135.0, 108.0, 75.0, 48.0, 34.0, 29.0, 18.0, 10.0, 12.0, 10.0, 5.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17333984375, -0.16812515258789062, -0.16291046142578125, -0.15769577026367188, -0.1524810791015625, -0.14726638793945312, -0.14205169677734375, -0.13683700561523438, -0.131622314453125, -0.12640762329101562, -0.12119293212890625, -0.11597824096679688, -0.1107635498046875, -0.10554885864257812, -0.10033416748046875, -0.09511947631835938, -0.08990478515625, -0.08469009399414062, -0.07947540283203125, -0.07426071166992188, -0.0690460205078125, -0.06383132934570312, -0.05861663818359375, -0.053401947021484375, -0.048187255859375, -0.042972564697265625, -0.03775787353515625, -0.032543182373046875, -0.0273284912109375, -0.022113800048828125, -0.01689910888671875, -0.011684417724609375, -0.0064697265625, -0.001255035400390625, 0.00395965576171875, 0.009174346923828125, 0.0143890380859375, 0.019603729248046875, 0.02481842041015625, 0.030033111572265625, 0.035247802734375, 0.040462493896484375, 0.04567718505859375, 0.050891876220703125, 0.0561065673828125, 0.061321258544921875, 0.06653594970703125, 0.07175064086914062, 0.07696533203125, 0.08218002319335938, 0.08739471435546875, 0.09260940551757812, 0.0978240966796875, 0.10303878784179688, 0.10825347900390625, 0.11346817016601562, 0.118682861328125, 0.12389755249023438, 0.12911224365234375, 0.13432693481445312, 0.1395416259765625, 0.14475631713867188, 0.14997100830078125, 0.15518569946289062, 0.160400390625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 4.0, 4.0, 9.0, 19.0, 15.0, 27.0, 50.0, 60.0, 74.0, 82.0, 102.0, 107.0, 88.0, 97.0, 73.0, 50.0, 42.0, 17.0, 16.0, 19.0, 15.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0907734632492065, -1.0485775470733643, -1.0063815116882324, -0.9641855359077454, -0.9219895601272583, -0.8797935843467712, -0.8375976085662842, -0.7954016327857971, -0.7532056570053101, -0.711009681224823, -0.6688137054443359, -0.6266177296638489, -0.5844217538833618, -0.5422257781028748, -0.5000298023223877, -0.45783382654190063, -0.4156378507614136, -0.3734418749809265, -0.33124589920043945, -0.2890499234199524, -0.24685394763946533, -0.20465797185897827, -0.1624619960784912, -0.12026602029800415, -0.07807004451751709, -0.03587406873703003, 0.006321907043457031, 0.04851788282394409, 0.09071385860443115, 0.1329098343849182, 0.17510581016540527, 0.21730178594589233, 0.25949788093566895, 0.301693856716156, 0.34388983249664307, 0.3860858082771301, 0.4282817840576172, 0.47047775983810425, 0.5126737356185913, 0.5548697113990784, 0.5970656871795654, 0.6392616629600525, 0.6814576387405396, 0.7236536145210266, 0.7658495903015137, 0.8080455660820007, 0.8502415418624878, 0.8924375176429749, 0.9346334934234619, 0.976829469203949, 1.019025444984436, 1.0612213611602783, 1.1034173965454102, 1.145613431930542, 1.1878093481063843, 1.2300052642822266, 1.2722012996673584, 1.3143973350524902, 1.3565932512283325, 1.3987891674041748, 1.4409852027893066, 1.4831812381744385, 1.5253771543502808, 1.567573070526123, 1.6097691059112549]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 7.0, 5.0, 9.0, 9.0, 22.0, 17.0, 28.0, 35.0, 34.0, 43.0, 55.0, 44.0, 55.0, 69.0, 52.0, 69.0, 54.0, 49.0, 57.0, 46.0, 50.0, 37.0, 29.0, 36.0, 27.0, 25.0, 12.0, 10.0, 5.0, 8.0, 1.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0028741359710693, -0.9743561148643494, -0.9458381533622742, -0.9173201322555542, -0.8888021111488342, -0.8602840900421143, -0.8317661285400391, -0.8032481074333191, -0.7747300863265991, -0.7462120652198792, -0.717694103717804, -0.689176082611084, -0.660658061504364, -0.632140040397644, -0.6036220788955688, -0.5751040577888489, -0.5465860962867737, -0.5180680751800537, -0.48955008387565613, -0.46103209257125854, -0.4325140714645386, -0.403996080160141, -0.3754780888557434, -0.34696006774902344, -0.31844207644462585, -0.28992408514022827, -0.2614060640335083, -0.23288807272911072, -0.20437006652355194, -0.17585206031799316, -0.14733406901359558, -0.1188160628080368, -0.09029799699783325, -0.061779994517564774, -0.033261992037296295, -0.004743993282318115, 0.02377401292324066, 0.05229201912879944, 0.08081001043319702, 0.1093280166387558, 0.13784602284431458, 0.16636402904987335, 0.19488203525543213, 0.2234000265598297, 0.2519180178642273, 0.28043603897094727, 0.30895403027534485, 0.33747202157974243, 0.3659900426864624, 0.39450803399086, 0.42302605509757996, 0.45154404640197754, 0.4800620675086975, 0.5085800886154175, 0.5370980501174927, 0.5656160712242126, 0.5941340923309326, 0.6226521134376526, 0.6511700749397278, 0.6796880960464478, 0.7082061171531677, 0.7367241382598877, 0.7652420997619629, 0.7937601208686829, 0.8222780823707581]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 9.0, 16.0, 22.0, 35.0, 36.0, 52.0, 106.0, 153.0, 229.0, 399.0, 717.0, 1345.0, 2747.0, 6250.0, 16368.0, 49779.0, 184742.0, 481328.0, 216186.0, 57029.0, 17919.0, 6792.0, 2984.0, 1412.0, 767.0, 453.0, 275.0, 145.0, 88.0, 62.0, 37.0, 25.0, 20.0, 13.0, 10.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1273193359375, -0.12373828887939453, -0.12015724182128906, -0.1165761947631836, -0.11299514770507812, -0.10941410064697266, -0.10583305358886719, -0.10225200653076172, -0.09867095947265625, -0.09508991241455078, -0.09150886535644531, -0.08792781829833984, -0.08434677124023438, -0.0807657241821289, -0.07718467712402344, -0.07360363006591797, -0.0700225830078125, -0.06644153594970703, -0.06286048889160156, -0.059279441833496094, -0.055698394775390625, -0.052117347717285156, -0.04853630065917969, -0.04495525360107422, -0.04137420654296875, -0.03779315948486328, -0.03421211242675781, -0.030631065368652344, -0.027050018310546875, -0.023468971252441406, -0.019887924194335938, -0.01630687713623047, -0.012725830078125, -0.009144783020019531, -0.0055637359619140625, -0.0019826889038085938, 0.001598358154296875, 0.005179405212402344, 0.008760452270507812, 0.012341499328613281, 0.01592254638671875, 0.01950359344482422, 0.023084640502929688, 0.026665687561035156, 0.030246734619140625, 0.033827781677246094, 0.03740882873535156, 0.04098987579345703, 0.0445709228515625, 0.04815196990966797, 0.05173301696777344, 0.055314064025878906, 0.058895111083984375, 0.062476158142089844, 0.06605720520019531, 0.06963825225830078, 0.07321929931640625, 0.07680034637451172, 0.08038139343261719, 0.08396244049072266, 0.08754348754882812, 0.0911245346069336, 0.09470558166503906, 0.09828662872314453, 0.10186767578125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 3.0, 4.0, 2.0, 2.0, 7.0, 2.0, 4.0, 10.0, 21.0, 13.0, 15.0, 22.0, 24.0, 30.0, 22.0, 31.0, 40.0, 41.0, 41.0, 38.0, 59.0, 62.0, 55.0, 47.0, 49.0, 47.0, 61.0, 44.0, 30.0, 43.0, 25.0, 19.0, 19.0, 17.0, 15.0, 15.0, 6.0, 6.0, 6.0, 7.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12493896484375, -0.12124156951904297, -0.11754417419433594, -0.1138467788696289, -0.11014938354492188, -0.10645198822021484, -0.10275459289550781, -0.09905719757080078, -0.09535980224609375, -0.09166240692138672, -0.08796501159667969, -0.08426761627197266, -0.08057022094726562, -0.0768728256225586, -0.07317543029785156, -0.06947803497314453, -0.0657806396484375, -0.06208324432373047, -0.05838584899902344, -0.054688453674316406, -0.050991058349609375, -0.047293663024902344, -0.04359626770019531, -0.03989887237548828, -0.03620147705078125, -0.03250408172607422, -0.028806686401367188, -0.025109291076660156, -0.021411895751953125, -0.017714500427246094, -0.014017105102539062, -0.010319709777832031, -0.006622314453125, -0.0029249191284179688, 0.0007724761962890625, 0.004469871520996094, 0.008167266845703125, 0.011864662170410156, 0.015562057495117188, 0.01925945281982422, 0.02295684814453125, 0.02665424346923828, 0.030351638793945312, 0.034049034118652344, 0.037746429443359375, 0.041443824768066406, 0.04514122009277344, 0.04883861541748047, 0.0525360107421875, 0.05623340606689453, 0.05993080139160156, 0.0636281967163086, 0.06732559204101562, 0.07102298736572266, 0.07472038269042969, 0.07841777801513672, 0.08211517333984375, 0.08581256866455078, 0.08950996398925781, 0.09320735931396484, 0.09690475463867188, 0.1006021499633789, 0.10429954528808594, 0.10799694061279297, 0.1116943359375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 6.0, 6.0, 5.0, 11.0, 24.0, 28.0, 54.0, 84.0, 127.0, 244.0, 425.0, 841.0, 1755.0, 4290.0, 12424.0, 41357.0, 171434.0, 558907.0, 189180.0, 44940.0, 13498.0, 4826.0, 2017.0, 969.0, 465.0, 259.0, 129.0, 86.0, 58.0, 38.0, 22.0, 18.0, 9.0, 11.0, 4.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09112548828125, -0.08823585510253906, -0.08534622192382812, -0.08245658874511719, -0.07956695556640625, -0.07667732238769531, -0.07378768920898438, -0.07089805603027344, -0.0680084228515625, -0.06511878967285156, -0.062229156494140625, -0.05933952331542969, -0.05644989013671875, -0.05356025695800781, -0.050670623779296875, -0.04778099060058594, -0.044891357421875, -0.04200172424316406, -0.039112091064453125, -0.03622245788574219, -0.03333282470703125, -0.030443191528320312, -0.027553558349609375, -0.024663925170898438, -0.0217742919921875, -0.018884658813476562, -0.015995025634765625, -0.013105392456054688, -0.01021575927734375, -0.0073261260986328125, -0.004436492919921875, -0.0015468597412109375, 0.0013427734375, 0.0042324066162109375, 0.007122039794921875, 0.010011672973632812, 0.01290130615234375, 0.015790939331054688, 0.018680572509765625, 0.021570205688476562, 0.0244598388671875, 0.027349472045898438, 0.030239105224609375, 0.03312873840332031, 0.03601837158203125, 0.03890800476074219, 0.041797637939453125, 0.04468727111816406, 0.047576904296875, 0.05046653747558594, 0.053356170654296875, 0.05624580383300781, 0.05913543701171875, 0.06202507019042969, 0.06491470336914062, 0.06780433654785156, 0.0706939697265625, 0.07358360290527344, 0.07647323608398438, 0.07936286926269531, 0.08225250244140625, 0.08514213562011719, 0.08803176879882812, 0.09092140197753906, 0.09381103515625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 7.0, 5.0, 11.0, 8.0, 20.0, 18.0, 23.0, 28.0, 33.0, 44.0, 48.0, 53.0, 68.0, 72.0, 71.0, 85.0, 63.0, 64.0, 59.0, 39.0, 41.0, 24.0, 24.0, 29.0, 14.0, 12.0, 8.0, 7.0, 6.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.34521484375, -0.3358421325683594, -0.32646942138671875, -0.3170967102050781, -0.3077239990234375, -0.2983512878417969, -0.28897857666015625, -0.2796058654785156, -0.270233154296875, -0.2608604431152344, -0.25148773193359375, -0.24211502075195312, -0.2327423095703125, -0.22336959838867188, -0.21399688720703125, -0.20462417602539062, -0.19525146484375, -0.18587875366210938, -0.17650604248046875, -0.16713333129882812, -0.1577606201171875, -0.14838790893554688, -0.13901519775390625, -0.12964248657226562, -0.120269775390625, -0.11089706420898438, -0.10152435302734375, -0.09215164184570312, -0.0827789306640625, -0.07340621948242188, -0.06403350830078125, -0.054660797119140625, -0.0452880859375, -0.035915374755859375, -0.02654266357421875, -0.017169952392578125, -0.0077972412109375, 0.001575469970703125, 0.01094818115234375, 0.020320892333984375, 0.029693603515625, 0.039066314697265625, 0.04843902587890625, 0.057811737060546875, 0.0671844482421875, 0.07655715942382812, 0.08592987060546875, 0.09530258178710938, 0.10467529296875, 0.11404800415039062, 0.12342071533203125, 0.13279342651367188, 0.1421661376953125, 0.15153884887695312, 0.16091156005859375, 0.17028427124023438, 0.179656982421875, 0.18902969360351562, 0.19840240478515625, 0.20777511596679688, 0.2171478271484375, 0.22652053833007812, 0.23589324951171875, 0.24526596069335938, 0.254638671875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 3.0, 4.0, 11.0, 9.0, 12.0, 18.0, 24.0, 46.0, 45.0, 78.0, 162.0, 259.0, 510.0, 1133.0, 4464.0, 37822.0, 667974.0, 311798.0, 19216.0, 2955.0, 930.0, 390.0, 197.0, 153.0, 104.0, 52.0, 49.0, 35.0, 28.0, 19.0, 3.0, 10.0, 6.0, 3.0, 6.0, 5.0, 2.0, 8.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03643798828125, -0.03525733947753906, -0.034076690673828125, -0.03289604187011719, -0.03171539306640625, -0.030534744262695312, -0.029354095458984375, -0.028173446655273438, -0.0269927978515625, -0.025812149047851562, -0.024631500244140625, -0.023450851440429688, -0.02227020263671875, -0.021089553833007812, -0.019908905029296875, -0.018728256225585938, -0.017547607421875, -0.016366958618164062, -0.015186309814453125, -0.014005661010742188, -0.01282501220703125, -0.011644363403320312, -0.010463714599609375, -0.009283065795898438, -0.0081024169921875, -0.0069217681884765625, -0.005741119384765625, -0.0045604705810546875, -0.00337982177734375, -0.0021991729736328125, -0.001018524169921875, 0.0001621246337890625, 0.0013427734375, 0.0025234222412109375, 0.003704071044921875, 0.0048847198486328125, 0.00606536865234375, 0.0072460174560546875, 0.008426666259765625, 0.009607315063476562, 0.0107879638671875, 0.011968612670898438, 0.013149261474609375, 0.014329910278320312, 0.01551055908203125, 0.016691207885742188, 0.017871856689453125, 0.019052505493164062, 0.020233154296875, 0.021413803100585938, 0.022594451904296875, 0.023775100708007812, 0.02495574951171875, 0.026136398315429688, 0.027317047119140625, 0.028497695922851562, 0.0296783447265625, 0.030858993530273438, 0.032039642333984375, 0.03322029113769531, 0.03440093994140625, 0.03558158874511719, 0.036762237548828125, 0.03794288635253906, 0.03912353515625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 0.0, 2.0, 4.0, 8.0, 6.0, 9.0, 7.0, 13.0, 19.0, 16.0, 17.0, 28.0, 33.0, 29.0, 27.0, 55.0, 55.0, 60.0, 52.0, 63.0, 79.0, 40.0, 50.0, 71.0, 44.0, 27.0, 36.0, 34.0, 20.0, 10.0, 13.0, 14.0, 11.0, 5.0, 4.0, 6.0, 2.0, 6.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0], "bins": [-7.092952728271484e-06, -6.870366632938385e-06, -6.647780537605286e-06, -6.425194442272186e-06, -6.202608346939087e-06, -5.9800222516059875e-06, -5.757436156272888e-06, -5.534850060939789e-06, -5.3122639656066895e-06, -5.08967787027359e-06, -4.867091774940491e-06, -4.644505679607391e-06, -4.421919584274292e-06, -4.199333488941193e-06, -3.976747393608093e-06, -3.754161298274994e-06, -3.5315752029418945e-06, -3.308989107608795e-06, -3.086403012275696e-06, -2.8638169169425964e-06, -2.641230821609497e-06, -2.4186447262763977e-06, -2.1960586309432983e-06, -1.973472535610199e-06, -1.7508864402770996e-06, -1.5283003449440002e-06, -1.3057142496109009e-06, -1.0831281542778015e-06, -8.605420589447021e-07, -6.379559636116028e-07, -4.153698682785034e-07, -1.9278377294540405e-07, 2.9802322387695312e-08, 2.523884177207947e-07, 4.7497451305389404e-07, 6.975606083869934e-07, 9.201467037200928e-07, 1.1427327990531921e-06, 1.3653188943862915e-06, 1.5879049897193909e-06, 1.8104910850524902e-06, 2.0330771803855896e-06, 2.255663275718689e-06, 2.4782493710517883e-06, 2.7008354663848877e-06, 2.923421561717987e-06, 3.1460076570510864e-06, 3.368593752384186e-06, 3.591179847717285e-06, 3.8137659430503845e-06, 4.036352038383484e-06, 4.258938133716583e-06, 4.481524229049683e-06, 4.704110324382782e-06, 4.926696419715881e-06, 5.149282515048981e-06, 5.37186861038208e-06, 5.5944547057151794e-06, 5.817040801048279e-06, 6.039626896381378e-06, 6.2622129917144775e-06, 6.484799087047577e-06, 6.707385182380676e-06, 6.929971277713776e-06, 7.152557373046875e-06]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 7.0, 2.0, 3.0, 3.0, 6.0, 6.0, 7.0, 7.0, 10.0, 15.0, 21.0, 25.0, 33.0, 41.0, 83.0, 117.0, 156.0, 233.0, 429.0, 981.0, 2803.0, 11980.0, 73585.0, 589086.0, 316985.0, 40605.0, 7426.0, 1981.0, 792.0, 349.0, 240.0, 173.0, 113.0, 61.0, 57.0, 45.0, 26.0, 21.0, 22.0, 8.0, 5.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.03497314453125, -0.033997535705566406, -0.03302192687988281, -0.03204631805419922, -0.031070709228515625, -0.03009510040283203, -0.029119491577148438, -0.028143882751464844, -0.02716827392578125, -0.026192665100097656, -0.025217056274414062, -0.02424144744873047, -0.023265838623046875, -0.02229022979736328, -0.021314620971679688, -0.020339012145996094, -0.0193634033203125, -0.018387794494628906, -0.017412185668945312, -0.01643657684326172, -0.015460968017578125, -0.014485359191894531, -0.013509750366210938, -0.012534141540527344, -0.01155853271484375, -0.010582923889160156, -0.009607315063476562, -0.008631706237792969, -0.007656097412109375, -0.006680488586425781, -0.0057048797607421875, -0.004729270935058594, -0.003753662109375, -0.0027780532836914062, -0.0018024444580078125, -0.0008268356323242188, 0.000148773193359375, 0.0011243820190429688, 0.0020999908447265625, 0.0030755996704101562, 0.00405120849609375, 0.005026817321777344, 0.0060024261474609375, 0.006978034973144531, 0.007953643798828125, 0.008929252624511719, 0.009904861450195312, 0.010880470275878906, 0.0118560791015625, 0.012831687927246094, 0.013807296752929688, 0.014782905578613281, 0.015758514404296875, 0.01673412322998047, 0.017709732055664062, 0.018685340881347656, 0.01966094970703125, 0.020636558532714844, 0.021612167358398438, 0.02258777618408203, 0.023563385009765625, 0.02453899383544922, 0.025514602661132812, 0.026490211486816406, 0.0274658203125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 9.0, 18.0, 36.0, 63.0, 93.0, 139.0, 154.0, 167.0, 122.0, 76.0, 58.0, 21.0, 16.0, 13.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07470703125, -0.07283258438110352, -0.07095813751220703, -0.06908369064331055, -0.06720924377441406, -0.06533479690551758, -0.0634603500366211, -0.06158590316772461, -0.059711456298828125, -0.05783700942993164, -0.055962562561035156, -0.05408811569213867, -0.05221366882324219, -0.0503392219543457, -0.04846477508544922, -0.046590328216552734, -0.04471588134765625, -0.042841434478759766, -0.04096698760986328, -0.0390925407409668, -0.03721809387207031, -0.03534364700317383, -0.033469200134277344, -0.03159475326538086, -0.029720306396484375, -0.02784585952758789, -0.025971412658691406, -0.024096965789794922, -0.022222518920898438, -0.020348072052001953, -0.01847362518310547, -0.016599178314208984, -0.0147247314453125, -0.012850284576416016, -0.010975837707519531, -0.009101390838623047, -0.0072269439697265625, -0.005352497100830078, -0.0034780502319335938, -0.0016036033630371094, 0.000270843505859375, 0.0021452903747558594, 0.004019737243652344, 0.005894184112548828, 0.0077686309814453125, 0.009643077850341797, 0.011517524719238281, 0.013391971588134766, 0.01526641845703125, 0.017140865325927734, 0.01901531219482422, 0.020889759063720703, 0.022764205932617188, 0.024638652801513672, 0.026513099670410156, 0.02838754653930664, 0.030261993408203125, 0.03213644027709961, 0.034010887145996094, 0.03588533401489258, 0.03775978088378906, 0.03963422775268555, 0.04150867462158203, 0.043383121490478516, 0.045257568359375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 1.0, 5.0, 6.0, 8.0, 11.0, 19.0, 23.0, 29.0, 53.0, 83.0, 107.0, 160.0, 163.0, 110.0, 81.0, 39.0, 28.0, 25.0, 13.0, 8.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8822153210639954, -0.8621003031730652, -0.8419852256774902, -0.8218702077865601, -0.8017551898956299, -0.7816401720046997, -0.7615251541137695, -0.7414100766181946, -0.7212950587272644, -0.7011800408363342, -0.6810649633407593, -0.6609499454498291, -0.6408349275588989, -0.6207199096679688, -0.6006048917770386, -0.5804898142814636, -0.5603747963905334, -0.5402597784996033, -0.5201447010040283, -0.5000296831130981, -0.47991466522216797, -0.4597996473312378, -0.43968459963798523, -0.41956955194473267, -0.3994545340538025, -0.3793395161628723, -0.35922446846961975, -0.3391094207763672, -0.318994402885437, -0.29887938499450684, -0.2787643373012543, -0.2586492896080017, -0.23853430151939392, -0.21841926872730255, -0.19830423593521118, -0.1781892031431198, -0.15807417035102844, -0.13795913755893707, -0.1178441047668457, -0.09772907197475433, -0.07761403918266296, -0.057499006390571594, -0.037383973598480225, -0.017268940806388855, 0.0028460919857025146, 0.022961124777793884, 0.043076157569885254, 0.06319119036197662, 0.083306223154068, 0.10342125594615936, 0.12353628873825073, 0.1436513215303421, 0.16376635432243347, 0.18388138711452484, 0.2039964199066162, 0.22411145269870758, 0.24422648549079895, 0.2643415331840515, 0.2844565510749817, 0.30457156896591187, 0.32468661665916443, 0.344801664352417, 0.36491668224334717, 0.38503170013427734, 0.4051467478275299]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 9.0, 20.0, 25.0, 45.0, 49.0, 62.0, 74.0, 92.0, 159.0, 134.0, 76.0, 68.0, 65.0, 35.0, 37.0, 20.0, 17.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 4.0], "bins": [-1.9915807247161865, -1.9508219957351685, -1.91006338596344, -1.8693046569824219, -1.8285460472106934, -1.7877873182296753, -1.7470287084579468, -1.7062699794769287, -1.6655113697052002, -1.6247526407241821, -1.5839940309524536, -1.5432353019714355, -1.502476692199707, -1.461717963218689, -1.4209593534469604, -1.3802006244659424, -1.3394418954849243, -1.2986831665039062, -1.2579245567321777, -1.2171658277511597, -1.1764072179794312, -1.135648488998413, -1.0948898792266846, -1.0541311502456665, -1.0133724212646484, -0.9726137518882751, -0.9318550825119019, -0.8910964131355286, -0.8503377437591553, -0.8095790147781372, -0.7688203454017639, -0.7280616760253906, -0.6873030066490173, -0.646544337272644, -0.6057856678962708, -0.5650269985198975, -0.5242682695388794, -0.4835096299648285, -0.4427509307861328, -0.4019922614097595, -0.36123359203338623, -0.32047492265701294, -0.27971625328063965, -0.23895755410194397, -0.19819888472557068, -0.1574402153491974, -0.1166815310716629, -0.07592284679412842, -0.03516417741775513, 0.005594499409198761, 0.04635317623615265, 0.08711185306310654, 0.12787052989006042, 0.16862919926643372, 0.2093878835439682, 0.2501465678215027, 0.290905237197876, 0.33166390657424927, 0.37242257595062256, 0.41318127512931824, 0.45393994450569153, 0.4946986138820648, 0.5354573130607605, 0.5762159824371338, 0.6169746518135071]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 6.0, 7.0, 14.0, 9.0, 23.0, 28.0, 36.0, 48.0, 71.0, 371.0, 158.0, 57.0, 59.0, 33.0, 23.0, 10.0, 17.0, 13.0, 10.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.32177734375, -0.3144245147705078, -0.3070716857910156, -0.29971885681152344, -0.29236602783203125, -0.28501319885253906, -0.2776603698730469, -0.2703075408935547, -0.2629547119140625, -0.2556018829345703, -0.24824905395507812, -0.24089622497558594, -0.23354339599609375, -0.22619056701660156, -0.21883773803710938, -0.2114849090576172, -0.204132080078125, -0.1967792510986328, -0.18942642211914062, -0.18207359313964844, -0.17472076416015625, -0.16736793518066406, -0.16001510620117188, -0.1526622772216797, -0.1453094482421875, -0.1379566192626953, -0.13060379028320312, -0.12325096130371094, -0.11589813232421875, -0.10854530334472656, -0.10119247436523438, -0.09383964538574219, -0.08648681640625, -0.07913398742675781, -0.07178115844726562, -0.06442832946777344, -0.05707550048828125, -0.04972267150878906, -0.042369842529296875, -0.03501701354980469, -0.0276641845703125, -0.020311355590820312, -0.012958526611328125, -0.0056056976318359375, 0.00174713134765625, 0.009099960327148438, 0.016452789306640625, 0.023805618286132812, 0.031158447265625, 0.03851127624511719, 0.045864105224609375, 0.05321693420410156, 0.06056976318359375, 0.06792259216308594, 0.07527542114257812, 0.08262825012207031, 0.0899810791015625, 0.09733390808105469, 0.10468673706054688, 0.11203956604003906, 0.11939239501953125, 0.12674522399902344, 0.13409805297851562, 0.1414508819580078, 0.1488037109375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 5.0, 2.0, 5.0, 3.0, 9.0, 9.0, 11.0, 15.0, 18.0, 17.0, 39.0, 44.0, 67.0, 107.0, 142.0, 229.0, 404.0, 884.0, 2164.0, 6294.0, 28903.0, 8287369.0, 49596.0, 7760.0, 2496.0, 940.0, 405.0, 238.0, 146.0, 101.0, 49.0, 39.0, 27.0, 12.0, 11.0, 12.0, 3.0, 8.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.46612322330474854, -0.45372939109802246, -0.441335529088974, -0.4289416968822479, -0.41654783487319946, -0.4041540026664734, -0.3917601406574249, -0.37936630845069885, -0.3669724464416504, -0.3545786142349243, -0.34218475222587585, -0.3297909200191498, -0.3173970580101013, -0.30500322580337524, -0.2926093637943268, -0.2802155315876007, -0.26782166957855225, -0.25542783737182617, -0.2430339753627777, -0.23064012825489044, -0.21824628114700317, -0.2058524340391159, -0.19345858693122864, -0.18106475472450256, -0.1686709225177765, -0.15627707540988922, -0.14388322830200195, -0.13148938119411469, -0.11909553408622742, -0.10670168697834015, -0.09430784732103348, -0.08191400021314621, -0.06952014565467834, -0.05712629854679108, -0.04473245143890381, -0.03233860805630684, -0.01994476094841957, -0.007550913840532303, 0.004842929542064667, 0.017236776649951935, 0.029630623757839203, 0.04202447086572647, 0.05441831797361374, 0.06681215763092041, 0.07920600473880768, 0.09159985184669495, 0.10399369895458221, 0.11638754606246948, 0.12878139317035675, 0.14117524027824402, 0.1535690873861313, 0.16596293449401855, 0.17835678160190582, 0.1907506287097931, 0.20314446091651917, 0.21553832292556763, 0.2279321551322937, 0.24032600224018097, 0.25271984934806824, 0.2651136815547943, 0.2775075435638428, 0.28990137577056885, 0.3022952377796173, 0.3146890699863434, 0.32708293199539185]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 7.0, 1.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 5.0, 2.0, 6.0, 2.0, 3.0, 6.0, 3.0, 2.0, 3.0, 1.0, 5.0, 2.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5263785719871521, -0.5044112205505371, -0.4824438691139221, -0.4604765474796295, -0.4385091960430145, -0.41654184460639954, -0.39457452297210693, -0.37260717153549194, -0.35063982009887695, -0.32867246866226196, -0.306705117225647, -0.28473779559135437, -0.2627704441547394, -0.2408030927181244, -0.2188357561826706, -0.1968684196472168, -0.1749010682106018, -0.15293371677398682, -0.13096638023853302, -0.10899903625249863, -0.08703169226646423, -0.06506434828042984, -0.04309700429439545, -0.02112966775894165, 0.0008376836776733398, 0.022805027663707733, 0.044772371649742126, 0.06673971563577652, 0.08870705962181091, 0.1106744036078453, 0.1326417475938797, 0.1546090841293335, 0.1765763759613037, 0.1985437273979187, 0.2205110639333725, 0.2424784004688263, 0.2644457519054413, 0.2864131033420563, 0.3083804249763489, 0.33034777641296387, 0.35231512784957886, 0.37428247928619385, 0.39624983072280884, 0.41821715235710144, 0.44018450379371643, 0.4621518552303314, 0.484119176864624, 0.506086528301239, 0.528053879737854, 0.550021231174469, 0.571988582611084, 0.593955934047699, 0.615923285484314, 0.6378905773162842, 0.6598579287528992, 0.6818252801895142, 0.7037926316261292, 0.7257599830627441, 0.7477273344993591, 0.7696946859359741, 0.7916619777679443, 0.8136293292045593, 0.8355966806411743, 0.8575640320777893, 0.8795313835144043]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 7.0, 13.0, 6.0, 26.0, 27.0, 33.0, 44.0, 48.0, 60.0, 62.0, 76.0, 88.0, 85.0, 68.0, 74.0, 48.0, 55.0, 62.0, 22.0, 35.0, 19.0, 9.0, 7.0, 9.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1063232421875, -0.10365676879882812, -0.10099029541015625, -0.09832382202148438, -0.0956573486328125, -0.09299087524414062, -0.09032440185546875, -0.08765792846679688, -0.084991455078125, -0.08232498168945312, -0.07965850830078125, -0.07699203491210938, -0.0743255615234375, -0.07165908813476562, -0.06899261474609375, -0.06632614135742188, -0.06365966796875, -0.060993194580078125, -0.05832672119140625, -0.055660247802734375, -0.0529937744140625, -0.050327301025390625, -0.04766082763671875, -0.044994354248046875, -0.042327880859375, -0.039661407470703125, -0.03699493408203125, -0.034328460693359375, -0.0316619873046875, -0.028995513916015625, -0.02632904052734375, -0.023662567138671875, -0.02099609375, -0.018329620361328125, -0.01566314697265625, -0.012996673583984375, -0.0103302001953125, -0.007663726806640625, -0.00499725341796875, -0.002330780029296875, 0.000335693359375, 0.003002166748046875, 0.00566864013671875, 0.008335113525390625, 0.0110015869140625, 0.013668060302734375, 0.01633453369140625, 0.019001007080078125, 0.02166748046875, 0.024333953857421875, 0.02700042724609375, 0.029666900634765625, 0.0323333740234375, 0.034999847412109375, 0.03766632080078125, 0.040332794189453125, 0.042999267578125, 0.045665740966796875, 0.04833221435546875, 0.050998687744140625, 0.0536651611328125, 0.056331634521484375, 0.05899810791015625, 0.061664581298828125, 0.0643310546875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 7.0, 3.0, 3.0, 3.0, 19.0, 8.0, 19.0, 16.0, 36.0, 44.0, 57.0, 81.0, 133.0, 237.0, 380.0, 715.0, 1444.0, 2792.0, 5808.0, 12963.0, 34562.0, 129702.0, 227963.0, 67847.0, 21796.0, 9016.0, 4078.0, 2018.0, 1086.0, 551.0, 318.0, 182.0, 115.0, 82.0, 53.0, 30.0, 27.0, 22.0, 12.0, 16.0, 5.0, 6.0, 5.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.220703125, -1.181671142578125, -1.14263916015625, -1.103607177734375, -1.0645751953125, -1.025543212890625, -0.98651123046875, -0.947479248046875, -0.908447265625, -0.869415283203125, -0.83038330078125, -0.791351318359375, -0.7523193359375, -0.713287353515625, -0.67425537109375, -0.635223388671875, -0.59619140625, -0.557159423828125, -0.51812744140625, -0.479095458984375, -0.4400634765625, -0.401031494140625, -0.36199951171875, -0.322967529296875, -0.283935546875, -0.244903564453125, -0.20587158203125, -0.166839599609375, -0.1278076171875, -0.088775634765625, -0.04974365234375, -0.010711669921875, 0.0283203125, 0.067352294921875, 0.10638427734375, 0.145416259765625, 0.1844482421875, 0.223480224609375, 0.26251220703125, 0.301544189453125, 0.340576171875, 0.379608154296875, 0.41864013671875, 0.457672119140625, 0.4967041015625, 0.535736083984375, 0.57476806640625, 0.613800048828125, 0.65283203125, 0.691864013671875, 0.73089599609375, 0.769927978515625, 0.8089599609375, 0.847991943359375, 0.88702392578125, 0.926055908203125, 0.965087890625, 1.004119873046875, 1.04315185546875, 1.082183837890625, 1.1212158203125, 1.160247802734375, 1.19927978515625, 1.238311767578125, 1.27734375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 3.0, 5.0, 9.0, 9.0, 12.0, 9.0, 26.0, 18.0, 17.0, 29.0, 27.0, 33.0, 37.0, 32.0, 44.0, 46.0, 40.0, 55.0, 53.0, 56.0, 57.0, 53.0, 46.0, 48.0, 43.0, 36.0, 30.0, 24.0, 19.0, 14.0, 16.0, 10.0, 6.0, 12.0, 9.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0997314453125, -0.0966501235961914, -0.09356880187988281, -0.09048748016357422, -0.08740615844726562, -0.08432483673095703, -0.08124351501464844, -0.07816219329833984, -0.07508087158203125, -0.07199954986572266, -0.06891822814941406, -0.06583690643310547, -0.06275558471679688, -0.05967426300048828, -0.05659294128417969, -0.053511619567871094, -0.0504302978515625, -0.047348976135253906, -0.04426765441894531, -0.04118633270263672, -0.038105010986328125, -0.03502368927001953, -0.03194236755371094, -0.028861045837402344, -0.02577972412109375, -0.022698402404785156, -0.019617080688476562, -0.01653575897216797, -0.013454437255859375, -0.010373115539550781, -0.0072917938232421875, -0.004210472106933594, -0.001129150390625, 0.0019521713256835938, 0.0050334930419921875, 0.008114814758300781, 0.011196136474609375, 0.014277458190917969, 0.017358779907226562, 0.020440101623535156, 0.02352142333984375, 0.026602745056152344, 0.029684066772460938, 0.03276538848876953, 0.035846710205078125, 0.03892803192138672, 0.04200935363769531, 0.045090675354003906, 0.0481719970703125, 0.051253318786621094, 0.05433464050292969, 0.05741596221923828, 0.060497283935546875, 0.06357860565185547, 0.06665992736816406, 0.06974124908447266, 0.07282257080078125, 0.07590389251708984, 0.07898521423339844, 0.08206653594970703, 0.08514785766601562, 0.08822917938232422, 0.09131050109863281, 0.0943918228149414, 0.09747314453125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 6.0, 9.0, 11.0, 14.0, 32.0, 42.0, 55.0, 77.0, 66.0, 48.0, 32.0, 32.0, 16.0, 11.0, 7.0, 4.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3021215796470642, -0.29052022099494934, -0.2789188623428345, -0.2673175036907196, -0.25571614503860474, -0.24411478638648987, -0.232513427734375, -0.22091206908226013, -0.20931071043014526, -0.1977093517780304, -0.18610799312591553, -0.17450663447380066, -0.1629052758216858, -0.15130391716957092, -0.13970255851745605, -0.1281011998653412, -0.11649984121322632, -0.10489848256111145, -0.09329712390899658, -0.08169576525688171, -0.07009440660476685, -0.05849304795265198, -0.04689168930053711, -0.03529033064842224, -0.023688971996307373, -0.012087613344192505, -0.0004862546920776367, 0.011115103960037231, 0.0227164626121521, 0.03431782126426697, 0.045919179916381836, 0.057520538568496704, 0.06912189722061157, 0.08072325587272644, 0.09232461452484131, 0.10392597317695618, 0.11552733182907104, 0.1271286904811859, 0.13873004913330078, 0.15033140778541565, 0.16193276643753052, 0.17353412508964539, 0.18513548374176025, 0.19673684239387512, 0.20833820104599, 0.21993955969810486, 0.23154091835021973, 0.2431422770023346, 0.25474363565444946, 0.26634499430656433, 0.2779463529586792, 0.28954771161079407, 0.30114907026290894, 0.3127504289150238, 0.32435178756713867, 0.33595314621925354, 0.3475545048713684, 0.3591558635234833, 0.37075722217559814, 0.382358580827713, 0.3939599394798279, 0.40556129813194275, 0.4171626567840576, 0.4287640154361725, 0.44036537408828735]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 9.0, 6.0, 8.0, 8.0, 6.0, 2.0, 4.0, 7.0, 14.0, 16.0, 60.0, 107.0, 83.0, 35.0, 17.0, 9.0, 14.0, 9.0, 9.0, 8.0, 10.0, 4.0, 8.0, 3.0, 4.0, 2.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3772903084754944, -0.3655451238155365, -0.3537999391555786, -0.3420547544956207, -0.33030956983566284, -0.31856435537338257, -0.30681920051574707, -0.2950739860534668, -0.2833288013935089, -0.271583616733551, -0.25983843207359314, -0.24809324741363525, -0.23634804785251617, -0.2246028631925583, -0.2128576785326004, -0.20111247897148132, -0.18936730921268463, -0.17762212455272675, -0.16587693989276886, -0.15413174033164978, -0.1423865556716919, -0.130641371011734, -0.11889618635177612, -0.10715099424123764, -0.09540580958127975, -0.08366062492132187, -0.07191543281078339, -0.0601702481508255, -0.048425059765577316, -0.03667987138032913, -0.024934686720371246, -0.013189494609832764, -0.001444309949874878, 0.010300877504050732, 0.02204606495797634, 0.033791251480579376, 0.04553643986582756, 0.057281628251075745, 0.06902681291103363, 0.08077200502157211, 0.09251718968153, 0.10426237434148788, 0.11600756645202637, 0.12775275111198425, 0.13949793577194214, 0.15124312043190002, 0.1629883050918579, 0.174733504652977, 0.18647868931293488, 0.19822387397289276, 0.20996905863285065, 0.22171425819396973, 0.2334594428539276, 0.2452046275138855, 0.2569498121738434, 0.26869499683380127, 0.28044018149375916, 0.29218536615371704, 0.3039305508136749, 0.3156757354736328, 0.3274209201335907, 0.3391661047935486, 0.35091131925582886, 0.36265650391578674, 0.37440168857574463]}, "eval/loss": 2.2451658248901367, "eval/bleu": 2.3052062590891975e-13, "eval/runtime": 2533.9805, "eval/samples_per_second": 5.825, "eval/steps_per_second": 0.728} \ No newline at end of file +{"train/loss": 2.1087, "train/learning_rate": 2.5321100917431195e-06, "train/epoch": 2.78, "train/global_step": 4500, "_runtime": 64806, "_timestamp": 1651837074, "_step": 4508, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 6.0, 9.0, 34.0, 94.0, 154.0, 239.0, 209.0, 147.0, 81.0, 30.0, 12.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8217853903770447, -0.729047417640686, -0.6363095045089722, -0.5435715317726135, -0.45083358883857727, -0.358095645904541, -0.2653576731681824, -0.1726197600364685, -0.07988178730010986, 0.012856163084506989, 0.10559411346912384, 0.1983320713043213, 0.29107001423835754, 0.3838079571723938, 0.47654592990875244, 0.5692838430404663, 0.662021815776825, 0.7547597885131836, 0.8474977016448975, 0.9402356743812561, 1.0329736471176147, 1.1257115602493286, 1.218449592590332, 1.311187505722046, 1.4039254188537598, 1.4966633319854736, 1.589401364326477, 1.682139277458191, 1.7748771905899048, 1.8676152229309082, 1.960353136062622, 2.053091049194336, 2.14582896232605, 2.2385668754577637, 2.3313047885894775, 2.4240427017211914, 2.5167808532714844, 2.6095187664031982, 2.702256679534912, 2.794994592666626, 2.88773250579834, 2.9804704189300537, 3.0732083320617676, 3.1659464836120605, 3.2586843967437744, 3.3514223098754883, 3.444160223007202, 3.536898136138916, 3.629636287689209, 3.722374200820923, 3.8151121139526367, 3.9078502655029297, 4.0005879402160645, 4.093326091766357, 4.186063766479492, 4.278801918029785, 4.37153959274292, 4.464277744293213, 4.557015419006348, 4.649753570556641, 4.742491245269775, 4.835229396820068, 4.927967071533203, 5.020705223083496, 5.113443374633789]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 0.0, 9.0, 9.0, 2.0, 19.0, 9.0, 12.0, 19.0, 22.0, 27.0, 25.0, 26.0, 25.0, 38.0, 38.0, 44.0, 41.0, 46.0, 35.0, 30.0, 47.0, 42.0, 44.0, 53.0, 39.0, 39.0, 28.0, 24.0, 33.0, 25.0, 23.0, 23.0, 23.0, 14.0, 15.0, 9.0, 9.0, 8.0, 4.0, 8.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.0925257205963135, -1.0581175088882446, -1.0237091779708862, -0.9893009066581726, -0.954892635345459, -0.9204844236373901, -0.8860761523246765, -0.8516678810119629, -0.8172596096992493, -0.7828513383865356, -0.748443067073822, -0.7140347957611084, -0.6796265840530396, -0.6452182531356812, -0.6108100414276123, -0.5764017701148987, -0.5419934988021851, -0.5075852274894714, -0.4731769561767578, -0.4387687146663666, -0.40436044335365295, -0.36995217204093933, -0.3355439305305481, -0.3011356592178345, -0.26672738790512085, -0.23231911659240723, -0.1979108601808548, -0.16350260376930237, -0.12909433245658875, -0.09468606114387512, -0.06027780473232269, -0.025869548320770264, 0.00853884220123291, 0.042947106063365936, 0.07735536992549896, 0.11176363378763199, 0.14617189764976501, 0.18058016896247864, 0.21498842537403107, 0.2493966817855835, 0.2838049530982971, 0.31821322441101074, 0.35262149572372437, 0.3870297372341156, 0.4214380085468292, 0.45584627985954285, 0.4902545213699341, 0.5246627926826477, 0.5590710639953613, 0.593479335308075, 0.6278876066207886, 0.6622958779335022, 0.6967041492462158, 0.7311123609542847, 0.7655206322669983, 0.7999289035797119, 0.8343371748924255, 0.8687454462051392, 0.9031537175178528, 0.9375619888305664, 0.9719702005386353, 1.0063785314559937, 1.0407867431640625, 1.075195074081421, 1.1096032857894897]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 9.0, 10.0, 15.0, 18.0, 29.0, 35.0, 53.0, 67.0, 145.0, 215.0, 303.0, 548.0, 939.0, 1710.0, 3439.0, 7546.0, 18600.0, 48104.0, 124902.0, 318078.0, 695103.0, 1154959.0, 965323.0, 504647.0, 217527.0, 81714.0, 29320.0, 11114.0, 4692.0, 2238.0, 1179.0, 637.0, 393.0, 227.0, 148.0, 89.0, 63.0, 42.0, 28.0, 23.0, 18.0, 10.0, 6.0, 4.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.37890625, -1.334075927734375, -1.28924560546875, -1.244415283203125, -1.1995849609375, -1.154754638671875, -1.10992431640625, -1.065093994140625, -1.020263671875, -0.975433349609375, -0.93060302734375, -0.885772705078125, -0.8409423828125, -0.796112060546875, -0.75128173828125, -0.706451416015625, -0.66162109375, -0.616790771484375, -0.57196044921875, -0.527130126953125, -0.4822998046875, -0.437469482421875, -0.39263916015625, -0.347808837890625, -0.302978515625, -0.258148193359375, -0.21331787109375, -0.168487548828125, -0.1236572265625, -0.078826904296875, -0.03399658203125, 0.010833740234375, 0.0556640625, 0.100494384765625, 0.14532470703125, 0.190155029296875, 0.2349853515625, 0.279815673828125, 0.32464599609375, 0.369476318359375, 0.414306640625, 0.459136962890625, 0.50396728515625, 0.548797607421875, 0.5936279296875, 0.638458251953125, 0.68328857421875, 0.728118896484375, 0.77294921875, 0.817779541015625, 0.86260986328125, 0.907440185546875, 0.9522705078125, 0.997100830078125, 1.04193115234375, 1.086761474609375, 1.131591796875, 1.176422119140625, 1.22125244140625, 1.266082763671875, 1.3109130859375, 1.355743408203125, 1.40057373046875, 1.445404052734375, 1.490234375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 4.0, 5.0, 5.0, 5.0, 11.0, 18.0, 16.0, 24.0, 13.0, 29.0, 28.0, 17.0, 24.0, 30.0, 35.0, 47.0, 48.0, 49.0, 45.0, 38.0, 42.0, 52.0, 33.0, 50.0, 38.0, 38.0, 39.0, 36.0, 24.0, 25.0, 26.0, 19.0, 25.0, 19.0, 12.0, 2.0, 10.0, 4.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.681640625, -1.6260528564453125, -1.570465087890625, -1.5148773193359375, -1.45928955078125, -1.4037017822265625, -1.348114013671875, -1.2925262451171875, -1.2369384765625, -1.1813507080078125, -1.125762939453125, -1.0701751708984375, -1.01458740234375, -0.9589996337890625, -0.903411865234375, -0.8478240966796875, -0.792236328125, -0.7366485595703125, -0.681060791015625, -0.6254730224609375, -0.56988525390625, -0.5142974853515625, -0.458709716796875, -0.4031219482421875, -0.3475341796875, -0.2919464111328125, -0.236358642578125, -0.1807708740234375, -0.12518310546875, -0.0695953369140625, -0.014007568359375, 0.0415802001953125, 0.09716796875, 0.1527557373046875, 0.208343505859375, 0.2639312744140625, 0.31951904296875, 0.3751068115234375, 0.430694580078125, 0.4862823486328125, 0.5418701171875, 0.5974578857421875, 0.653045654296875, 0.7086334228515625, 0.76422119140625, 0.8198089599609375, 0.875396728515625, 0.9309844970703125, 0.986572265625, 1.0421600341796875, 1.097747802734375, 1.1533355712890625, 1.20892333984375, 1.2645111083984375, 1.320098876953125, 1.3756866455078125, 1.4312744140625, 1.4868621826171875, 1.542449951171875, 1.5980377197265625, 1.65362548828125, 1.7092132568359375, 1.764801025390625, 1.8203887939453125, 1.8759765625]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 8.0, 6.0, 8.0, 7.0, 7.0, 9.0, 23.0, 25.0, 43.0, 42.0, 77.0, 97.0, 172.0, 236.0, 440.0, 1072.0, 61745.0, 4126660.0, 2103.0, 551.0, 345.0, 195.0, 120.0, 71.0, 59.0, 39.0, 22.0, 21.0, 23.0, 13.0, 15.0, 3.0, 4.0, 8.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.40625, -18.784423828125, -18.16259765625, -17.540771484375, -16.9189453125, -16.297119140625, -15.67529296875, -15.053466796875, -14.431640625, -13.809814453125, -13.18798828125, -12.566162109375, -11.9443359375, -11.322509765625, -10.70068359375, -10.078857421875, -9.45703125, -8.835205078125, -8.21337890625, -7.591552734375, -6.9697265625, -6.347900390625, -5.72607421875, -5.104248046875, -4.482421875, -3.860595703125, -3.23876953125, -2.616943359375, -1.9951171875, -1.373291015625, -0.75146484375, -0.129638671875, 0.4921875, 1.114013671875, 1.73583984375, 2.357666015625, 2.9794921875, 3.601318359375, 4.22314453125, 4.844970703125, 5.466796875, 6.088623046875, 6.71044921875, 7.332275390625, 7.9541015625, 8.575927734375, 9.19775390625, 9.819580078125, 10.44140625, 11.063232421875, 11.68505859375, 12.306884765625, 12.9287109375, 13.550537109375, 14.17236328125, 14.794189453125, 15.416015625, 16.037841796875, 16.65966796875, 17.281494140625, 17.9033203125, 18.525146484375, 19.14697265625, 19.768798828125, 20.390625]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 7.0, 5.0, 9.0, 4.0, 10.0, 14.0, 22.0, 30.0, 34.0, 33.0, 52.0, 76.0, 127.0, 129.0, 228.0, 295.0, 403.0, 508.0, 550.0, 412.0, 295.0, 235.0, 160.0, 104.0, 82.0, 55.0, 44.0, 30.0, 32.0, 21.0, 11.0, 8.0, 13.0, 11.0, 3.0, 6.0, 8.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65478515625, -0.6330032348632812, -0.6112213134765625, -0.5894393920898438, -0.567657470703125, -0.5458755493164062, -0.5240936279296875, -0.5023117065429688, -0.48052978515625, -0.45874786376953125, -0.4369659423828125, -0.41518402099609375, -0.393402099609375, -0.37162017822265625, -0.3498382568359375, -0.32805633544921875, -0.3062744140625, -0.28449249267578125, -0.2627105712890625, -0.24092864990234375, -0.219146728515625, -0.19736480712890625, -0.1755828857421875, -0.15380096435546875, -0.13201904296875, -0.11023712158203125, -0.0884552001953125, -0.06667327880859375, -0.044891357421875, -0.02310943603515625, -0.0013275146484375, 0.02045440673828125, 0.042236328125, 0.06401824951171875, 0.0858001708984375, 0.10758209228515625, 0.129364013671875, 0.15114593505859375, 0.1729278564453125, 0.19470977783203125, 0.21649169921875, 0.23827362060546875, 0.2600555419921875, 0.28183746337890625, 0.303619384765625, 0.32540130615234375, 0.3471832275390625, 0.36896514892578125, 0.3907470703125, 0.41252899169921875, 0.4343109130859375, 0.45609283447265625, 0.477874755859375, 0.49965667724609375, 0.5214385986328125, 0.5432205200195312, 0.56500244140625, 0.5867843627929688, 0.6085662841796875, 0.6303482055664062, 0.652130126953125, 0.6739120483398438, 0.6956939697265625, 0.7174758911132812, 0.7392578125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 11.0, 19.0, 17.0, 21.0, 26.0, 41.0, 46.0, 50.0, 58.0, 94.0, 95.0, 89.0, 94.0, 66.0, 54.0, 45.0, 39.0, 35.0, 24.0, 17.0, 17.0, 13.0, 14.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6731536388397217, -2.592991590499878, -2.512829542160034, -2.4326672554016113, -2.3525052070617676, -2.272343158721924, -2.19218111038208, -2.1120190620422363, -2.0318570137023926, -1.9516949653625488, -1.8715327978134155, -1.7913707494735718, -1.711208701133728, -1.6310465335845947, -1.550884485244751, -1.4707224369049072, -1.390560269355774, -1.3103982210159302, -1.2302360534667969, -1.1500740051269531, -1.0699119567871094, -0.9897498488426208, -0.9095877408981323, -0.8294256925582886, -0.7492635846138, -0.6691014766693115, -0.5889394283294678, -0.5087773203849792, -0.4286152422428131, -0.348453164100647, -0.26829105615615845, -0.1881290078163147, -0.10796689987182617, -0.027804814279079437, 0.0523572713136673, 0.13251936435699463, 0.21268144249916077, 0.2928435206413269, 0.37300562858581543, 0.4531676769256592, 0.5333297848701477, 0.6134918928146362, 0.69365394115448, 0.7738160490989685, 0.853978157043457, 0.9341402053833008, 1.0143022537231445, 1.0944643020629883, 1.1746264696121216, 1.2547885179519653, 1.3349506855010986, 1.4151127338409424, 1.4952747821807861, 1.5754368305206299, 1.6555989980697632, 1.735761046409607, 1.8159232139587402, 1.896085262298584, 1.9762474298477173, 2.0564093589782715, 2.1365716457366943, 2.216733694076538, 2.296895742416382, 2.3770577907562256, 2.4572198390960693]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 0.0, 4.0, 8.0, 8.0, 6.0, 10.0, 14.0, 17.0, 20.0, 16.0, 25.0, 27.0, 27.0, 29.0, 31.0, 29.0, 35.0, 43.0, 47.0, 43.0, 42.0, 31.0, 53.0, 41.0, 30.0, 37.0, 32.0, 48.0, 30.0, 32.0, 35.0, 23.0, 28.0, 13.0, 23.0, 7.0, 13.0, 9.0, 4.0, 7.0, 3.0, 7.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4387236833572388, -1.3873543739318848, -1.3359849452972412, -1.2846155166625977, -1.2332462072372437, -1.1818768978118896, -1.130507469177246, -1.0791380405426025, -1.0277687311172485, -0.9763993620872498, -0.925029993057251, -0.8736606240272522, -0.8222912549972534, -0.7709218859672546, -0.7195525169372559, -0.6681831479072571, -0.6168137788772583, -0.5654444098472595, -0.5140750408172607, -0.46270567178726196, -0.4113363027572632, -0.3599669337272644, -0.3085975646972656, -0.25722819566726685, -0.20585882663726807, -0.1544894576072693, -0.10312008857727051, -0.05175071954727173, -0.0003813505172729492, 0.05098801851272583, 0.10235738754272461, 0.1537267565727234, 0.20509624481201172, 0.2564656138420105, 0.3078349828720093, 0.35920435190200806, 0.41057372093200684, 0.4619430899620056, 0.5133124589920044, 0.5646818280220032, 0.616051197052002, 0.6674205660820007, 0.7187899351119995, 0.7701593041419983, 0.8215286731719971, 0.8728980422019958, 0.9242674112319946, 0.9756367802619934, 1.0270061492919922, 1.0783755779266357, 1.1297448873519897, 1.1811141967773438, 1.2324836254119873, 1.2838530540466309, 1.3352223634719849, 1.3865916728973389, 1.4379611015319824, 1.489330530166626, 1.54069983959198, 1.592069149017334, 1.6434385776519775, 1.694808006286621, 1.746177315711975, 1.797546625137329, 1.8489160537719727]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 6.0, 17.0, 16.0, 25.0, 33.0, 44.0, 72.0, 127.0, 206.0, 300.0, 509.0, 731.0, 1249.0, 1955.0, 3265.0, 5578.0, 10015.0, 18648.0, 35958.0, 70655.0, 142496.0, 259405.0, 239750.0, 125016.0, 62475.0, 31764.0, 16750.0, 8809.0, 5047.0, 2851.0, 1772.0, 1092.0, 710.0, 411.0, 289.0, 205.0, 118.0, 62.0, 48.0, 25.0, 15.0, 10.0, 15.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.471923828125, -0.4550132751464844, -0.43810272216796875, -0.4211921691894531, -0.4042816162109375, -0.3873710632324219, -0.37046051025390625, -0.3535499572753906, -0.336639404296875, -0.3197288513183594, -0.30281829833984375, -0.2859077453613281, -0.2689971923828125, -0.2520866394042969, -0.23517608642578125, -0.21826553344726562, -0.20135498046875, -0.18444442749023438, -0.16753387451171875, -0.15062332153320312, -0.1337127685546875, -0.11680221557617188, -0.09989166259765625, -0.08298110961914062, -0.066070556640625, -0.049160003662109375, -0.03224945068359375, -0.015338897705078125, 0.0015716552734375, 0.018482208251953125, 0.03539276123046875, 0.052303314208984375, 0.0692138671875, 0.08612442016601562, 0.10303497314453125, 0.11994552612304688, 0.1368560791015625, 0.15376663208007812, 0.17067718505859375, 0.18758773803710938, 0.204498291015625, 0.22140884399414062, 0.23831939697265625, 0.2552299499511719, 0.2721405029296875, 0.2890510559082031, 0.30596160888671875, 0.3228721618652344, 0.33978271484375, 0.3566932678222656, 0.37360382080078125, 0.3905143737792969, 0.4074249267578125, 0.4243354797363281, 0.44124603271484375, 0.4581565856933594, 0.475067138671875, 0.4919776916503906, 0.5088882446289062, 0.5257987976074219, 0.5427093505859375, 0.5596199035644531, 0.5765304565429688, 0.5934410095214844, 0.6103515625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 8.0, 14.0, 2.0, 13.0, 9.0, 9.0, 16.0, 22.0, 32.0, 21.0, 35.0, 27.0, 29.0, 25.0, 29.0, 38.0, 36.0, 43.0, 48.0, 39.0, 38.0, 42.0, 49.0, 37.0, 41.0, 36.0, 25.0, 42.0, 23.0, 25.0, 17.0, 25.0, 15.0, 15.0, 9.0, 9.0, 7.0, 7.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 4.0, 2.0, 1.0], "bins": [-1.2109375, -1.1737518310546875, -1.136566162109375, -1.0993804931640625, -1.06219482421875, -1.0250091552734375, -0.987823486328125, -0.9506378173828125, -0.9134521484375, -0.8762664794921875, -0.839080810546875, -0.8018951416015625, -0.76470947265625, -0.7275238037109375, -0.690338134765625, -0.6531524658203125, -0.615966796875, -0.5787811279296875, -0.541595458984375, -0.5044097900390625, -0.46722412109375, -0.4300384521484375, -0.392852783203125, -0.3556671142578125, -0.3184814453125, -0.2812957763671875, -0.244110107421875, -0.2069244384765625, -0.16973876953125, -0.1325531005859375, -0.095367431640625, -0.0581817626953125, -0.02099609375, 0.0161895751953125, 0.053375244140625, 0.0905609130859375, 0.12774658203125, 0.1649322509765625, 0.202117919921875, 0.2393035888671875, 0.2764892578125, 0.3136749267578125, 0.350860595703125, 0.3880462646484375, 0.42523193359375, 0.4624176025390625, 0.499603271484375, 0.5367889404296875, 0.573974609375, 0.6111602783203125, 0.648345947265625, 0.6855316162109375, 0.72271728515625, 0.7599029541015625, 0.797088623046875, 0.8342742919921875, 0.8714599609375, 0.9086456298828125, 0.945831298828125, 0.9830169677734375, 1.02020263671875, 1.0573883056640625, 1.094573974609375, 1.1317596435546875, 1.1689453125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 3.0, 8.0, 4.0, 13.0, 16.0, 31.0, 37.0, 50.0, 69.0, 97.0, 213.0, 285.0, 505.0, 905.0, 1959.0, 4144.0, 9575.0, 25353.0, 74726.0, 252957.0, 436301.0, 160774.0, 49404.0, 17503.0, 7080.0, 3159.0, 1459.0, 791.0, 430.0, 267.0, 159.0, 84.0, 55.0, 34.0, 30.0, 16.0, 15.0, 9.0, 8.0, 8.0, 3.0, 4.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.9814453125, -0.950103759765625, -0.91876220703125, -0.887420654296875, -0.8560791015625, -0.824737548828125, -0.79339599609375, -0.762054443359375, -0.730712890625, -0.699371337890625, -0.66802978515625, -0.636688232421875, -0.6053466796875, -0.574005126953125, -0.54266357421875, -0.511322021484375, -0.47998046875, -0.448638916015625, -0.41729736328125, -0.385955810546875, -0.3546142578125, -0.323272705078125, -0.29193115234375, -0.260589599609375, -0.229248046875, -0.197906494140625, -0.16656494140625, -0.135223388671875, -0.1038818359375, -0.072540283203125, -0.04119873046875, -0.009857177734375, 0.021484375, 0.052825927734375, 0.08416748046875, 0.115509033203125, 0.1468505859375, 0.178192138671875, 0.20953369140625, 0.240875244140625, 0.272216796875, 0.303558349609375, 0.33489990234375, 0.366241455078125, 0.3975830078125, 0.428924560546875, 0.46026611328125, 0.491607666015625, 0.52294921875, 0.554290771484375, 0.58563232421875, 0.616973876953125, 0.6483154296875, 0.679656982421875, 0.71099853515625, 0.742340087890625, 0.773681640625, 0.805023193359375, 0.83636474609375, 0.867706298828125, 0.8990478515625, 0.930389404296875, 0.96173095703125, 0.993072509765625, 1.0244140625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 2.0, 1.0, 3.0, 4.0, 8.0, 6.0, 12.0, 13.0, 20.0, 25.0, 24.0, 28.0, 34.0, 43.0, 54.0, 38.0, 43.0, 50.0, 52.0, 47.0, 51.0, 44.0, 47.0, 46.0, 47.0, 43.0, 40.0, 25.0, 33.0, 26.0, 12.0, 15.0, 18.0, 16.0, 13.0, 3.0, 6.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.673828125, -3.578887939453125, -3.48394775390625, -3.389007568359375, -3.2940673828125, -3.199127197265625, -3.10418701171875, -3.009246826171875, -2.914306640625, -2.819366455078125, -2.72442626953125, -2.629486083984375, -2.5345458984375, -2.439605712890625, -2.34466552734375, -2.249725341796875, -2.15478515625, -2.059844970703125, -1.96490478515625, -1.869964599609375, -1.7750244140625, -1.680084228515625, -1.58514404296875, -1.490203857421875, -1.395263671875, -1.300323486328125, -1.20538330078125, -1.110443115234375, -1.0155029296875, -0.920562744140625, -0.82562255859375, -0.730682373046875, -0.6357421875, -0.540802001953125, -0.44586181640625, -0.350921630859375, -0.2559814453125, -0.161041259765625, -0.06610107421875, 0.028839111328125, 0.123779296875, 0.218719482421875, 0.31365966796875, 0.408599853515625, 0.5035400390625, 0.598480224609375, 0.69342041015625, 0.788360595703125, 0.88330078125, 0.978240966796875, 1.07318115234375, 1.168121337890625, 1.2630615234375, 1.358001708984375, 1.45294189453125, 1.547882080078125, 1.642822265625, 1.737762451171875, 1.83270263671875, 1.927642822265625, 2.0225830078125, 2.117523193359375, 2.21246337890625, 2.307403564453125, 2.40234375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 6.0, 9.0, 16.0, 33.0, 33.0, 34.0, 51.0, 102.0, 149.0, 207.0, 311.0, 504.0, 808.0, 1340.0, 2283.0, 4178.0, 8639.0, 19248.0, 52689.0, 206021.0, 516008.0, 158288.0, 44057.0, 16669.0, 7646.0, 3885.0, 2122.0, 1158.0, 768.0, 425.0, 307.0, 168.0, 129.0, 76.0, 64.0, 48.0, 23.0, 17.0, 12.0, 8.0, 10.0, 5.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.382080078125, -0.37029266357421875, -0.3585052490234375, -0.34671783447265625, -0.334930419921875, -0.32314300537109375, -0.3113555908203125, -0.29956817626953125, -0.28778076171875, -0.27599334716796875, -0.2642059326171875, -0.25241851806640625, -0.240631103515625, -0.22884368896484375, -0.2170562744140625, -0.20526885986328125, -0.1934814453125, -0.18169403076171875, -0.1699066162109375, -0.15811920166015625, -0.146331787109375, -0.13454437255859375, -0.1227569580078125, -0.11096954345703125, -0.09918212890625, -0.08739471435546875, -0.0756072998046875, -0.06381988525390625, -0.052032470703125, -0.04024505615234375, -0.0284576416015625, -0.01667022705078125, -0.0048828125, 0.00690460205078125, 0.0186920166015625, 0.03047943115234375, 0.042266845703125, 0.05405426025390625, 0.0658416748046875, 0.07762908935546875, 0.08941650390625, 0.10120391845703125, 0.1129913330078125, 0.12477874755859375, 0.136566162109375, 0.14835357666015625, 0.1601409912109375, 0.17192840576171875, 0.1837158203125, 0.19550323486328125, 0.2072906494140625, 0.21907806396484375, 0.230865478515625, 0.24265289306640625, 0.2544403076171875, 0.26622772216796875, 0.27801513671875, 0.28980255126953125, 0.3015899658203125, 0.31337738037109375, 0.325164794921875, 0.33695220947265625, 0.3487396240234375, 0.36052703857421875, 0.372314453125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 1.0, 4.0, 14.0, 7.0, 20.0, 25.0, 52.0, 67.0, 141.0, 200.0, 185.0, 108.0, 62.0, 30.0, 24.0, 8.0, 10.0, 4.0, 4.0, 6.0, 5.0, 4.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00028824806213378906, -0.0002788752317428589, -0.0002695024013519287, -0.00026012957096099854, -0.00025075674057006836, -0.00024138391017913818, -0.000232011079788208, -0.00022263824939727783, -0.00021326541900634766, -0.00020389258861541748, -0.0001945197582244873, -0.00018514692783355713, -0.00017577409744262695, -0.00016640126705169678, -0.0001570284366607666, -0.00014765560626983643, -0.00013828277587890625, -0.00012890994548797607, -0.0001195371150970459, -0.00011016428470611572, -0.00010079145431518555, -9.141862392425537e-05, -8.20457935333252e-05, -7.267296314239502e-05, -6.330013275146484e-05, -5.392730236053467e-05, -4.455447196960449e-05, -3.5181641578674316e-05, -2.580881118774414e-05, -1.6435980796813965e-05, -7.063150405883789e-06, 2.3096799850463867e-06, 1.1682510375976562e-05, 2.1055340766906738e-05, 3.0428171157836914e-05, 3.980100154876709e-05, 4.9173831939697266e-05, 5.854666233062744e-05, 6.791949272155762e-05, 7.729232311248779e-05, 8.666515350341797e-05, 9.603798389434814e-05, 0.00010541081428527832, 0.0001147836446762085, 0.00012415647506713867, 0.00013352930545806885, 0.00014290213584899902, 0.0001522749662399292, 0.00016164779663085938, 0.00017102062702178955, 0.00018039345741271973, 0.0001897662878036499, 0.00019913911819458008, 0.00020851194858551025, 0.00021788477897644043, 0.0002272576093673706, 0.00023663043975830078, 0.00024600327014923096, 0.00025537610054016113, 0.0002647489309310913, 0.0002741217613220215, 0.00028349459171295166, 0.00029286742210388184, 0.000302240252494812, 0.0003116130828857422]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 1.0, 9.0, 5.0, 11.0, 15.0, 15.0, 23.0, 27.0, 27.0, 42.0, 55.0, 86.0, 142.0, 385.0, 1614.0, 10400.0, 163638.0, 826780.0, 39564.0, 4281.0, 839.0, 244.0, 103.0, 56.0, 53.0, 34.0, 26.0, 22.0, 12.0, 9.0, 11.0, 3.0, 3.0, 5.0, 4.0, 2.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2373046875, -1.2032012939453125, -1.169097900390625, -1.1349945068359375, -1.10089111328125, -1.0667877197265625, -1.032684326171875, -0.9985809326171875, -0.9644775390625, -0.9303741455078125, -0.896270751953125, -0.8621673583984375, -0.82806396484375, -0.7939605712890625, -0.759857177734375, -0.7257537841796875, -0.691650390625, -0.6575469970703125, -0.623443603515625, -0.5893402099609375, -0.55523681640625, -0.5211334228515625, -0.487030029296875, -0.4529266357421875, -0.4188232421875, -0.3847198486328125, -0.350616455078125, -0.3165130615234375, -0.28240966796875, -0.2483062744140625, -0.214202880859375, -0.1800994873046875, -0.14599609375, -0.1118927001953125, -0.077789306640625, -0.0436859130859375, -0.00958251953125, 0.0245208740234375, 0.058624267578125, 0.0927276611328125, 0.1268310546875, 0.1609344482421875, 0.195037841796875, 0.2291412353515625, 0.26324462890625, 0.2973480224609375, 0.331451416015625, 0.3655548095703125, 0.399658203125, 0.4337615966796875, 0.467864990234375, 0.5019683837890625, 0.53607177734375, 0.5701751708984375, 0.604278564453125, 0.6383819580078125, 0.6724853515625, 0.7065887451171875, 0.740692138671875, 0.7747955322265625, 0.80889892578125, 0.8430023193359375, 0.877105712890625, 0.9112091064453125, 0.9453125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 7.0, 7.0, 11.0, 12.0, 10.0, 11.0, 13.0, 21.0, 30.0, 27.0, 42.0, 41.0, 92.0, 76.0, 93.0, 112.0, 77.0, 67.0, 60.0, 41.0, 30.0, 25.0, 13.0, 14.0, 18.0, 10.0, 9.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1322021484375, -0.12841510772705078, -0.12462806701660156, -0.12084102630615234, -0.11705398559570312, -0.1132669448852539, -0.10947990417480469, -0.10569286346435547, -0.10190582275390625, -0.09811878204345703, -0.09433174133300781, -0.0905447006225586, -0.08675765991210938, -0.08297061920166016, -0.07918357849121094, -0.07539653778076172, -0.0716094970703125, -0.06782245635986328, -0.06403541564941406, -0.060248374938964844, -0.056461334228515625, -0.052674293518066406, -0.04888725280761719, -0.04510021209716797, -0.04131317138671875, -0.03752613067626953, -0.03373908996582031, -0.029952049255371094, -0.026165008544921875, -0.022377967834472656, -0.018590927124023438, -0.014803886413574219, -0.011016845703125, -0.007229804992675781, -0.0034427642822265625, 0.00034427642822265625, 0.004131317138671875, 0.007918357849121094, 0.011705398559570312, 0.015492439270019531, 0.01927947998046875, 0.02306652069091797, 0.026853561401367188, 0.030640602111816406, 0.034427642822265625, 0.038214683532714844, 0.04200172424316406, 0.04578876495361328, 0.0495758056640625, 0.05336284637451172, 0.05714988708496094, 0.060936927795410156, 0.06472396850585938, 0.0685110092163086, 0.07229804992675781, 0.07608509063720703, 0.07987213134765625, 0.08365917205810547, 0.08744621276855469, 0.0912332534790039, 0.09502029418945312, 0.09880733489990234, 0.10259437561035156, 0.10638141632080078, 0.11016845703125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 10.0, 13.0, 31.0, 39.0, 59.0, 68.0, 108.0, 144.0, 121.0, 128.0, 93.0, 73.0, 45.0, 18.0, 19.0, 16.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.001615524291992, -3.910857915878296, -3.8201003074645996, -3.729342460632324, -3.638584852218628, -3.5478272438049316, -3.4570696353912354, -3.366312026977539, -3.2755544185638428, -3.1847968101501465, -3.09403920173645, -3.003281593322754, -2.9125237464904785, -2.8217661380767822, -2.731008529663086, -2.6402509212493896, -2.5494933128356934, -2.458735704421997, -2.367978096008301, -2.2772202491760254, -2.186462640762329, -2.095705032348633, -2.0049474239349365, -1.9141898155212402, -1.8234319686889648, -1.7326743602752686, -1.6419166326522827, -1.5511590242385864, -1.4604014158248901, -1.3696436882019043, -1.278886079788208, -1.1881284713745117, -1.0973708629608154, -1.0066132545471191, -0.9158555865287781, -0.825097918510437, -0.7343403100967407, -0.6435826420783997, -0.5528249740600586, -0.4620673656463623, -0.37130969762802124, -0.28055205941200256, -0.1897944062948227, -0.09903675317764282, -0.008279114961624146, 0.08247852325439453, 0.1732361912727356, 0.2639937996864319, 0.35475146770477295, 0.4455091059207916, 0.5362667441368103, 0.6270244121551514, 0.7177820205688477, 0.8085396885871887, 0.8992973566055298, 0.9900549650192261, 1.080812692642212, 1.1715703010559082, 1.262328028678894, 1.3530856370925903, 1.4438432455062866, 1.5346009731292725, 1.6253585815429688, 1.716116189956665, 1.8068737983703613]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 6.0, 7.0, 7.0, 8.0, 15.0, 12.0, 21.0, 17.0, 24.0, 24.0, 25.0, 28.0, 36.0, 35.0, 30.0, 32.0, 54.0, 41.0, 47.0, 33.0, 42.0, 52.0, 36.0, 36.0, 36.0, 40.0, 55.0, 32.0, 29.0, 27.0, 20.0, 15.0, 16.0, 9.0, 11.0, 6.0, 7.0, 5.0, 7.0, 3.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1570268869400024, -1.1179341077804565, -1.078841209411621, -1.0397484302520752, -1.0006556510925293, -0.9615628123283386, -0.922469973564148, -0.883377194404602, -0.8442843556404114, -0.8051915168762207, -0.7660987377166748, -0.7270058989524841, -0.6879130601882935, -0.6488202810287476, -0.6097274422645569, -0.5706346035003662, -0.5315418243408203, -0.492449015378952, -0.45335620641708374, -0.41426336765289307, -0.3751705586910248, -0.3360777497291565, -0.2969849109649658, -0.25789210200309753, -0.21879929304122925, -0.17970648407936096, -0.14061366021633148, -0.1015208438038826, -0.062428027391433716, -0.02333521842956543, 0.01575760543346405, 0.05485042929649353, 0.09394311904907227, 0.13303592801094055, 0.17212875187397003, 0.2112215757369995, 0.2503143846988678, 0.2894071936607361, 0.32850003242492676, 0.36759284138679504, 0.40668565034866333, 0.4457784593105316, 0.4848712682723999, 0.5239641070365906, 0.5630569458007812, 0.6021497249603271, 0.6412425637245178, 0.6803354024887085, 0.7194281816482544, 0.7585210204124451, 0.797613799571991, 0.8367066383361816, 0.8757994174957275, 0.9148922562599182, 0.9539850950241089, 0.9930778741836548, 1.0321707725524902, 1.0712635517120361, 1.1103564500808716, 1.1494492292404175, 1.1885420083999634, 1.2276349067687988, 1.2667276859283447, 1.3058204650878906, 1.3449132442474365]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 8.0, 12.0, 24.0, 35.0, 34.0, 68.0, 67.0, 115.0, 168.0, 236.0, 400.0, 534.0, 826.0, 1382.0, 2176.0, 3665.0, 6446.0, 11789.0, 21956.0, 41567.0, 79803.0, 144908.0, 217768.0, 212119.0, 139219.0, 76003.0, 39293.0, 21277.0, 11207.0, 6048.0, 3550.0, 2053.0, 1279.0, 803.0, 536.0, 378.0, 240.0, 184.0, 108.0, 67.0, 72.0, 33.0, 21.0, 22.0, 14.0, 12.0, 8.0, 8.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.52294921875, -0.5070838928222656, -0.49121856689453125, -0.4753532409667969, -0.4594879150390625, -0.4436225891113281, -0.42775726318359375, -0.4118919372558594, -0.396026611328125, -0.3801612854003906, -0.36429595947265625, -0.3484306335449219, -0.3325653076171875, -0.3166999816894531, -0.30083465576171875, -0.2849693298339844, -0.26910400390625, -0.2532386779785156, -0.23737335205078125, -0.22150802612304688, -0.2056427001953125, -0.18977737426757812, -0.17391204833984375, -0.15804672241210938, -0.142181396484375, -0.12631607055664062, -0.11045074462890625, -0.09458541870117188, -0.0787200927734375, -0.06285476684570312, -0.04698944091796875, -0.031124114990234375, -0.0152587890625, 0.000606536865234375, 0.01647186279296875, 0.032337188720703125, 0.0482025146484375, 0.06406784057617188, 0.07993316650390625, 0.09579849243164062, 0.111663818359375, 0.12752914428710938, 0.14339447021484375, 0.15925979614257812, 0.1751251220703125, 0.19099044799804688, 0.20685577392578125, 0.22272109985351562, 0.23858642578125, 0.2544517517089844, 0.27031707763671875, 0.2861824035644531, 0.3020477294921875, 0.3179130554199219, 0.33377838134765625, 0.3496437072753906, 0.365509033203125, 0.3813743591308594, 0.39723968505859375, 0.4131050109863281, 0.4289703369140625, 0.4448356628417969, 0.46070098876953125, 0.4765663146972656, 0.492431640625]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 6.0, 5.0, 5.0, 12.0, 11.0, 14.0, 16.0, 19.0, 19.0, 26.0, 34.0, 26.0, 29.0, 42.0, 44.0, 52.0, 40.0, 66.0, 45.0, 66.0, 39.0, 49.0, 33.0, 34.0, 39.0, 33.0, 30.0, 30.0, 26.0, 20.0, 14.0, 16.0, 18.0, 16.0, 9.0, 3.0, 8.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8984375, -9.5850830078125, -9.271728515625, -8.9583740234375, -8.64501953125, -8.3316650390625, -8.018310546875, -7.7049560546875, -7.3916015625, -7.0782470703125, -6.764892578125, -6.4515380859375, -6.13818359375, -5.8248291015625, -5.511474609375, -5.1981201171875, -4.884765625, -4.5714111328125, -4.258056640625, -3.9447021484375, -3.63134765625, -3.3179931640625, -3.004638671875, -2.6912841796875, -2.3779296875, -2.0645751953125, -1.751220703125, -1.4378662109375, -1.12451171875, -0.8111572265625, -0.497802734375, -0.1844482421875, 0.12890625, 0.4422607421875, 0.755615234375, 1.0689697265625, 1.38232421875, 1.6956787109375, 2.009033203125, 2.3223876953125, 2.6357421875, 2.9490966796875, 3.262451171875, 3.5758056640625, 3.88916015625, 4.2025146484375, 4.515869140625, 4.8292236328125, 5.142578125, 5.4559326171875, 5.769287109375, 6.0826416015625, 6.39599609375, 6.7093505859375, 7.022705078125, 7.3360595703125, 7.6494140625, 7.9627685546875, 8.276123046875, 8.5894775390625, 8.90283203125, 9.2161865234375, 9.529541015625, 9.8428955078125, 10.15625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 1.0, 5.0, 6.0, 8.0, 10.0, 11.0, 16.0, 29.0, 28.0, 29.0, 51.0, 56.0, 71.0, 90.0, 137.0, 206.0, 252.0, 458.0, 935.0, 5275.0, 306446.0, 719950.0, 11745.0, 1222.0, 533.0, 279.0, 185.0, 136.0, 84.0, 81.0, 44.0, 41.0, 33.0, 26.0, 24.0, 8.0, 12.0, 7.0, 6.0, 6.0, 3.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.83984375, -3.7203369140625, -3.600830078125, -3.4813232421875, -3.36181640625, -3.2423095703125, -3.122802734375, -3.0032958984375, -2.8837890625, -2.7642822265625, -2.644775390625, -2.5252685546875, -2.40576171875, -2.2862548828125, -2.166748046875, -2.0472412109375, -1.927734375, -1.8082275390625, -1.688720703125, -1.5692138671875, -1.44970703125, -1.3302001953125, -1.210693359375, -1.0911865234375, -0.9716796875, -0.8521728515625, -0.732666015625, -0.6131591796875, -0.49365234375, -0.3741455078125, -0.254638671875, -0.1351318359375, -0.015625, 0.1038818359375, 0.223388671875, 0.3428955078125, 0.46240234375, 0.5819091796875, 0.701416015625, 0.8209228515625, 0.9404296875, 1.0599365234375, 1.179443359375, 1.2989501953125, 1.41845703125, 1.5379638671875, 1.657470703125, 1.7769775390625, 1.896484375, 2.0159912109375, 2.135498046875, 2.2550048828125, 2.37451171875, 2.4940185546875, 2.613525390625, 2.7330322265625, 2.8525390625, 2.9720458984375, 3.091552734375, 3.2110595703125, 3.33056640625, 3.4500732421875, 3.569580078125, 3.6890869140625, 3.80859375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 5.0, 3.0, 4.0, 5.0, 6.0, 8.0, 14.0, 19.0, 8.0, 22.0, 13.0, 22.0, 29.0, 25.0, 35.0, 46.0, 35.0, 38.0, 35.0, 48.0, 42.0, 54.0, 53.0, 47.0, 44.0, 46.0, 50.0, 24.0, 46.0, 28.0, 21.0, 30.0, 21.0, 10.0, 14.0, 16.0, 11.0, 7.0, 5.0, 6.0, 3.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.83203125, -7.55230712890625, -7.2725830078125, -6.99285888671875, -6.713134765625, -6.43341064453125, -6.1536865234375, -5.87396240234375, -5.59423828125, -5.31451416015625, -5.0347900390625, -4.75506591796875, -4.475341796875, -4.19561767578125, -3.9158935546875, -3.63616943359375, -3.3564453125, -3.07672119140625, -2.7969970703125, -2.51727294921875, -2.237548828125, -1.95782470703125, -1.6781005859375, -1.39837646484375, -1.11865234375, -0.83892822265625, -0.5592041015625, -0.27947998046875, 0.000244140625, 0.27996826171875, 0.5596923828125, 0.83941650390625, 1.119140625, 1.39886474609375, 1.6785888671875, 1.95831298828125, 2.238037109375, 2.51776123046875, 2.7974853515625, 3.07720947265625, 3.35693359375, 3.63665771484375, 3.9163818359375, 4.19610595703125, 4.475830078125, 4.75555419921875, 5.0352783203125, 5.31500244140625, 5.5947265625, 5.87445068359375, 6.1541748046875, 6.43389892578125, 6.713623046875, 6.99334716796875, 7.2730712890625, 7.55279541015625, 7.83251953125, 8.11224365234375, 8.3919677734375, 8.67169189453125, 8.951416015625, 9.23114013671875, 9.5108642578125, 9.79058837890625, 10.0703125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 4.0, 1.0, 8.0, 9.0, 15.0, 35.0, 42.0, 39.0, 77.0, 116.0, 244.0, 524.0, 1510.0, 6504.0, 92715.0, 907955.0, 32851.0, 3906.0, 1100.0, 410.0, 184.0, 119.0, 64.0, 48.0, 29.0, 21.0, 10.0, 8.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6376953125, -0.6166839599609375, -0.595672607421875, -0.5746612548828125, -0.55364990234375, -0.5326385498046875, -0.511627197265625, -0.4906158447265625, -0.4696044921875, -0.4485931396484375, -0.427581787109375, -0.4065704345703125, -0.38555908203125, -0.3645477294921875, -0.343536376953125, -0.3225250244140625, -0.301513671875, -0.2805023193359375, -0.259490966796875, -0.2384796142578125, -0.21746826171875, -0.1964569091796875, -0.175445556640625, -0.1544342041015625, -0.1334228515625, -0.1124114990234375, -0.091400146484375, -0.0703887939453125, -0.04937744140625, -0.0283660888671875, -0.007354736328125, 0.0136566162109375, 0.03466796875, 0.0556793212890625, 0.076690673828125, 0.0977020263671875, 0.11871337890625, 0.1397247314453125, 0.160736083984375, 0.1817474365234375, 0.2027587890625, 0.2237701416015625, 0.244781494140625, 0.2657928466796875, 0.28680419921875, 0.3078155517578125, 0.328826904296875, 0.3498382568359375, 0.370849609375, 0.3918609619140625, 0.412872314453125, 0.4338836669921875, 0.45489501953125, 0.4759063720703125, 0.496917724609375, 0.5179290771484375, 0.5389404296875, 0.5599517822265625, 0.580963134765625, 0.6019744873046875, 0.62298583984375, 0.6439971923828125, 0.665008544921875, 0.6860198974609375, 0.70703125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 9.0, 12.0, 15.0, 28.0, 17.0, 49.0, 67.0, 104.0, 158.0, 169.0, 133.0, 70.0, 45.0, 38.0, 27.0, 16.0, 8.0, 10.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.595518112182617e-05, -4.413537681102753e-05, -4.231557250022888e-05, -4.049576818943024e-05, -3.867596387863159e-05, -3.685615956783295e-05, -3.50363552570343e-05, -3.321655094623566e-05, -3.139674663543701e-05, -2.9576942324638367e-05, -2.775713801383972e-05, -2.5937333703041077e-05, -2.411752939224243e-05, -2.2297725081443787e-05, -2.047792077064514e-05, -1.8658116459846497e-05, -1.683831214904785e-05, -1.5018507838249207e-05, -1.3198703527450562e-05, -1.1378899216651917e-05, -9.559094905853271e-06, -7.739290595054626e-06, -5.9194862842559814e-06, -4.0996819734573364e-06, -2.2798776626586914e-06, -4.600733518600464e-07, 1.3597309589385986e-06, 3.1795352697372437e-06, 4.999339580535889e-06, 6.819143891334534e-06, 8.638948202133179e-06, 1.0458752512931824e-05, 1.2278556823730469e-05, 1.4098361134529114e-05, 1.591816544532776e-05, 1.7737969756126404e-05, 1.955777406692505e-05, 2.1377578377723694e-05, 2.319738268852234e-05, 2.5017186999320984e-05, 2.683699131011963e-05, 2.8656795620918274e-05, 3.047659993171692e-05, 3.2296404242515564e-05, 3.411620855331421e-05, 3.5936012864112854e-05, 3.77558171749115e-05, 3.9575621485710144e-05, 4.139542579650879e-05, 4.3215230107307434e-05, 4.503503441810608e-05, 4.6854838728904724e-05, 4.867464303970337e-05, 5.0494447350502014e-05, 5.231425166130066e-05, 5.4134055972099304e-05, 5.595386028289795e-05, 5.7773664593696594e-05, 5.959346890449524e-05, 6.141327321529388e-05, 6.323307752609253e-05, 6.505288183689117e-05, 6.687268614768982e-05, 6.869249045848846e-05, 7.051229476928711e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 13.0, 17.0, 14.0, 29.0, 38.0, 45.0, 82.0, 201.0, 447.0, 1742.0, 10270.0, 181548.0, 818256.0, 30852.0, 3626.0, 803.0, 285.0, 101.0, 59.0, 30.0, 20.0, 20.0, 17.0, 11.0, 4.0, 9.0, 3.0, 0.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.480712890625, -0.4623832702636719, -0.44405364990234375, -0.4257240295410156, -0.4073944091796875, -0.3890647888183594, -0.37073516845703125, -0.3524055480957031, -0.334075927734375, -0.3157463073730469, -0.29741668701171875, -0.2790870666503906, -0.2607574462890625, -0.24242782592773438, -0.22409820556640625, -0.20576858520507812, -0.18743896484375, -0.16910934448242188, -0.15077972412109375, -0.13245010375976562, -0.1141204833984375, -0.09579086303710938, -0.07746124267578125, -0.059131622314453125, -0.040802001953125, -0.022472381591796875, -0.00414276123046875, 0.014186859130859375, 0.0325164794921875, 0.050846099853515625, 0.06917572021484375, 0.08750534057617188, 0.1058349609375, 0.12416458129882812, 0.14249420166015625, 0.16082382202148438, 0.1791534423828125, 0.19748306274414062, 0.21581268310546875, 0.23414230346679688, 0.252471923828125, 0.2708015441894531, 0.28913116455078125, 0.3074607849121094, 0.3257904052734375, 0.3441200256347656, 0.36244964599609375, 0.3807792663574219, 0.39910888671875, 0.4174385070800781, 0.43576812744140625, 0.4540977478027344, 0.4724273681640625, 0.4907569885253906, 0.5090866088867188, 0.5274162292480469, 0.545745849609375, 0.5640754699707031, 0.5824050903320312, 0.6007347106933594, 0.6190643310546875, 0.6373939514160156, 0.6557235717773438, 0.6740531921386719, 0.6923828125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 4.0, 9.0, 13.0, 19.0, 19.0, 23.0, 20.0, 37.0, 45.0, 69.0, 100.0, 137.0, 141.0, 91.0, 59.0, 43.0, 34.0, 27.0, 18.0, 23.0, 16.0, 10.0, 9.0, 9.0, 4.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10498046875, -0.10107803344726562, -0.09717559814453125, -0.09327316284179688, -0.0893707275390625, -0.08546829223632812, -0.08156585693359375, -0.07766342163085938, -0.073760986328125, -0.06985855102539062, -0.06595611572265625, -0.062053680419921875, -0.0581512451171875, -0.054248809814453125, -0.05034637451171875, -0.046443939208984375, -0.04254150390625, -0.038639068603515625, -0.03473663330078125, -0.030834197998046875, -0.0269317626953125, -0.023029327392578125, -0.01912689208984375, -0.015224456787109375, -0.011322021484375, -0.007419586181640625, -0.00351715087890625, 0.000385284423828125, 0.0042877197265625, 0.008190155029296875, 0.01209259033203125, 0.015995025634765625, 0.0198974609375, 0.023799896240234375, 0.02770233154296875, 0.031604766845703125, 0.0355072021484375, 0.039409637451171875, 0.04331207275390625, 0.047214508056640625, 0.051116943359375, 0.055019378662109375, 0.05892181396484375, 0.06282424926757812, 0.0667266845703125, 0.07062911987304688, 0.07453155517578125, 0.07843399047851562, 0.08233642578125, 0.08623886108398438, 0.09014129638671875, 0.09404373168945312, 0.0979461669921875, 0.10184860229492188, 0.10575103759765625, 0.10965347290039062, 0.113555908203125, 0.11745834350585938, 0.12136077880859375, 0.12526321411132812, 0.1291656494140625, 0.13306808471679688, 0.13697052001953125, 0.14087295532226562, 0.144775390625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 255.0, 739.0, 22.0], "bins": [-82.84195709228516, -81.51062774658203, -80.1792984008789, -78.84796905517578, -77.51663970947266, -76.18531036376953, -74.8539810180664, -73.52265167236328, -72.19132232666016, -70.85999298095703, -69.5286636352539, -68.19733428955078, -66.86600494384766, -65.53467559814453, -64.2033462524414, -62.87201690673828, -61.54069137573242, -60.2093620300293, -58.87803268432617, -57.54670333862305, -56.21537399291992, -54.8840446472168, -53.55271530151367, -52.22138977050781, -50.89006042480469, -49.55873107910156, -48.22740173339844, -46.89607238769531, -45.56474304199219, -44.23341369628906, -42.90208435058594, -41.57075500488281, -40.23942947387695, -38.90810012817383, -37.5767707824707, -36.24544143676758, -34.91411209106445, -33.58278274536133, -32.2514533996582, -30.92012596130371, -29.588796615600586, -28.25746726989746, -26.926137924194336, -25.59480857849121, -24.26348114013672, -22.932151794433594, -21.60082244873047, -20.269493103027344, -18.93816375732422, -17.606834411621094, -16.27550506591797, -14.94417667388916, -13.612847328186035, -12.28151798248291, -10.950189590454102, -9.618860244750977, -8.287530899047852, -6.956201553344727, -5.62487268447876, -4.293543815612793, -2.962214469909668, -1.630885124206543, -0.29955625534057617, 1.0317726135253906, 2.3631019592285156]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 7.0, 6.0, 7.0, 8.0, 8.0, 9.0, 15.0, 15.0, 31.0, 29.0, 18.0, 33.0, 27.0, 23.0, 35.0, 36.0, 33.0, 32.0, 41.0, 36.0, 36.0, 42.0, 39.0, 41.0, 37.0, 38.0, 37.0, 33.0, 34.0, 30.0, 27.0, 36.0, 20.0, 23.0, 11.0, 17.0, 14.0, 9.0, 2.0, 4.0, 3.0, 10.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-12.697251319885254, -12.286035537719727, -11.8748197555542, -11.463603973388672, -11.052389144897461, -10.641173362731934, -10.229957580566406, -9.818741798400879, -9.407526016235352, -8.996310234069824, -8.585094451904297, -8.173879623413086, -7.7626633644104, -7.351448059082031, -6.940232276916504, -6.529016494750977, -6.117801189422607, -5.70658540725708, -5.295370101928711, -4.884154319763184, -4.472938537597656, -4.061722755432129, -3.6505074501037598, -3.2392916679382324, -2.828076124191284, -2.416860580444336, -2.0056447982788086, -1.5944292545318604, -1.1832135915756226, -0.7719979286193848, -0.3607823848724365, 0.05043339729309082, 0.46164894104003906, 0.8728646039962769, 1.2840802669525146, 1.695295810699463, 2.1065115928649902, 2.5177271366119385, 2.9289426803588867, 3.340158462524414, 3.7513740062713623, 4.1625895500183105, 4.573805332183838, 4.985020637512207, 5.396236419677734, 5.807452201843262, 6.218667984008789, 6.629883766174316, 7.0410990715026855, 7.452314853668213, 7.863530158996582, 8.27474594116211, 8.685961723327637, 9.097177505493164, 9.508392333984375, 9.919609069824219, 10.33082389831543, 10.742039680480957, 11.153255462646484, 11.564470291137695, 11.975686073303223, 12.38690185546875, 12.798117637634277, 13.209333419799805, 13.620549201965332]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 9.0, 3.0, 7.0, 5.0, 24.0, 18.0, 28.0, 31.0, 38.0, 48.0, 70.0, 116.0, 249.0, 940.0, 6163.0, 88824.0, 1813766.0, 2159990.0, 114777.0, 7349.0, 1154.0, 282.0, 112.0, 70.0, 42.0, 34.0, 23.0, 22.0, 19.0, 15.0, 20.0, 4.0, 6.0, 6.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.28515625, -4.166259765625, -4.04736328125, -3.928466796875, -3.8095703125, -3.690673828125, -3.57177734375, -3.452880859375, -3.333984375, -3.215087890625, -3.09619140625, -2.977294921875, -2.8583984375, -2.739501953125, -2.62060546875, -2.501708984375, -2.3828125, -2.263916015625, -2.14501953125, -2.026123046875, -1.9072265625, -1.788330078125, -1.66943359375, -1.550537109375, -1.431640625, -1.312744140625, -1.19384765625, -1.074951171875, -0.9560546875, -0.837158203125, -0.71826171875, -0.599365234375, -0.48046875, -0.361572265625, -0.24267578125, -0.123779296875, -0.0048828125, 0.114013671875, 0.23291015625, 0.351806640625, 0.470703125, 0.589599609375, 0.70849609375, 0.827392578125, 0.9462890625, 1.065185546875, 1.18408203125, 1.302978515625, 1.421875, 1.540771484375, 1.65966796875, 1.778564453125, 1.8974609375, 2.016357421875, 2.13525390625, 2.254150390625, 2.373046875, 2.491943359375, 2.61083984375, 2.729736328125, 2.8486328125, 2.967529296875, 3.08642578125, 3.205322265625, 3.32421875]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 7.0, 14.0, 12.0, 14.0, 14.0, 15.0, 33.0, 35.0, 36.0, 42.0, 38.0, 42.0, 55.0, 47.0, 44.0, 57.0, 48.0, 43.0, 50.0, 45.0, 34.0, 47.0, 31.0, 25.0, 33.0, 24.0, 25.0, 19.0, 13.0, 7.0, 10.0, 9.0, 3.0, 2.0, 6.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.767578125, -1.713775634765625, -1.65997314453125, -1.606170654296875, -1.5523681640625, -1.498565673828125, -1.44476318359375, -1.390960693359375, -1.337158203125, -1.283355712890625, -1.22955322265625, -1.175750732421875, -1.1219482421875, -1.068145751953125, -1.01434326171875, -0.960540771484375, -0.90673828125, -0.852935791015625, -0.79913330078125, -0.745330810546875, -0.6915283203125, -0.637725830078125, -0.58392333984375, -0.530120849609375, -0.476318359375, -0.422515869140625, -0.36871337890625, -0.314910888671875, -0.2611083984375, -0.207305908203125, -0.15350341796875, -0.099700927734375, -0.0458984375, 0.007904052734375, 0.06170654296875, 0.115509033203125, 0.1693115234375, 0.223114013671875, 0.27691650390625, 0.330718994140625, 0.384521484375, 0.438323974609375, 0.49212646484375, 0.545928955078125, 0.5997314453125, 0.653533935546875, 0.70733642578125, 0.761138916015625, 0.81494140625, 0.868743896484375, 0.92254638671875, 0.976348876953125, 1.0301513671875, 1.083953857421875, 1.13775634765625, 1.191558837890625, 1.245361328125, 1.299163818359375, 1.35296630859375, 1.406768798828125, 1.4605712890625, 1.514373779296875, 1.56817626953125, 1.621978759765625, 1.67578125]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 7.0, 4.0, 4.0, 8.0, 16.0, 16.0, 35.0, 134.0, 6988.0, 4186645.0, 260.0, 74.0, 22.0, 15.0, 10.0, 10.0, 10.0, 6.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-77.1875, -75.16259765625, -73.1376953125, -71.11279296875, -69.087890625, -67.06298828125, -65.0380859375, -63.01318359375, -60.98828125, -58.96337890625, -56.9384765625, -54.91357421875, -52.888671875, -50.86376953125, -48.8388671875, -46.81396484375, -44.7890625, -42.76416015625, -40.7392578125, -38.71435546875, -36.689453125, -34.66455078125, -32.6396484375, -30.61474609375, -28.58984375, -26.56494140625, -24.5400390625, -22.51513671875, -20.490234375, -18.46533203125, -16.4404296875, -14.41552734375, -12.390625, -10.36572265625, -8.3408203125, -6.31591796875, -4.291015625, -2.26611328125, -0.2412109375, 1.78369140625, 3.80859375, 5.83349609375, 7.8583984375, 9.88330078125, 11.908203125, 13.93310546875, 15.9580078125, 17.98291015625, 20.0078125, 22.03271484375, 24.0576171875, 26.08251953125, 28.107421875, 30.13232421875, 32.1572265625, 34.18212890625, 36.20703125, 38.23193359375, 40.2568359375, 42.28173828125, 44.306640625, 46.33154296875, 48.3564453125, 50.38134765625, 52.40625]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 7.0, 12.0, 17.0, 21.0, 19.0, 37.0, 63.0, 91.0, 153.0, 236.0, 296.0, 470.0, 620.0, 599.0, 480.0, 296.0, 221.0, 144.0, 104.0, 49.0, 41.0, 31.0, 20.0, 16.0, 9.0, 6.0, 3.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55126953125, -0.527191162109375, -0.50311279296875, -0.479034423828125, -0.4549560546875, -0.430877685546875, -0.40679931640625, -0.382720947265625, -0.358642578125, -0.334564208984375, -0.31048583984375, -0.286407470703125, -0.2623291015625, -0.238250732421875, -0.21417236328125, -0.190093994140625, -0.166015625, -0.141937255859375, -0.11785888671875, -0.093780517578125, -0.0697021484375, -0.045623779296875, -0.02154541015625, 0.002532958984375, 0.026611328125, 0.050689697265625, 0.07476806640625, 0.098846435546875, 0.1229248046875, 0.147003173828125, 0.17108154296875, 0.195159912109375, 0.21923828125, 0.243316650390625, 0.26739501953125, 0.291473388671875, 0.3155517578125, 0.339630126953125, 0.36370849609375, 0.387786865234375, 0.411865234375, 0.435943603515625, 0.46002197265625, 0.484100341796875, 0.5081787109375, 0.532257080078125, 0.55633544921875, 0.580413818359375, 0.6044921875, 0.628570556640625, 0.65264892578125, 0.676727294921875, 0.7008056640625, 0.724884033203125, 0.74896240234375, 0.773040771484375, 0.797119140625, 0.821197509765625, 0.84527587890625, 0.869354248046875, 0.8934326171875, 0.917510986328125, 0.94158935546875, 0.965667724609375, 0.98974609375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 8.0, 11.0, 20.0, 34.0, 81.0, 92.0, 180.0, 176.0, 155.0, 96.0, 68.0, 42.0, 23.0, 13.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.36844539642334, -6.221563339233398, -6.074681282043457, -5.927798748016357, -5.780916690826416, -5.634034633636475, -5.487152099609375, -5.340270042419434, -5.193387985229492, -5.046505928039551, -4.899623870849609, -4.75274133682251, -4.605859279632568, -4.458977222442627, -4.312094688415527, -4.165212631225586, -4.0183305740356445, -3.871448516845703, -3.7245662212371826, -3.577683925628662, -3.4308018684387207, -3.2839198112487793, -3.137037515640259, -2.9901552200317383, -2.843273162841797, -2.6963911056518555, -2.549508810043335, -2.4026265144348145, -2.255744457244873, -2.1088624000549316, -1.9619801044464111, -1.8150979280471802, -1.6682162284851074, -1.5213340520858765, -1.3744518756866455, -1.2275696992874146, -1.0806875228881836, -0.9338053464889526, -0.7869231700897217, -0.6400409936904907, -0.49315881729125977, -0.3462766408920288, -0.19939446449279785, -0.052512288093566895, 0.09436988830566406, 0.24125206470489502, 0.388134241104126, 0.5350164175033569, 0.6818985939025879, 0.8287807703018188, 0.9756629467010498, 1.1225451231002808, 1.2694272994995117, 1.4163094758987427, 1.5631916522979736, 1.7100738286972046, 1.8569560050964355, 2.003838062286377, 2.1507203578948975, 2.297602653503418, 2.4444847106933594, 2.591366767883301, 2.7382490634918213, 2.885131359100342, 3.032013416290283]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 8.0, 7.0, 11.0, 8.0, 12.0, 19.0, 9.0, 13.0, 23.0, 20.0, 22.0, 24.0, 26.0, 37.0, 37.0, 29.0, 31.0, 43.0, 48.0, 54.0, 35.0, 43.0, 45.0, 45.0, 39.0, 30.0, 34.0, 35.0, 34.0, 22.0, 16.0, 20.0, 23.0, 22.0, 15.0, 12.0, 12.0, 7.0, 10.0, 5.0, 3.0, 3.0, 6.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.6271095275878906, -1.5789276361465454, -1.5307457447052002, -1.482563853263855, -1.4343819618225098, -1.386200189590454, -1.3380181789398193, -1.2898364067077637, -1.2416545152664185, -1.1934726238250732, -1.145290732383728, -1.0971088409423828, -1.0489269495010376, -1.0007450580596924, -0.9525632262229919, -0.9043813943862915, -0.8561994433403015, -0.8080175518989563, -0.7598356604576111, -0.7116538286209106, -0.6634719371795654, -0.6152900457382202, -0.567108154296875, -0.5189262628555298, -0.47074440121650696, -0.42256250977516174, -0.3743806481361389, -0.3261987566947937, -0.2780168652534485, -0.22983500361442566, -0.18165311217308044, -0.13347125053405762, -0.0852893590927124, -0.03710747882723808, 0.011074401438236237, 0.059256285429000854, 0.10743816196918488, 0.1556200385093689, 0.2038019299507141, 0.25198379158973694, 0.30016568303108215, 0.34834757447242737, 0.3965294361114502, 0.4447113275527954, 0.4928932189941406, 0.5410751104354858, 0.589257001876831, 0.6374388337135315, 0.6856207251548767, 0.7338026165962219, 0.7819845080375671, 0.8301663398742676, 0.8783482313156128, 0.926530122756958, 0.9747120141983032, 1.0228939056396484, 1.0710757970809937, 1.1192576885223389, 1.167439579963684, 1.2156214714050293, 1.2638033628463745, 1.3119852542877197, 1.3601670265197754, 1.4083489179611206, 1.4565308094024658]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 7.0, 9.0, 16.0, 19.0, 39.0, 61.0, 111.0, 162.0, 232.0, 388.0, 552.0, 852.0, 1405.0, 2312.0, 3796.0, 7427.0, 14584.0, 32584.0, 77644.0, 177770.0, 304392.0, 231519.0, 106457.0, 44893.0, 19716.0, 9253.0, 4917.0, 2794.0, 1721.0, 1082.0, 660.0, 394.0, 257.0, 192.0, 111.0, 79.0, 51.0, 32.0, 24.0, 14.0, 12.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.63671875, -0.6183624267578125, -0.600006103515625, -0.5816497802734375, -0.56329345703125, -0.5449371337890625, -0.526580810546875, -0.5082244873046875, -0.4898681640625, -0.4715118408203125, -0.453155517578125, -0.4347991943359375, -0.41644287109375, -0.3980865478515625, -0.379730224609375, -0.3613739013671875, -0.343017578125, -0.3246612548828125, -0.306304931640625, -0.2879486083984375, -0.26959228515625, -0.2512359619140625, -0.232879638671875, -0.2145233154296875, -0.1961669921875, -0.1778106689453125, -0.159454345703125, -0.1410980224609375, -0.12274169921875, -0.1043853759765625, -0.086029052734375, -0.0676727294921875, -0.04931640625, -0.0309600830078125, -0.012603759765625, 0.0057525634765625, 0.02410888671875, 0.0424652099609375, 0.060821533203125, 0.0791778564453125, 0.0975341796875, 0.1158905029296875, 0.134246826171875, 0.1526031494140625, 0.17095947265625, 0.1893157958984375, 0.207672119140625, 0.2260284423828125, 0.244384765625, 0.2627410888671875, 0.281097412109375, 0.2994537353515625, 0.31781005859375, 0.3361663818359375, 0.354522705078125, 0.3728790283203125, 0.3912353515625, 0.4095916748046875, 0.427947998046875, 0.4463043212890625, 0.46466064453125, 0.4830169677734375, 0.501373291015625, 0.5197296142578125, 0.5380859375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 6.0, 4.0, 4.0, 11.0, 5.0, 7.0, 9.0, 14.0, 23.0, 27.0, 27.0, 29.0, 33.0, 38.0, 33.0, 48.0, 43.0, 37.0, 50.0, 53.0, 62.0, 47.0, 51.0, 41.0, 40.0, 33.0, 21.0, 24.0, 32.0, 23.0, 24.0, 21.0, 23.0, 12.0, 11.0, 14.0, 5.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99755859375, -0.9617233276367188, -0.9258880615234375, -0.8900527954101562, -0.854217529296875, -0.8183822631835938, -0.7825469970703125, -0.7467117309570312, -0.71087646484375, -0.6750411987304688, -0.6392059326171875, -0.6033706665039062, -0.567535400390625, -0.5317001342773438, -0.4958648681640625, -0.46002960205078125, -0.4241943359375, -0.38835906982421875, -0.3525238037109375, -0.31668853759765625, -0.280853271484375, -0.24501800537109375, -0.2091827392578125, -0.17334747314453125, -0.13751220703125, -0.10167694091796875, -0.0658416748046875, -0.03000640869140625, 0.005828857421875, 0.04166412353515625, 0.0774993896484375, 0.11333465576171875, 0.149169921875, 0.18500518798828125, 0.2208404541015625, 0.25667572021484375, 0.292510986328125, 0.32834625244140625, 0.3641815185546875, 0.40001678466796875, 0.43585205078125, 0.47168731689453125, 0.5075225830078125, 0.5433578491210938, 0.579193115234375, 0.6150283813476562, 0.6508636474609375, 0.6866989135742188, 0.7225341796875, 0.7583694458007812, 0.7942047119140625, 0.8300399780273438, 0.865875244140625, 0.9017105102539062, 0.9375457763671875, 0.9733810424804688, 1.00921630859375, 1.0450515747070312, 1.0808868408203125, 1.1167221069335938, 1.152557373046875, 1.1883926391601562, 1.2242279052734375, 1.2600631713867188, 1.2958984375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 10.0, 6.0, 17.0, 20.0, 31.0, 38.0, 63.0, 89.0, 133.0, 219.0, 347.0, 649.0, 1148.0, 2473.0, 5946.0, 14993.0, 41968.0, 123265.0, 314465.0, 332316.0, 135350.0, 46240.0, 16458.0, 6457.0, 2829.0, 1317.0, 690.0, 350.0, 210.0, 148.0, 96.0, 52.0, 39.0, 28.0, 24.0, 15.0, 11.0, 15.0, 10.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7841796875, -0.7589187622070312, -0.7336578369140625, -0.7083969116210938, -0.683135986328125, -0.6578750610351562, -0.6326141357421875, -0.6073532104492188, -0.58209228515625, -0.5568313598632812, -0.5315704345703125, -0.5063095092773438, -0.481048583984375, -0.45578765869140625, -0.4305267333984375, -0.40526580810546875, -0.3800048828125, -0.35474395751953125, -0.3294830322265625, -0.30422210693359375, -0.278961181640625, -0.25370025634765625, -0.2284393310546875, -0.20317840576171875, -0.17791748046875, -0.15265655517578125, -0.1273956298828125, -0.10213470458984375, -0.076873779296875, -0.05161285400390625, -0.0263519287109375, -0.00109100341796875, 0.024169921875, 0.04943084716796875, 0.0746917724609375, 0.09995269775390625, 0.125213623046875, 0.15047454833984375, 0.1757354736328125, 0.20099639892578125, 0.22625732421875, 0.25151824951171875, 0.2767791748046875, 0.30204010009765625, 0.327301025390625, 0.35256195068359375, 0.3778228759765625, 0.40308380126953125, 0.4283447265625, 0.45360565185546875, 0.4788665771484375, 0.5041275024414062, 0.529388427734375, 0.5546493530273438, 0.5799102783203125, 0.6051712036132812, 0.63043212890625, 0.6556930541992188, 0.6809539794921875, 0.7062149047851562, 0.731475830078125, 0.7567367553710938, 0.7819976806640625, 0.8072586059570312, 0.83251953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 7.0, 4.0, 6.0, 10.0, 8.0, 13.0, 15.0, 21.0, 27.0, 35.0, 35.0, 34.0, 40.0, 62.0, 60.0, 64.0, 52.0, 74.0, 58.0, 59.0, 69.0, 38.0, 40.0, 29.0, 35.0, 24.0, 20.0, 16.0, 11.0, 8.0, 8.0, 11.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4375, -2.353179931640625, -2.26885986328125, -2.184539794921875, -2.1002197265625, -2.015899658203125, -1.93157958984375, -1.847259521484375, -1.762939453125, -1.678619384765625, -1.59429931640625, -1.509979248046875, -1.4256591796875, -1.341339111328125, -1.25701904296875, -1.172698974609375, -1.08837890625, -1.004058837890625, -0.91973876953125, -0.835418701171875, -0.7510986328125, -0.666778564453125, -0.58245849609375, -0.498138427734375, -0.413818359375, -0.329498291015625, -0.24517822265625, -0.160858154296875, -0.0765380859375, 0.007781982421875, 0.09210205078125, 0.176422119140625, 0.2607421875, 0.345062255859375, 0.42938232421875, 0.513702392578125, 0.5980224609375, 0.682342529296875, 0.76666259765625, 0.850982666015625, 0.935302734375, 1.019622802734375, 1.10394287109375, 1.188262939453125, 1.2725830078125, 1.356903076171875, 1.44122314453125, 1.525543212890625, 1.60986328125, 1.694183349609375, 1.77850341796875, 1.862823486328125, 1.9471435546875, 2.031463623046875, 2.11578369140625, 2.200103759765625, 2.284423828125, 2.368743896484375, 2.45306396484375, 2.537384033203125, 2.6217041015625, 2.706024169921875, 2.79034423828125, 2.874664306640625, 2.958984375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 6.0, 5.0, 18.0, 14.0, 25.0, 35.0, 100.0, 120.0, 206.0, 407.0, 955.0, 2055.0, 5649.0, 20990.0, 130160.0, 633284.0, 211929.0, 30213.0, 7669.0, 2577.0, 1041.0, 474.0, 266.0, 139.0, 82.0, 38.0, 38.0, 17.0, 15.0, 5.0, 8.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.436767578125, -0.42377471923828125, -0.4107818603515625, -0.39778900146484375, -0.384796142578125, -0.37180328369140625, -0.3588104248046875, -0.34581756591796875, -0.33282470703125, -0.31983184814453125, -0.3068389892578125, -0.29384613037109375, -0.280853271484375, -0.26786041259765625, -0.2548675537109375, -0.24187469482421875, -0.2288818359375, -0.21588897705078125, -0.2028961181640625, -0.18990325927734375, -0.176910400390625, -0.16391754150390625, -0.1509246826171875, -0.13793182373046875, -0.12493896484375, -0.11194610595703125, -0.0989532470703125, -0.08596038818359375, -0.072967529296875, -0.05997467041015625, -0.0469818115234375, -0.03398895263671875, -0.02099609375, -0.00800323486328125, 0.0049896240234375, 0.01798248291015625, 0.030975341796875, 0.04396820068359375, 0.0569610595703125, 0.06995391845703125, 0.08294677734375, 0.09593963623046875, 0.1089324951171875, 0.12192535400390625, 0.134918212890625, 0.14791107177734375, 0.1609039306640625, 0.17389678955078125, 0.1868896484375, 0.19988250732421875, 0.2128753662109375, 0.22586822509765625, 0.238861083984375, 0.25185394287109375, 0.2648468017578125, 0.27783966064453125, 0.29083251953125, 0.30382537841796875, 0.3168182373046875, 0.32981109619140625, 0.342803955078125, 0.35579681396484375, 0.3687896728515625, 0.38178253173828125, 0.394775390625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 2.0, 3.0, 7.0, 3.0, 7.0, 7.0, 17.0, 16.0, 22.0, 49.0, 31.0, 60.0, 66.0, 69.0, 88.0, 114.0, 94.0, 79.0, 62.0, 43.0, 36.0, 25.0, 22.0, 22.0, 12.0, 9.0, 5.0, 5.0, 5.0, 4.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.00016450881958007812, -0.00016052182763814926, -0.0001565348356962204, -0.00015254784375429153, -0.00014856085181236267, -0.0001445738598704338, -0.00014058686792850494, -0.00013659987598657608, -0.00013261288404464722, -0.00012862589210271835, -0.0001246389001607895, -0.00012065190821886063, -0.00011666491627693176, -0.0001126779243350029, -0.00010869093239307404, -0.00010470394045114517, -0.00010071694850921631, -9.672995656728745e-05, -9.274296462535858e-05, -8.875597268342972e-05, -8.476898074150085e-05, -8.078198879957199e-05, -7.679499685764313e-05, -7.280800491571426e-05, -6.88210129737854e-05, -6.483402103185654e-05, -6.084702908992767e-05, -5.686003714799881e-05, -5.2873045206069946e-05, -4.888605326414108e-05, -4.489906132221222e-05, -4.0912069380283356e-05, -3.692507743835449e-05, -3.293808549642563e-05, -2.8951093554496765e-05, -2.49641016125679e-05, -2.0977109670639038e-05, -1.6990117728710175e-05, -1.3003125786781311e-05, -9.016133844852448e-06, -5.029141902923584e-06, -1.0421499609947205e-06, 2.944841980934143e-06, 6.931833922863007e-06, 1.091882586479187e-05, 1.4905817806720734e-05, 1.8892809748649597e-05, 2.287980169057846e-05, 2.6866793632507324e-05, 3.085378557443619e-05, 3.484077751636505e-05, 3.8827769458293915e-05, 4.281476140022278e-05, 4.680175334215164e-05, 5.0788745284080505e-05, 5.477573722600937e-05, 5.876272916793823e-05, 6.27497211098671e-05, 6.673671305179596e-05, 7.072370499372482e-05, 7.471069693565369e-05, 7.869768887758255e-05, 8.268468081951141e-05, 8.667167276144028e-05, 9.065866470336914e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 5.0, 5.0, 10.0, 9.0, 8.0, 10.0, 21.0, 25.0, 32.0, 49.0, 64.0, 103.0, 275.0, 570.0, 2220.0, 25364.0, 949885.0, 65091.0, 3404.0, 777.0, 252.0, 132.0, 88.0, 38.0, 29.0, 30.0, 13.0, 14.0, 8.0, 9.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.990234375, -0.954376220703125, -0.91851806640625, -0.882659912109375, -0.8468017578125, -0.810943603515625, -0.77508544921875, -0.739227294921875, -0.703369140625, -0.667510986328125, -0.63165283203125, -0.595794677734375, -0.5599365234375, -0.524078369140625, -0.48822021484375, -0.452362060546875, -0.41650390625, -0.380645751953125, -0.34478759765625, -0.308929443359375, -0.2730712890625, -0.237213134765625, -0.20135498046875, -0.165496826171875, -0.129638671875, -0.093780517578125, -0.05792236328125, -0.022064208984375, 0.0137939453125, 0.049652099609375, 0.08551025390625, 0.121368408203125, 0.1572265625, 0.193084716796875, 0.22894287109375, 0.264801025390625, 0.3006591796875, 0.336517333984375, 0.37237548828125, 0.408233642578125, 0.444091796875, 0.479949951171875, 0.51580810546875, 0.551666259765625, 0.5875244140625, 0.623382568359375, 0.65924072265625, 0.695098876953125, 0.73095703125, 0.766815185546875, 0.80267333984375, 0.838531494140625, 0.8743896484375, 0.910247802734375, 0.94610595703125, 0.981964111328125, 1.017822265625, 1.053680419921875, 1.08953857421875, 1.125396728515625, 1.1612548828125, 1.197113037109375, 1.23297119140625, 1.268829345703125, 1.3046875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 5.0, 2.0, 0.0, 5.0, 3.0, 6.0, 14.0, 14.0, 23.0, 30.0, 37.0, 67.0, 98.0, 104.0, 141.0, 118.0, 99.0, 84.0, 52.0, 30.0, 23.0, 22.0, 9.0, 6.0, 5.0, 6.0, 3.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1363525390625, -0.1317577362060547, -0.12716293334960938, -0.12256813049316406, -0.11797332763671875, -0.11337852478027344, -0.10878372192382812, -0.10418891906738281, -0.0995941162109375, -0.09499931335449219, -0.09040451049804688, -0.08580970764160156, -0.08121490478515625, -0.07662010192871094, -0.07202529907226562, -0.06743049621582031, -0.062835693359375, -0.05824089050292969, -0.053646087646484375, -0.04905128479003906, -0.04445648193359375, -0.03986167907714844, -0.035266876220703125, -0.030672073364257812, -0.0260772705078125, -0.021482467651367188, -0.016887664794921875, -0.012292861938476562, -0.00769805908203125, -0.0031032562255859375, 0.001491546630859375, 0.0060863494873046875, 0.01068115234375, 0.015275955200195312, 0.019870758056640625, 0.024465560913085938, 0.02906036376953125, 0.03365516662597656, 0.038249969482421875, 0.04284477233886719, 0.0474395751953125, 0.05203437805175781, 0.056629180908203125, 0.06122398376464844, 0.06581878662109375, 0.07041358947753906, 0.07500839233398438, 0.07960319519042969, 0.084197998046875, 0.08879280090332031, 0.09338760375976562, 0.09798240661621094, 0.10257720947265625, 0.10717201232910156, 0.11176681518554688, 0.11636161804199219, 0.1209564208984375, 0.1255512237548828, 0.13014602661132812, 0.13474082946777344, 0.13933563232421875, 0.14393043518066406, 0.14852523803710938, 0.1531200408935547, 0.15771484375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 5.0, 4.0, 9.0, 17.0, 28.0, 42.0, 61.0, 72.0, 119.0, 134.0, 119.0, 116.0, 102.0, 55.0, 33.0, 32.0, 24.0, 11.0, 5.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9822492599487305, -1.9182709455490112, -1.854292631149292, -1.7903143167495728, -1.7263360023498535, -1.6623578071594238, -1.5983794927597046, -1.5344011783599854, -1.4704228639602661, -1.4064445495605469, -1.3424662351608276, -1.2784879207611084, -1.2145097255706787, -1.15053129196167, -1.0865530967712402, -1.022574782371521, -0.9585964679718018, -0.8946181535720825, -0.8306398391723633, -0.7666615843772888, -0.7026832699775696, -0.6387049555778503, -0.5747267007827759, -0.5107483863830566, -0.4467700719833374, -0.38279175758361816, -0.3188134729862213, -0.25483518838882446, -0.19085687398910522, -0.126878559589386, -0.06290027499198914, 0.0010780096054077148, 0.06505608558654785, 0.1290343850851059, 0.19301268458366394, 0.2569909691810608, 0.32096928358078003, 0.38494759798049927, 0.4489258825778961, 0.512904167175293, 0.5768824815750122, 0.6408607959747314, 0.7048391103744507, 0.7688173651695251, 0.8327956795692444, 0.8967739939689636, 0.9607522487640381, 1.0247305631637573, 1.0887088775634766, 1.1526871919631958, 1.216665506362915, 1.2806438207626343, 1.3446221351623535, 1.4086003303527832, 1.4725786447525024, 1.5365569591522217, 1.600535273551941, 1.6645135879516602, 1.7284919023513794, 1.7924702167510986, 1.8564484119415283, 1.920426845550537, 1.9844050407409668, 2.0483832359313965, 2.1123616695404053]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 3.0, 6.0, 2.0, 9.0, 18.0, 20.0, 16.0, 16.0, 20.0, 32.0, 35.0, 21.0, 35.0, 46.0, 47.0, 50.0, 50.0, 59.0, 57.0, 39.0, 56.0, 55.0, 32.0, 35.0, 35.0, 34.0, 23.0, 28.0, 27.0, 23.0, 13.0, 17.0, 12.0, 9.0, 8.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1759898662567139, -1.1387073993682861, -1.1014249324798584, -1.0641424655914307, -1.026859998703003, -0.98957759141922, -0.952295184135437, -0.9150127172470093, -0.8777302503585815, -0.8404477834701538, -0.8031653165817261, -0.7658829092979431, -0.7286004424095154, -0.6913179755210876, -0.6540355682373047, -0.616753101348877, -0.5794706344604492, -0.5421881675720215, -0.5049057006835938, -0.4676232933998108, -0.43034082651138306, -0.3930583596229553, -0.35577592253685, -0.31849348545074463, -0.2812110185623169, -0.24392856657505035, -0.2066461145877838, -0.16936366260051727, -0.13208121061325073, -0.09479875862598419, -0.05751630663871765, -0.020233869552612305, 0.01704871654510498, 0.05433116853237152, 0.09161362051963806, 0.1288960725069046, 0.16617852449417114, 0.20346097648143768, 0.24074342846870422, 0.27802586555480957, 0.3153083324432373, 0.35259079933166504, 0.3898732364177704, 0.42715567350387573, 0.46443814039230347, 0.5017206072807312, 0.5390030145645142, 0.5762854814529419, 0.6135679483413696, 0.6508504152297974, 0.6881328821182251, 0.7254152894020081, 0.7626977562904358, 0.7999802231788635, 0.8372626304626465, 0.8745450973510742, 0.911827564239502, 0.9491100311279297, 0.9863924980163574, 1.0236749649047852, 1.060957431793213, 1.098239779472351, 1.1355222463607788, 1.1728047132492065, 1.2100871801376343]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 4.0, 3.0, 4.0, 7.0, 13.0, 16.0, 18.0, 28.0, 52.0, 77.0, 124.0, 202.0, 384.0, 726.0, 1361.0, 2875.0, 6326.0, 14451.0, 32629.0, 79518.0, 277237.0, 427895.0, 122237.0, 45929.0, 19843.0, 8807.0, 3956.0, 1862.0, 870.0, 451.0, 244.0, 139.0, 83.0, 73.0, 32.0, 25.0, 21.0, 15.0, 6.0, 4.0, 6.0, 3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82568359375, -0.79833984375, -0.77099609375, -0.74365234375, -0.71630859375, -0.68896484375, -0.66162109375, -0.63427734375, -0.60693359375, -0.57958984375, -0.55224609375, -0.52490234375, -0.49755859375, -0.47021484375, -0.44287109375, -0.41552734375, -0.38818359375, -0.36083984375, -0.33349609375, -0.30615234375, -0.27880859375, -0.25146484375, -0.22412109375, -0.19677734375, -0.16943359375, -0.14208984375, -0.11474609375, -0.08740234375, -0.06005859375, -0.03271484375, -0.00537109375, 0.02197265625, 0.04931640625, 0.07666015625, 0.10400390625, 0.13134765625, 0.15869140625, 0.18603515625, 0.21337890625, 0.24072265625, 0.26806640625, 0.29541015625, 0.32275390625, 0.35009765625, 0.37744140625, 0.40478515625, 0.43212890625, 0.45947265625, 0.48681640625, 0.51416015625, 0.54150390625, 0.56884765625, 0.59619140625, 0.62353515625, 0.65087890625, 0.67822265625, 0.70556640625, 0.73291015625, 0.76025390625, 0.78759765625, 0.81494140625, 0.84228515625, 0.86962890625, 0.89697265625, 0.92431640625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 6.0, 4.0, 10.0, 9.0, 7.0, 13.0, 15.0, 17.0, 24.0, 22.0, 22.0, 24.0, 25.0, 19.0, 28.0, 36.0, 39.0, 44.0, 42.0, 47.0, 39.0, 32.0, 34.0, 39.0, 36.0, 46.0, 42.0, 27.0, 32.0, 25.0, 31.0, 25.0, 17.0, 21.0, 25.0, 16.0, 9.0, 12.0, 10.0, 1.0, 2.0, 3.0, 4.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.306640625, -3.200286865234375, -3.09393310546875, -2.987579345703125, -2.8812255859375, -2.774871826171875, -2.66851806640625, -2.562164306640625, -2.455810546875, -2.349456787109375, -2.24310302734375, -2.136749267578125, -2.0303955078125, -1.924041748046875, -1.81768798828125, -1.711334228515625, -1.60498046875, -1.498626708984375, -1.39227294921875, -1.285919189453125, -1.1795654296875, -1.073211669921875, -0.96685791015625, -0.860504150390625, -0.754150390625, -0.647796630859375, -0.54144287109375, -0.435089111328125, -0.3287353515625, -0.222381591796875, -0.11602783203125, -0.009674072265625, 0.0966796875, 0.203033447265625, 0.30938720703125, 0.415740966796875, 0.5220947265625, 0.628448486328125, 0.73480224609375, 0.841156005859375, 0.947509765625, 1.053863525390625, 1.16021728515625, 1.266571044921875, 1.3729248046875, 1.479278564453125, 1.58563232421875, 1.691986083984375, 1.79833984375, 1.904693603515625, 2.01104736328125, 2.117401123046875, 2.2237548828125, 2.330108642578125, 2.43646240234375, 2.542816162109375, 2.649169921875, 2.755523681640625, 2.86187744140625, 2.968231201171875, 3.0745849609375, 3.180938720703125, 3.28729248046875, 3.393646240234375, 3.5]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 9.0, 10.0, 7.0, 16.0, 16.0, 26.0, 36.0, 48.0, 52.0, 61.0, 86.0, 193.0, 773.0, 1040413.0, 6058.0, 279.0, 129.0, 89.0, 77.0, 51.0, 34.0, 24.0, 16.0, 15.0, 10.0, 8.0, 9.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.78125, -18.2830810546875, -17.784912109375, -17.2867431640625, -16.78857421875, -16.2904052734375, -15.792236328125, -15.2940673828125, -14.7958984375, -14.2977294921875, -13.799560546875, -13.3013916015625, -12.80322265625, -12.3050537109375, -11.806884765625, -11.3087158203125, -10.810546875, -10.3123779296875, -9.814208984375, -9.3160400390625, -8.81787109375, -8.3197021484375, -7.821533203125, -7.3233642578125, -6.8251953125, -6.3270263671875, -5.828857421875, -5.3306884765625, -4.83251953125, -4.3343505859375, -3.836181640625, -3.3380126953125, -2.83984375, -2.3416748046875, -1.843505859375, -1.3453369140625, -0.84716796875, -0.3489990234375, 0.149169921875, 0.6473388671875, 1.1455078125, 1.6436767578125, 2.141845703125, 2.6400146484375, 3.13818359375, 3.6363525390625, 4.134521484375, 4.6326904296875, 5.130859375, 5.6290283203125, 6.127197265625, 6.6253662109375, 7.12353515625, 7.6217041015625, 8.119873046875, 8.6180419921875, 9.1162109375, 9.6143798828125, 10.112548828125, 10.6107177734375, 11.10888671875, 11.6070556640625, 12.105224609375, 12.6033935546875, 13.1015625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 10.0, 8.0, 7.0, 18.0, 15.0, 23.0, 34.0, 33.0, 44.0, 50.0, 53.0, 63.0, 61.0, 93.0, 68.0, 69.0, 69.0, 56.0, 58.0, 48.0, 30.0, 22.0, 16.0, 17.0, 10.0, 7.0, 10.0, 6.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.51953125, -7.32012939453125, -7.1207275390625, -6.92132568359375, -6.721923828125, -6.52252197265625, -6.3231201171875, -6.12371826171875, -5.92431640625, -5.72491455078125, -5.5255126953125, -5.32611083984375, -5.126708984375, -4.92730712890625, -4.7279052734375, -4.52850341796875, -4.3291015625, -4.12969970703125, -3.9302978515625, -3.73089599609375, -3.531494140625, -3.33209228515625, -3.1326904296875, -2.93328857421875, -2.73388671875, -2.53448486328125, -2.3350830078125, -2.13568115234375, -1.936279296875, -1.73687744140625, -1.5374755859375, -1.33807373046875, -1.138671875, -0.93927001953125, -0.7398681640625, -0.54046630859375, -0.341064453125, -0.14166259765625, 0.0577392578125, 0.25714111328125, 0.45654296875, 0.65594482421875, 0.8553466796875, 1.05474853515625, 1.254150390625, 1.45355224609375, 1.6529541015625, 1.85235595703125, 2.0517578125, 2.25115966796875, 2.4505615234375, 2.64996337890625, 2.849365234375, 3.04876708984375, 3.2481689453125, 3.44757080078125, 3.64697265625, 3.84637451171875, 4.0457763671875, 4.24517822265625, 4.444580078125, 4.64398193359375, 4.8433837890625, 5.04278564453125, 5.2421875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 7.0, 8.0, 9.0, 15.0, 11.0, 17.0, 23.0, 38.0, 40.0, 89.0, 129.0, 313.0, 1367.0, 11140.0, 504673.0, 516947.0, 11554.0, 1458.0, 349.0, 115.0, 60.0, 47.0, 37.0, 28.0, 18.0, 12.0, 11.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0771484375, -1.0424041748046875, -1.007659912109375, -0.9729156494140625, -0.93817138671875, -0.9034271240234375, -0.868682861328125, -0.8339385986328125, -0.7991943359375, -0.7644500732421875, -0.729705810546875, -0.6949615478515625, -0.66021728515625, -0.6254730224609375, -0.590728759765625, -0.5559844970703125, -0.521240234375, -0.4864959716796875, -0.451751708984375, -0.4170074462890625, -0.38226318359375, -0.3475189208984375, -0.312774658203125, -0.2780303955078125, -0.2432861328125, -0.2085418701171875, -0.173797607421875, -0.1390533447265625, -0.10430908203125, -0.0695648193359375, -0.034820556640625, -7.62939453125e-05, 0.03466796875, 0.0694122314453125, 0.104156494140625, 0.1389007568359375, 0.17364501953125, 0.2083892822265625, 0.243133544921875, 0.2778778076171875, 0.3126220703125, 0.3473663330078125, 0.382110595703125, 0.4168548583984375, 0.45159912109375, 0.4863433837890625, 0.521087646484375, 0.5558319091796875, 0.590576171875, 0.6253204345703125, 0.660064697265625, 0.6948089599609375, 0.72955322265625, 0.7642974853515625, 0.799041748046875, 0.8337860107421875, 0.8685302734375, 0.9032745361328125, 0.938018798828125, 0.9727630615234375, 1.00750732421875, 1.0422515869140625, 1.076995849609375, 1.1117401123046875, 1.146484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 6.0, 5.0, 7.0, 7.0, 16.0, 14.0, 29.0, 37.0, 73.0, 81.0, 141.0, 186.0, 143.0, 78.0, 41.0, 38.0, 32.0, 19.0, 17.0, 6.0, 2.0, 3.0, 5.0, 5.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.921457290649414e-05, -7.621478289365768e-05, -7.321499288082123e-05, -7.021520286798477e-05, -6.721541285514832e-05, -6.421562284231186e-05, -6.12158328294754e-05, -5.8216042816638947e-05, -5.521625280380249e-05, -5.2216462790966034e-05, -4.921667277812958e-05, -4.621688276529312e-05, -4.3217092752456665e-05, -4.021730273962021e-05, -3.721751272678375e-05, -3.4217722713947296e-05, -3.121793270111084e-05, -2.8218142688274384e-05, -2.5218352675437927e-05, -2.221856266260147e-05, -1.9218772649765015e-05, -1.621898263692856e-05, -1.3219192624092102e-05, -1.0219402611255646e-05, -7.2196125984191895e-06, -4.219822585582733e-06, -1.2200325727462769e-06, 1.7797574400901794e-06, 4.779547452926636e-06, 7.779337465763092e-06, 1.0779127478599548e-05, 1.3778917491436005e-05, 1.677870750427246e-05, 1.9778497517108917e-05, 2.2778287529945374e-05, 2.577807754278183e-05, 2.8777867555618286e-05, 3.177765756845474e-05, 3.47774475812912e-05, 3.7777237594127655e-05, 4.077702760696411e-05, 4.377681761980057e-05, 4.6776607632637024e-05, 4.977639764547348e-05, 5.2776187658309937e-05, 5.577597767114639e-05, 5.877576768398285e-05, 6.17755576968193e-05, 6.477534770965576e-05, 6.777513772249222e-05, 7.077492773532867e-05, 7.377471774816513e-05, 7.677450776100159e-05, 7.977429777383804e-05, 8.27740877866745e-05, 8.577387779951096e-05, 8.877366781234741e-05, 9.177345782518387e-05, 9.477324783802032e-05, 9.777303785085678e-05, 0.00010077282786369324, 0.0001037726178765297, 0.00010677240788936615, 0.0001097721979022026, 0.00011277198791503906]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 5.0, 8.0, 12.0, 10.0, 13.0, 18.0, 24.0, 31.0, 46.0, 93.0, 167.0, 445.0, 1883.0, 15786.0, 702911.0, 314505.0, 10332.0, 1509.0, 375.0, 150.0, 74.0, 44.0, 28.0, 18.0, 12.0, 5.0, 9.0, 5.0, 8.0, 3.0, 9.0, 3.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.22265625, -1.1886138916015625, -1.154571533203125, -1.1205291748046875, -1.08648681640625, -1.0524444580078125, -1.018402099609375, -0.9843597412109375, -0.9503173828125, -0.9162750244140625, -0.882232666015625, -0.8481903076171875, -0.81414794921875, -0.7801055908203125, -0.746063232421875, -0.7120208740234375, -0.677978515625, -0.6439361572265625, -0.609893798828125, -0.5758514404296875, -0.54180908203125, -0.5077667236328125, -0.473724365234375, -0.4396820068359375, -0.4056396484375, -0.3715972900390625, -0.337554931640625, -0.3035125732421875, -0.26947021484375, -0.2354278564453125, -0.201385498046875, -0.1673431396484375, -0.13330078125, -0.0992584228515625, -0.065216064453125, -0.0311737060546875, 0.00286865234375, 0.0369110107421875, 0.070953369140625, 0.1049957275390625, 0.1390380859375, 0.1730804443359375, 0.207122802734375, 0.2411651611328125, 0.27520751953125, 0.3092498779296875, 0.343292236328125, 0.3773345947265625, 0.411376953125, 0.4454193115234375, 0.479461669921875, 0.5135040283203125, 0.54754638671875, 0.5815887451171875, 0.615631103515625, 0.6496734619140625, 0.6837158203125, 0.7177581787109375, 0.751800537109375, 0.7858428955078125, 0.81988525390625, 0.8539276123046875, 0.887969970703125, 0.9220123291015625, 0.9560546875]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 8.0, 6.0, 8.0, 4.0, 5.0, 1.0, 9.0, 7.0, 11.0, 14.0, 19.0, 35.0, 37.0, 57.0, 67.0, 75.0, 110.0, 116.0, 96.0, 65.0, 45.0, 56.0, 34.0, 19.0, 27.0, 17.0, 8.0, 4.0, 5.0, 5.0, 7.0, 5.0, 6.0, 5.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.161865234375, -0.1571216583251953, -0.15237808227539062, -0.14763450622558594, -0.14289093017578125, -0.13814735412597656, -0.13340377807617188, -0.1286602020263672, -0.1239166259765625, -0.11917304992675781, -0.11442947387695312, -0.10968589782714844, -0.10494232177734375, -0.10019874572753906, -0.09545516967773438, -0.09071159362792969, -0.085968017578125, -0.08122444152832031, -0.07648086547851562, -0.07173728942871094, -0.06699371337890625, -0.06225013732910156, -0.057506561279296875, -0.05276298522949219, -0.0480194091796875, -0.04327583312988281, -0.038532257080078125, -0.03378868103027344, -0.02904510498046875, -0.024301528930664062, -0.019557952880859375, -0.014814376831054688, -0.01007080078125, -0.0053272247314453125, -0.000583648681640625, 0.0041599273681640625, 0.00890350341796875, 0.013647079467773438, 0.018390655517578125, 0.023134231567382812, 0.0278778076171875, 0.03262138366699219, 0.037364959716796875, 0.04210853576660156, 0.04685211181640625, 0.05159568786621094, 0.056339263916015625, 0.06108283996582031, 0.065826416015625, 0.07056999206542969, 0.07531356811523438, 0.08005714416503906, 0.08480072021484375, 0.08954429626464844, 0.09428787231445312, 0.09903144836425781, 0.1037750244140625, 0.10851860046386719, 0.11326217651367188, 0.11800575256347656, 0.12274932861328125, 0.12749290466308594, 0.13223648071289062, 0.1369800567626953, 0.1417236328125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 5.0, 30.0, 113.0, 322.0, 341.0, 141.0, 43.0, 13.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.34256935119629, -19.966489791870117, -19.590410232543945, -19.214330673217773, -18.8382511138916, -18.462173461914062, -18.08609390258789, -17.71001434326172, -17.333934783935547, -16.957855224609375, -16.581775665283203, -16.20569610595703, -15.829617500305176, -15.453537940979004, -15.077458381652832, -14.70137882232666, -14.325299263000488, -13.949219703674316, -13.573140144348145, -13.197061538696289, -12.820981979370117, -12.444902420043945, -12.068822860717773, -11.692743301391602, -11.31666374206543, -10.940584182739258, -10.564504623413086, -10.188425064086914, -9.812346458435059, -9.436266899108887, -9.060187339782715, -8.684107780456543, -8.308029174804688, -7.931949615478516, -7.555870532989502, -7.17979097366333, -6.803711891174316, -6.4276323318481445, -6.051552772521973, -5.675473213195801, -5.299394607543945, -4.923315048217773, -4.54723596572876, -4.171156406402588, -3.795077085494995, -3.4189977645874023, -3.0429182052612305, -2.6668388843536377, -2.290759325027466, -1.914680004119873, -1.5386005640029907, -1.1625211238861084, -0.7864418029785156, -0.41036248207092285, -0.03428292274475098, 0.3417963981628418, 0.7178757190704346, 1.0939550399780273, 1.4700344800949097, 1.846113920211792, 2.2221932411193848, 2.5982725620269775, 2.9743521213531494, 3.350431442260742, 3.726510763168335]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 2.0, 4.0, 6.0, 9.0, 11.0, 6.0, 12.0, 12.0, 19.0, 16.0, 16.0, 17.0, 21.0, 28.0, 33.0, 29.0, 41.0, 44.0, 32.0, 36.0, 44.0, 26.0, 44.0, 56.0, 40.0, 43.0, 35.0, 42.0, 39.0, 30.0, 22.0, 30.0, 22.0, 23.0, 17.0, 23.0, 13.0, 11.0, 4.0, 9.0, 8.0, 6.0, 5.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.362370491027832, -5.197085857391357, -5.031801223754883, -4.86651611328125, -4.701231479644775, -4.535946846008301, -4.370662212371826, -4.205377578735352, -4.040092468261719, -3.874807834625244, -3.7095229625701904, -3.544238328933716, -3.378953456878662, -3.2136688232421875, -3.048384189605713, -2.8830995559692383, -2.7178149223327637, -2.552530288696289, -2.3872454166412354, -2.2219607830047607, -2.056675910949707, -1.8913912773132324, -1.7261066436767578, -1.5608218908309937, -1.3955371379852295, -1.2302523851394653, -1.0649676322937012, -0.8996829986572266, -0.7343982458114624, -0.5691134929656982, -0.40382879972457886, -0.23854410648345947, -0.07325983047485352, 0.09202489256858826, 0.25730961561203003, 0.4225943386554718, 0.5878790616989136, 0.7531638145446777, 0.9184485077857971, 1.0837332010269165, 1.2490179538726807, 1.4143027067184448, 1.579587459564209, 1.7448720932006836, 1.9101568460464478, 2.075441598892212, 2.2407262325286865, 2.4060111045837402, 2.571295738220215, 2.7365803718566895, 2.901865243911743, 3.0671498775482178, 3.2324347496032715, 3.397719383239746, 3.5630040168762207, 3.7282886505126953, 3.893573522567749, 4.058858394622803, 4.224143028259277, 4.389427661895752, 4.554712295532227, 4.719997406005859, 4.885282039642334, 5.050566673278809, 5.215851306915283]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 2.0, 3.0, 3.0, 6.0, 10.0, 12.0, 12.0, 9.0, 11.0, 21.0, 12.0, 22.0, 26.0, 27.0, 33.0, 34.0, 46.0, 85.0, 152.0, 309.0, 949.0, 4164.0, 29239.0, 485510.0, 2824249.0, 791599.0, 50141.0, 5556.0, 1206.0, 344.0, 160.0, 75.0, 44.0, 38.0, 22.0, 23.0, 20.0, 19.0, 10.0, 14.0, 8.0, 18.0, 13.0, 6.0, 3.0, 4.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.119140625, -3.0234375, -2.927734375, -2.83203125, -2.736328125, -2.640625, -2.544921875, -2.44921875, -2.353515625, -2.2578125, -2.162109375, -2.06640625, -1.970703125, -1.875, -1.779296875, -1.68359375, -1.587890625, -1.4921875, -1.396484375, -1.30078125, -1.205078125, -1.109375, -1.013671875, -0.91796875, -0.822265625, -0.7265625, -0.630859375, -0.53515625, -0.439453125, -0.34375, -0.248046875, -0.15234375, -0.056640625, 0.0390625, 0.134765625, 0.23046875, 0.326171875, 0.421875, 0.517578125, 0.61328125, 0.708984375, 0.8046875, 0.900390625, 0.99609375, 1.091796875, 1.1875, 1.283203125, 1.37890625, 1.474609375, 1.5703125, 1.666015625, 1.76171875, 1.857421875, 1.953125, 2.048828125, 2.14453125, 2.240234375, 2.3359375, 2.431640625, 2.52734375, 2.623046875, 2.71875, 2.814453125, 2.91015625, 3.005859375]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 7.0, 10.0, 6.0, 10.0, 14.0, 11.0, 20.0, 20.0, 24.0, 24.0, 29.0, 41.0, 46.0, 35.0, 44.0, 45.0, 57.0, 47.0, 40.0, 52.0, 50.0, 51.0, 28.0, 37.0, 37.0, 42.0, 31.0, 20.0, 26.0, 22.0, 14.0, 11.0, 15.0, 8.0, 7.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2978515625, -1.2531890869140625, -1.208526611328125, -1.1638641357421875, -1.11920166015625, -1.0745391845703125, -1.029876708984375, -0.9852142333984375, -0.9405517578125, -0.8958892822265625, -0.851226806640625, -0.8065643310546875, -0.76190185546875, -0.7172393798828125, -0.672576904296875, -0.6279144287109375, -0.583251953125, -0.5385894775390625, -0.493927001953125, -0.4492645263671875, -0.40460205078125, -0.3599395751953125, -0.315277099609375, -0.2706146240234375, -0.2259521484375, -0.1812896728515625, -0.136627197265625, -0.0919647216796875, -0.04730224609375, -0.0026397705078125, 0.042022705078125, 0.0866851806640625, 0.13134765625, 0.1760101318359375, 0.220672607421875, 0.2653350830078125, 0.30999755859375, 0.3546600341796875, 0.399322509765625, 0.4439849853515625, 0.4886474609375, 0.5333099365234375, 0.577972412109375, 0.6226348876953125, 0.66729736328125, 0.7119598388671875, 0.756622314453125, 0.8012847900390625, 0.845947265625, 0.8906097412109375, 0.935272216796875, 0.9799346923828125, 1.02459716796875, 1.0692596435546875, 1.113922119140625, 1.1585845947265625, 1.2032470703125, 1.2479095458984375, 1.292572021484375, 1.3372344970703125, 1.38189697265625, 1.4265594482421875, 1.471221923828125, 1.5158843994140625, 1.560546875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 6.0, 1.0, 4.0, 9.0, 10.0, 17.0, 23.0, 26.0, 55.0, 67.0, 118.0, 170.0, 277.0, 468.0, 1491.0, 179840.0, 4006209.0, 3962.0, 621.0, 329.0, 176.0, 108.0, 105.0, 60.0, 36.0, 24.0, 23.0, 17.0, 9.0, 8.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-11.46875, -11.1231689453125, -10.777587890625, -10.4320068359375, -10.08642578125, -9.7408447265625, -9.395263671875, -9.0496826171875, -8.7041015625, -8.3585205078125, -8.012939453125, -7.6673583984375, -7.32177734375, -6.9761962890625, -6.630615234375, -6.2850341796875, -5.939453125, -5.5938720703125, -5.248291015625, -4.9027099609375, -4.55712890625, -4.2115478515625, -3.865966796875, -3.5203857421875, -3.1748046875, -2.8292236328125, -2.483642578125, -2.1380615234375, -1.79248046875, -1.4468994140625, -1.101318359375, -0.7557373046875, -0.41015625, -0.0645751953125, 0.281005859375, 0.6265869140625, 0.97216796875, 1.3177490234375, 1.663330078125, 2.0089111328125, 2.3544921875, 2.7000732421875, 3.045654296875, 3.3912353515625, 3.73681640625, 4.0823974609375, 4.427978515625, 4.7735595703125, 5.119140625, 5.4647216796875, 5.810302734375, 6.1558837890625, 6.50146484375, 6.8470458984375, 7.192626953125, 7.5382080078125, 7.8837890625, 8.2293701171875, 8.574951171875, 8.9205322265625, 9.26611328125, 9.6116943359375, 9.957275390625, 10.3028564453125, 10.6484375]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 8.0, 11.0, 15.0, 16.0, 27.0, 34.0, 40.0, 55.0, 75.0, 93.0, 132.0, 243.0, 286.0, 403.0, 475.0, 498.0, 408.0, 341.0, 251.0, 194.0, 123.0, 78.0, 50.0, 56.0, 36.0, 19.0, 21.0, 25.0, 13.0, 7.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.69091796875, -0.6723518371582031, -0.6537857055664062, -0.6352195739746094, -0.6166534423828125, -0.5980873107910156, -0.5795211791992188, -0.5609550476074219, -0.542388916015625, -0.5238227844238281, -0.5052566528320312, -0.4866905212402344, -0.4681243896484375, -0.4495582580566406, -0.43099212646484375, -0.4124259948730469, -0.39385986328125, -0.3752937316894531, -0.35672760009765625, -0.3381614685058594, -0.3195953369140625, -0.3010292053222656, -0.28246307373046875, -0.2638969421386719, -0.245330810546875, -0.22676467895507812, -0.20819854736328125, -0.18963241577148438, -0.1710662841796875, -0.15250015258789062, -0.13393402099609375, -0.11536788940429688, -0.0968017578125, -0.07823562622070312, -0.05966949462890625, -0.041103363037109375, -0.0225372314453125, -0.003971099853515625, 0.01459503173828125, 0.033161163330078125, 0.051727294921875, 0.07029342651367188, 0.08885955810546875, 0.10742568969726562, 0.1259918212890625, 0.14455795288085938, 0.16312408447265625, 0.18169021606445312, 0.20025634765625, 0.21882247924804688, 0.23738861083984375, 0.2559547424316406, 0.2745208740234375, 0.2930870056152344, 0.31165313720703125, 0.3302192687988281, 0.348785400390625, 0.3673515319824219, 0.38591766357421875, 0.4044837951660156, 0.4230499267578125, 0.4416160583496094, 0.46018218994140625, 0.4787483215332031, 0.497314453125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 8.0, 6.0, 17.0, 32.0, 48.0, 96.0, 108.0, 109.0, 147.0, 128.0, 94.0, 77.0, 47.0, 37.0, 23.0, 11.0, 9.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.035017967224121, -3.9271116256713867, -3.8192055225372314, -3.711299419403076, -3.603393077850342, -3.4954867362976074, -3.387580633163452, -3.279674530029297, -3.1717681884765625, -3.063861846923828, -2.955955743789673, -2.8480496406555176, -2.740143299102783, -2.632236957550049, -2.5243308544158936, -2.4164247512817383, -2.308518409729004, -2.2006120681762695, -2.0927059650421143, -1.9847997426986694, -1.8768935203552246, -1.7689872980117798, -1.661081075668335, -1.5531748533248901, -1.4452686309814453, -1.3373624086380005, -1.2294561862945557, -1.1215499639511108, -1.013643741607666, -0.9057375192642212, -0.7978312969207764, -0.6899250745773315, -0.5820190906524658, -0.474112868309021, -0.36620664596557617, -0.25830042362213135, -0.15039420127868652, -0.0424879789352417, 0.06541824340820312, 0.17332446575164795, 0.2812306880950928, 0.3891369104385376, 0.4970431327819824, 0.6049493551254272, 0.7128555774688721, 0.8207617998123169, 0.9286680221557617, 1.0365742444992065, 1.1444804668426514, 1.2523866891860962, 1.360292911529541, 1.4681991338729858, 1.5761053562164307, 1.6840115785598755, 1.7919178009033203, 1.8998240232467651, 2.00773024559021, 2.1156363487243652, 2.2235426902770996, 2.331449031829834, 2.4393551349639893, 2.5472612380981445, 2.655167579650879, 2.7630739212036133, 2.8709800243377686]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 2.0, 4.0, 8.0, 9.0, 4.0, 12.0, 16.0, 7.0, 17.0, 20.0, 14.0, 20.0, 27.0, 31.0, 34.0, 40.0, 40.0, 34.0, 55.0, 46.0, 36.0, 47.0, 39.0, 31.0, 43.0, 35.0, 37.0, 31.0, 41.0, 29.0, 26.0, 26.0, 26.0, 19.0, 13.0, 16.0, 15.0, 10.0, 9.0, 5.0, 6.0, 3.0, 8.0, 3.0, 0.0, 2.0, 3.0, 3.0], "bins": [-1.569925308227539, -1.5279452800750732, -1.485965371131897, -1.4439853429794312, -1.4020054340362549, -1.360025405883789, -1.3180453777313232, -1.2760653495788574, -1.2340854406356812, -1.1921054124832153, -1.150125503540039, -1.1081454753875732, -1.0661654472351074, -1.0241855382919312, -0.9822055101394653, -0.9402255415916443, -0.8982455730438232, -0.8562656044960022, -0.8142856359481812, -0.7723056077957153, -0.7303256392478943, -0.6883456707000732, -0.6463656425476074, -0.6043856739997864, -0.5624057054519653, -0.5204257369041443, -0.47844573855400085, -0.4364657402038574, -0.3944857716560364, -0.35250580310821533, -0.3105258047580719, -0.26854580640792847, -0.22656595706939697, -0.18458597362041473, -0.1426059901714325, -0.10062600672245026, -0.05864602327346802, -0.01666603982448578, 0.02531394362449646, 0.06729394197463989, 0.10927391052246094, 0.15125389397144318, 0.19323387742042542, 0.23521386086940765, 0.2771938443183899, 0.31917381286621094, 0.36115381121635437, 0.4031338095664978, 0.44511377811431885, 0.4870937466621399, 0.5290737152099609, 0.5710537433624268, 0.6130337119102478, 0.6550136804580688, 0.6969937086105347, 0.7389736771583557, 0.7809536457061768, 0.8229336142539978, 0.8649135828018188, 0.9068936109542847, 0.9488735795021057, 0.9908535480499268, 1.0328335762023926, 1.0748136043548584, 1.1167935132980347]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 7.0, 19.0, 13.0, 31.0, 37.0, 65.0, 86.0, 168.0, 269.0, 563.0, 1151.0, 2755.0, 7836.0, 24588.0, 80604.0, 242409.0, 381412.0, 207698.0, 67246.0, 20421.0, 6598.0, 2449.0, 1024.0, 430.0, 250.0, 161.0, 77.0, 50.0, 33.0, 32.0, 18.0, 10.0, 15.0, 9.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7861328125, -0.7639389038085938, -0.7417449951171875, -0.7195510864257812, -0.697357177734375, -0.6751632690429688, -0.6529693603515625, -0.6307754516601562, -0.60858154296875, -0.5863876342773438, -0.5641937255859375, -0.5419998168945312, -0.519805908203125, -0.49761199951171875, -0.4754180908203125, -0.45322418212890625, -0.4310302734375, -0.40883636474609375, -0.3866424560546875, -0.36444854736328125, -0.342254638671875, -0.32006072998046875, -0.2978668212890625, -0.27567291259765625, -0.25347900390625, -0.23128509521484375, -0.2090911865234375, -0.18689727783203125, -0.164703369140625, -0.14250946044921875, -0.1203155517578125, -0.09812164306640625, -0.075927734375, -0.05373382568359375, -0.0315399169921875, -0.00934600830078125, 0.012847900390625, 0.03504180908203125, 0.0572357177734375, 0.07942962646484375, 0.10162353515625, 0.12381744384765625, 0.1460113525390625, 0.16820526123046875, 0.190399169921875, 0.21259307861328125, 0.2347869873046875, 0.25698089599609375, 0.2791748046875, 0.30136871337890625, 0.3235626220703125, 0.34575653076171875, 0.367950439453125, 0.39014434814453125, 0.4123382568359375, 0.43453216552734375, 0.45672607421875, 0.47891998291015625, 0.5011138916015625, 0.5233078002929688, 0.545501708984375, 0.5676956176757812, 0.5898895263671875, 0.6120834350585938, 0.63427734375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 2.0, 8.0, 2.0, 5.0, 8.0, 7.0, 14.0, 17.0, 21.0, 14.0, 21.0, 26.0, 33.0, 47.0, 41.0, 47.0, 56.0, 63.0, 38.0, 41.0, 54.0, 44.0, 42.0, 35.0, 43.0, 41.0, 36.0, 30.0, 26.0, 27.0, 19.0, 18.0, 17.0, 12.0, 11.0, 11.0, 8.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.013671875, -0.9859085083007812, -0.9581451416015625, -0.9303817749023438, -0.902618408203125, -0.8748550415039062, -0.8470916748046875, -0.8193283081054688, -0.79156494140625, -0.7638015747070312, -0.7360382080078125, -0.7082748413085938, -0.680511474609375, -0.6527481079101562, -0.6249847412109375, -0.5972213745117188, -0.5694580078125, -0.5416946411132812, -0.5139312744140625, -0.48616790771484375, -0.458404541015625, -0.43064117431640625, -0.4028778076171875, -0.37511444091796875, -0.34735107421875, -0.31958770751953125, -0.2918243408203125, -0.26406097412109375, -0.236297607421875, -0.20853424072265625, -0.1807708740234375, -0.15300750732421875, -0.125244140625, -0.09748077392578125, -0.0697174072265625, -0.04195404052734375, -0.014190673828125, 0.01357269287109375, 0.0413360595703125, 0.06909942626953125, 0.09686279296875, 0.12462615966796875, 0.1523895263671875, 0.18015289306640625, 0.207916259765625, 0.23567962646484375, 0.2634429931640625, 0.29120635986328125, 0.3189697265625, 0.34673309326171875, 0.3744964599609375, 0.40225982666015625, 0.430023193359375, 0.45778656005859375, 0.4855499267578125, 0.5133132934570312, 0.54107666015625, 0.5688400268554688, 0.5966033935546875, 0.6243667602539062, 0.652130126953125, 0.6798934936523438, 0.7076568603515625, 0.7354202270507812, 0.76318359375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 8.0, 13.0, 15.0, 14.0, 29.0, 31.0, 52.0, 72.0, 96.0, 173.0, 265.0, 460.0, 1003.0, 2153.0, 5183.0, 14365.0, 43989.0, 138464.0, 319191.0, 318180.0, 137338.0, 43961.0, 14123.0, 4998.0, 2134.0, 984.0, 477.0, 275.0, 167.0, 115.0, 78.0, 48.0, 27.0, 25.0, 15.0, 10.0, 7.0, 9.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0], "bins": [-0.7490234375, -0.72930908203125, -0.7095947265625, -0.68988037109375, -0.670166015625, -0.65045166015625, -0.6307373046875, -0.61102294921875, -0.59130859375, -0.57159423828125, -0.5518798828125, -0.53216552734375, -0.512451171875, -0.49273681640625, -0.4730224609375, -0.45330810546875, -0.43359375, -0.41387939453125, -0.3941650390625, -0.37445068359375, -0.354736328125, -0.33502197265625, -0.3153076171875, -0.29559326171875, -0.27587890625, -0.25616455078125, -0.2364501953125, -0.21673583984375, -0.197021484375, -0.17730712890625, -0.1575927734375, -0.13787841796875, -0.1181640625, -0.09844970703125, -0.0787353515625, -0.05902099609375, -0.039306640625, -0.01959228515625, 0.0001220703125, 0.01983642578125, 0.03955078125, 0.05926513671875, 0.0789794921875, 0.09869384765625, 0.118408203125, 0.13812255859375, 0.1578369140625, 0.17755126953125, 0.197265625, 0.21697998046875, 0.2366943359375, 0.25640869140625, 0.276123046875, 0.29583740234375, 0.3155517578125, 0.33526611328125, 0.35498046875, 0.37469482421875, 0.3944091796875, 0.41412353515625, 0.433837890625, 0.45355224609375, 0.4732666015625, 0.49298095703125, 0.5126953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 7.0, 8.0, 8.0, 8.0, 21.0, 25.0, 41.0, 28.0, 55.0, 37.0, 49.0, 62.0, 81.0, 52.0, 72.0, 79.0, 69.0, 68.0, 46.0, 38.0, 31.0, 30.0, 21.0, 23.0, 7.0, 14.0, 9.0, 5.0, 2.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9189453125, -1.8480682373046875, -1.777191162109375, -1.7063140869140625, -1.63543701171875, -1.5645599365234375, -1.493682861328125, -1.4228057861328125, -1.3519287109375, -1.2810516357421875, -1.210174560546875, -1.1392974853515625, -1.06842041015625, -0.9975433349609375, -0.926666259765625, -0.8557891845703125, -0.784912109375, -0.7140350341796875, -0.643157958984375, -0.5722808837890625, -0.50140380859375, -0.4305267333984375, -0.359649658203125, -0.2887725830078125, -0.2178955078125, -0.1470184326171875, -0.076141357421875, -0.0052642822265625, 0.06561279296875, 0.1364898681640625, 0.207366943359375, 0.2782440185546875, 0.34912109375, 0.4199981689453125, 0.490875244140625, 0.5617523193359375, 0.63262939453125, 0.7035064697265625, 0.774383544921875, 0.8452606201171875, 0.9161376953125, 0.9870147705078125, 1.057891845703125, 1.1287689208984375, 1.19964599609375, 1.2705230712890625, 1.341400146484375, 1.4122772216796875, 1.483154296875, 1.5540313720703125, 1.624908447265625, 1.6957855224609375, 1.76666259765625, 1.8375396728515625, 1.908416748046875, 1.9792938232421875, 2.0501708984375, 2.1210479736328125, 2.191925048828125, 2.2628021240234375, 2.33367919921875, 2.4045562744140625, 2.475433349609375, 2.5463104248046875, 2.6171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 8.0, 3.0, 10.0, 14.0, 20.0, 32.0, 38.0, 60.0, 77.0, 129.0, 174.0, 281.0, 542.0, 907.0, 1872.0, 3705.0, 8324.0, 20843.0, 64162.0, 215219.0, 414478.0, 216262.0, 64113.0, 21084.0, 8274.0, 3734.0, 1845.0, 974.0, 526.0, 286.0, 188.0, 108.0, 87.0, 63.0, 31.0, 25.0, 17.0, 13.0, 7.0, 8.0, 8.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2337646484375, -0.22657203674316406, -0.21937942504882812, -0.2121868133544922, -0.20499420166015625, -0.1978015899658203, -0.19060897827148438, -0.18341636657714844, -0.1762237548828125, -0.16903114318847656, -0.16183853149414062, -0.1546459197998047, -0.14745330810546875, -0.1402606964111328, -0.13306808471679688, -0.12587547302246094, -0.118682861328125, -0.11149024963378906, -0.10429763793945312, -0.09710502624511719, -0.08991241455078125, -0.08271980285644531, -0.07552719116210938, -0.06833457946777344, -0.0611419677734375, -0.05394935607910156, -0.046756744384765625, -0.03956413269042969, -0.03237152099609375, -0.025178909301757812, -0.017986297607421875, -0.010793685913085938, -0.00360107421875, 0.0035915374755859375, 0.010784149169921875, 0.017976760864257812, 0.02516937255859375, 0.03236198425292969, 0.039554595947265625, 0.04674720764160156, 0.0539398193359375, 0.06113243103027344, 0.06832504272460938, 0.07551765441894531, 0.08271026611328125, 0.08990287780761719, 0.09709548950195312, 0.10428810119628906, 0.111480712890625, 0.11867332458496094, 0.12586593627929688, 0.1330585479736328, 0.14025115966796875, 0.1474437713623047, 0.15463638305664062, 0.16182899475097656, 0.1690216064453125, 0.17621421813964844, 0.18340682983398438, 0.1905994415283203, 0.19779205322265625, 0.2049846649169922, 0.21217727661132812, 0.21936988830566406, 0.2265625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 10.0, 7.0, 15.0, 24.0, 31.0, 87.0, 74.0, 107.0, 135.0, 121.0, 133.0, 94.0, 67.0, 28.0, 22.0, 14.0, 12.0, 6.0, 2.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002570152282714844, -0.00025132112205028534, -0.0002456270158290863, -0.00023993290960788727, -0.00023423880338668823, -0.0002285446971654892, -0.00022285059094429016, -0.00021715648472309113, -0.0002114623785018921, -0.00020576827228069305, -0.00020007416605949402, -0.00019438005983829498, -0.00018868595361709595, -0.0001829918473958969, -0.00017729774117469788, -0.00017160363495349884, -0.0001659095287322998, -0.00016021542251110077, -0.00015452131628990173, -0.0001488272100687027, -0.00014313310384750366, -0.00013743899762630463, -0.0001317448914051056, -0.00012605078518390656, -0.00012035667896270752, -0.00011466257274150848, -0.00010896846652030945, -0.00010327436029911041, -9.758025407791138e-05, -9.188614785671234e-05, -8.61920416355133e-05, -8.049793541431427e-05, -7.480382919311523e-05, -6.91097229719162e-05, -6.341561675071716e-05, -5.772151052951813e-05, -5.202740430831909e-05, -4.6333298087120056e-05, -4.063919186592102e-05, -3.4945085644721985e-05, -2.925097942352295e-05, -2.3556873202323914e-05, -1.7862766981124878e-05, -1.2168660759925842e-05, -6.474554538726807e-06, -7.80448317527771e-07, 4.913657903671265e-06, 1.06077641248703e-05, 1.6301870346069336e-05, 2.199597656726837e-05, 2.7690082788467407e-05, 3.338418900966644e-05, 3.907829523086548e-05, 4.4772401452064514e-05, 5.046650767326355e-05, 5.6160613894462585e-05, 6.185472011566162e-05, 6.754882633686066e-05, 7.324293255805969e-05, 7.893703877925873e-05, 8.463114500045776e-05, 9.03252512216568e-05, 9.601935744285583e-05, 0.00010171346366405487, 0.0001074075698852539]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 3.0, 1.0, 6.0, 1.0, 6.0, 9.0, 22.0, 28.0, 30.0, 37.0, 65.0, 125.0, 184.0, 393.0, 990.0, 3313.0, 17108.0, 176050.0, 711297.0, 121323.0, 13258.0, 2702.0, 840.0, 339.0, 155.0, 83.0, 57.0, 38.0, 20.0, 18.0, 13.0, 10.0, 7.0, 5.0, 6.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5029296875, -0.487884521484375, -0.47283935546875, -0.457794189453125, -0.4427490234375, -0.427703857421875, -0.41265869140625, -0.397613525390625, -0.382568359375, -0.367523193359375, -0.35247802734375, -0.337432861328125, -0.3223876953125, -0.307342529296875, -0.29229736328125, -0.277252197265625, -0.26220703125, -0.247161865234375, -0.23211669921875, -0.217071533203125, -0.2020263671875, -0.186981201171875, -0.17193603515625, -0.156890869140625, -0.141845703125, -0.126800537109375, -0.11175537109375, -0.096710205078125, -0.0816650390625, -0.066619873046875, -0.05157470703125, -0.036529541015625, -0.021484375, -0.006439208984375, 0.00860595703125, 0.023651123046875, 0.0386962890625, 0.053741455078125, 0.06878662109375, 0.083831787109375, 0.098876953125, 0.113922119140625, 0.12896728515625, 0.144012451171875, 0.1590576171875, 0.174102783203125, 0.18914794921875, 0.204193115234375, 0.21923828125, 0.234283447265625, 0.24932861328125, 0.264373779296875, 0.2794189453125, 0.294464111328125, 0.30950927734375, 0.324554443359375, 0.339599609375, 0.354644775390625, 0.36968994140625, 0.384735107421875, 0.3997802734375, 0.414825439453125, 0.42987060546875, 0.444915771484375, 0.4599609375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 0.0, 6.0, 4.0, 4.0, 5.0, 9.0, 5.0, 18.0, 11.0, 23.0, 26.0, 33.0, 36.0, 54.0, 56.0, 63.0, 71.0, 67.0, 65.0, 78.0, 57.0, 65.0, 56.0, 41.0, 34.0, 24.0, 21.0, 17.0, 9.0, 8.0, 5.0, 3.0, 3.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061370849609375, -0.05948448181152344, -0.057598114013671875, -0.05571174621582031, -0.05382537841796875, -0.05193901062011719, -0.050052642822265625, -0.04816627502441406, -0.0462799072265625, -0.04439353942871094, -0.042507171630859375, -0.04062080383300781, -0.03873443603515625, -0.03684806823730469, -0.034961700439453125, -0.03307533264160156, -0.03118896484375, -0.029302597045898438, -0.027416229248046875, -0.025529861450195312, -0.02364349365234375, -0.021757125854492188, -0.019870758056640625, -0.017984390258789062, -0.0160980224609375, -0.014211654663085938, -0.012325286865234375, -0.010438919067382812, -0.00855255126953125, -0.0066661834716796875, -0.004779815673828125, -0.0028934478759765625, -0.001007080078125, 0.0008792877197265625, 0.002765655517578125, 0.0046520233154296875, 0.00653839111328125, 0.008424758911132812, 0.010311126708984375, 0.012197494506835938, 0.0140838623046875, 0.015970230102539062, 0.017856597900390625, 0.019742965698242188, 0.02162933349609375, 0.023515701293945312, 0.025402069091796875, 0.027288436889648438, 0.0291748046875, 0.031061172485351562, 0.032947540283203125, 0.03483390808105469, 0.03672027587890625, 0.03860664367675781, 0.040493011474609375, 0.04237937927246094, 0.0442657470703125, 0.04615211486816406, 0.048038482666015625, 0.04992485046386719, 0.05181121826171875, 0.05369758605957031, 0.055583953857421875, 0.05747032165527344, 0.059356689453125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 11.0, 15.0, 13.0, 39.0, 81.0, 82.0, 110.0, 115.0, 142.0, 123.0, 81.0, 62.0, 38.0, 29.0, 18.0, 18.0, 6.0, 9.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0483486652374268, -1.98997163772583, -1.931594729423523, -1.8732177019119263, -1.8148406744003296, -1.7564637660980225, -1.6980867385864258, -1.639709711074829, -1.5813326835632324, -1.5229556560516357, -1.4645787477493286, -1.406201720237732, -1.3478246927261353, -1.2894477844238281, -1.2310707569122314, -1.1726937294006348, -1.1143168210983276, -1.055939793586731, -0.997562825679779, -0.9391858577728271, -0.8808088302612305, -0.8224318623542786, -0.7640548944473267, -0.70567786693573, -0.6473008990287781, -0.5889239311218262, -0.5305469036102295, -0.4721699357032776, -0.4137929379940033, -0.355415940284729, -0.2970389723777771, -0.2386619746685028, -0.18028485774993896, -0.12190786749124527, -0.06353087723255157, -0.0051538944244384766, 0.053223103284835815, 0.11160010099411011, 0.169977068901062, 0.2283540666103363, 0.2867310643196106, 0.3451080620288849, 0.4034850597381592, 0.4618620276451111, 0.520238995552063, 0.5786160230636597, 0.6369929909706116, 0.6953699588775635, 0.7537469863891602, 0.8121239542961121, 0.8705009818077087, 0.9288779497146606, 0.9872549772262573, 1.0456318855285645, 1.1040089130401611, 1.1623859405517578, 1.2207629680633545, 1.2791399955749512, 1.3375169038772583, 1.395893931388855, 1.4542709589004517, 1.5126478672027588, 1.5710248947143555, 1.6294019222259521, 1.6877788305282593]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 2.0, 12.0, 7.0, 12.0, 6.0, 16.0, 14.0, 10.0, 13.0, 15.0, 15.0, 27.0, 34.0, 44.0, 41.0, 48.0, 38.0, 57.0, 45.0, 31.0, 55.0, 33.0, 21.0, 53.0, 37.0, 34.0, 36.0, 30.0, 35.0, 29.0, 20.0, 25.0, 22.0, 14.0, 16.0, 4.0, 9.0, 9.0, 9.0, 8.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8311824202537537, -0.8067749738693237, -0.7823675274848938, -0.7579600811004639, -0.7335526347160339, -0.709145188331604, -0.6847377419471741, -0.6603302955627441, -0.6359228491783142, -0.6115154027938843, -0.5871079564094543, -0.5627005100250244, -0.5382930636405945, -0.5138856172561646, -0.4894781708717346, -0.4650707244873047, -0.44066324830055237, -0.41625580191612244, -0.3918483555316925, -0.3674409091472626, -0.34303346276283264, -0.3186260163784027, -0.2942185401916504, -0.26981109380722046, -0.24540366232395172, -0.2209962159395218, -0.19658876955509186, -0.17218130826950073, -0.1477738618850708, -0.12336642295122147, -0.09895896911621094, -0.074551522731781, -0.050144076347351074, -0.025736628100275993, -0.0013291798532009125, 0.023078270256519318, 0.04748571664094925, 0.07189316302537918, 0.09630061686038971, 0.12070806324481964, 0.14511550962924957, 0.1695229560136795, 0.19393040239810944, 0.21833786368370056, 0.2427453100681305, 0.2671527564525604, 0.29156020283699036, 0.3159676492214203, 0.3403750956058502, 0.36478254199028015, 0.3891899883747101, 0.41359743475914, 0.43800488114356995, 0.4624123275279999, 0.4868198037147522, 0.5112272500991821, 0.5356346964836121, 0.560042142868042, 0.5844495892524719, 0.6088570356369019, 0.6332644820213318, 0.6576719284057617, 0.6820793747901917, 0.7064868211746216, 0.7308942675590515]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 6.0, 8.0, 6.0, 17.0, 16.0, 26.0, 30.0, 45.0, 59.0, 93.0, 164.0, 263.0, 477.0, 917.0, 1967.0, 4225.0, 9298.0, 21263.0, 51639.0, 139694.0, 479150.0, 215024.0, 72435.0, 28822.0, 12243.0, 5367.0, 2493.0, 1273.0, 650.0, 334.0, 205.0, 98.0, 80.0, 34.0, 33.0, 34.0, 17.0, 11.0, 10.0, 8.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.7646484375, -0.740509033203125, -0.71636962890625, -0.692230224609375, -0.6680908203125, -0.643951416015625, -0.61981201171875, -0.595672607421875, -0.571533203125, -0.547393798828125, -0.52325439453125, -0.499114990234375, -0.4749755859375, -0.450836181640625, -0.42669677734375, -0.402557373046875, -0.37841796875, -0.354278564453125, -0.33013916015625, -0.305999755859375, -0.2818603515625, -0.257720947265625, -0.23358154296875, -0.209442138671875, -0.185302734375, -0.161163330078125, -0.13702392578125, -0.112884521484375, -0.0887451171875, -0.064605712890625, -0.04046630859375, -0.016326904296875, 0.0078125, 0.031951904296875, 0.05609130859375, 0.080230712890625, 0.1043701171875, 0.128509521484375, 0.15264892578125, 0.176788330078125, 0.200927734375, 0.225067138671875, 0.24920654296875, 0.273345947265625, 0.2974853515625, 0.321624755859375, 0.34576416015625, 0.369903564453125, 0.39404296875, 0.418182373046875, 0.44232177734375, 0.466461181640625, 0.4906005859375, 0.514739990234375, 0.53887939453125, 0.563018798828125, 0.587158203125, 0.611297607421875, 0.63543701171875, 0.659576416015625, 0.6837158203125, 0.707855224609375, 0.73199462890625, 0.756134033203125, 0.7802734375]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 4.0, 3.0, 9.0, 11.0, 5.0, 14.0, 7.0, 13.0, 23.0, 20.0, 21.0, 26.0, 21.0, 40.0, 31.0, 43.0, 43.0, 47.0, 40.0, 42.0, 48.0, 36.0, 44.0, 41.0, 33.0, 35.0, 31.0, 23.0, 33.0, 26.0, 33.0, 17.0, 17.0, 14.0, 19.0, 12.0, 13.0, 13.0, 10.0, 4.0, 5.0, 2.0, 3.0, 3.0, 6.0, 2.0, 1.0, 3.0, 2.0], "bins": [-1.791015625, -1.7405242919921875, -1.690032958984375, -1.6395416259765625, -1.58905029296875, -1.5385589599609375, -1.488067626953125, -1.4375762939453125, -1.3870849609375, -1.3365936279296875, -1.286102294921875, -1.2356109619140625, -1.18511962890625, -1.1346282958984375, -1.084136962890625, -1.0336456298828125, -0.983154296875, -0.9326629638671875, -0.882171630859375, -0.8316802978515625, -0.78118896484375, -0.7306976318359375, -0.680206298828125, -0.6297149658203125, -0.5792236328125, -0.5287322998046875, -0.478240966796875, -0.4277496337890625, -0.37725830078125, -0.3267669677734375, -0.276275634765625, -0.2257843017578125, -0.17529296875, -0.1248016357421875, -0.074310302734375, -0.0238189697265625, 0.02667236328125, 0.0771636962890625, 0.127655029296875, 0.1781463623046875, 0.2286376953125, 0.2791290283203125, 0.329620361328125, 0.3801116943359375, 0.43060302734375, 0.4810943603515625, 0.531585693359375, 0.5820770263671875, 0.632568359375, 0.6830596923828125, 0.733551025390625, 0.7840423583984375, 0.83453369140625, 0.8850250244140625, 0.935516357421875, 0.9860076904296875, 1.0364990234375, 1.0869903564453125, 1.137481689453125, 1.1879730224609375, 1.23846435546875, 1.2889556884765625, 1.339447021484375, 1.3899383544921875, 1.4404296875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 2.0, 6.0, 6.0, 7.0, 7.0, 13.0, 14.0, 10.0, 17.0, 22.0, 27.0, 35.0, 31.0, 37.0, 57.0, 85.0, 115.0, 411.0, 87717.0, 958613.0, 762.0, 165.0, 86.0, 58.0, 33.0, 38.0, 29.0, 35.0, 20.0, 18.0, 18.0, 18.0, 10.0, 7.0, 7.0, 9.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8671875, -8.5823974609375, -8.297607421875, -8.0128173828125, -7.72802734375, -7.4432373046875, -7.158447265625, -6.8736572265625, -6.5888671875, -6.3040771484375, -6.019287109375, -5.7344970703125, -5.44970703125, -5.1649169921875, -4.880126953125, -4.5953369140625, -4.310546875, -4.0257568359375, -3.740966796875, -3.4561767578125, -3.17138671875, -2.8865966796875, -2.601806640625, -2.3170166015625, -2.0322265625, -1.7474365234375, -1.462646484375, -1.1778564453125, -0.89306640625, -0.6082763671875, -0.323486328125, -0.0386962890625, 0.24609375, 0.5308837890625, 0.815673828125, 1.1004638671875, 1.38525390625, 1.6700439453125, 1.954833984375, 2.2396240234375, 2.5244140625, 2.8092041015625, 3.093994140625, 3.3787841796875, 3.66357421875, 3.9483642578125, 4.233154296875, 4.5179443359375, 4.802734375, 5.0875244140625, 5.372314453125, 5.6571044921875, 5.94189453125, 6.2266845703125, 6.511474609375, 6.7962646484375, 7.0810546875, 7.3658447265625, 7.650634765625, 7.9354248046875, 8.22021484375, 8.5050048828125, 8.789794921875, 9.0745849609375, 9.359375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 6.0, 6.0, 7.0, 5.0, 8.0, 11.0, 17.0, 18.0, 19.0, 26.0, 38.0, 28.0, 34.0, 37.0, 39.0, 49.0, 49.0, 43.0, 52.0, 57.0, 55.0, 51.0, 46.0, 45.0, 30.0, 32.0, 33.0, 36.0, 22.0, 20.0, 18.0, 12.0, 8.0, 16.0, 11.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.076171875, -2.01123046875, -1.9462890625, -1.88134765625, -1.81640625, -1.75146484375, -1.6865234375, -1.62158203125, -1.556640625, -1.49169921875, -1.4267578125, -1.36181640625, -1.296875, -1.23193359375, -1.1669921875, -1.10205078125, -1.037109375, -0.97216796875, -0.9072265625, -0.84228515625, -0.77734375, -0.71240234375, -0.6474609375, -0.58251953125, -0.517578125, -0.45263671875, -0.3876953125, -0.32275390625, -0.2578125, -0.19287109375, -0.1279296875, -0.06298828125, 0.001953125, 0.06689453125, 0.1318359375, 0.19677734375, 0.26171875, 0.32666015625, 0.3916015625, 0.45654296875, 0.521484375, 0.58642578125, 0.6513671875, 0.71630859375, 0.78125, 0.84619140625, 0.9111328125, 0.97607421875, 1.041015625, 1.10595703125, 1.1708984375, 1.23583984375, 1.30078125, 1.36572265625, 1.4306640625, 1.49560546875, 1.560546875, 1.62548828125, 1.6904296875, 1.75537109375, 1.8203125, 1.88525390625, 1.9501953125, 2.01513671875, 2.080078125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 4.0, 1.0, 6.0, 4.0, 5.0, 12.0, 25.0, 29.0, 40.0, 77.0, 277.0, 920.0, 8631.0, 936777.0, 98358.0, 2655.0, 422.0, 138.0, 68.0, 34.0, 23.0, 17.0, 9.0, 6.0, 12.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3203125, -1.272796630859375, -1.22528076171875, -1.177764892578125, -1.1302490234375, -1.082733154296875, -1.03521728515625, -0.987701416015625, -0.940185546875, -0.892669677734375, -0.84515380859375, -0.797637939453125, -0.7501220703125, -0.702606201171875, -0.65509033203125, -0.607574462890625, -0.56005859375, -0.512542724609375, -0.46502685546875, -0.417510986328125, -0.3699951171875, -0.322479248046875, -0.27496337890625, -0.227447509765625, -0.179931640625, -0.132415771484375, -0.08489990234375, -0.037384033203125, 0.0101318359375, 0.057647705078125, 0.10516357421875, 0.152679443359375, 0.2001953125, 0.247711181640625, 0.29522705078125, 0.342742919921875, 0.3902587890625, 0.437774658203125, 0.48529052734375, 0.532806396484375, 0.580322265625, 0.627838134765625, 0.67535400390625, 0.722869873046875, 0.7703857421875, 0.817901611328125, 0.86541748046875, 0.912933349609375, 0.96044921875, 1.007965087890625, 1.05548095703125, 1.102996826171875, 1.1505126953125, 1.198028564453125, 1.24554443359375, 1.293060302734375, 1.340576171875, 1.388092041015625, 1.43560791015625, 1.483123779296875, 1.5306396484375, 1.578155517578125, 1.62567138671875, 1.673187255859375, 1.720703125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 8.0, 11.0, 13.0, 39.0, 58.0, 106.0, 219.0, 263.0, 122.0, 67.0, 22.0, 23.0, 14.0, 13.0, 8.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.130073547363281e-05, -7.778778672218323e-05, -7.427483797073364e-05, -7.076188921928406e-05, -6.724894046783447e-05, -6.373599171638489e-05, -6.02230429649353e-05, -5.671009421348572e-05, -5.319714546203613e-05, -4.968419671058655e-05, -4.617124795913696e-05, -4.265829920768738e-05, -3.914535045623779e-05, -3.563240170478821e-05, -3.211945295333862e-05, -2.8606504201889038e-05, -2.5093555450439453e-05, -2.1580606698989868e-05, -1.8067657947540283e-05, -1.4554709196090698e-05, -1.1041760444641113e-05, -7.528811693191528e-06, -4.015862941741943e-06, -5.029141902923584e-07, 3.0100345611572266e-06, 6.5229833126068115e-06, 1.0035932064056396e-05, 1.3548880815505981e-05, 1.7061829566955566e-05, 2.057477831840515e-05, 2.4087727069854736e-05, 2.760067582130432e-05, 3.1113624572753906e-05, 3.462657332420349e-05, 3.8139522075653076e-05, 4.165247082710266e-05, 4.5165419578552246e-05, 4.867836833000183e-05, 5.2191317081451416e-05, 5.5704265832901e-05, 5.9217214584350586e-05, 6.273016333580017e-05, 6.624311208724976e-05, 6.975606083869934e-05, 7.326900959014893e-05, 7.678195834159851e-05, 8.02949070930481e-05, 8.380785584449768e-05, 8.732080459594727e-05, 9.083375334739685e-05, 9.434670209884644e-05, 9.785965085029602e-05, 0.0001013725996017456, 0.00010488554835319519, 0.00010839849710464478, 0.00011191144585609436, 0.00011542439460754395, 0.00011893734335899353, 0.00012245029211044312, 0.0001259632408618927, 0.00012947618961334229, 0.00013298913836479187, 0.00013650208711624146, 0.00014001503586769104, 0.00014352798461914062]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 8.0, 5.0, 9.0, 14.0, 17.0, 30.0, 47.0, 109.0, 262.0, 759.0, 3097.0, 28242.0, 914627.0, 93270.0, 6088.0, 1252.0, 386.0, 155.0, 62.0, 34.0, 30.0, 13.0, 8.0, 11.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96484375, -0.9323272705078125, -0.899810791015625, -0.8672943115234375, -0.83477783203125, -0.8022613525390625, -0.769744873046875, -0.7372283935546875, -0.7047119140625, -0.6721954345703125, -0.639678955078125, -0.6071624755859375, -0.57464599609375, -0.5421295166015625, -0.509613037109375, -0.4770965576171875, -0.444580078125, -0.4120635986328125, -0.379547119140625, -0.3470306396484375, -0.31451416015625, -0.2819976806640625, -0.249481201171875, -0.2169647216796875, -0.1844482421875, -0.1519317626953125, -0.119415283203125, -0.0868988037109375, -0.05438232421875, -0.0218658447265625, 0.010650634765625, 0.0431671142578125, 0.07568359375, 0.1082000732421875, 0.140716552734375, 0.1732330322265625, 0.20574951171875, 0.2382659912109375, 0.270782470703125, 0.3032989501953125, 0.3358154296875, 0.3683319091796875, 0.400848388671875, 0.4333648681640625, 0.46588134765625, 0.4983978271484375, 0.530914306640625, 0.5634307861328125, 0.595947265625, 0.6284637451171875, 0.660980224609375, 0.6934967041015625, 0.72601318359375, 0.7585296630859375, 0.791046142578125, 0.8235626220703125, 0.8560791015625, 0.8885955810546875, 0.921112060546875, 0.9536285400390625, 0.98614501953125, 1.0186614990234375, 1.051177978515625, 1.0836944580078125, 1.1162109375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 6.0, 3.0, 5.0, 9.0, 16.0, 29.0, 19.0, 79.0, 154.0, 316.0, 173.0, 63.0, 48.0, 20.0, 15.0, 16.0, 11.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.309814453125, -0.2993621826171875, -0.288909912109375, -0.2784576416015625, -0.26800537109375, -0.2575531005859375, -0.247100830078125, -0.2366485595703125, -0.2261962890625, -0.2157440185546875, -0.205291748046875, -0.1948394775390625, -0.18438720703125, -0.1739349365234375, -0.163482666015625, -0.1530303955078125, -0.142578125, -0.1321258544921875, -0.121673583984375, -0.1112213134765625, -0.10076904296875, -0.0903167724609375, -0.079864501953125, -0.0694122314453125, -0.0589599609375, -0.0485076904296875, -0.038055419921875, -0.0276031494140625, -0.01715087890625, -0.0066986083984375, 0.003753662109375, 0.0142059326171875, 0.024658203125, 0.0351104736328125, 0.045562744140625, 0.0560150146484375, 0.06646728515625, 0.0769195556640625, 0.087371826171875, 0.0978240966796875, 0.1082763671875, 0.1187286376953125, 0.129180908203125, 0.1396331787109375, 0.15008544921875, 0.1605377197265625, 0.170989990234375, 0.1814422607421875, 0.19189453125, 0.2023468017578125, 0.212799072265625, 0.2232513427734375, 0.23370361328125, 0.2441558837890625, 0.254608154296875, 0.2650604248046875, 0.2755126953125, 0.2859649658203125, 0.296417236328125, 0.3068695068359375, 0.31732177734375, 0.3277740478515625, 0.338226318359375, 0.3486785888671875, 0.359130859375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 8.0, 42.0, 197.0, 384.0, 290.0, 69.0, 15.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.681331634521484, -21.291372299194336, -20.901411056518555, -20.511451721191406, -20.121490478515625, -19.731531143188477, -19.341569900512695, -18.951610565185547, -18.561649322509766, -18.171689987182617, -17.781728744506836, -17.391769409179688, -17.001808166503906, -16.611848831176758, -16.221887588500977, -15.831928253173828, -15.441967964172363, -15.052007675170898, -14.662047386169434, -14.272087097167969, -13.882126808166504, -13.492166519165039, -13.10220718383789, -12.71224594116211, -12.322286605834961, -11.932326316833496, -11.542366027832031, -11.152405738830566, -10.762445449829102, -10.372485160827637, -9.982524871826172, -9.592565536499023, -9.202604293823242, -8.812644004821777, -8.422683715820312, -8.032723426818848, -7.642763137817383, -7.252802848815918, -6.862843036651611, -6.4728827476501465, -6.082921981811523, -5.692961692810059, -5.303001403808594, -4.913041114807129, -4.523080825805664, -4.133120536804199, -3.7431607246398926, -3.3532004356384277, -2.963240385055542, -2.573280096054077, -2.1833200454711914, -1.7933597564697266, -1.4033994674682617, -1.0134391784667969, -0.6234791278839111, -0.2335188388824463, 0.15644145011901855, 0.5464016795158386, 0.9363619089126587, 1.326322078704834, 1.7162823677062988, 2.1062426567077637, 2.4962027072906494, 2.8861629962921143, 3.276123285293579]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 1.0, 7.0, 4.0, 7.0, 5.0, 7.0, 17.0, 16.0, 21.0, 26.0, 24.0, 20.0, 26.0, 29.0, 25.0, 35.0, 33.0, 32.0, 34.0, 28.0, 33.0, 47.0, 46.0, 46.0, 39.0, 48.0, 37.0, 31.0, 34.0, 23.0, 41.0, 27.0, 22.0, 18.0, 17.0, 11.0, 16.0, 12.0, 6.0, 13.0, 4.0, 8.0, 10.0, 2.0, 5.0, 6.0, 1.0, 1.0, 2.0], "bins": [-2.9436018466949463, -2.8690743446350098, -2.7945470809936523, -2.720019817352295, -2.6454923152923584, -2.570964813232422, -2.4964375495910645, -2.421910285949707, -2.3473827838897705, -2.272855281829834, -2.1983280181884766, -2.123800754547119, -2.0492732524871826, -1.9747458696365356, -1.9002184867858887, -1.8256911039352417, -1.7511637210845947, -1.6766363382339478, -1.6021089553833008, -1.5275815725326538, -1.4530541896820068, -1.3785268068313599, -1.303999423980713, -1.229472041130066, -1.154944658279419, -1.080417275428772, -1.005889892578125, -0.931362509727478, -0.856835126876831, -0.7823077440261841, -0.7077803611755371, -0.6332529783248901, -0.5587254762649536, -0.48419809341430664, -0.40967071056365967, -0.3351433277130127, -0.2606159448623657, -0.18608856201171875, -0.11156117916107178, -0.037033796310424805, 0.03749358654022217, 0.11202096939086914, 0.1865483522415161, 0.2610757350921631, 0.33560311794281006, 0.41013050079345703, 0.484657883644104, 0.559185266494751, 0.633712649345398, 0.7082400321960449, 0.7827674150466919, 0.8572947978973389, 0.9318221807479858, 1.0063495635986328, 1.0808769464492798, 1.1554043292999268, 1.2299317121505737, 1.3044590950012207, 1.3789864778518677, 1.4535138607025146, 1.5280412435531616, 1.6025686264038086, 1.6770960092544556, 1.7516233921051025, 1.8261507749557495]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 7.0, 7.0, 11.0, 17.0, 34.0, 49.0, 73.0, 101.0, 205.0, 400.0, 801.0, 2060.0, 6292.0, 24952.0, 155174.0, 1007214.0, 2138552.0, 716245.0, 111892.0, 21589.0, 5462.0, 1764.0, 716.0, 288.0, 146.0, 93.0, 57.0, 26.0, 21.0, 9.0, 10.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.33203125, -2.2743072509765625, -2.216583251953125, -2.1588592529296875, -2.10113525390625, -2.0434112548828125, -1.985687255859375, -1.9279632568359375, -1.8702392578125, -1.8125152587890625, -1.754791259765625, -1.6970672607421875, -1.63934326171875, -1.5816192626953125, -1.523895263671875, -1.4661712646484375, -1.408447265625, -1.3507232666015625, -1.292999267578125, -1.2352752685546875, -1.17755126953125, -1.1198272705078125, -1.062103271484375, -1.0043792724609375, -0.9466552734375, -0.8889312744140625, -0.831207275390625, -0.7734832763671875, -0.71575927734375, -0.6580352783203125, -0.600311279296875, -0.5425872802734375, -0.48486328125, -0.4271392822265625, -0.369415283203125, -0.3116912841796875, -0.25396728515625, -0.1962432861328125, -0.138519287109375, -0.0807952880859375, -0.0230712890625, 0.0346527099609375, 0.092376708984375, 0.1501007080078125, 0.20782470703125, 0.2655487060546875, 0.323272705078125, 0.3809967041015625, 0.438720703125, 0.4964447021484375, 0.554168701171875, 0.6118927001953125, 0.66961669921875, 0.7273406982421875, 0.785064697265625, 0.8427886962890625, 0.9005126953125, 0.9582366943359375, 1.015960693359375, 1.0736846923828125, 1.13140869140625, 1.1891326904296875, 1.246856689453125, 1.3045806884765625, 1.3623046875]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 11.0, 18.0, 16.0, 14.0, 26.0, 24.0, 25.0, 21.0, 48.0, 43.0, 41.0, 44.0, 46.0, 46.0, 57.0, 51.0, 63.0, 58.0, 36.0, 40.0, 42.0, 37.0, 36.0, 26.0, 25.0, 19.0, 13.0, 11.0, 16.0, 5.0, 8.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4306640625, -1.3869781494140625, -1.343292236328125, -1.2996063232421875, -1.25592041015625, -1.2122344970703125, -1.168548583984375, -1.1248626708984375, -1.0811767578125, -1.0374908447265625, -0.993804931640625, -0.9501190185546875, -0.90643310546875, -0.8627471923828125, -0.819061279296875, -0.7753753662109375, -0.731689453125, -0.6880035400390625, -0.644317626953125, -0.6006317138671875, -0.55694580078125, -0.5132598876953125, -0.469573974609375, -0.4258880615234375, -0.3822021484375, -0.3385162353515625, -0.294830322265625, -0.2511444091796875, -0.20745849609375, -0.1637725830078125, -0.120086669921875, -0.0764007568359375, -0.03271484375, 0.0109710693359375, 0.054656982421875, 0.0983428955078125, 0.14202880859375, 0.1857147216796875, 0.229400634765625, 0.2730865478515625, 0.3167724609375, 0.3604583740234375, 0.404144287109375, 0.4478302001953125, 0.49151611328125, 0.5352020263671875, 0.578887939453125, 0.6225738525390625, 0.666259765625, 0.7099456787109375, 0.753631591796875, 0.7973175048828125, 0.84100341796875, 0.8846893310546875, 0.928375244140625, 0.9720611572265625, 1.0157470703125, 1.0594329833984375, 1.103118896484375, 1.1468048095703125, 1.19049072265625, 1.2341766357421875, 1.277862548828125, 1.3215484619140625, 1.365234375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 6.0, 10.0, 11.0, 12.0, 12.0, 25.0, 46.0, 49.0, 80.0, 114.0, 247.0, 516.0, 1970.0, 12255.0, 590468.0, 3546778.0, 36671.0, 3470.0, 778.0, 275.0, 162.0, 102.0, 65.0, 42.0, 28.0, 22.0, 20.0, 9.0, 9.0, 7.0, 6.0, 7.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3671875, -4.23150634765625, -4.0958251953125, -3.96014404296875, -3.824462890625, -3.68878173828125, -3.5531005859375, -3.41741943359375, -3.28173828125, -3.14605712890625, -3.0103759765625, -2.87469482421875, -2.739013671875, -2.60333251953125, -2.4676513671875, -2.33197021484375, -2.1962890625, -2.06060791015625, -1.9249267578125, -1.78924560546875, -1.653564453125, -1.51788330078125, -1.3822021484375, -1.24652099609375, -1.11083984375, -0.97515869140625, -0.8394775390625, -0.70379638671875, -0.568115234375, -0.43243408203125, -0.2967529296875, -0.16107177734375, -0.025390625, 0.11029052734375, 0.2459716796875, 0.38165283203125, 0.517333984375, 0.65301513671875, 0.7886962890625, 0.92437744140625, 1.06005859375, 1.19573974609375, 1.3314208984375, 1.46710205078125, 1.602783203125, 1.73846435546875, 1.8741455078125, 2.00982666015625, 2.1455078125, 2.28118896484375, 2.4168701171875, 2.55255126953125, 2.688232421875, 2.82391357421875, 2.9595947265625, 3.09527587890625, 3.23095703125, 3.36663818359375, 3.5023193359375, 3.63800048828125, 3.773681640625, 3.90936279296875, 4.0450439453125, 4.18072509765625, 4.31640625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 1.0, 1.0, 11.0, 6.0, 15.0, 11.0, 12.0, 34.0, 45.0, 46.0, 81.0, 108.0, 187.0, 233.0, 387.0, 525.0, 586.0, 558.0, 401.0, 292.0, 181.0, 115.0, 70.0, 39.0, 38.0, 24.0, 21.0, 9.0, 13.0, 3.0, 7.0, 1.0, 3.0, 1.0, 0.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.64990234375, -0.6299285888671875, -0.609954833984375, -0.5899810791015625, -0.57000732421875, -0.5500335693359375, -0.530059814453125, -0.5100860595703125, -0.4901123046875, -0.4701385498046875, -0.450164794921875, -0.4301910400390625, -0.41021728515625, -0.3902435302734375, -0.370269775390625, -0.3502960205078125, -0.330322265625, -0.3103485107421875, -0.290374755859375, -0.2704010009765625, -0.25042724609375, -0.2304534912109375, -0.210479736328125, -0.1905059814453125, -0.1705322265625, -0.1505584716796875, -0.130584716796875, -0.1106109619140625, -0.09063720703125, -0.0706634521484375, -0.050689697265625, -0.0307159423828125, -0.0107421875, 0.0092315673828125, 0.029205322265625, 0.0491790771484375, 0.06915283203125, 0.0891265869140625, 0.109100341796875, 0.1290740966796875, 0.1490478515625, 0.1690216064453125, 0.188995361328125, 0.2089691162109375, 0.22894287109375, 0.2489166259765625, 0.268890380859375, 0.2888641357421875, 0.308837890625, 0.3288116455078125, 0.348785400390625, 0.3687591552734375, 0.38873291015625, 0.4087066650390625, 0.428680419921875, 0.4486541748046875, 0.4686279296875, 0.4886016845703125, 0.508575439453125, 0.5285491943359375, 0.54852294921875, 0.5684967041015625, 0.588470458984375, 0.6084442138671875, 0.62841796875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 6.0, 16.0, 18.0, 24.0, 47.0, 63.0, 83.0, 121.0, 134.0, 121.0, 110.0, 90.0, 64.0, 35.0, 29.0, 14.0, 13.0, 6.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.809737205505371, -2.7159247398376465, -2.622112274169922, -2.5282998085021973, -2.4344875812530518, -2.340675115585327, -2.2468626499176025, -2.153050184249878, -2.0592379570007324, -1.9654254913330078, -1.8716131448745728, -1.7778006792068481, -1.683988332748413, -1.5901758670806885, -1.4963634014129639, -1.4025509357452393, -1.3087384700775146, -1.21492600440979, -1.121113657951355, -1.0273011922836304, -0.9334887862205505, -0.8396763801574707, -0.7458639144897461, -0.6520515084266663, -0.5582391023635864, -0.4644266963005066, -0.37061426043510437, -0.27680182456970215, -0.18298941850662231, -0.08917701244354248, 0.004635453224182129, 0.09844785928726196, 0.1922605037689209, 0.28607290983200073, 0.37988534569740295, 0.4736977815628052, 0.567510187625885, 0.6613225936889648, 0.7551350593566895, 0.8489474654197693, 0.9427598714828491, 1.0365723371505737, 1.1303846836090088, 1.2241971492767334, 1.318009614944458, 1.411821961402893, 1.5056344270706177, 1.5994467735290527, 1.6932592391967773, 1.787071704864502, 1.880884051322937, 1.9746965169906616, 2.0685088634490967, 2.1623213291168213, 2.256133794784546, 2.3499462604522705, 2.443758487701416, 2.5375709533691406, 2.6313834190368652, 2.72519588470459, 2.8190081119537354, 2.91282057762146, 3.0066330432891846, 3.100445508956909, 3.194257974624634]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 7.0, 2.0, 10.0, 3.0, 9.0, 7.0, 11.0, 14.0, 13.0, 10.0, 18.0, 15.0, 25.0, 28.0, 36.0, 24.0, 40.0, 33.0, 34.0, 40.0, 42.0, 43.0, 40.0, 43.0, 33.0, 46.0, 28.0, 36.0, 33.0, 48.0, 39.0, 26.0, 31.0, 15.0, 20.0, 13.0, 15.0, 16.0, 6.0, 8.0, 10.0, 3.0, 8.0, 8.0, 2.0, 6.0, 0.0, 3.0, 1.0, 1.0, 3.0], "bins": [-1.2898352146148682, -1.252617359161377, -1.2153996229171753, -1.178181767463684, -1.1409639120101929, -1.1037461757659912, -1.0665283203125, -1.0293104648590088, -0.9920926690101624, -0.9548748731613159, -0.9176570177078247, -0.8804392218589783, -0.8432214260101318, -0.8060035705566406, -0.7687857747077942, -0.7315679788589478, -0.6943501234054565, -0.6571323275566101, -0.6199144721031189, -0.5826966762542725, -0.5454788208007812, -0.5082610249519348, -0.4710432291030884, -0.43382540345191956, -0.39660757780075073, -0.3593897521495819, -0.3221719264984131, -0.28495413064956665, -0.24773630499839783, -0.210518479347229, -0.17330066859722137, -0.13608285784721375, -0.09886491298675537, -0.061647094786167145, -0.02442927658557892, 0.012788541615009308, 0.050006359815597534, 0.08722418546676636, 0.12444199621677399, 0.16165980696678162, 0.19887763261795044, 0.23609545826911926, 0.2733132839202881, 0.3105310797691345, 0.34774890542030334, 0.38496673107147217, 0.4221845269203186, 0.4594023525714874, 0.49662017822265625, 0.5338379740715027, 0.5710558295249939, 0.6082736253738403, 0.6454914808273315, 0.682709276676178, 0.7199270725250244, 0.7571449279785156, 0.7943627238273621, 0.8315805196762085, 0.8687983751296997, 0.9060161709785461, 0.9432339668273926, 0.9804518222808838, 1.017669677734375, 1.0548874139785767, 1.0921052694320679]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 18.0, 15.0, 33.0, 37.0, 105.0, 171.0, 334.0, 964.0, 2925.0, 11639.0, 61414.0, 388248.0, 482786.0, 80044.0, 14669.0, 3377.0, 1041.0, 385.0, 155.0, 79.0, 52.0, 34.0, 9.0, 10.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.19140625, -1.1623992919921875, -1.133392333984375, -1.1043853759765625, -1.07537841796875, -1.0463714599609375, -1.017364501953125, -0.9883575439453125, -0.9593505859375, -0.9303436279296875, -0.901336669921875, -0.8723297119140625, -0.84332275390625, -0.8143157958984375, -0.785308837890625, -0.7563018798828125, -0.727294921875, -0.6982879638671875, -0.669281005859375, -0.6402740478515625, -0.61126708984375, -0.5822601318359375, -0.553253173828125, -0.5242462158203125, -0.4952392578125, -0.4662322998046875, -0.437225341796875, -0.4082183837890625, -0.37921142578125, -0.3502044677734375, -0.321197509765625, -0.2921905517578125, -0.26318359375, -0.2341766357421875, -0.205169677734375, -0.1761627197265625, -0.14715576171875, -0.1181488037109375, -0.089141845703125, -0.0601348876953125, -0.0311279296875, -0.0021209716796875, 0.026885986328125, 0.0558929443359375, 0.08489990234375, 0.1139068603515625, 0.142913818359375, 0.1719207763671875, 0.200927734375, 0.2299346923828125, 0.258941650390625, 0.2879486083984375, 0.31695556640625, 0.3459625244140625, 0.374969482421875, 0.4039764404296875, 0.4329833984375, 0.4619903564453125, 0.490997314453125, 0.5200042724609375, 0.54901123046875, 0.5780181884765625, 0.607025146484375, 0.6360321044921875, 0.6650390625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 4.0, 9.0, 11.0, 7.0, 10.0, 9.0, 21.0, 23.0, 23.0, 33.0, 27.0, 46.0, 54.0, 51.0, 64.0, 53.0, 57.0, 68.0, 51.0, 57.0, 43.0, 61.0, 44.0, 34.0, 38.0, 21.0, 16.0, 18.0, 11.0, 8.0, 8.0, 6.0, 9.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.181640625, -1.151092529296875, -1.12054443359375, -1.089996337890625, -1.0594482421875, -1.028900146484375, -0.99835205078125, -0.967803955078125, -0.937255859375, -0.906707763671875, -0.87615966796875, -0.845611572265625, -0.8150634765625, -0.784515380859375, -0.75396728515625, -0.723419189453125, -0.69287109375, -0.662322998046875, -0.63177490234375, -0.601226806640625, -0.5706787109375, -0.540130615234375, -0.50958251953125, -0.479034423828125, -0.448486328125, -0.417938232421875, -0.38739013671875, -0.356842041015625, -0.3262939453125, -0.295745849609375, -0.26519775390625, -0.234649658203125, -0.2041015625, -0.173553466796875, -0.14300537109375, -0.112457275390625, -0.0819091796875, -0.051361083984375, -0.02081298828125, 0.009735107421875, 0.040283203125, 0.070831298828125, 0.10137939453125, 0.131927490234375, 0.1624755859375, 0.193023681640625, 0.22357177734375, 0.254119873046875, 0.28466796875, 0.315216064453125, 0.34576416015625, 0.376312255859375, 0.4068603515625, 0.437408447265625, 0.46795654296875, 0.498504638671875, 0.529052734375, 0.559600830078125, 0.59014892578125, 0.620697021484375, 0.6512451171875, 0.681793212890625, 0.71234130859375, 0.742889404296875, 0.7734375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 3.0, 7.0, 9.0, 11.0, 13.0, 21.0, 28.0, 28.0, 49.0, 63.0, 87.0, 147.0, 211.0, 362.0, 631.0, 1149.0, 2302.0, 4955.0, 11537.0, 27506.0, 69143.0, 175107.0, 338799.0, 245990.0, 101106.0, 39664.0, 16264.0, 6826.0, 3085.0, 1423.0, 813.0, 425.0, 252.0, 166.0, 114.0, 82.0, 50.0, 40.0, 17.0, 16.0, 21.0, 15.0, 2.0, 8.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.461181640625, -0.4478912353515625, -0.434600830078125, -0.4213104248046875, -0.40802001953125, -0.3947296142578125, -0.381439208984375, -0.3681488037109375, -0.3548583984375, -0.3415679931640625, -0.328277587890625, -0.3149871826171875, -0.30169677734375, -0.2884063720703125, -0.275115966796875, -0.2618255615234375, -0.24853515625, -0.2352447509765625, -0.221954345703125, -0.2086639404296875, -0.19537353515625, -0.1820831298828125, -0.168792724609375, -0.1555023193359375, -0.1422119140625, -0.1289215087890625, -0.115631103515625, -0.1023406982421875, -0.08905029296875, -0.0757598876953125, -0.062469482421875, -0.0491790771484375, -0.035888671875, -0.0225982666015625, -0.009307861328125, 0.0039825439453125, 0.01727294921875, 0.0305633544921875, 0.043853759765625, 0.0571441650390625, 0.0704345703125, 0.0837249755859375, 0.097015380859375, 0.1103057861328125, 0.12359619140625, 0.1368865966796875, 0.150177001953125, 0.1634674072265625, 0.1767578125, 0.1900482177734375, 0.203338623046875, 0.2166290283203125, 0.22991943359375, 0.2432098388671875, 0.256500244140625, 0.2697906494140625, 0.2830810546875, 0.2963714599609375, 0.309661865234375, 0.3229522705078125, 0.33624267578125, 0.3495330810546875, 0.362823486328125, 0.3761138916015625, 0.389404296875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 8.0, 4.0, 6.0, 13.0, 12.0, 9.0, 20.0, 14.0, 22.0, 19.0, 37.0, 28.0, 40.0, 40.0, 38.0, 37.0, 51.0, 48.0, 46.0, 51.0, 54.0, 46.0, 58.0, 46.0, 38.0, 28.0, 27.0, 32.0, 26.0, 22.0, 15.0, 8.0, 10.0, 9.0, 8.0, 10.0, 7.0, 5.0, 3.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.638671875, -1.5912322998046875, -1.543792724609375, -1.4963531494140625, -1.44891357421875, -1.4014739990234375, -1.354034423828125, -1.3065948486328125, -1.2591552734375, -1.2117156982421875, -1.164276123046875, -1.1168365478515625, -1.06939697265625, -1.0219573974609375, -0.974517822265625, -0.9270782470703125, -0.879638671875, -0.8321990966796875, -0.784759521484375, -0.7373199462890625, -0.68988037109375, -0.6424407958984375, -0.595001220703125, -0.5475616455078125, -0.5001220703125, -0.4526824951171875, -0.405242919921875, -0.3578033447265625, -0.31036376953125, -0.2629241943359375, -0.215484619140625, -0.1680450439453125, -0.12060546875, -0.0731658935546875, -0.025726318359375, 0.0217132568359375, 0.06915283203125, 0.1165924072265625, 0.164031982421875, 0.2114715576171875, 0.2589111328125, 0.3063507080078125, 0.353790283203125, 0.4012298583984375, 0.44866943359375, 0.4961090087890625, 0.543548583984375, 0.5909881591796875, 0.638427734375, 0.6858673095703125, 0.733306884765625, 0.7807464599609375, 0.82818603515625, 0.8756256103515625, 0.923065185546875, 0.9705047607421875, 1.0179443359375, 1.0653839111328125, 1.112823486328125, 1.1602630615234375, 1.20770263671875, 1.2551422119140625, 1.302581787109375, 1.3500213623046875, 1.3974609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 3.0, 6.0, 10.0, 12.0, 24.0, 20.0, 31.0, 52.0, 72.0, 107.0, 153.0, 266.0, 364.0, 683.0, 1093.0, 1869.0, 3596.0, 6711.0, 13939.0, 31665.0, 88997.0, 279339.0, 384240.0, 147632.0, 48323.0, 19441.0, 9073.0, 4629.0, 2490.0, 1387.0, 861.0, 505.0, 310.0, 224.0, 138.0, 95.0, 60.0, 37.0, 23.0, 26.0, 12.0, 4.0, 8.0, 8.0, 3.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.192626953125, -0.1866474151611328, -0.18066787719726562, -0.17468833923339844, -0.16870880126953125, -0.16272926330566406, -0.15674972534179688, -0.1507701873779297, -0.1447906494140625, -0.1388111114501953, -0.13283157348632812, -0.12685203552246094, -0.12087249755859375, -0.11489295959472656, -0.10891342163085938, -0.10293388366699219, -0.096954345703125, -0.09097480773925781, -0.08499526977539062, -0.07901573181152344, -0.07303619384765625, -0.06705665588378906, -0.061077117919921875, -0.05509757995605469, -0.0491180419921875, -0.04313850402832031, -0.037158966064453125, -0.031179428100585938, -0.02519989013671875, -0.019220352172851562, -0.013240814208984375, -0.0072612762451171875, -0.00128173828125, 0.0046977996826171875, 0.010677337646484375, 0.016656875610351562, 0.02263641357421875, 0.028615951538085938, 0.034595489501953125, 0.04057502746582031, 0.0465545654296875, 0.05253410339355469, 0.058513641357421875, 0.06449317932128906, 0.07047271728515625, 0.07645225524902344, 0.08243179321289062, 0.08841133117675781, 0.094390869140625, 0.10037040710449219, 0.10634994506835938, 0.11232948303222656, 0.11830902099609375, 0.12428855895996094, 0.13026809692382812, 0.1362476348876953, 0.1422271728515625, 0.1482067108154297, 0.15418624877929688, 0.16016578674316406, 0.16614532470703125, 0.17212486267089844, 0.17810440063476562, 0.1840839385986328, 0.1900634765625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 14.0, 15.0, 41.0, 36.0, 64.0, 108.0, 157.0, 169.0, 143.0, 84.0, 52.0, 31.0, 29.0, 14.0, 9.0, 11.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00015306472778320312, -0.0001476295292377472, -0.00014219433069229126, -0.00013675913214683533, -0.0001313239336013794, -0.00012588873505592346, -0.00012045353651046753, -0.0001150183379650116, -0.00010958313941955566, -0.00010414794087409973, -9.87127423286438e-05, -9.327754378318787e-05, -8.784234523773193e-05, -8.2407146692276e-05, -7.697194814682007e-05, -7.153674960136414e-05, -6.61015510559082e-05, -6.066635251045227e-05, -5.523115396499634e-05, -4.9795955419540405e-05, -4.436075687408447e-05, -3.892555832862854e-05, -3.349035978317261e-05, -2.8055161237716675e-05, -2.2619962692260742e-05, -1.718476414680481e-05, -1.1749565601348877e-05, -6.314367055892944e-06, -8.791685104370117e-07, 4.556030035018921e-06, 9.991228580474854e-06, 1.5426427125930786e-05, 2.086162567138672e-05, 2.629682421684265e-05, 3.1732022762298584e-05, 3.7167221307754517e-05, 4.260241985321045e-05, 4.803761839866638e-05, 5.3472816944122314e-05, 5.890801548957825e-05, 6.434321403503418e-05, 6.977841258049011e-05, 7.521361112594604e-05, 8.064880967140198e-05, 8.608400821685791e-05, 9.151920676231384e-05, 9.695440530776978e-05, 0.00010238960385322571, 0.00010782480239868164, 0.00011326000094413757, 0.0001186951994895935, 0.00012413039803504944, 0.00012956559658050537, 0.0001350007951259613, 0.00014043599367141724, 0.00014587119221687317, 0.0001513063907623291, 0.00015674158930778503, 0.00016217678785324097, 0.0001676119863986969, 0.00017304718494415283, 0.00017848238348960876, 0.0001839175820350647, 0.00018935278058052063, 0.00019478797912597656]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 2.0, 6.0, 4.0, 7.0, 8.0, 7.0, 13.0, 12.0, 25.0, 42.0, 50.0, 93.0, 135.0, 267.0, 610.0, 1506.0, 4159.0, 13943.0, 60360.0, 380559.0, 480742.0, 80184.0, 17482.0, 5116.0, 1743.0, 691.0, 335.0, 166.0, 98.0, 41.0, 32.0, 22.0, 17.0, 9.0, 10.0, 16.0, 9.0, 5.0, 7.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.30908203125, -0.29845428466796875, -0.2878265380859375, -0.27719879150390625, -0.266571044921875, -0.25594329833984375, -0.2453155517578125, -0.23468780517578125, -0.22406005859375, -0.21343231201171875, -0.2028045654296875, -0.19217681884765625, -0.181549072265625, -0.17092132568359375, -0.1602935791015625, -0.14966583251953125, -0.1390380859375, -0.12841033935546875, -0.1177825927734375, -0.10715484619140625, -0.096527099609375, -0.08589935302734375, -0.0752716064453125, -0.06464385986328125, -0.05401611328125, -0.04338836669921875, -0.0327606201171875, -0.02213287353515625, -0.011505126953125, -0.00087738037109375, 0.0097503662109375, 0.02037811279296875, 0.031005859375, 0.04163360595703125, 0.0522613525390625, 0.06288909912109375, 0.073516845703125, 0.08414459228515625, 0.0947723388671875, 0.10540008544921875, 0.11602783203125, 0.12665557861328125, 0.1372833251953125, 0.14791107177734375, 0.158538818359375, 0.16916656494140625, 0.1797943115234375, 0.19042205810546875, 0.2010498046875, 0.21167755126953125, 0.2223052978515625, 0.23293304443359375, 0.243560791015625, 0.25418853759765625, 0.2648162841796875, 0.27544403076171875, 0.28607177734375, 0.29669952392578125, 0.3073272705078125, 0.31795501708984375, 0.328582763671875, 0.33921051025390625, 0.3498382568359375, 0.36046600341796875, 0.37109375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 2.0, 4.0, 4.0, 5.0, 3.0, 10.0, 9.0, 16.0, 14.0, 11.0, 18.0, 27.0, 23.0, 40.0, 46.0, 64.0, 62.0, 78.0, 74.0, 86.0, 69.0, 50.0, 51.0, 41.0, 32.0, 31.0, 33.0, 7.0, 20.0, 12.0, 13.0, 5.0, 7.0, 5.0, 6.0, 7.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042755126953125, -0.0410923957824707, -0.039429664611816406, -0.03776693344116211, -0.03610420227050781, -0.034441471099853516, -0.03277873992919922, -0.031116008758544922, -0.029453277587890625, -0.027790546417236328, -0.02612781524658203, -0.024465084075927734, -0.022802352905273438, -0.02113962173461914, -0.019476890563964844, -0.017814159393310547, -0.01615142822265625, -0.014488697052001953, -0.012825965881347656, -0.01116323471069336, -0.009500503540039062, -0.007837772369384766, -0.006175041198730469, -0.004512310028076172, -0.002849578857421875, -0.0011868476867675781, 0.00047588348388671875, 0.0021386146545410156, 0.0038013458251953125, 0.005464076995849609, 0.007126808166503906, 0.008789539337158203, 0.0104522705078125, 0.012115001678466797, 0.013777732849121094, 0.01544046401977539, 0.017103195190429688, 0.018765926361083984, 0.02042865753173828, 0.022091388702392578, 0.023754119873046875, 0.025416851043701172, 0.02707958221435547, 0.028742313385009766, 0.030405044555664062, 0.03206777572631836, 0.033730506896972656, 0.03539323806762695, 0.03705596923828125, 0.03871870040893555, 0.040381431579589844, 0.04204416275024414, 0.04370689392089844, 0.045369625091552734, 0.04703235626220703, 0.04869508743286133, 0.050357818603515625, 0.05202054977416992, 0.05368328094482422, 0.055346012115478516, 0.05700874328613281, 0.05867147445678711, 0.060334205627441406, 0.0619969367980957, 0.06365966796875]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 7.0, 8.0, 23.0, 29.0, 59.0, 104.0, 149.0, 166.0, 131.0, 131.0, 83.0, 45.0, 23.0, 20.0, 5.0, 7.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2450764179229736, -2.180626153945923, -2.116175651550293, -2.051725387573242, -1.9872751235961914, -1.9228248596191406, -1.8583744764328003, -1.79392409324646, -1.7294738292694092, -1.6650235652923584, -1.600573182106018, -1.5361227989196777, -1.471672534942627, -1.4072222709655762, -1.3427718877792358, -1.2783215045928955, -1.2138712406158447, -1.149420976638794, -1.0849705934524536, -1.0205202102661133, -0.9560699462890625, -0.8916196227073669, -0.8271692991256714, -0.7627189755439758, -0.6982686519622803, -0.6338183283805847, -0.5693680047988892, -0.5049176812171936, -0.44046735763549805, -0.3760170340538025, -0.31156671047210693, -0.24711638689041138, -0.18266618251800537, -0.11821585893630981, -0.05376553535461426, 0.010684788227081299, 0.07513511180877686, 0.1395854353904724, 0.20403575897216797, 0.2684860825538635, 0.3329364061355591, 0.39738672971725464, 0.4618370532989502, 0.5262873768806458, 0.5907377004623413, 0.6551880240440369, 0.7196383476257324, 0.784088671207428, 0.8485389947891235, 0.9129893183708191, 0.9774396419525146, 1.0418899059295654, 1.1063402891159058, 1.170790672302246, 1.2352409362792969, 1.2996912002563477, 1.364141583442688, 1.4285919666290283, 1.493042230606079, 1.5574924945831299, 1.6219428777694702, 1.6863932609558105, 1.7508435249328613, 1.815293788909912, 1.8797441720962524]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 4.0, 6.0, 9.0, 12.0, 10.0, 7.0, 12.0, 15.0, 13.0, 15.0, 21.0, 27.0, 23.0, 45.0, 30.0, 36.0, 42.0, 38.0, 53.0, 41.0, 52.0, 37.0, 43.0, 53.0, 30.0, 49.0, 49.0, 29.0, 36.0, 31.0, 23.0, 10.0, 21.0, 17.0, 10.0, 15.0, 5.0, 7.0, 6.0, 2.0, 8.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.8412993550300598, -0.8182972073554993, -0.795295000076294, -0.7722928524017334, -0.7492907047271729, -0.7262884974479675, -0.703286349773407, -0.6802841424942017, -0.6572819948196411, -0.6342798471450806, -0.6112776398658752, -0.5882754921913147, -0.5652733445167542, -0.5422711372375488, -0.5192689895629883, -0.49626681208610535, -0.4732646644115448, -0.45026248693466187, -0.4272603392601013, -0.4042581617832184, -0.38125598430633545, -0.3582538366317749, -0.33525165915489197, -0.31224948167800903, -0.2892473340034485, -0.26624515652656555, -0.2432429939508438, -0.22024083137512207, -0.19723865389823914, -0.1742364913225174, -0.15123432874679565, -0.12823215126991272, -0.10522997379302979, -0.08222780376672745, -0.05922563746571541, -0.03622347116470337, -0.013221301138401031, 0.009780868887901306, 0.03278303146362305, 0.05578520894050598, 0.07878737151622772, 0.10178954154253006, 0.1247917115688324, 0.14779387414455414, 0.17079603672027588, 0.1937982141971588, 0.21680037677288055, 0.2398025542497635, 0.26280471682548523, 0.28580689430236816, 0.3088090419769287, 0.33181121945381165, 0.3548133969306946, 0.3778155446052551, 0.40081772208213806, 0.423819899559021, 0.44682204723358154, 0.4698242247104645, 0.492826372385025, 0.515828549861908, 0.5388306975364685, 0.5618329048156738, 0.5848350524902344, 0.6078372001647949, 0.6308394074440002]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 4.0, 2.0, 7.0, 10.0, 9.0, 11.0, 23.0, 45.0, 49.0, 79.0, 149.0, 260.0, 505.0, 1256.0, 2892.0, 7996.0, 23085.0, 81999.0, 327430.0, 429229.0, 123624.0, 32535.0, 10454.0, 3826.0, 1603.0, 714.0, 317.0, 156.0, 98.0, 65.0, 24.0, 33.0, 18.0, 11.0, 11.0, 9.0, 7.0, 2.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0888671875, -1.0560150146484375, -1.023162841796875, -0.9903106689453125, -0.95745849609375, -0.9246063232421875, -0.891754150390625, -0.8589019775390625, -0.8260498046875, -0.7931976318359375, -0.760345458984375, -0.7274932861328125, -0.69464111328125, -0.6617889404296875, -0.628936767578125, -0.5960845947265625, -0.563232421875, -0.5303802490234375, -0.497528076171875, -0.4646759033203125, -0.43182373046875, -0.3989715576171875, -0.366119384765625, -0.3332672119140625, -0.3004150390625, -0.2675628662109375, -0.234710693359375, -0.2018585205078125, -0.16900634765625, -0.1361541748046875, -0.103302001953125, -0.0704498291015625, -0.03759765625, -0.0047454833984375, 0.028106689453125, 0.0609588623046875, 0.09381103515625, 0.1266632080078125, 0.159515380859375, 0.1923675537109375, 0.2252197265625, 0.2580718994140625, 0.290924072265625, 0.3237762451171875, 0.35662841796875, 0.3894805908203125, 0.422332763671875, 0.4551849365234375, 0.488037109375, 0.5208892822265625, 0.553741455078125, 0.5865936279296875, 0.61944580078125, 0.6522979736328125, 0.685150146484375, 0.7180023193359375, 0.7508544921875, 0.7837066650390625, 0.816558837890625, 0.8494110107421875, 0.88226318359375, 0.9151153564453125, 0.947967529296875, 0.9808197021484375, 1.013671875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 2.0, 5.0, 11.0, 6.0, 11.0, 16.0, 5.0, 20.0, 14.0, 20.0, 22.0, 26.0, 25.0, 42.0, 35.0, 36.0, 27.0, 51.0, 60.0, 59.0, 37.0, 38.0, 44.0, 51.0, 39.0, 42.0, 34.0, 36.0, 32.0, 22.0, 25.0, 21.0, 14.0, 10.0, 9.0, 15.0, 8.0, 9.0, 1.0, 5.0, 1.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.654296875, -1.6071319580078125, -1.559967041015625, -1.5128021240234375, -1.46563720703125, -1.4184722900390625, -1.371307373046875, -1.3241424560546875, -1.2769775390625, -1.2298126220703125, -1.182647705078125, -1.1354827880859375, -1.08831787109375, -1.0411529541015625, -0.993988037109375, -0.9468231201171875, -0.899658203125, -0.8524932861328125, -0.805328369140625, -0.7581634521484375, -0.71099853515625, -0.6638336181640625, -0.616668701171875, -0.5695037841796875, -0.5223388671875, -0.4751739501953125, -0.428009033203125, -0.3808441162109375, -0.33367919921875, -0.2865142822265625, -0.239349365234375, -0.1921844482421875, -0.14501953125, -0.0978546142578125, -0.050689697265625, -0.0035247802734375, 0.04364013671875, 0.0908050537109375, 0.137969970703125, 0.1851348876953125, 0.2322998046875, 0.2794647216796875, 0.326629638671875, 0.3737945556640625, 0.42095947265625, 0.4681243896484375, 0.515289306640625, 0.5624542236328125, 0.609619140625, 0.6567840576171875, 0.703948974609375, 0.7511138916015625, 0.79827880859375, 0.8454437255859375, 0.892608642578125, 0.9397735595703125, 0.9869384765625, 1.0341033935546875, 1.081268310546875, 1.1284332275390625, 1.17559814453125, 1.2227630615234375, 1.269927978515625, 1.3170928955078125, 1.3642578125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 4.0, 5.0, 3.0, 4.0, 9.0, 6.0, 7.0, 13.0, 8.0, 15.0, 24.0, 23.0, 26.0, 26.0, 50.0, 53.0, 61.0, 81.0, 146.0, 177.0, 285.0, 1007.0, 22327.0, 958685.0, 62671.0, 1678.0, 349.0, 216.0, 136.0, 98.0, 79.0, 60.0, 39.0, 36.0, 28.0, 19.0, 12.0, 16.0, 7.0, 7.0, 13.0, 7.0, 8.0, 7.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 2.0, 0.0, 3.0, 2.0, 1.0], "bins": [-4.1484375, -4.0172119140625, -3.885986328125, -3.7547607421875, -3.62353515625, -3.4923095703125, -3.361083984375, -3.2298583984375, -3.0986328125, -2.9674072265625, -2.836181640625, -2.7049560546875, -2.57373046875, -2.4425048828125, -2.311279296875, -2.1800537109375, -2.048828125, -1.9176025390625, -1.786376953125, -1.6551513671875, -1.52392578125, -1.3927001953125, -1.261474609375, -1.1302490234375, -0.9990234375, -0.8677978515625, -0.736572265625, -0.6053466796875, -0.47412109375, -0.3428955078125, -0.211669921875, -0.0804443359375, 0.05078125, 0.1820068359375, 0.313232421875, 0.4444580078125, 0.57568359375, 0.7069091796875, 0.838134765625, 0.9693603515625, 1.1005859375, 1.2318115234375, 1.363037109375, 1.4942626953125, 1.62548828125, 1.7567138671875, 1.887939453125, 2.0191650390625, 2.150390625, 2.2816162109375, 2.412841796875, 2.5440673828125, 2.67529296875, 2.8065185546875, 2.937744140625, 3.0689697265625, 3.2001953125, 3.3314208984375, 3.462646484375, 3.5938720703125, 3.72509765625, 3.8563232421875, 3.987548828125, 4.1187744140625, 4.25]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 3.0, 6.0, 10.0, 11.0, 11.0, 11.0, 20.0, 27.0, 26.0, 40.0, 34.0, 35.0, 31.0, 37.0, 52.0, 41.0, 39.0, 48.0, 59.0, 55.0, 34.0, 52.0, 48.0, 44.0, 40.0, 38.0, 26.0, 18.0, 23.0, 14.0, 7.0, 12.0, 13.0, 3.0, 7.0, 6.0, 4.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.90234375, -1.847564697265625, -1.79278564453125, -1.738006591796875, -1.6832275390625, -1.628448486328125, -1.57366943359375, -1.518890380859375, -1.464111328125, -1.409332275390625, -1.35455322265625, -1.299774169921875, -1.2449951171875, -1.190216064453125, -1.13543701171875, -1.080657958984375, -1.02587890625, -0.971099853515625, -0.91632080078125, -0.861541748046875, -0.8067626953125, -0.751983642578125, -0.69720458984375, -0.642425537109375, -0.587646484375, -0.532867431640625, -0.47808837890625, -0.423309326171875, -0.3685302734375, -0.313751220703125, -0.25897216796875, -0.204193115234375, -0.1494140625, -0.094635009765625, -0.03985595703125, 0.014923095703125, 0.0697021484375, 0.124481201171875, 0.17926025390625, 0.234039306640625, 0.288818359375, 0.343597412109375, 0.39837646484375, 0.453155517578125, 0.5079345703125, 0.562713623046875, 0.61749267578125, 0.672271728515625, 0.72705078125, 0.781829833984375, 0.83660888671875, 0.891387939453125, 0.9461669921875, 1.000946044921875, 1.05572509765625, 1.110504150390625, 1.165283203125, 1.220062255859375, 1.27484130859375, 1.329620361328125, 1.3843994140625, 1.439178466796875, 1.49395751953125, 1.548736572265625, 1.603515625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 7.0, 4.0, 10.0, 15.0, 13.0, 23.0, 40.0, 60.0, 90.0, 155.0, 286.0, 631.0, 1253.0, 3240.0, 10457.0, 61093.0, 621494.0, 309585.0, 29466.0, 6505.0, 2201.0, 909.0, 438.0, 195.0, 110.0, 88.0, 54.0, 45.0, 21.0, 12.0, 12.0, 4.0, 7.0, 3.0, 3.0, 7.0, 6.0, 3.0, 3.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.39599609375, -0.3806610107421875, -0.365325927734375, -0.3499908447265625, -0.33465576171875, -0.3193206787109375, -0.303985595703125, -0.2886505126953125, -0.2733154296875, -0.2579803466796875, -0.242645263671875, -0.2273101806640625, -0.21197509765625, -0.1966400146484375, -0.181304931640625, -0.1659698486328125, -0.150634765625, -0.1352996826171875, -0.119964599609375, -0.1046295166015625, -0.08929443359375, -0.0739593505859375, -0.058624267578125, -0.0432891845703125, -0.0279541015625, -0.0126190185546875, 0.002716064453125, 0.0180511474609375, 0.03338623046875, 0.0487213134765625, 0.064056396484375, 0.0793914794921875, 0.0947265625, 0.1100616455078125, 0.125396728515625, 0.1407318115234375, 0.15606689453125, 0.1714019775390625, 0.186737060546875, 0.2020721435546875, 0.2174072265625, 0.2327423095703125, 0.248077392578125, 0.2634124755859375, 0.27874755859375, 0.2940826416015625, 0.309417724609375, 0.3247528076171875, 0.340087890625, 0.3554229736328125, 0.370758056640625, 0.3860931396484375, 0.40142822265625, 0.4167633056640625, 0.432098388671875, 0.4474334716796875, 0.4627685546875, 0.4781036376953125, 0.493438720703125, 0.5087738037109375, 0.52410888671875, 0.5394439697265625, 0.554779052734375, 0.5701141357421875, 0.58544921875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 7.0, 2.0, 5.0, 12.0, 7.0, 16.0, 20.0, 22.0, 32.0, 48.0, 92.0, 114.0, 108.0, 128.0, 120.0, 76.0, 51.0, 41.0, 27.0, 14.0, 21.0, 8.0, 9.0, 8.0, 1.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.282329559326172e-05, -6.074737757444382e-05, -5.8671459555625916e-05, -5.6595541536808014e-05, -5.451962351799011e-05, -5.244370549917221e-05, -5.036778748035431e-05, -4.829186946153641e-05, -4.6215951442718506e-05, -4.4140033423900604e-05, -4.20641154050827e-05, -3.99881973862648e-05, -3.79122793674469e-05, -3.5836361348629e-05, -3.3760443329811096e-05, -3.1684525310993195e-05, -2.9608607292175293e-05, -2.753268927335739e-05, -2.545677125453949e-05, -2.3380853235721588e-05, -2.1304935216903687e-05, -1.9229017198085785e-05, -1.7153099179267883e-05, -1.5077181160449982e-05, -1.300126314163208e-05, -1.0925345122814178e-05, -8.849427103996277e-06, -6.773509085178375e-06, -4.697591066360474e-06, -2.621673047542572e-06, -5.457550287246704e-07, 1.5301629900932312e-06, 3.606081008911133e-06, 5.6819990277290344e-06, 7.757917046546936e-06, 9.833835065364838e-06, 1.190975308418274e-05, 1.3985671103000641e-05, 1.6061589121818542e-05, 1.8137507140636444e-05, 2.0213425159454346e-05, 2.2289343178272247e-05, 2.436526119709015e-05, 2.644117921590805e-05, 2.8517097234725952e-05, 3.0593015253543854e-05, 3.2668933272361755e-05, 3.474485129117966e-05, 3.682076930999756e-05, 3.889668732881546e-05, 4.097260534763336e-05, 4.3048523366451263e-05, 4.5124441385269165e-05, 4.720035940408707e-05, 4.927627742290497e-05, 5.135219544172287e-05, 5.342811346054077e-05, 5.550403147935867e-05, 5.7579949498176575e-05, 5.9655867516994476e-05, 6.173178553581238e-05, 6.380770355463028e-05, 6.588362157344818e-05, 6.795953959226608e-05, 7.003545761108398e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 0.0, 2.0, 1.0, 7.0, 9.0, 5.0, 17.0, 14.0, 11.0, 29.0, 47.0, 65.0, 117.0, 236.0, 589.0, 1850.0, 7562.0, 52832.0, 667949.0, 288651.0, 22567.0, 4045.0, 1101.0, 388.0, 188.0, 91.0, 60.0, 25.0, 20.0, 18.0, 13.0, 10.0, 8.0, 12.0, 5.0, 2.0, 6.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55078125, -0.5323028564453125, -0.513824462890625, -0.4953460693359375, -0.47686767578125, -0.4583892822265625, -0.439910888671875, -0.4214324951171875, -0.4029541015625, -0.3844757080078125, -0.365997314453125, -0.3475189208984375, -0.32904052734375, -0.3105621337890625, -0.292083740234375, -0.2736053466796875, -0.255126953125, -0.2366485595703125, -0.218170166015625, -0.1996917724609375, -0.18121337890625, -0.1627349853515625, -0.144256591796875, -0.1257781982421875, -0.1072998046875, -0.0888214111328125, -0.070343017578125, -0.0518646240234375, -0.03338623046875, -0.0149078369140625, 0.003570556640625, 0.0220489501953125, 0.04052734375, 0.0590057373046875, 0.077484130859375, 0.0959625244140625, 0.11444091796875, 0.1329193115234375, 0.151397705078125, 0.1698760986328125, 0.1883544921875, 0.2068328857421875, 0.225311279296875, 0.2437896728515625, 0.26226806640625, 0.2807464599609375, 0.299224853515625, 0.3177032470703125, 0.336181640625, 0.3546600341796875, 0.373138427734375, 0.3916168212890625, 0.41009521484375, 0.4285736083984375, 0.447052001953125, 0.4655303955078125, 0.4840087890625, 0.5024871826171875, 0.520965576171875, 0.5394439697265625, 0.55792236328125, 0.5764007568359375, 0.594879150390625, 0.6133575439453125, 0.6318359375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 5.0, 13.0, 8.0, 7.0, 14.0, 18.0, 24.0, 45.0, 51.0, 60.0, 71.0, 86.0, 98.0, 99.0, 80.0, 78.0, 58.0, 46.0, 36.0, 20.0, 19.0, 13.0, 7.0, 11.0, 3.0, 4.0, 2.0, 5.0, 6.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.159912109375, -0.15454483032226562, -0.14917755126953125, -0.14381027221679688, -0.1384429931640625, -0.13307571411132812, -0.12770843505859375, -0.12234115600585938, -0.116973876953125, -0.11160659790039062, -0.10623931884765625, -0.10087203979492188, -0.0955047607421875, -0.09013748168945312, -0.08477020263671875, -0.07940292358398438, -0.07403564453125, -0.06866836547851562, -0.06330108642578125, -0.057933807373046875, -0.0525665283203125, -0.047199249267578125, -0.04183197021484375, -0.036464691162109375, -0.031097412109375, -0.025730133056640625, -0.02036285400390625, -0.014995574951171875, -0.0096282958984375, -0.004261016845703125, 0.00110626220703125, 0.006473541259765625, 0.0118408203125, 0.017208099365234375, 0.02257537841796875, 0.027942657470703125, 0.0333099365234375, 0.038677215576171875, 0.04404449462890625, 0.049411773681640625, 0.054779052734375, 0.060146331787109375, 0.06551361083984375, 0.07088088989257812, 0.0762481689453125, 0.08161544799804688, 0.08698272705078125, 0.09235000610351562, 0.09771728515625, 0.10308456420898438, 0.10845184326171875, 0.11381912231445312, 0.1191864013671875, 0.12455368041992188, 0.12992095947265625, 0.13528823852539062, 0.140655517578125, 0.14602279663085938, 0.15139007568359375, 0.15675735473632812, 0.1621246337890625, 0.16749191284179688, 0.17285919189453125, 0.17822647094726562, 0.18359375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 8.0, 12.0, 19.0, 35.0, 60.0, 116.0, 133.0, 144.0, 144.0, 118.0, 81.0, 53.0, 34.0, 11.0, 6.0, 8.0, 8.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.344545841217041, -4.219826698303223, -4.095107555389404, -3.970388650894165, -3.845669746398926, -3.7209506034851074, -3.596231460571289, -3.47151255607605, -3.3467936515808105, -3.222074508666992, -3.097355604171753, -2.9726364612579346, -2.8479175567626953, -2.723198413848877, -2.5984792709350586, -2.4737603664398193, -2.349041223526001, -2.2243220806121826, -2.0996031761169434, -1.974884033203125, -1.8501651287078857, -1.7254459857940674, -1.6007269620895386, -1.4760079383850098, -1.351288914680481, -1.2265698909759521, -1.1018508672714233, -0.9771317839622498, -0.852412760257721, -0.7276937365531921, -0.6029746532440186, -0.47825562953948975, -0.35353636741638184, -0.22881732881069183, -0.10409829020500183, 0.020620763301849365, 0.14533978700637817, 0.270058810710907, 0.39477789402008057, 0.5194969177246094, 0.6442159414291382, 0.768934965133667, 0.8936539888381958, 1.0183730125427246, 1.143092155456543, 1.2678110599517822, 1.3925302028656006, 1.5172492265701294, 1.6419682502746582, 1.766687273979187, 1.8914062976837158, 2.016125440597534, 2.1408443450927734, 2.265563488006592, 2.39028263092041, 2.5150015354156494, 2.6397204399108887, 2.764439582824707, 2.8891584873199463, 3.0138776302337646, 3.138596534729004, 3.2633156776428223, 3.3880348205566406, 3.51275372505188, 3.6374728679656982]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 6.0, 2.0, 4.0, 11.0, 4.0, 11.0, 13.0, 14.0, 15.0, 21.0, 21.0, 24.0, 31.0, 29.0, 26.0, 33.0, 44.0, 46.0, 43.0, 52.0, 52.0, 51.0, 48.0, 47.0, 29.0, 46.0, 32.0, 42.0, 18.0, 33.0, 19.0, 27.0, 14.0, 24.0, 15.0, 17.0, 9.0, 4.0, 8.0, 6.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.8090808391571045, -2.7263031005859375, -2.6435253620147705, -2.5607473850250244, -2.4779696464538574, -2.3951919078826904, -2.3124141693115234, -2.2296364307403564, -2.1468586921691895, -2.0640809535980225, -1.981303095817566, -1.898525357246399, -1.8157474994659424, -1.7329697608947754, -1.6501920223236084, -1.5674142837524414, -1.4846363067626953, -1.4018585681915283, -1.3190807104110718, -1.2363029718399048, -1.1535251140594482, -1.0707473754882812, -0.9879696369171143, -0.9051918387413025, -0.8224140405654907, -0.739636242389679, -0.6568584442138672, -0.5740807056427002, -0.4913029074668884, -0.40852510929107666, -0.3257473409175873, -0.2429695725440979, -0.16019177436828613, -0.07741399109363556, 0.005363792181015015, 0.08814157545566559, 0.17091935873031616, 0.25369715690612793, 0.3364749252796173, 0.4192526936531067, 0.5020304918289185, 0.5848082900047302, 0.667586088180542, 0.750363826751709, 0.8331416249275208, 0.9159194231033325, 0.9986971616744995, 1.081475019454956, 1.164252758026123, 1.24703049659729, 1.3298083543777466, 1.4125860929489136, 1.4953639507293701, 1.578141689300537, 1.660919427871704, 1.743697166442871, 1.8264750242233276, 1.9092527627944946, 1.9920306205749512, 2.074808359146118, 2.157586097717285, 2.2403640747070312, 2.3231418132781982, 2.4059195518493652, 2.4886972904205322]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 5.0, 2.0, 2.0, 10.0, 8.0, 7.0, 6.0, 12.0, 18.0, 25.0, 33.0, 37.0, 50.0, 81.0, 126.0, 241.0, 496.0, 1175.0, 3010.0, 10224.0, 52328.0, 423901.0, 2222635.0, 1269760.0, 173115.0, 27468.0, 5915.0, 1946.0, 748.0, 349.0, 183.0, 121.0, 59.0, 49.0, 33.0, 23.0, 15.0, 15.0, 12.0, 7.0, 10.0, 6.0, 7.0, 7.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7890625, -1.72900390625, -1.6689453125, -1.60888671875, -1.548828125, -1.48876953125, -1.4287109375, -1.36865234375, -1.30859375, -1.24853515625, -1.1884765625, -1.12841796875, -1.068359375, -1.00830078125, -0.9482421875, -0.88818359375, -0.828125, -0.76806640625, -0.7080078125, -0.64794921875, -0.587890625, -0.52783203125, -0.4677734375, -0.40771484375, -0.34765625, -0.28759765625, -0.2275390625, -0.16748046875, -0.107421875, -0.04736328125, 0.0126953125, 0.07275390625, 0.1328125, 0.19287109375, 0.2529296875, 0.31298828125, 0.373046875, 0.43310546875, 0.4931640625, 0.55322265625, 0.61328125, 0.67333984375, 0.7333984375, 0.79345703125, 0.853515625, 0.91357421875, 0.9736328125, 1.03369140625, 1.09375, 1.15380859375, 1.2138671875, 1.27392578125, 1.333984375, 1.39404296875, 1.4541015625, 1.51416015625, 1.57421875, 1.63427734375, 1.6943359375, 1.75439453125, 1.814453125, 1.87451171875, 1.9345703125, 1.99462890625, 2.0546875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 3.0, 4.0, 4.0, 6.0, 2.0, 12.0, 5.0, 16.0, 10.0, 19.0, 22.0, 15.0, 23.0, 29.0, 28.0, 30.0, 41.0, 44.0, 39.0, 31.0, 53.0, 49.0, 50.0, 63.0, 45.0, 34.0, 41.0, 32.0, 32.0, 27.0, 26.0, 21.0, 28.0, 16.0, 15.0, 14.0, 15.0, 10.0, 9.0, 6.0, 5.0, 3.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0], "bins": [-1.2548828125, -1.2197799682617188, -1.1846771240234375, -1.1495742797851562, -1.114471435546875, -1.0793685913085938, -1.0442657470703125, -1.0091629028320312, -0.97406005859375, -0.9389572143554688, -0.9038543701171875, -0.8687515258789062, -0.833648681640625, -0.7985458374023438, -0.7634429931640625, -0.7283401489257812, -0.6932373046875, -0.6581344604492188, -0.6230316162109375, -0.5879287719726562, -0.552825927734375, -0.5177230834960938, -0.4826202392578125, -0.44751739501953125, -0.41241455078125, -0.37731170654296875, -0.3422088623046875, -0.30710601806640625, -0.272003173828125, -0.23690032958984375, -0.2017974853515625, -0.16669464111328125, -0.131591796875, -0.09648895263671875, -0.0613861083984375, -0.02628326416015625, 0.008819580078125, 0.04392242431640625, 0.0790252685546875, 0.11412811279296875, 0.14923095703125, 0.18433380126953125, 0.2194366455078125, 0.25453948974609375, 0.289642333984375, 0.32474517822265625, 0.3598480224609375, 0.39495086669921875, 0.4300537109375, 0.46515655517578125, 0.5002593994140625, 0.5353622436523438, 0.570465087890625, 0.6055679321289062, 0.6406707763671875, 0.6757736206054688, 0.71087646484375, 0.7459793090820312, 0.7810821533203125, 0.8161849975585938, 0.851287841796875, 0.8863906860351562, 0.9214935302734375, 0.9565963745117188, 0.99169921875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 5.0, 6.0, 15.0, 12.0, 24.0, 40.0, 44.0, 63.0, 92.0, 147.0, 311.0, 859.0, 8474.0, 3812617.0, 367463.0, 2920.0, 552.0, 234.0, 119.0, 82.0, 48.0, 53.0, 38.0, 15.0, 14.0, 3.0, 4.0, 7.0, 4.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.39453125, -6.19976806640625, -6.0050048828125, -5.81024169921875, -5.615478515625, -5.42071533203125, -5.2259521484375, -5.03118896484375, -4.83642578125, -4.64166259765625, -4.4468994140625, -4.25213623046875, -4.057373046875, -3.86260986328125, -3.6678466796875, -3.47308349609375, -3.2783203125, -3.08355712890625, -2.8887939453125, -2.69403076171875, -2.499267578125, -2.30450439453125, -2.1097412109375, -1.91497802734375, -1.72021484375, -1.52545166015625, -1.3306884765625, -1.13592529296875, -0.941162109375, -0.74639892578125, -0.5516357421875, -0.35687255859375, -0.162109375, 0.03265380859375, 0.2274169921875, 0.42218017578125, 0.616943359375, 0.81170654296875, 1.0064697265625, 1.20123291015625, 1.39599609375, 1.59075927734375, 1.7855224609375, 1.98028564453125, 2.175048828125, 2.36981201171875, 2.5645751953125, 2.75933837890625, 2.9541015625, 3.14886474609375, 3.3436279296875, 3.53839111328125, 3.733154296875, 3.92791748046875, 4.1226806640625, 4.31744384765625, 4.51220703125, 4.70697021484375, 4.9017333984375, 5.09649658203125, 5.291259765625, 5.48602294921875, 5.6807861328125, 5.87554931640625, 6.0703125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 1.0, 5.0, 5.0, 8.0, 4.0, 14.0, 17.0, 29.0, 31.0, 33.0, 48.0, 72.0, 99.0, 147.0, 177.0, 251.0, 348.0, 475.0, 470.0, 473.0, 343.0, 301.0, 204.0, 148.0, 103.0, 69.0, 50.0, 31.0, 24.0, 27.0, 22.0, 13.0, 10.0, 5.0, 1.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39501953125, -0.3811798095703125, -0.367340087890625, -0.3535003662109375, -0.33966064453125, -0.3258209228515625, -0.311981201171875, -0.2981414794921875, -0.2843017578125, -0.2704620361328125, -0.256622314453125, -0.2427825927734375, -0.22894287109375, -0.2151031494140625, -0.201263427734375, -0.1874237060546875, -0.173583984375, -0.1597442626953125, -0.145904541015625, -0.1320648193359375, -0.11822509765625, -0.1043853759765625, -0.090545654296875, -0.0767059326171875, -0.0628662109375, -0.0490264892578125, -0.035186767578125, -0.0213470458984375, -0.00750732421875, 0.0063323974609375, 0.020172119140625, 0.0340118408203125, 0.0478515625, 0.0616912841796875, 0.075531005859375, 0.0893707275390625, 0.10321044921875, 0.1170501708984375, 0.130889892578125, 0.1447296142578125, 0.1585693359375, 0.1724090576171875, 0.186248779296875, 0.2000885009765625, 0.21392822265625, 0.2277679443359375, 0.241607666015625, 0.2554473876953125, 0.269287109375, 0.2831268310546875, 0.296966552734375, 0.3108062744140625, 0.32464599609375, 0.3384857177734375, 0.352325439453125, 0.3661651611328125, 0.3800048828125, 0.3938446044921875, 0.407684326171875, 0.4215240478515625, 0.43536376953125, 0.4492034912109375, 0.463043212890625, 0.4768829345703125, 0.49072265625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 8.0, 10.0, 8.0, 20.0, 27.0, 60.0, 71.0, 114.0, 160.0, 134.0, 134.0, 110.0, 56.0, 44.0, 22.0, 14.0, 8.0, 5.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1752493381500244, -3.0769264698028564, -2.9786033630371094, -2.8802804946899414, -2.7819576263427734, -2.6836347579956055, -2.5853118896484375, -2.4869887828826904, -2.3886659145355225, -2.2903430461883545, -2.1920199394226074, -2.0936970710754395, -1.9953742027282715, -1.8970513343811035, -1.798728346824646, -1.7004053592681885, -1.6020824909210205, -1.5037596225738525, -1.405436635017395, -1.3071136474609375, -1.2087907791137695, -1.1104679107666016, -1.012144923210144, -0.9138219952583313, -0.8154990673065186, -0.7171761393547058, -0.6188532114028931, -0.5205302834510803, -0.4222073554992676, -0.32388442754745483, -0.2255614995956421, -0.12723857164382935, -0.0289154052734375, 0.06940752267837524, 0.167730450630188, 0.26605337858200073, 0.3643763065338135, 0.4626992344856262, 0.561022162437439, 0.6593450903892517, 0.7576680183410645, 0.8559909462928772, 0.9543138742446899, 1.0526368618011475, 1.1509597301483154, 1.2492825984954834, 1.347605586051941, 1.4459285736083984, 1.5442514419555664, 1.6425743103027344, 1.740897297859192, 1.8392202854156494, 1.9375431537628174, 2.0358660221099854, 2.1341891288757324, 2.2325119972229004, 2.3308348655700684, 2.4291577339172363, 2.5274806022644043, 2.6258037090301514, 2.7241265773773193, 2.8224494457244873, 2.9207725524902344, 3.0190954208374023, 3.1174182891845703]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 2.0, 9.0, 4.0, 5.0, 4.0, 7.0, 7.0, 6.0, 10.0, 9.0, 14.0, 16.0, 21.0, 25.0, 27.0, 27.0, 18.0, 32.0, 34.0, 33.0, 28.0, 37.0, 35.0, 45.0, 39.0, 37.0, 47.0, 36.0, 30.0, 39.0, 30.0, 34.0, 31.0, 28.0, 25.0, 24.0, 16.0, 17.0, 17.0, 15.0, 12.0, 12.0, 7.0, 12.0, 9.0, 10.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 3.0], "bins": [-1.2031254768371582, -1.170365810394287, -1.137606143951416, -1.104846477508545, -1.0720868110656738, -1.0393271446228027, -1.0065674781799316, -0.9738078117370605, -0.9410481452941895, -0.9082884788513184, -0.8755288124084473, -0.8427691459655762, -0.8100094795227051, -0.777249813079834, -0.7444901466369629, -0.7117304801940918, -0.6789708137512207, -0.6462111473083496, -0.6134514808654785, -0.5806918144226074, -0.5479321479797363, -0.5151724815368652, -0.48241281509399414, -0.44965314865112305, -0.41689348220825195, -0.38413381576538086, -0.35137414932250977, -0.31861448287963867, -0.2858548164367676, -0.2530951499938965, -0.2203354835510254, -0.1875758171081543, -0.15481621026992798, -0.12205654382705688, -0.08929687738418579, -0.0565372109413147, -0.023777544498443604, 0.00898212194442749, 0.041741788387298584, 0.07450145483016968, 0.10726112127304077, 0.14002078771591187, 0.17278045415878296, 0.20554012060165405, 0.23829978704452515, 0.27105945348739624, 0.30381911993026733, 0.3365787863731384, 0.3693384528160095, 0.4020981192588806, 0.4348577857017517, 0.4676174521446228, 0.5003771185874939, 0.533136785030365, 0.5658964514732361, 0.5986561179161072, 0.6314157843589783, 0.6641754508018494, 0.6969351172447205, 0.7296947836875916, 0.7624544501304626, 0.7952141165733337, 0.8279737830162048, 0.8607334494590759, 0.893493115901947]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 7.0, 2.0, 6.0, 9.0, 7.0, 20.0, 34.0, 40.0, 65.0, 128.0, 216.0, 416.0, 769.0, 1751.0, 4728.0, 14130.0, 50591.0, 215598.0, 510488.0, 185466.0, 44124.0, 12497.0, 4235.0, 1635.0, 762.0, 362.0, 168.0, 115.0, 68.0, 37.0, 19.0, 20.0, 12.0, 10.0, 10.0, 7.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4677734375, -0.4518890380859375, -0.436004638671875, -0.4201202392578125, -0.40423583984375, -0.3883514404296875, -0.372467041015625, -0.3565826416015625, -0.3406982421875, -0.3248138427734375, -0.308929443359375, -0.2930450439453125, -0.27716064453125, -0.2612762451171875, -0.245391845703125, -0.2295074462890625, -0.213623046875, -0.1977386474609375, -0.181854248046875, -0.1659698486328125, -0.15008544921875, -0.1342010498046875, -0.118316650390625, -0.1024322509765625, -0.0865478515625, -0.0706634521484375, -0.054779052734375, -0.0388946533203125, -0.02301025390625, -0.0071258544921875, 0.008758544921875, 0.0246429443359375, 0.04052734375, 0.0564117431640625, 0.072296142578125, 0.0881805419921875, 0.10406494140625, 0.1199493408203125, 0.135833740234375, 0.1517181396484375, 0.1676025390625, 0.1834869384765625, 0.199371337890625, 0.2152557373046875, 0.23114013671875, 0.2470245361328125, 0.262908935546875, 0.2787933349609375, 0.294677734375, 0.3105621337890625, 0.326446533203125, 0.3423309326171875, 0.35821533203125, 0.3740997314453125, 0.389984130859375, 0.4058685302734375, 0.4217529296875, 0.4376373291015625, 0.453521728515625, 0.4694061279296875, 0.48529052734375, 0.5011749267578125, 0.517059326171875, 0.5329437255859375, 0.548828125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 9.0, 7.0, 7.0, 6.0, 9.0, 7.0, 6.0, 4.0, 11.0, 20.0, 28.0, 19.0, 33.0, 37.0, 45.0, 29.0, 33.0, 36.0, 55.0, 42.0, 47.0, 61.0, 54.0, 44.0, 31.0, 33.0, 41.0, 38.0, 31.0, 26.0, 26.0, 15.0, 18.0, 16.0, 14.0, 13.0, 10.0, 5.0, 9.0, 9.0, 5.0, 3.0, 5.0, 3.0, 0.0, 4.0, 0.0, 1.0], "bins": [-0.86328125, -0.8398056030273438, -0.8163299560546875, -0.7928543090820312, -0.769378662109375, -0.7459030151367188, -0.7224273681640625, -0.6989517211914062, -0.67547607421875, -0.6520004272460938, -0.6285247802734375, -0.6050491333007812, -0.581573486328125, -0.5580978393554688, -0.5346221923828125, -0.5111465454101562, -0.4876708984375, -0.46419525146484375, -0.4407196044921875, -0.41724395751953125, -0.393768310546875, -0.37029266357421875, -0.3468170166015625, -0.32334136962890625, -0.29986572265625, -0.27639007568359375, -0.2529144287109375, -0.22943878173828125, -0.205963134765625, -0.18248748779296875, -0.1590118408203125, -0.13553619384765625, -0.112060546875, -0.08858489990234375, -0.0651092529296875, -0.04163360595703125, -0.018157958984375, 0.00531768798828125, 0.0287933349609375, 0.05226898193359375, 0.07574462890625, 0.09922027587890625, 0.1226959228515625, 0.14617156982421875, 0.169647216796875, 0.19312286376953125, 0.2165985107421875, 0.24007415771484375, 0.2635498046875, 0.28702545166015625, 0.3105010986328125, 0.33397674560546875, 0.357452392578125, 0.38092803955078125, 0.4044036865234375, 0.42787933349609375, 0.45135498046875, 0.47483062744140625, 0.4983062744140625, 0.5217819213867188, 0.545257568359375, 0.5687332153320312, 0.5922088623046875, 0.6156845092773438, 0.63916015625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 11.0, 11.0, 7.0, 11.0, 16.0, 27.0, 24.0, 48.0, 57.0, 87.0, 133.0, 207.0, 323.0, 549.0, 1030.0, 2109.0, 4743.0, 11339.0, 29674.0, 79582.0, 208538.0, 359452.0, 215936.0, 82030.0, 30967.0, 12064.0, 4842.0, 2177.0, 1013.0, 576.0, 330.0, 188.0, 109.0, 90.0, 74.0, 36.0, 36.0, 31.0, 16.0, 8.0, 10.0, 9.0, 11.0, 4.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-0.359375, -0.3483238220214844, -0.33727264404296875, -0.3262214660644531, -0.3151702880859375, -0.3041191101074219, -0.29306793212890625, -0.2820167541503906, -0.270965576171875, -0.2599143981933594, -0.24886322021484375, -0.23781204223632812, -0.2267608642578125, -0.21570968627929688, -0.20465850830078125, -0.19360733032226562, -0.18255615234375, -0.17150497436523438, -0.16045379638671875, -0.14940261840820312, -0.1383514404296875, -0.12730026245117188, -0.11624908447265625, -0.10519790649414062, -0.094146728515625, -0.08309555053710938, -0.07204437255859375, -0.060993194580078125, -0.0499420166015625, -0.038890838623046875, -0.02783966064453125, -0.016788482666015625, -0.0057373046875, 0.005313873291015625, 0.01636505126953125, 0.027416229248046875, 0.0384674072265625, 0.049518585205078125, 0.06056976318359375, 0.07162094116210938, 0.082672119140625, 0.09372329711914062, 0.10477447509765625, 0.11582565307617188, 0.1268768310546875, 0.13792800903320312, 0.14897918701171875, 0.16003036499023438, 0.17108154296875, 0.18213272094726562, 0.19318389892578125, 0.20423507690429688, 0.2152862548828125, 0.22633743286132812, 0.23738861083984375, 0.24843978881835938, 0.259490966796875, 0.2705421447753906, 0.28159332275390625, 0.2926445007324219, 0.3036956787109375, 0.3147468566894531, 0.32579803466796875, 0.3368492126464844, 0.347900390625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 3.0, 8.0, 4.0, 3.0, 8.0, 7.0, 11.0, 19.0, 27.0, 13.0, 23.0, 24.0, 26.0, 38.0, 37.0, 40.0, 57.0, 55.0, 38.0, 47.0, 64.0, 53.0, 54.0, 55.0, 46.0, 49.0, 26.0, 25.0, 20.0, 16.0, 14.0, 16.0, 14.0, 14.0, 14.0, 6.0, 7.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.48828125, -1.4355926513671875, -1.382904052734375, -1.3302154541015625, -1.27752685546875, -1.2248382568359375, -1.172149658203125, -1.1194610595703125, -1.0667724609375, -1.0140838623046875, -0.961395263671875, -0.9087066650390625, -0.85601806640625, -0.8033294677734375, -0.750640869140625, -0.6979522705078125, -0.645263671875, -0.5925750732421875, -0.539886474609375, -0.4871978759765625, -0.43450927734375, -0.3818206787109375, -0.329132080078125, -0.2764434814453125, -0.2237548828125, -0.1710662841796875, -0.118377685546875, -0.0656890869140625, -0.01300048828125, 0.0396881103515625, 0.092376708984375, 0.1450653076171875, 0.19775390625, 0.2504425048828125, 0.303131103515625, 0.3558197021484375, 0.40850830078125, 0.4611968994140625, 0.513885498046875, 0.5665740966796875, 0.6192626953125, 0.6719512939453125, 0.724639892578125, 0.7773284912109375, 0.83001708984375, 0.8827056884765625, 0.935394287109375, 0.9880828857421875, 1.040771484375, 1.0934600830078125, 1.146148681640625, 1.1988372802734375, 1.25152587890625, 1.3042144775390625, 1.356903076171875, 1.4095916748046875, 1.4622802734375, 1.5149688720703125, 1.567657470703125, 1.6203460693359375, 1.67303466796875, 1.7257232666015625, 1.778411865234375, 1.8311004638671875, 1.8837890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 7.0, 5.0, 14.0, 16.0, 32.0, 55.0, 89.0, 171.0, 313.0, 730.0, 1837.0, 5362.0, 21754.0, 213525.0, 719323.0, 68492.0, 11265.0, 3202.0, 1211.0, 530.0, 277.0, 126.0, 91.0, 45.0, 29.0, 14.0, 10.0, 10.0, 9.0, 3.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3056640625, -0.2935752868652344, -0.28148651123046875, -0.2693977355957031, -0.2573089599609375, -0.24522018432617188, -0.23313140869140625, -0.22104263305664062, -0.208953857421875, -0.19686508178710938, -0.18477630615234375, -0.17268753051757812, -0.1605987548828125, -0.14850997924804688, -0.13642120361328125, -0.12433242797851562, -0.11224365234375, -0.10015487670898438, -0.08806610107421875, -0.07597732543945312, -0.0638885498046875, -0.051799774169921875, -0.03971099853515625, -0.027622222900390625, -0.015533447265625, -0.003444671630859375, 0.00864410400390625, 0.020732879638671875, 0.0328216552734375, 0.044910430908203125, 0.05699920654296875, 0.06908798217773438, 0.0811767578125, 0.09326553344726562, 0.10535430908203125, 0.11744308471679688, 0.1295318603515625, 0.14162063598632812, 0.15370941162109375, 0.16579818725585938, 0.177886962890625, 0.18997573852539062, 0.20206451416015625, 0.21415328979492188, 0.2262420654296875, 0.23833084106445312, 0.25041961669921875, 0.2625083923339844, 0.27459716796875, 0.2866859436035156, 0.29877471923828125, 0.3108634948730469, 0.3229522705078125, 0.3350410461425781, 0.34712982177734375, 0.3592185974121094, 0.371307373046875, 0.3833961486816406, 0.39548492431640625, 0.4075736999511719, 0.4196624755859375, 0.4317512512207031, 0.44384002685546875, 0.4559288024902344, 0.468017578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 7.0, 10.0, 9.0, 21.0, 20.0, 37.0, 42.0, 74.0, 108.0, 109.0, 138.0, 128.0, 82.0, 45.0, 40.0, 38.0, 21.0, 13.0, 12.0, 11.0, 7.0, 5.0, 2.0, 3.0, 4.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00010085105895996094, -9.781122207641602e-05, -9.47713851928711e-05, -9.173154830932617e-05, -8.869171142578125e-05, -8.565187454223633e-05, -8.26120376586914e-05, -7.957220077514648e-05, -7.653236389160156e-05, -7.349252700805664e-05, -7.045269012451172e-05, -6.74128532409668e-05, -6.437301635742188e-05, -6.133317947387695e-05, -5.829334259033203e-05, -5.525350570678711e-05, -5.221366882324219e-05, -4.9173831939697266e-05, -4.6133995056152344e-05, -4.309415817260742e-05, -4.00543212890625e-05, -3.701448440551758e-05, -3.3974647521972656e-05, -3.0934810638427734e-05, -2.7894973754882812e-05, -2.485513687133789e-05, -2.181529998779297e-05, -1.8775463104248047e-05, -1.5735626220703125e-05, -1.2695789337158203e-05, -9.655952453613281e-06, -6.616115570068359e-06, -3.5762786865234375e-06, -5.364418029785156e-07, 2.5033950805664062e-06, 5.543231964111328e-06, 8.58306884765625e-06, 1.1622905731201172e-05, 1.4662742614746094e-05, 1.7702579498291016e-05, 2.0742416381835938e-05, 2.378225326538086e-05, 2.682209014892578e-05, 2.9861927032470703e-05, 3.2901763916015625e-05, 3.594160079956055e-05, 3.898143768310547e-05, 4.202127456665039e-05, 4.506111145019531e-05, 4.8100948333740234e-05, 5.1140785217285156e-05, 5.418062210083008e-05, 5.7220458984375e-05, 6.026029586791992e-05, 6.330013275146484e-05, 6.633996963500977e-05, 6.937980651855469e-05, 7.241964340209961e-05, 7.545948028564453e-05, 7.849931716918945e-05, 8.153915405273438e-05, 8.45789909362793e-05, 8.761882781982422e-05, 9.065866470336914e-05, 9.369850158691406e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 10.0, 3.0, 10.0, 17.0, 13.0, 21.0, 36.0, 40.0, 69.0, 126.0, 321.0, 688.0, 2255.0, 11477.0, 143290.0, 804978.0, 74876.0, 7550.0, 1669.0, 537.0, 246.0, 118.0, 66.0, 41.0, 17.0, 21.0, 15.0, 10.0, 10.0, 13.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.443603515625, -0.42990875244140625, -0.4162139892578125, -0.40251922607421875, -0.388824462890625, -0.37512969970703125, -0.3614349365234375, -0.34774017333984375, -0.33404541015625, -0.32035064697265625, -0.3066558837890625, -0.29296112060546875, -0.279266357421875, -0.26557159423828125, -0.2518768310546875, -0.23818206787109375, -0.2244873046875, -0.21079254150390625, -0.1970977783203125, -0.18340301513671875, -0.169708251953125, -0.15601348876953125, -0.1423187255859375, -0.12862396240234375, -0.11492919921875, -0.10123443603515625, -0.0875396728515625, -0.07384490966796875, -0.060150146484375, -0.04645538330078125, -0.0327606201171875, -0.01906585693359375, -0.00537109375, 0.00832366943359375, 0.0220184326171875, 0.03571319580078125, 0.049407958984375, 0.06310272216796875, 0.0767974853515625, 0.09049224853515625, 0.10418701171875, 0.11788177490234375, 0.1315765380859375, 0.14527130126953125, 0.158966064453125, 0.17266082763671875, 0.1863555908203125, 0.20005035400390625, 0.2137451171875, 0.22743988037109375, 0.2411346435546875, 0.25482940673828125, 0.268524169921875, 0.28221893310546875, 0.2959136962890625, 0.30960845947265625, 0.32330322265625, 0.33699798583984375, 0.3506927490234375, 0.36438751220703125, 0.378082275390625, 0.39177703857421875, 0.4054718017578125, 0.41916656494140625, 0.432861328125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 5.0, 5.0, 9.0, 12.0, 9.0, 15.0, 14.0, 25.0, 31.0, 58.0, 53.0, 84.0, 97.0, 115.0, 111.0, 86.0, 66.0, 45.0, 49.0, 33.0, 15.0, 14.0, 11.0, 7.0, 2.0, 12.0, 5.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.073974609375, -0.07176780700683594, -0.06956100463867188, -0.06735420227050781, -0.06514739990234375, -0.06294059753417969, -0.060733795166015625, -0.05852699279785156, -0.0563201904296875, -0.05411338806152344, -0.051906585693359375, -0.04969978332519531, -0.04749298095703125, -0.04528617858886719, -0.043079376220703125, -0.04087257385253906, -0.038665771484375, -0.03645896911621094, -0.034252166748046875, -0.03204536437988281, -0.02983856201171875, -0.027631759643554688, -0.025424957275390625, -0.023218154907226562, -0.0210113525390625, -0.018804550170898438, -0.016597747802734375, -0.014390945434570312, -0.01218414306640625, -0.009977340698242188, -0.007770538330078125, -0.0055637359619140625, -0.00335693359375, -0.0011501312255859375, 0.001056671142578125, 0.0032634735107421875, 0.00547027587890625, 0.0076770782470703125, 0.009883880615234375, 0.012090682983398438, 0.0142974853515625, 0.016504287719726562, 0.018711090087890625, 0.020917892456054688, 0.02312469482421875, 0.025331497192382812, 0.027538299560546875, 0.029745101928710938, 0.031951904296875, 0.03415870666503906, 0.036365509033203125, 0.03857231140136719, 0.04077911376953125, 0.04298591613769531, 0.045192718505859375, 0.04739952087402344, 0.0496063232421875, 0.05181312561035156, 0.054019927978515625, 0.05622673034667969, 0.05843353271484375, 0.06064033508300781, 0.06284713745117188, 0.06505393981933594, 0.0672607421875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 11.0, 11.0, 19.0, 29.0, 51.0, 106.0, 163.0, 177.0, 164.0, 111.0, 65.0, 51.0, 18.0, 8.0, 9.0, 2.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3199594020843506, -2.2529542446136475, -2.1859488487243652, -2.118943691253662, -2.05193829536438, -1.9849331378936768, -1.917927861213684, -1.8509225845336914, -1.7839174270629883, -1.7169121503829956, -1.649906873703003, -1.5829017162322998, -1.5158964395523071, -1.4488911628723145, -1.3818858861923218, -1.314880609512329, -1.2478753328323364, -1.1808700561523438, -1.113864779472351, -1.0468595027923584, -0.9798543453216553, -0.9128490686416626, -0.8458437919616699, -0.7788385152816772, -0.7118332982063293, -0.6448280215263367, -0.5778228044509888, -0.5108175277709961, -0.4438122808933258, -0.3768070340156555, -0.30980175733566284, -0.24279651045799255, -0.17579138278961182, -0.10878612846136093, -0.041780874133110046, 0.025224387645721436, 0.09222963452339172, 0.159234881401062, 0.2262401580810547, 0.293245404958725, 0.36025065183639526, 0.42725589871406555, 0.49426114559173584, 0.5612664222717285, 0.6282716989517212, 0.6952769160270691, 0.7622821927070618, 0.8292874097824097, 0.8962926864624023, 0.963297963142395, 1.0303032398223877, 1.0973083972930908, 1.1643136739730835, 1.2313189506530762, 1.2983242273330688, 1.3653295040130615, 1.4323346614837646, 1.4993399381637573, 1.56634521484375, 1.6333503723144531, 1.7003556489944458, 1.7673609256744385, 1.8343662023544312, 1.9013714790344238, 1.9683767557144165]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 1.0, 12.0, 10.0, 4.0, 12.0, 15.0, 18.0, 23.0, 30.0, 30.0, 49.0, 53.0, 58.0, 45.0, 58.0, 74.0, 58.0, 56.0, 61.0, 52.0, 40.0, 49.0, 38.0, 26.0, 32.0, 16.0, 21.0, 16.0, 16.0, 8.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.267939567565918, -1.23697030544281, -1.2060011625289917, -1.1750319004058838, -1.1440626382827759, -1.113093376159668, -1.0821242332458496, -1.0511549711227417, -1.0201857089996338, -0.9892165064811707, -0.9582472443580627, -0.9272780418395996, -0.8963087797164917, -0.8653395771980286, -0.8343703746795654, -0.8034011125564575, -0.7724319100379944, -0.7414627075195312, -0.7104934453964233, -0.6795242428779602, -0.6485549807548523, -0.6175857782363892, -0.5866165161132812, -0.5556473135948181, -0.524678111076355, -0.49370887875556946, -0.46273964643478394, -0.4317704439163208, -0.4008011817932129, -0.36983197927474976, -0.33886274695396423, -0.3078935146331787, -0.2769242525100708, -0.24595502018928528, -0.21498578786849976, -0.18401657044887543, -0.1530473381280899, -0.12207810580730438, -0.09110888838768005, -0.06013965606689453, -0.02917042374610901, 0.0017988048493862152, 0.03276803344488144, 0.06373725831508636, 0.09470649063587189, 0.1256757229566574, 0.15664494037628174, 0.18761417269706726, 0.21858340501785278, 0.2495526373386383, 0.28052186965942383, 0.31149107217788696, 0.3424603343009949, 0.373429536819458, 0.40439876914024353, 0.43536800146102905, 0.4663372337818146, 0.4973064661026001, 0.5282756686210632, 0.5592449307441711, 0.5902141332626343, 0.6211833953857422, 0.6521525979042053, 0.6831218004226685, 0.7140910625457764]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 9.0, 9.0, 16.0, 22.0, 31.0, 44.0, 91.0, 187.0, 3338.0, 765579.0, 277519.0, 1356.0, 135.0, 82.0, 45.0, 34.0, 23.0, 12.0, 12.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.17578125, -6.031768798828125, -5.88775634765625, -5.743743896484375, -5.5997314453125, -5.455718994140625, -5.31170654296875, -5.167694091796875, -5.023681640625, -4.879669189453125, -4.73565673828125, -4.591644287109375, -4.4476318359375, -4.303619384765625, -4.15960693359375, -4.015594482421875, -3.87158203125, -3.727569580078125, -3.58355712890625, -3.439544677734375, -3.2955322265625, -3.151519775390625, -3.00750732421875, -2.863494873046875, -2.719482421875, -2.575469970703125, -2.43145751953125, -2.287445068359375, -2.1434326171875, -1.999420166015625, -1.85540771484375, -1.711395263671875, -1.5673828125, -1.423370361328125, -1.27935791015625, -1.135345458984375, -0.9913330078125, -0.847320556640625, -0.70330810546875, -0.559295654296875, -0.415283203125, -0.271270751953125, -0.12725830078125, 0.016754150390625, 0.1607666015625, 0.304779052734375, 0.44879150390625, 0.592803955078125, 0.73681640625, 0.880828857421875, 1.02484130859375, 1.168853759765625, 1.3128662109375, 1.456878662109375, 1.60089111328125, 1.744903564453125, 1.888916015625, 2.032928466796875, 2.17694091796875, 2.320953369140625, 2.4649658203125, 2.608978271484375, 2.75299072265625, 2.897003173828125, 3.041015625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 7.0, 3.0, 9.0, 9.0, 17.0, 20.0, 33.0, 38.0, 63.0, 70.0, 111.0, 83.0, 106.0, 95.0, 108.0, 62.0, 49.0, 40.0, 33.0, 24.0, 11.0, 11.0, 7.0, 7.0], "bins": [-5.59765625, -5.4905242919921875, -5.383392333984375, -5.2762603759765625, -5.16912841796875, -5.0619964599609375, -4.954864501953125, -4.8477325439453125, -4.7406005859375, -4.6334686279296875, -4.526336669921875, -4.4192047119140625, -4.31207275390625, -4.2049407958984375, -4.097808837890625, -3.9906768798828125, -3.883544921875, -3.7764129638671875, -3.669281005859375, -3.5621490478515625, -3.45501708984375, -3.3478851318359375, -3.240753173828125, -3.1336212158203125, -3.0264892578125, -2.9193572998046875, -2.812225341796875, -2.7050933837890625, -2.59796142578125, -2.4908294677734375, -2.383697509765625, -2.2765655517578125, -2.16943359375, -2.0623016357421875, -1.955169677734375, -1.8480377197265625, -1.74090576171875, -1.6337738037109375, -1.526641845703125, -1.4195098876953125, -1.3123779296875, -1.2052459716796875, -1.098114013671875, -0.9909820556640625, -0.88385009765625, -0.7767181396484375, -0.669586181640625, -0.5624542236328125, -0.455322265625, -0.3481903076171875, -0.241058349609375, -0.1339263916015625, -0.02679443359375, 0.0803375244140625, 0.187469482421875, 0.2946014404296875, 0.4017333984375, 0.5088653564453125, 0.615997314453125, 0.7231292724609375, 0.83026123046875, 0.9373931884765625, 1.044525146484375, 1.1516571044921875, 1.2587890625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 8.0, 6.0, 13.0, 14.0, 10.0, 24.0, 22.0, 33.0, 30.0, 54.0, 53.0, 71.0, 83.0, 94.0, 143.0, 165.0, 208.0, 323.0, 688.0, 4927.0, 130685.0, 838407.0, 67404.0, 3239.0, 574.0, 294.0, 187.0, 136.0, 126.0, 109.0, 79.0, 75.0, 61.0, 43.0, 33.0, 33.0, 28.0, 19.0, 11.0, 9.0, 8.0, 5.0, 6.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0], "bins": [-2.453125, -2.3818359375, -2.310546875, -2.2392578125, -2.16796875, -2.0966796875, -2.025390625, -1.9541015625, -1.8828125, -1.8115234375, -1.740234375, -1.6689453125, -1.59765625, -1.5263671875, -1.455078125, -1.3837890625, -1.3125, -1.2412109375, -1.169921875, -1.0986328125, -1.02734375, -0.9560546875, -0.884765625, -0.8134765625, -0.7421875, -0.6708984375, -0.599609375, -0.5283203125, -0.45703125, -0.3857421875, -0.314453125, -0.2431640625, -0.171875, -0.1005859375, -0.029296875, 0.0419921875, 0.11328125, 0.1845703125, 0.255859375, 0.3271484375, 0.3984375, 0.4697265625, 0.541015625, 0.6123046875, 0.68359375, 0.7548828125, 0.826171875, 0.8974609375, 0.96875, 1.0400390625, 1.111328125, 1.1826171875, 1.25390625, 1.3251953125, 1.396484375, 1.4677734375, 1.5390625, 1.6103515625, 1.681640625, 1.7529296875, 1.82421875, 1.8955078125, 1.966796875, 2.0380859375, 2.109375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 2.0, 4.0, 5.0, 13.0, 15.0, 13.0, 18.0, 19.0, 20.0, 18.0, 16.0, 37.0, 30.0, 23.0, 47.0, 38.0, 28.0, 33.0, 38.0, 32.0, 45.0, 46.0, 48.0, 48.0, 45.0, 37.0, 24.0, 33.0, 30.0, 21.0, 31.0, 21.0, 15.0, 15.0, 11.0, 12.0, 8.0, 8.0, 12.0, 6.0, 5.0, 9.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.470703125, -1.4264984130859375, -1.382293701171875, -1.3380889892578125, -1.29388427734375, -1.2496795654296875, -1.205474853515625, -1.1612701416015625, -1.1170654296875, -1.0728607177734375, -1.028656005859375, -0.9844512939453125, -0.94024658203125, -0.8960418701171875, -0.851837158203125, -0.8076324462890625, -0.763427734375, -0.7192230224609375, -0.675018310546875, -0.6308135986328125, -0.58660888671875, -0.5424041748046875, -0.498199462890625, -0.4539947509765625, -0.4097900390625, -0.3655853271484375, -0.321380615234375, -0.2771759033203125, -0.23297119140625, -0.1887664794921875, -0.144561767578125, -0.1003570556640625, -0.05615234375, -0.0119476318359375, 0.032257080078125, 0.0764617919921875, 0.12066650390625, 0.1648712158203125, 0.209075927734375, 0.2532806396484375, 0.2974853515625, 0.3416900634765625, 0.385894775390625, 0.4300994873046875, 0.47430419921875, 0.5185089111328125, 0.562713623046875, 0.6069183349609375, 0.651123046875, 0.6953277587890625, 0.739532470703125, 0.7837371826171875, 0.82794189453125, 0.8721466064453125, 0.916351318359375, 0.9605560302734375, 1.0047607421875, 1.0489654541015625, 1.093170166015625, 1.1373748779296875, 1.18157958984375, 1.2257843017578125, 1.269989013671875, 1.3141937255859375, 1.3583984375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 9.0, 7.0, 17.0, 14.0, 31.0, 38.0, 52.0, 77.0, 150.0, 290.0, 955.0, 4834.0, 51830.0, 695051.0, 276462.0, 15529.0, 2167.0, 534.0, 197.0, 93.0, 60.0, 41.0, 30.0, 32.0, 16.0, 8.0, 5.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.5419921875, -0.5264053344726562, -0.5108184814453125, -0.49523162841796875, -0.479644775390625, -0.46405792236328125, -0.4484710693359375, -0.43288421630859375, -0.41729736328125, -0.40171051025390625, -0.3861236572265625, -0.37053680419921875, -0.354949951171875, -0.33936309814453125, -0.3237762451171875, -0.30818939208984375, -0.2926025390625, -0.27701568603515625, -0.2614288330078125, -0.24584197998046875, -0.230255126953125, -0.21466827392578125, -0.1990814208984375, -0.18349456787109375, -0.16790771484375, -0.15232086181640625, -0.1367340087890625, -0.12114715576171875, -0.105560302734375, -0.08997344970703125, -0.0743865966796875, -0.05879974365234375, -0.043212890625, -0.02762603759765625, -0.0120391845703125, 0.00354766845703125, 0.019134521484375, 0.03472137451171875, 0.0503082275390625, 0.06589508056640625, 0.08148193359375, 0.09706878662109375, 0.1126556396484375, 0.12824249267578125, 0.143829345703125, 0.15941619873046875, 0.1750030517578125, 0.19058990478515625, 0.2061767578125, 0.22176361083984375, 0.2373504638671875, 0.25293731689453125, 0.268524169921875, 0.28411102294921875, 0.2996978759765625, 0.31528472900390625, 0.33087158203125, 0.34645843505859375, 0.3620452880859375, 0.37763214111328125, 0.393218994140625, 0.40880584716796875, 0.4243927001953125, 0.43997955322265625, 0.45556640625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 1.0, 4.0, 10.0, 8.0, 15.0, 13.0, 14.0, 27.0, 33.0, 36.0, 47.0, 58.0, 59.0, 69.0, 66.0, 86.0, 72.0, 67.0, 64.0, 43.0, 42.0, 34.0, 37.0, 14.0, 19.0, 10.0, 12.0, 8.0, 6.0, 5.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.190206527709961e-05, -4.078354686498642e-05, -3.966502845287323e-05, -3.854651004076004e-05, -3.742799162864685e-05, -3.630947321653366e-05, -3.519095480442047e-05, -3.407243639230728e-05, -3.295391798019409e-05, -3.18353995680809e-05, -3.071688115596771e-05, -2.9598362743854523e-05, -2.8479844331741333e-05, -2.7361325919628143e-05, -2.6242807507514954e-05, -2.5124289095401764e-05, -2.4005770683288574e-05, -2.2887252271175385e-05, -2.1768733859062195e-05, -2.0650215446949005e-05, -1.9531697034835815e-05, -1.8413178622722626e-05, -1.7294660210609436e-05, -1.6176141798496246e-05, -1.5057623386383057e-05, -1.3939104974269867e-05, -1.2820586562156677e-05, -1.1702068150043488e-05, -1.0583549737930298e-05, -9.465031325817108e-06, -8.346512913703918e-06, -7.227994501590729e-06, -6.109476089477539e-06, -4.990957677364349e-06, -3.87243926525116e-06, -2.75392085313797e-06, -1.6354024410247803e-06, -5.168840289115906e-07, 6.016343832015991e-07, 1.7201527953147888e-06, 2.8386712074279785e-06, 3.957189619541168e-06, 5.075708031654358e-06, 6.194226443767548e-06, 7.312744855880737e-06, 8.431263267993927e-06, 9.549781680107117e-06, 1.0668300092220306e-05, 1.1786818504333496e-05, 1.2905336916446686e-05, 1.4023855328559875e-05, 1.5142373740673065e-05, 1.6260892152786255e-05, 1.7379410564899445e-05, 1.8497928977012634e-05, 1.9616447389125824e-05, 2.0734965801239014e-05, 2.1853484213352203e-05, 2.2972002625465393e-05, 2.4090521037578583e-05, 2.5209039449691772e-05, 2.6327557861804962e-05, 2.7446076273918152e-05, 2.856459468603134e-05, 2.968311309814453e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 3.0, 8.0, 11.0, 11.0, 25.0, 22.0, 45.0, 56.0, 124.0, 257.0, 721.0, 3291.0, 43525.0, 898314.0, 96028.0, 4573.0, 864.0, 288.0, 154.0, 86.0, 56.0, 34.0, 16.0, 17.0, 3.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72412109375, -0.7004547119140625, -0.676788330078125, -0.6531219482421875, -0.62945556640625, -0.6057891845703125, -0.582122802734375, -0.5584564208984375, -0.5347900390625, -0.5111236572265625, -0.487457275390625, -0.4637908935546875, -0.44012451171875, -0.4164581298828125, -0.392791748046875, -0.3691253662109375, -0.345458984375, -0.3217926025390625, -0.298126220703125, -0.2744598388671875, -0.25079345703125, -0.2271270751953125, -0.203460693359375, -0.1797943115234375, -0.1561279296875, -0.1324615478515625, -0.108795166015625, -0.0851287841796875, -0.06146240234375, -0.0377960205078125, -0.014129638671875, 0.0095367431640625, 0.033203125, 0.0568695068359375, 0.080535888671875, 0.1042022705078125, 0.12786865234375, 0.1515350341796875, 0.175201416015625, 0.1988677978515625, 0.2225341796875, 0.2462005615234375, 0.269866943359375, 0.2935333251953125, 0.31719970703125, 0.3408660888671875, 0.364532470703125, 0.3881988525390625, 0.411865234375, 0.4355316162109375, 0.459197998046875, 0.4828643798828125, 0.50653076171875, 0.5301971435546875, 0.553863525390625, 0.5775299072265625, 0.6011962890625, 0.6248626708984375, 0.648529052734375, 0.6721954345703125, 0.69586181640625, 0.7195281982421875, 0.743194580078125, 0.7668609619140625, 0.79052734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 8.0, 3.0, 13.0, 18.0, 21.0, 29.0, 34.0, 50.0, 65.0, 115.0, 107.0, 113.0, 106.0, 86.0, 71.0, 46.0, 38.0, 28.0, 10.0, 11.0, 7.0, 10.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2230224609375, -0.21706771850585938, -0.21111297607421875, -0.20515823364257812, -0.1992034912109375, -0.19324874877929688, -0.18729400634765625, -0.18133926391601562, -0.175384521484375, -0.16942977905273438, -0.16347503662109375, -0.15752029418945312, -0.1515655517578125, -0.14561080932617188, -0.13965606689453125, -0.13370132446289062, -0.12774658203125, -0.12179183959960938, -0.11583709716796875, -0.10988235473632812, -0.1039276123046875, -0.09797286987304688, -0.09201812744140625, -0.08606338500976562, -0.080108642578125, -0.07415390014648438, -0.06819915771484375, -0.062244415283203125, -0.0562896728515625, -0.050334930419921875, -0.04438018798828125, -0.038425445556640625, -0.032470703125, -0.026515960693359375, -0.02056121826171875, -0.014606475830078125, -0.0086517333984375, -0.002696990966796875, 0.00325775146484375, 0.009212493896484375, 0.015167236328125, 0.021121978759765625, 0.02707672119140625, 0.033031463623046875, 0.0389862060546875, 0.044940948486328125, 0.05089569091796875, 0.056850433349609375, 0.06280517578125, 0.06875991821289062, 0.07471466064453125, 0.08066940307617188, 0.0866241455078125, 0.09257888793945312, 0.09853363037109375, 0.10448837280273438, 0.110443115234375, 0.11639785766601562, 0.12235260009765625, 0.12830734252929688, 0.1342620849609375, 0.14021682739257812, 0.14617156982421875, 0.15212631225585938, 0.1580810546875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 12.0, 6.0, 27.0, 31.0, 60.0, 110.0, 147.0, 186.0, 143.0, 120.0, 69.0, 47.0, 18.0, 11.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33904504776001, -4.20599889755249, -4.072952747344971, -3.9399068355560303, -3.80686092376709, -3.6738147735595703, -3.540768623352051, -3.4077227115631104, -3.27467679977417, -3.1416306495666504, -3.00858473777771, -2.8755385875701904, -2.74249267578125, -2.6094465255737305, -2.476400375366211, -2.3433544635772705, -2.210308313369751, -2.0772621631622314, -1.944216251373291, -1.8111701011657715, -1.678124189376831, -1.5450780391693115, -1.4120320081710815, -1.2789859771728516, -1.1459399461746216, -1.0128939151763916, -0.8798478841781616, -0.7468017935752869, -0.6137557625770569, -0.4807097315788269, -0.34766364097595215, -0.21461760997772217, -0.08157157897949219, 0.05147446691989899, 0.18452051281929016, 0.31756657361984253, 0.4506126046180725, 0.5836586356163025, 0.7167047262191772, 0.8497507572174072, 0.9827967882156372, 1.1158428192138672, 1.2488888502120972, 1.3819348812103271, 1.5149810314178467, 1.648026943206787, 1.7810730934143066, 1.9141191244125366, 2.0471651554107666, 2.180211305618286, 2.3132572174072266, 2.446303367614746, 2.5793492794036865, 2.712395429611206, 2.8454413414001465, 2.978487491607666, 3.1115336418151855, 3.244579792022705, 3.3776257038116455, 3.510671854019165, 3.6437177658081055, 3.776763916015625, 3.9098100662231445, 4.042856216430664, 4.175901889801025]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 14.0, 13.0, 11.0, 23.0, 22.0, 38.0, 45.0, 39.0, 56.0, 74.0, 52.0, 66.0, 73.0, 76.0, 71.0, 75.0, 49.0, 52.0, 34.0, 33.0, 31.0, 21.0, 15.0, 13.0, 6.0, 2.0, 2.0, 6.0, 2.0], "bins": [-6.718866348266602, -6.577828407287598, -6.436790943145752, -6.295753002166748, -6.154715061187744, -6.013677597045898, -5.8726396560668945, -5.731601715087891, -5.590563774108887, -5.449525833129883, -5.308488368988037, -5.167450428009033, -5.026412487030029, -4.885375022888184, -4.74433708190918, -4.603299140930176, -4.46226167678833, -4.321223735809326, -4.1801862716674805, -4.039148330688477, -3.8981103897094727, -3.757072687149048, -3.616034984588623, -3.474997043609619, -3.3339593410491943, -3.1929216384887695, -3.0518836975097656, -2.910845994949341, -2.769808292388916, -2.628770351409912, -2.4877326488494873, -2.3466949462890625, -2.2056565284729004, -2.0646188259124756, -1.9235808849334717, -1.7825431823730469, -1.6415053606033325, -1.5004675388336182, -1.3594298362731934, -1.218392014503479, -1.0773541927337646, -0.9363163709640503, -0.7952786087989807, -0.6542408466339111, -0.5132030248641968, -0.3721652030944824, -0.23112744092941284, -0.09008967876434326, 0.050948143005371094, 0.19198593497276306, 0.33302372694015503, 0.474061518907547, 0.615099310874939, 0.7561371326446533, 0.8971748948097229, 1.0382126569747925, 1.1792504787445068, 1.3202883005142212, 1.4613261222839355, 1.6023638248443604, 1.7434016466140747, 1.884439468383789, 2.025477170944214, 2.1665148735046387, 2.3075528144836426]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 6.0, 6.0, 8.0, 9.0, 10.0, 19.0, 24.0, 43.0, 59.0, 92.0, 111.0, 168.0, 294.0, 476.0, 789.0, 1514.0, 3257.0, 7631.0, 23083.0, 91941.0, 477992.0, 1794871.0, 1378635.0, 313107.0, 68599.0, 18957.0, 6426.0, 2806.0, 1399.0, 777.0, 397.0, 257.0, 143.0, 112.0, 79.0, 53.0, 30.0, 30.0, 22.0, 16.0, 12.0, 5.0, 8.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2548828125, -1.2142333984375, -1.173583984375, -1.1329345703125, -1.09228515625, -1.0516357421875, -1.010986328125, -0.9703369140625, -0.9296875, -0.8890380859375, -0.848388671875, -0.8077392578125, -0.76708984375, -0.7264404296875, -0.685791015625, -0.6451416015625, -0.6044921875, -0.5638427734375, -0.523193359375, -0.4825439453125, -0.44189453125, -0.4012451171875, -0.360595703125, -0.3199462890625, -0.279296875, -0.2386474609375, -0.197998046875, -0.1573486328125, -0.11669921875, -0.0760498046875, -0.035400390625, 0.0052490234375, 0.0458984375, 0.0865478515625, 0.127197265625, 0.1678466796875, 0.20849609375, 0.2491455078125, 0.289794921875, 0.3304443359375, 0.37109375, 0.4117431640625, 0.452392578125, 0.4930419921875, 0.53369140625, 0.5743408203125, 0.614990234375, 0.6556396484375, 0.6962890625, 0.7369384765625, 0.777587890625, 0.8182373046875, 0.85888671875, 0.8995361328125, 0.940185546875, 0.9808349609375, 1.021484375, 1.0621337890625, 1.102783203125, 1.1434326171875, 1.18408203125, 1.2247314453125, 1.265380859375, 1.3060302734375, 1.3466796875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 4.0, 4.0, 4.0, 8.0, 2.0, 4.0, 14.0, 19.0, 18.0, 18.0, 29.0, 33.0, 32.0, 40.0, 39.0, 41.0, 48.0, 42.0, 54.0, 47.0, 47.0, 64.0, 46.0, 52.0, 45.0, 35.0, 24.0, 34.0, 30.0, 16.0, 20.0, 23.0, 13.0, 17.0, 7.0, 6.0, 11.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2021484375, -1.1643524169921875, -1.126556396484375, -1.0887603759765625, -1.05096435546875, -1.0131683349609375, -0.975372314453125, -0.9375762939453125, -0.8997802734375, -0.8619842529296875, -0.824188232421875, -0.7863922119140625, -0.74859619140625, -0.7108001708984375, -0.673004150390625, -0.6352081298828125, -0.597412109375, -0.5596160888671875, -0.521820068359375, -0.4840240478515625, -0.44622802734375, -0.4084320068359375, -0.370635986328125, -0.3328399658203125, -0.2950439453125, -0.2572479248046875, -0.219451904296875, -0.1816558837890625, -0.14385986328125, -0.1060638427734375, -0.068267822265625, -0.0304718017578125, 0.00732421875, 0.0451202392578125, 0.082916259765625, 0.1207122802734375, 0.15850830078125, 0.1963043212890625, 0.234100341796875, 0.2718963623046875, 0.3096923828125, 0.3474884033203125, 0.385284423828125, 0.4230804443359375, 0.46087646484375, 0.4986724853515625, 0.536468505859375, 0.5742645263671875, 0.612060546875, 0.6498565673828125, 0.687652587890625, 0.7254486083984375, 0.76324462890625, 0.8010406494140625, 0.838836669921875, 0.8766326904296875, 0.9144287109375, 0.9522247314453125, 0.990020751953125, 1.0278167724609375, 1.06561279296875, 1.1034088134765625, 1.141204833984375, 1.1790008544921875, 1.216796875]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 9.0, 15.0, 25.0, 52.0, 106.0, 170.0, 418.0, 1240.0, 13067.0, 4072636.0, 102994.0, 2419.0, 571.0, 250.0, 145.0, 74.0, 40.0, 22.0, 14.0, 11.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.9765625, -8.775726318359375, -8.57489013671875, -8.374053955078125, -8.1732177734375, -7.972381591796875, -7.77154541015625, -7.570709228515625, -7.369873046875, -7.169036865234375, -6.96820068359375, -6.767364501953125, -6.5665283203125, -6.365692138671875, -6.16485595703125, -5.964019775390625, -5.76318359375, -5.562347412109375, -5.36151123046875, -5.160675048828125, -4.9598388671875, -4.759002685546875, -4.55816650390625, -4.357330322265625, -4.156494140625, -3.955657958984375, -3.75482177734375, -3.553985595703125, -3.3531494140625, -3.152313232421875, -2.95147705078125, -2.750640869140625, -2.5498046875, -2.348968505859375, -2.14813232421875, -1.947296142578125, -1.7464599609375, -1.545623779296875, -1.34478759765625, -1.143951416015625, -0.943115234375, -0.742279052734375, -0.54144287109375, -0.340606689453125, -0.1397705078125, 0.061065673828125, 0.26190185546875, 0.462738037109375, 0.66357421875, 0.864410400390625, 1.06524658203125, 1.266082763671875, 1.4669189453125, 1.667755126953125, 1.86859130859375, 2.069427490234375, 2.270263671875, 2.471099853515625, 2.67193603515625, 2.872772216796875, 3.0736083984375, 3.274444580078125, 3.47528076171875, 3.676116943359375, 3.876953125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 0.0, 3.0, 6.0, 3.0, 5.0, 10.0, 16.0, 17.0, 30.0, 31.0, 47.0, 64.0, 128.0, 161.0, 284.0, 471.0, 628.0, 661.0, 519.0, 377.0, 229.0, 130.0, 86.0, 46.0, 41.0, 26.0, 20.0, 12.0, 11.0, 2.0, 3.0, 5.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55908203125, -0.5411605834960938, -0.5232391357421875, -0.5053176879882812, -0.487396240234375, -0.46947479248046875, -0.4515533447265625, -0.43363189697265625, -0.41571044921875, -0.39778900146484375, -0.3798675537109375, -0.36194610595703125, -0.344024658203125, -0.32610321044921875, -0.3081817626953125, -0.29026031494140625, -0.2723388671875, -0.25441741943359375, -0.2364959716796875, -0.21857452392578125, -0.200653076171875, -0.18273162841796875, -0.1648101806640625, -0.14688873291015625, -0.12896728515625, -0.11104583740234375, -0.0931243896484375, -0.07520294189453125, -0.057281494140625, -0.03936004638671875, -0.0214385986328125, -0.00351715087890625, 0.014404296875, 0.03232574462890625, 0.0502471923828125, 0.06816864013671875, 0.086090087890625, 0.10401153564453125, 0.1219329833984375, 0.13985443115234375, 0.15777587890625, 0.17569732666015625, 0.1936187744140625, 0.21154022216796875, 0.229461669921875, 0.24738311767578125, 0.2653045654296875, 0.28322601318359375, 0.3011474609375, 0.31906890869140625, 0.3369903564453125, 0.35491180419921875, 0.372833251953125, 0.39075469970703125, 0.4086761474609375, 0.42659759521484375, 0.44451904296875, 0.46244049072265625, 0.4803619384765625, 0.49828338623046875, 0.516204833984375, 0.5341262817382812, 0.5520477294921875, 0.5699691772460938, 0.587890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 12.0, 26.0, 36.0, 47.0, 53.0, 79.0, 104.0, 116.0, 135.0, 117.0, 89.0, 55.0, 44.0, 32.0, 17.0, 11.0, 9.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.475778818130493, -2.396470785140991, -2.3171629905700684, -2.2378549575805664, -2.1585469245910645, -2.0792391300201416, -1.9999310970306396, -1.9206231832504272, -1.8413152694702148, -1.7620073556900024, -1.68269944190979, -1.603391408920288, -1.5240834951400757, -1.4447755813598633, -1.3654675483703613, -1.286159634590149, -1.2068517208099365, -1.1275438070297241, -1.0482358932495117, -0.9689278602600098, -0.8896199464797974, -0.810312032699585, -0.7310040593147278, -0.6516960859298706, -0.5723881721496582, -0.4930802285671234, -0.4137722849845886, -0.33446434140205383, -0.25515639781951904, -0.17584845423698425, -0.09654051065444946, -0.017232537269592285, 0.06207537651062012, 0.1413833200931549, 0.2206912636756897, 0.2999992072582245, 0.3793071508407593, 0.45861509442329407, 0.5379230380058289, 0.617231011390686, 0.6965389251708984, 0.7758468389511108, 0.855154812335968, 0.9344627857208252, 1.0137706995010376, 1.09307861328125, 1.172386646270752, 1.2516945600509644, 1.3310024738311768, 1.4103103876113892, 1.4896183013916016, 1.5689263343811035, 1.648234248161316, 1.7275421619415283, 1.8068501949310303, 1.8861581087112427, 1.965466022491455, 2.044774055480957, 2.12408185005188, 2.203389883041382, 2.2826976776123047, 2.3620057106018066, 2.4413137435913086, 2.5206217765808105, 2.5999295711517334]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 6.0, 6.0, 6.0, 5.0, 8.0, 10.0, 13.0, 17.0, 12.0, 24.0, 26.0, 26.0, 20.0, 24.0, 30.0, 30.0, 33.0, 31.0, 39.0, 32.0, 47.0, 39.0, 42.0, 41.0, 43.0, 37.0, 27.0, 37.0, 31.0, 29.0, 18.0, 36.0, 27.0, 26.0, 14.0, 17.0, 12.0, 10.0, 11.0, 9.0, 7.0, 6.0, 5.0, 7.0, 4.0, 4.0, 2.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.0165743827819824, -0.9838593602180481, -0.9511443376541138, -0.9184293150901794, -0.8857142925262451, -0.8529993295669556, -0.8202843070030212, -0.7875692844390869, -0.7548542618751526, -0.7221392393112183, -0.6894242167472839, -0.6567091941833496, -0.6239942312240601, -0.591279149055481, -0.5585641860961914, -0.5258491635322571, -0.49313414096832275, -0.4604191184043884, -0.4277040958404541, -0.39498910307884216, -0.36227408051490784, -0.3295590579509735, -0.2968440651893616, -0.26412904262542725, -0.23141402006149292, -0.1986989974975586, -0.16598398983478546, -0.13326898217201233, -0.100553959608078, -0.06783893704414368, -0.035123929381370544, -0.002408921718597412, 0.030306100845336914, 0.06302111595869064, 0.09573613107204437, 0.1284511387348175, 0.16116616129875183, 0.19388118386268616, 0.2265961915254593, 0.2593111991882324, 0.29202622175216675, 0.3247412443161011, 0.3574562668800354, 0.39017125964164734, 0.42288628220558167, 0.455601304769516, 0.48831629753112793, 0.5210313200950623, 0.5537463426589966, 0.5864613652229309, 0.6191763877868652, 0.6518914103507996, 0.6846064329147339, 0.7173213958740234, 0.7500364184379578, 0.7827514410018921, 0.8154664635658264, 0.8481814861297607, 0.8808965086936951, 0.9136115312576294, 0.946326494216919, 0.979041576385498, 1.0117565393447876, 1.0444715023040771, 1.0771865844726562]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 15.0, 10.0, 11.0, 29.0, 77.0, 209.0, 724.0, 2950.0, 15396.0, 119165.0, 830441.0, 66373.0, 10299.0, 2046.0, 520.0, 146.0, 54.0, 25.0, 23.0, 8.0, 8.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.1875, -1.1548614501953125, -1.122222900390625, -1.0895843505859375, -1.05694580078125, -1.0243072509765625, -0.991668701171875, -0.9590301513671875, -0.9263916015625, -0.8937530517578125, -0.861114501953125, -0.8284759521484375, -0.79583740234375, -0.7631988525390625, -0.730560302734375, -0.6979217529296875, -0.665283203125, -0.6326446533203125, -0.600006103515625, -0.5673675537109375, -0.53472900390625, -0.5020904541015625, -0.469451904296875, -0.4368133544921875, -0.4041748046875, -0.3715362548828125, -0.338897705078125, -0.3062591552734375, -0.27362060546875, -0.2409820556640625, -0.208343505859375, -0.1757049560546875, -0.14306640625, -0.1104278564453125, -0.077789306640625, -0.0451507568359375, -0.01251220703125, 0.0201263427734375, 0.052764892578125, 0.0854034423828125, 0.1180419921875, 0.1506805419921875, 0.183319091796875, 0.2159576416015625, 0.24859619140625, 0.2812347412109375, 0.313873291015625, 0.3465118408203125, 0.379150390625, 0.4117889404296875, 0.444427490234375, 0.4770660400390625, 0.50970458984375, 0.5423431396484375, 0.574981689453125, 0.6076202392578125, 0.6402587890625, 0.6728973388671875, 0.705535888671875, 0.7381744384765625, 0.77081298828125, 0.8034515380859375, 0.836090087890625, 0.8687286376953125, 0.9013671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 10.0, 4.0, 7.0, 16.0, 30.0, 25.0, 45.0, 66.0, 88.0, 95.0, 83.0, 101.0, 102.0, 92.0, 85.0, 50.0, 42.0, 31.0, 12.0, 10.0, 10.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.65234375, -2.5973129272460938, -2.5422821044921875, -2.4872512817382812, -2.432220458984375, -2.3771896362304688, -2.3221588134765625, -2.2671279907226562, -2.21209716796875, -2.1570663452148438, -2.1020355224609375, -2.0470046997070312, -1.991973876953125, -1.9369430541992188, -1.8819122314453125, -1.8268814086914062, -1.7718505859375, -1.7168197631835938, -1.6617889404296875, -1.6067581176757812, -1.551727294921875, -1.4966964721679688, -1.4416656494140625, -1.3866348266601562, -1.33160400390625, -1.2765731811523438, -1.2215423583984375, -1.1665115356445312, -1.111480712890625, -1.0564498901367188, -1.0014190673828125, -0.9463882446289062, -0.891357421875, -0.8363265991210938, -0.7812957763671875, -0.7262649536132812, -0.671234130859375, -0.6162033081054688, -0.5611724853515625, -0.5061416625976562, -0.45111083984375, -0.39608001708984375, -0.3410491943359375, -0.28601837158203125, -0.230987548828125, -0.17595672607421875, -0.1209259033203125, -0.06589508056640625, -0.0108642578125, 0.04416656494140625, 0.0991973876953125, 0.15422821044921875, 0.209259033203125, 0.26428985595703125, 0.3193206787109375, 0.37435150146484375, 0.42938232421875, 0.48441314697265625, 0.5394439697265625, 0.5944747924804688, 0.649505615234375, 0.7045364379882812, 0.7595672607421875, 0.8145980834960938, 0.86962890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 3.0, 10.0, 12.0, 20.0, 26.0, 46.0, 80.0, 107.0, 227.0, 507.0, 1273.0, 3446.0, 10933.0, 37918.0, 271273.0, 618266.0, 76824.0, 18459.0, 5656.0, 1955.0, 754.0, 322.0, 175.0, 88.0, 54.0, 39.0, 26.0, 15.0, 9.0, 10.0, 7.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64453125, -0.6245269775390625, -0.604522705078125, -0.5845184326171875, -0.56451416015625, -0.5445098876953125, -0.524505615234375, -0.5045013427734375, -0.4844970703125, -0.4644927978515625, -0.444488525390625, -0.4244842529296875, -0.40447998046875, -0.3844757080078125, -0.364471435546875, -0.3444671630859375, -0.324462890625, -0.3044586181640625, -0.284454345703125, -0.2644500732421875, -0.24444580078125, -0.2244415283203125, -0.204437255859375, -0.1844329833984375, -0.1644287109375, -0.1444244384765625, -0.124420166015625, -0.1044158935546875, -0.08441162109375, -0.0644073486328125, -0.044403076171875, -0.0243988037109375, -0.00439453125, 0.0156097412109375, 0.035614013671875, 0.0556182861328125, 0.07562255859375, 0.0956268310546875, 0.115631103515625, 0.1356353759765625, 0.1556396484375, 0.1756439208984375, 0.195648193359375, 0.2156524658203125, 0.23565673828125, 0.2556610107421875, 0.275665283203125, 0.2956695556640625, 0.315673828125, 0.3356781005859375, 0.355682373046875, 0.3756866455078125, 0.39569091796875, 0.4156951904296875, 0.435699462890625, 0.4557037353515625, 0.4757080078125, 0.4957122802734375, 0.515716552734375, 0.5357208251953125, 0.55572509765625, 0.5757293701171875, 0.595733642578125, 0.6157379150390625, 0.6357421875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 1.0, 3.0, 8.0, 10.0, 16.0, 17.0, 39.0, 42.0, 47.0, 56.0, 56.0, 77.0, 64.0, 69.0, 89.0, 75.0, 63.0, 53.0, 49.0, 32.0, 30.0, 31.0, 17.0, 19.0, 19.0, 7.0, 4.0, 2.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.564453125, -2.481048583984375, -2.39764404296875, -2.314239501953125, -2.2308349609375, -2.147430419921875, -2.06402587890625, -1.980621337890625, -1.897216796875, -1.813812255859375, -1.73040771484375, -1.647003173828125, -1.5635986328125, -1.480194091796875, -1.39678955078125, -1.313385009765625, -1.22998046875, -1.146575927734375, -1.06317138671875, -0.979766845703125, -0.8963623046875, -0.812957763671875, -0.72955322265625, -0.646148681640625, -0.562744140625, -0.479339599609375, -0.39593505859375, -0.312530517578125, -0.2291259765625, -0.145721435546875, -0.06231689453125, 0.021087646484375, 0.1044921875, 0.187896728515625, 0.27130126953125, 0.354705810546875, 0.4381103515625, 0.521514892578125, 0.60491943359375, 0.688323974609375, 0.771728515625, 0.855133056640625, 0.93853759765625, 1.021942138671875, 1.1053466796875, 1.188751220703125, 1.27215576171875, 1.355560302734375, 1.43896484375, 1.522369384765625, 1.60577392578125, 1.689178466796875, 1.7725830078125, 1.855987548828125, 1.93939208984375, 2.022796630859375, 2.106201171875, 2.189605712890625, 2.27301025390625, 2.356414794921875, 2.4398193359375, 2.523223876953125, 2.60662841796875, 2.690032958984375, 2.7734375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 11.0, 12.0, 17.0, 20.0, 33.0, 69.0, 83.0, 109.0, 189.0, 328.0, 560.0, 979.0, 1907.0, 3897.0, 8186.0, 20404.0, 59893.0, 265173.0, 502428.0, 124395.0, 35269.0, 13175.0, 5669.0, 2571.0, 1420.0, 714.0, 398.0, 230.0, 159.0, 71.0, 55.0, 45.0, 22.0, 26.0, 8.0, 6.0, 6.0, 4.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.17529296875, -0.17032241821289062, -0.16535186767578125, -0.16038131713867188, -0.1554107666015625, -0.15044021606445312, -0.14546966552734375, -0.14049911499023438, -0.135528564453125, -0.13055801391601562, -0.12558746337890625, -0.12061691284179688, -0.1156463623046875, -0.11067581176757812, -0.10570526123046875, -0.10073471069335938, -0.09576416015625, -0.09079360961914062, -0.08582305908203125, -0.08085250854492188, -0.0758819580078125, -0.07091140747070312, -0.06594085693359375, -0.060970306396484375, -0.055999755859375, -0.051029205322265625, -0.04605865478515625, -0.041088104248046875, -0.0361175537109375, -0.031147003173828125, -0.02617645263671875, -0.021205902099609375, -0.0162353515625, -0.011264801025390625, -0.00629425048828125, -0.001323699951171875, 0.0036468505859375, 0.008617401123046875, 0.01358795166015625, 0.018558502197265625, 0.023529052734375, 0.028499603271484375, 0.03347015380859375, 0.038440704345703125, 0.0434112548828125, 0.048381805419921875, 0.05335235595703125, 0.058322906494140625, 0.06329345703125, 0.06826400756835938, 0.07323455810546875, 0.07820510864257812, 0.0831756591796875, 0.08814620971679688, 0.09311676025390625, 0.09808731079101562, 0.103057861328125, 0.10802841186523438, 0.11299896240234375, 0.11796951293945312, 0.1229400634765625, 0.12791061401367188, 0.13288116455078125, 0.13785171508789062, 0.142822265625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 6.0, 10.0, 9.0, 7.0, 11.0, 19.0, 34.0, 41.0, 60.0, 113.0, 135.0, 136.0, 112.0, 95.0, 65.0, 38.0, 25.0, 15.0, 14.0, 13.0, 10.0, 6.0, 5.0, 2.0, 4.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.347894668579102e-05, -6.106030195951462e-05, -5.864165723323822e-05, -5.622301250696182e-05, -5.3804367780685425e-05, -5.138572305440903e-05, -4.896707832813263e-05, -4.654843360185623e-05, -4.4129788875579834e-05, -4.1711144149303436e-05, -3.929249942302704e-05, -3.687385469675064e-05, -3.445520997047424e-05, -3.2036565244197845e-05, -2.9617920517921448e-05, -2.719927579164505e-05, -2.4780631065368652e-05, -2.2361986339092255e-05, -1.9943341612815857e-05, -1.752469688653946e-05, -1.5106052160263062e-05, -1.2687407433986664e-05, -1.0268762707710266e-05, -7.850117981433868e-06, -5.431473255157471e-06, -3.012828528881073e-06, -5.941838026046753e-07, 1.8244609236717224e-06, 4.24310564994812e-06, 6.661750376224518e-06, 9.080395102500916e-06, 1.1499039828777313e-05, 1.3917684555053711e-05, 1.633632928133011e-05, 1.8754974007606506e-05, 2.1173618733882904e-05, 2.3592263460159302e-05, 2.60109081864357e-05, 2.8429552912712097e-05, 3.0848197638988495e-05, 3.326684236526489e-05, 3.568548709154129e-05, 3.810413181781769e-05, 4.0522776544094086e-05, 4.2941421270370483e-05, 4.536006599664688e-05, 4.777871072292328e-05, 5.0197355449199677e-05, 5.2616000175476074e-05, 5.503464490175247e-05, 5.745328962802887e-05, 5.987193435430527e-05, 6.229057908058167e-05, 6.470922380685806e-05, 6.712786853313446e-05, 6.954651325941086e-05, 7.196515798568726e-05, 7.438380271196365e-05, 7.680244743824005e-05, 7.922109216451645e-05, 8.163973689079285e-05, 8.405838161706924e-05, 8.647702634334564e-05, 8.889567106962204e-05, 9.131431579589844e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 2.0, 6.0, 6.0, 6.0, 11.0, 12.0, 8.0, 12.0, 23.0, 37.0, 45.0, 79.0, 127.0, 316.0, 852.0, 3103.0, 13080.0, 73565.0, 711691.0, 211341.0, 26249.0, 5649.0, 1377.0, 487.0, 183.0, 98.0, 45.0, 33.0, 25.0, 12.0, 18.0, 6.0, 8.0, 8.0, 2.0, 6.0, 6.0, 2.0, 3.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2880859375, -0.2792816162109375, -0.270477294921875, -0.2616729736328125, -0.25286865234375, -0.2440643310546875, -0.235260009765625, -0.2264556884765625, -0.2176513671875, -0.2088470458984375, -0.200042724609375, -0.1912384033203125, -0.18243408203125, -0.1736297607421875, -0.164825439453125, -0.1560211181640625, -0.147216796875, -0.1384124755859375, -0.129608154296875, -0.1208038330078125, -0.11199951171875, -0.1031951904296875, -0.094390869140625, -0.0855865478515625, -0.0767822265625, -0.0679779052734375, -0.059173583984375, -0.0503692626953125, -0.04156494140625, -0.0327606201171875, -0.023956298828125, -0.0151519775390625, -0.00634765625, 0.0024566650390625, 0.011260986328125, 0.0200653076171875, 0.02886962890625, 0.0376739501953125, 0.046478271484375, 0.0552825927734375, 0.0640869140625, 0.0728912353515625, 0.081695556640625, 0.0904998779296875, 0.09930419921875, 0.1081085205078125, 0.116912841796875, 0.1257171630859375, 0.134521484375, 0.1433258056640625, 0.152130126953125, 0.1609344482421875, 0.16973876953125, 0.1785430908203125, 0.187347412109375, 0.1961517333984375, 0.2049560546875, 0.2137603759765625, 0.222564697265625, 0.2313690185546875, 0.24017333984375, 0.2489776611328125, 0.257781982421875, 0.2665863037109375, 0.275390625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 6.0, 5.0, 6.0, 5.0, 7.0, 11.0, 6.0, 13.0, 20.0, 21.0, 51.0, 38.0, 66.0, 81.0, 85.0, 104.0, 95.0, 87.0, 78.0, 46.0, 30.0, 29.0, 25.0, 20.0, 17.0, 6.0, 7.0, 3.0, 2.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040985107421875, -0.03960466384887695, -0.038224220275878906, -0.03684377670288086, -0.03546333312988281, -0.034082889556884766, -0.03270244598388672, -0.03132200241088867, -0.029941558837890625, -0.028561115264892578, -0.02718067169189453, -0.025800228118896484, -0.024419784545898438, -0.02303934097290039, -0.021658897399902344, -0.020278453826904297, -0.01889801025390625, -0.017517566680908203, -0.016137123107910156, -0.01475667953491211, -0.013376235961914062, -0.011995792388916016, -0.010615348815917969, -0.009234905242919922, -0.007854461669921875, -0.006474018096923828, -0.005093574523925781, -0.0037131309509277344, -0.0023326873779296875, -0.0009522438049316406, 0.00042819976806640625, 0.0018086433410644531, 0.0031890869140625, 0.004569530487060547, 0.005949974060058594, 0.007330417633056641, 0.008710861206054688, 0.010091304779052734, 0.011471748352050781, 0.012852191925048828, 0.014232635498046875, 0.015613079071044922, 0.01699352264404297, 0.018373966217041016, 0.019754409790039062, 0.02113485336303711, 0.022515296936035156, 0.023895740509033203, 0.02527618408203125, 0.026656627655029297, 0.028037071228027344, 0.02941751480102539, 0.030797958374023438, 0.032178401947021484, 0.03355884552001953, 0.03493928909301758, 0.036319732666015625, 0.03770017623901367, 0.03908061981201172, 0.040461063385009766, 0.04184150695800781, 0.04322195053100586, 0.044602394104003906, 0.04598283767700195, 0.04736328125]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 15.0, 34.0, 36.0, 65.0, 87.0, 148.0, 174.0, 153.0, 99.0, 71.0, 42.0, 25.0, 15.0, 11.0, 4.0, 8.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8319793939590454, -1.7723743915557861, -1.7127693891525269, -1.6531643867492676, -1.5935593843460083, -1.533954381942749, -1.4743494987487793, -1.41474449634552, -1.3551394939422607, -1.2955344915390015, -1.2359294891357422, -1.176324486732483, -1.1167194843292236, -1.057114601135254, -0.9975095391273499, -0.9379045963287354, -0.8782995343208313, -0.818694531917572, -0.7590895295143127, -0.6994845867156982, -0.639879584312439, -0.5802745819091797, -0.5206695795059204, -0.4610646069049835, -0.40145960450172424, -0.34185460209846497, -0.2822496294975281, -0.2226446270942688, -0.16303963959217072, -0.10343465209007263, -0.043829649686813354, 0.015775322914123535, 0.07538032531738281, 0.1349853128194809, 0.19459030032157898, 0.25419530272483826, 0.31380027532577515, 0.3734052777290344, 0.4330102801322937, 0.4926152527332306, 0.5522202253341675, 0.6118252277374268, 0.671430230140686, 0.7310352325439453, 0.7906401753425598, 0.8502451777458191, 0.9098501801490784, 0.9694551229476929, 1.0290601253509521, 1.0886651277542114, 1.1482701301574707, 1.20787513256073, 1.2674801349639893, 1.327085018157959, 1.3866901397705078, 1.4462950229644775, 1.5059001445770264, 1.5655051469802856, 1.625110149383545, 1.6847151517868042, 1.7443201541900635, 1.8039250373840332, 1.863530158996582, 1.9231350421905518, 1.982740044593811]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 7.0, 5.0, 9.0, 15.0, 27.0, 26.0, 37.0, 48.0, 61.0, 56.0, 70.0, 85.0, 82.0, 62.0, 81.0, 69.0, 57.0, 55.0, 40.0, 34.0, 16.0, 17.0, 12.0, 13.0, 9.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.7790000438690186, -1.7380934953689575, -1.697186827659607, -1.656280279159546, -1.6153736114501953, -1.5744670629501343, -1.5335603952407837, -1.4926538467407227, -1.451747179031372, -1.410840630531311, -1.3699339628219604, -1.3290274143218994, -1.2881207466125488, -1.2472141981124878, -1.2063075304031372, -1.1654009819030762, -1.1244944334030151, -1.083587884902954, -1.0426812171936035, -1.0017746686935425, -0.9608680009841919, -0.9199614524841309, -0.879054844379425, -0.8381482362747192, -0.7972416281700134, -0.7563350200653076, -0.7154284119606018, -0.674521803855896, -0.633615255355835, -0.5927085876464844, -0.5518020391464233, -0.5108954310417175, -0.46998870372772217, -0.42908209562301636, -0.38817548751831055, -0.3472689092159271, -0.3063623011112213, -0.2654556930065155, -0.2245490998029709, -0.18364250659942627, -0.14273589849472046, -0.10182929784059525, -0.06092269718647003, -0.020016096532344818, 0.020890504121780396, 0.061797112226486206, 0.10270370543003082, 0.14361029863357544, 0.18451690673828125, 0.22542351484298706, 0.26633012294769287, 0.3072367012500763, 0.3481433093547821, 0.3890499174594879, 0.42995649576187134, 0.47086310386657715, 0.511769711971283, 0.5526763200759888, 0.5935829281806946, 0.6344895362854004, 0.6753960847854614, 0.716302752494812, 0.757209300994873, 0.7981159090995789, 0.8390225172042847]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 6.0, 1.0, 7.0, 2.0, 7.0, 12.0, 12.0, 21.0, 11.0, 37.0, 53.0, 97.0, 522.0, 9425.0, 963256.0, 73322.0, 1356.0, 179.0, 62.0, 34.0, 35.0, 23.0, 19.0, 11.0, 15.0, 5.0, 9.0, 4.0, 8.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.15625, -5.029571533203125, -4.90289306640625, -4.776214599609375, -4.6495361328125, -4.522857666015625, -4.39617919921875, -4.269500732421875, -4.142822265625, -4.016143798828125, -3.88946533203125, -3.762786865234375, -3.6361083984375, -3.509429931640625, -3.38275146484375, -3.256072998046875, -3.12939453125, -3.002716064453125, -2.87603759765625, -2.749359130859375, -2.6226806640625, -2.496002197265625, -2.36932373046875, -2.242645263671875, -2.115966796875, -1.989288330078125, -1.86260986328125, -1.735931396484375, -1.6092529296875, -1.482574462890625, -1.35589599609375, -1.229217529296875, -1.1025390625, -0.975860595703125, -0.84918212890625, -0.722503662109375, -0.5958251953125, -0.469146728515625, -0.34246826171875, -0.215789794921875, -0.089111328125, 0.037567138671875, 0.16424560546875, 0.290924072265625, 0.4176025390625, 0.544281005859375, 0.67095947265625, 0.797637939453125, 0.92431640625, 1.050994873046875, 1.17767333984375, 1.304351806640625, 1.4310302734375, 1.557708740234375, 1.68438720703125, 1.811065673828125, 1.937744140625, 2.064422607421875, 2.19110107421875, 2.317779541015625, 2.4444580078125, 2.571136474609375, 2.69781494140625, 2.824493408203125, 2.951171875]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 13.0, 14.0, 35.0, 72.0, 109.0, 166.0, 193.0, 161.0, 117.0, 69.0, 35.0, 18.0, 8.0, 6.0], "bins": [-10.8671875, -10.674575805664062, -10.481964111328125, -10.289352416992188, -10.09674072265625, -9.904129028320312, -9.711517333984375, -9.518905639648438, -9.3262939453125, -9.133682250976562, -8.941070556640625, -8.748458862304688, -8.55584716796875, -8.363235473632812, -8.170623779296875, -7.9780120849609375, -7.785400390625, -7.5927886962890625, -7.400177001953125, -7.2075653076171875, -7.01495361328125, -6.8223419189453125, -6.629730224609375, -6.4371185302734375, -6.2445068359375, -6.0518951416015625, -5.859283447265625, -5.6666717529296875, -5.47406005859375, -5.2814483642578125, -5.088836669921875, -4.8962249755859375, -4.70361328125, -4.5110015869140625, -4.318389892578125, -4.1257781982421875, -3.93316650390625, -3.7405548095703125, -3.547943115234375, -3.3553314208984375, -3.1627197265625, -2.9701080322265625, -2.777496337890625, -2.5848846435546875, -2.39227294921875, -2.1996612548828125, -2.007049560546875, -1.8144378662109375, -1.621826171875, -1.4292144775390625, -1.236602783203125, -1.0439910888671875, -0.85137939453125, -0.6587677001953125, -0.466156005859375, -0.2735443115234375, -0.0809326171875, 0.1116790771484375, 0.304290771484375, 0.4969024658203125, 0.68951416015625, 0.8821258544921875, 1.074737548828125, 1.2673492431640625, 1.4599609375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 4.0, 9.0, 13.0, 10.0, 16.0, 19.0, 25.0, 37.0, 41.0, 60.0, 52.0, 94.0, 104.0, 147.0, 209.0, 406.0, 1317.0, 10130.0, 334266.0, 677923.0, 20222.0, 2002.0, 533.0, 249.0, 177.0, 125.0, 75.0, 64.0, 59.0, 37.0, 26.0, 19.0, 20.0, 17.0, 6.0, 12.0, 6.0, 4.0, 4.0, 4.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.033203125, -1.967864990234375, -1.90252685546875, -1.837188720703125, -1.7718505859375, -1.706512451171875, -1.64117431640625, -1.575836181640625, -1.510498046875, -1.445159912109375, -1.37982177734375, -1.314483642578125, -1.2491455078125, -1.183807373046875, -1.11846923828125, -1.053131103515625, -0.98779296875, -0.922454833984375, -0.85711669921875, -0.791778564453125, -0.7264404296875, -0.661102294921875, -0.59576416015625, -0.530426025390625, -0.465087890625, -0.399749755859375, -0.33441162109375, -0.269073486328125, -0.2037353515625, -0.138397216796875, -0.07305908203125, -0.007720947265625, 0.0576171875, 0.122955322265625, 0.18829345703125, 0.253631591796875, 0.3189697265625, 0.384307861328125, 0.44964599609375, 0.514984130859375, 0.580322265625, 0.645660400390625, 0.71099853515625, 0.776336669921875, 0.8416748046875, 0.907012939453125, 0.97235107421875, 1.037689208984375, 1.10302734375, 1.168365478515625, 1.23370361328125, 1.299041748046875, 1.3643798828125, 1.429718017578125, 1.49505615234375, 1.560394287109375, 1.625732421875, 1.691070556640625, 1.75640869140625, 1.821746826171875, 1.8870849609375, 1.952423095703125, 2.01776123046875, 2.083099365234375, 2.1484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 6.0, 1.0, 2.0, 8.0, 9.0, 7.0, 19.0, 12.0, 18.0, 18.0, 19.0, 21.0, 22.0, 21.0, 35.0, 34.0, 28.0, 42.0, 29.0, 47.0, 44.0, 43.0, 49.0, 42.0, 45.0, 31.0, 38.0, 37.0, 40.0, 28.0, 26.0, 29.0, 26.0, 18.0, 14.0, 17.0, 18.0, 10.0, 8.0, 7.0, 6.0, 6.0, 5.0, 2.0, 4.0, 4.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.8203125, -1.765899658203125, -1.71148681640625, -1.657073974609375, -1.6026611328125, -1.548248291015625, -1.49383544921875, -1.439422607421875, -1.385009765625, -1.330596923828125, -1.27618408203125, -1.221771240234375, -1.1673583984375, -1.112945556640625, -1.05853271484375, -1.004119873046875, -0.94970703125, -0.895294189453125, -0.84088134765625, -0.786468505859375, -0.7320556640625, -0.677642822265625, -0.62322998046875, -0.568817138671875, -0.514404296875, -0.459991455078125, -0.40557861328125, -0.351165771484375, -0.2967529296875, -0.242340087890625, -0.18792724609375, -0.133514404296875, -0.0791015625, -0.024688720703125, 0.02972412109375, 0.084136962890625, 0.1385498046875, 0.192962646484375, 0.24737548828125, 0.301788330078125, 0.356201171875, 0.410614013671875, 0.46502685546875, 0.519439697265625, 0.5738525390625, 0.628265380859375, 0.68267822265625, 0.737091064453125, 0.79150390625, 0.845916748046875, 0.90032958984375, 0.954742431640625, 1.0091552734375, 1.063568115234375, 1.11798095703125, 1.172393798828125, 1.226806640625, 1.281219482421875, 1.33563232421875, 1.390045166015625, 1.4444580078125, 1.498870849609375, 1.55328369140625, 1.607696533203125, 1.662109375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 6.0, 2.0, 8.0, 7.0, 19.0, 21.0, 38.0, 68.0, 147.0, 481.0, 2379.0, 41845.0, 958264.0, 42085.0, 2381.0, 466.0, 160.0, 71.0, 46.0, 22.0, 13.0, 9.0, 6.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1640625, -1.1338272094726562, -1.1035919189453125, -1.0733566284179688, -1.043121337890625, -1.0128860473632812, -0.9826507568359375, -0.9524154663085938, -0.92218017578125, -0.8919448852539062, -0.8617095947265625, -0.8314743041992188, -0.801239013671875, -0.7710037231445312, -0.7407684326171875, -0.7105331420898438, -0.6802978515625, -0.6500625610351562, -0.6198272705078125, -0.5895919799804688, -0.559356689453125, -0.5291213989257812, -0.4988861083984375, -0.46865081787109375, -0.43841552734375, -0.40818023681640625, -0.3779449462890625, -0.34770965576171875, -0.317474365234375, -0.28723907470703125, -0.2570037841796875, -0.22676849365234375, -0.196533203125, -0.16629791259765625, -0.1360626220703125, -0.10582733154296875, -0.075592041015625, -0.04535675048828125, -0.0151214599609375, 0.01511383056640625, 0.04534912109375, 0.07558441162109375, 0.1058197021484375, 0.13605499267578125, 0.166290283203125, 0.19652557373046875, 0.2267608642578125, 0.25699615478515625, 0.2872314453125, 0.31746673583984375, 0.3477020263671875, 0.37793731689453125, 0.408172607421875, 0.43840789794921875, 0.4686431884765625, 0.49887847900390625, 0.52911376953125, 0.5593490600585938, 0.5895843505859375, 0.6198196411132812, 0.650054931640625, 0.6802902221679688, 0.7105255126953125, 0.7407608032226562, 0.77099609375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 5.0, 9.0, 11.0, 12.0, 25.0, 47.0, 91.0, 124.0, 166.0, 150.0, 113.0, 92.0, 64.0, 33.0, 20.0, 12.0, 11.0, 7.0, 2.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.56978988647461e-05, -7.308833301067352e-05, -7.047876715660095e-05, -6.786920130252838e-05, -6.525963544845581e-05, -6.265006959438324e-05, -6.004050374031067e-05, -5.74309378862381e-05, -5.482137203216553e-05, -5.2211806178092957e-05, -4.9602240324020386e-05, -4.6992674469947815e-05, -4.4383108615875244e-05, -4.177354276180267e-05, -3.91639769077301e-05, -3.655441105365753e-05, -3.394484519958496e-05, -3.133527934551239e-05, -2.872571349143982e-05, -2.611614763736725e-05, -2.3506581783294678e-05, -2.0897015929222107e-05, -1.8287450075149536e-05, -1.5677884221076965e-05, -1.3068318367004395e-05, -1.0458752512931824e-05, -7.849186658859253e-06, -5.239620804786682e-06, -2.6300549507141113e-06, -2.0489096641540527e-08, 2.5890767574310303e-06, 5.198642611503601e-06, 7.808208465576172e-06, 1.0417774319648743e-05, 1.3027340173721313e-05, 1.5636906027793884e-05, 1.8246471881866455e-05, 2.0856037735939026e-05, 2.3465603590011597e-05, 2.6075169444084167e-05, 2.8684735298156738e-05, 3.129430115222931e-05, 3.390386700630188e-05, 3.651343286037445e-05, 3.912299871444702e-05, 4.173256456851959e-05, 4.434213042259216e-05, 4.6951696276664734e-05, 4.9561262130737305e-05, 5.2170827984809875e-05, 5.4780393838882446e-05, 5.738995969295502e-05, 5.999952554702759e-05, 6.260909140110016e-05, 6.521865725517273e-05, 6.78282231092453e-05, 7.043778896331787e-05, 7.304735481739044e-05, 7.565692067146301e-05, 7.826648652553558e-05, 8.087605237960815e-05, 8.348561823368073e-05, 8.60951840877533e-05, 8.870474994182587e-05, 9.131431579589844e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 9.0, 17.0, 19.0, 20.0, 52.0, 88.0, 183.0, 479.0, 1822.0, 19189.0, 930105.0, 91323.0, 3876.0, 808.0, 283.0, 106.0, 74.0, 28.0, 19.0, 13.0, 9.0, 8.0, 6.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2021484375, -1.1684646606445312, -1.1347808837890625, -1.1010971069335938, -1.067413330078125, -1.0337295532226562, -1.0000457763671875, -0.9663619995117188, -0.93267822265625, -0.8989944458007812, -0.8653106689453125, -0.8316268920898438, -0.797943115234375, -0.7642593383789062, -0.7305755615234375, -0.6968917846679688, -0.6632080078125, -0.6295242309570312, -0.5958404541015625, -0.5621566772460938, -0.528472900390625, -0.49478912353515625, -0.4611053466796875, -0.42742156982421875, -0.39373779296875, -0.36005401611328125, -0.3263702392578125, -0.29268646240234375, -0.259002685546875, -0.22531890869140625, -0.1916351318359375, -0.15795135498046875, -0.124267578125, -0.09058380126953125, -0.0569000244140625, -0.02321624755859375, 0.010467529296875, 0.04415130615234375, 0.0778350830078125, 0.11151885986328125, 0.14520263671875, 0.17888641357421875, 0.2125701904296875, 0.24625396728515625, 0.279937744140625, 0.31362152099609375, 0.3473052978515625, 0.38098907470703125, 0.4146728515625, 0.44835662841796875, 0.4820404052734375, 0.5157241821289062, 0.549407958984375, 0.5830917358398438, 0.6167755126953125, 0.6504592895507812, 0.68414306640625, 0.7178268432617188, 0.7515106201171875, 0.7851943969726562, 0.818878173828125, 0.8525619506835938, 0.8862457275390625, 0.9199295043945312, 0.95361328125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 4.0, 11.0, 16.0, 15.0, 24.0, 38.0, 60.0, 64.0, 112.0, 125.0, 129.0, 104.0, 82.0, 67.0, 49.0, 26.0, 16.0, 15.0, 16.0, 7.0, 2.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1781005859375, -0.17127418518066406, -0.16444778442382812, -0.1576213836669922, -0.15079498291015625, -0.1439685821533203, -0.13714218139648438, -0.13031578063964844, -0.1234893798828125, -0.11666297912597656, -0.10983657836914062, -0.10301017761230469, -0.09618377685546875, -0.08935737609863281, -0.08253097534179688, -0.07570457458496094, -0.068878173828125, -0.06205177307128906, -0.055225372314453125, -0.04839897155761719, -0.04157257080078125, -0.03474617004394531, -0.027919769287109375, -0.021093368530273438, -0.0142669677734375, -0.0074405670166015625, -0.000614166259765625, 0.0062122344970703125, 0.01303863525390625, 0.019865036010742188, 0.026691436767578125, 0.03351783752441406, 0.04034423828125, 0.04717063903808594, 0.053997039794921875, 0.06082344055175781, 0.06764984130859375, 0.07447624206542969, 0.08130264282226562, 0.08812904357910156, 0.0949554443359375, 0.10178184509277344, 0.10860824584960938, 0.11543464660644531, 0.12226104736328125, 0.1290874481201172, 0.13591384887695312, 0.14274024963378906, 0.149566650390625, 0.15639305114746094, 0.16321945190429688, 0.1700458526611328, 0.17687225341796875, 0.1836986541748047, 0.19052505493164062, 0.19735145568847656, 0.2041778564453125, 0.21100425720214844, 0.21783065795898438, 0.2246570587158203, 0.23148345947265625, 0.2383098602294922, 0.24513626098632812, 0.25196266174316406, 0.2587890625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 6.0, 14.0, 27.0, 60.0, 106.0, 183.0, 190.0, 189.0, 111.0, 46.0, 34.0, 13.0, 8.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.292221784591675, -3.1399030685424805, -2.987584352493286, -2.835265636444092, -2.6829471588134766, -2.5306284427642822, -2.378309726715088, -2.2259912490844727, -2.073672294616699, -1.9213535785675049, -1.7690349817276, -1.6167162656784058, -1.464397668838501, -1.3120789527893066, -1.1597602367401123, -1.0074416399002075, -0.8551230430603027, -0.7028043866157532, -0.5504857301712036, -0.3981670141220093, -0.24584835767745972, -0.09352970123291016, 0.05878901481628418, 0.21110761165618896, 0.3634263277053833, 0.5157449841499329, 0.6680636405944824, 0.8203823566436768, 0.9727010130882263, 1.1250196695327759, 1.2773383855819702, 1.429656982421875, 1.5819754600524902, 1.7342941761016846, 1.8866127729415894, 2.038931369781494, 2.1912500858306885, 2.343568801879883, 2.495887517929077, 2.6482062339782715, 2.8005247116088867, 2.952843427658081, 3.1051621437072754, 3.2574806213378906, 3.409799337387085, 3.5621180534362793, 3.7144367694854736, 3.866755485534668, 4.019074440002441, 4.171392917633057, 4.32371187210083, 4.476030349731445, 4.628349304199219, 4.780667781829834, 4.932986259460449, 5.085305213928223, 5.237623691558838, 5.389942169189453, 5.542261123657227, 5.694579601287842, 5.846898555755615, 5.9992170333862305, 6.151535987854004, 6.303854465484619, 6.456172943115234]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 16.0, 13.0, 29.0, 31.0, 28.0, 40.0, 47.0, 60.0, 58.0, 98.0, 83.0, 65.0, 71.0, 69.0, 59.0, 59.0, 37.0, 39.0, 37.0, 25.0, 23.0, 9.0, 8.0, 7.0], "bins": [-8.575007438659668, -8.407403945922852, -8.239800453186035, -8.072196960449219, -7.904592990875244, -7.736989498138428, -7.569386005401611, -7.401782512664795, -7.2341790199279785, -7.066575527191162, -6.898972034454346, -6.731368064880371, -6.563764572143555, -6.396161079406738, -6.228557586669922, -6.0609540939331055, -5.893350601196289, -5.725747108459473, -5.558143615722656, -5.39054012298584, -5.222936153411865, -5.055332660675049, -4.887729167938232, -4.720125675201416, -4.552521705627441, -4.384918212890625, -4.217314720153809, -4.049711227416992, -3.8821074962615967, -3.714503765106201, -3.5469002723693848, -3.3792967796325684, -3.211693048477173, -3.0440895557403564, -2.876485824584961, -2.7088823318481445, -2.541278839111328, -2.3736753463745117, -2.206071615219116, -2.0384681224823, -1.8708645105361938, -1.703260898590088, -1.5356574058532715, -1.3680537939071655, -1.2004501819610596, -1.0328466892242432, -0.8652430772781372, -0.6976395845413208, -0.5300359725952148, -0.36243242025375366, -0.1948288381099701, -0.027225255966186523, 0.14037829637527466, 0.30798184871673584, 0.4755854606628418, 0.6431889533996582, 0.8107925653457642, 0.9783961176872253, 1.1459996700286865, 1.3136032819747925, 1.4812068939208984, 1.6488103866577148, 1.8164139986038208, 1.9840174913406372, 2.151621103286743]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 7.0, 10.0, 12.0, 17.0, 24.0, 34.0, 65.0, 84.0, 132.0, 242.0, 437.0, 878.0, 1783.0, 4099.0, 11850.0, 45513.0, 269701.0, 1576463.0, 1862057.0, 343067.0, 55804.0, 13166.0, 4503.0, 2023.0, 1026.0, 521.0, 310.0, 173.0, 103.0, 62.0, 39.0, 20.0, 20.0, 8.0, 8.0, 5.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.6923828125, -1.646728515625, -1.60107421875, -1.555419921875, -1.509765625, -1.464111328125, -1.41845703125, -1.372802734375, -1.3271484375, -1.281494140625, -1.23583984375, -1.190185546875, -1.14453125, -1.098876953125, -1.05322265625, -1.007568359375, -0.9619140625, -0.916259765625, -0.87060546875, -0.824951171875, -0.779296875, -0.733642578125, -0.68798828125, -0.642333984375, -0.5966796875, -0.551025390625, -0.50537109375, -0.459716796875, -0.4140625, -0.368408203125, -0.32275390625, -0.277099609375, -0.2314453125, -0.185791015625, -0.14013671875, -0.094482421875, -0.048828125, -0.003173828125, 0.04248046875, 0.088134765625, 0.1337890625, 0.179443359375, 0.22509765625, 0.270751953125, 0.31640625, 0.362060546875, 0.40771484375, 0.453369140625, 0.4990234375, 0.544677734375, 0.59033203125, 0.635986328125, 0.681640625, 0.727294921875, 0.77294921875, 0.818603515625, 0.8642578125, 0.909912109375, 0.95556640625, 1.001220703125, 1.046875, 1.092529296875, 1.13818359375, 1.183837890625, 1.2294921875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 7.0, 16.0, 11.0, 18.0, 26.0, 21.0, 22.0, 35.0, 31.0, 42.0, 35.0, 41.0, 55.0, 52.0, 59.0, 68.0, 46.0, 56.0, 43.0, 48.0, 31.0, 34.0, 39.0, 41.0, 17.0, 19.0, 7.0, 11.0, 13.0, 7.0, 5.0, 10.0, 3.0, 7.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1220703125, -1.0846405029296875, -1.047210693359375, -1.0097808837890625, -0.97235107421875, -0.9349212646484375, -0.897491455078125, -0.8600616455078125, -0.8226318359375, -0.7852020263671875, -0.747772216796875, -0.7103424072265625, -0.67291259765625, -0.6354827880859375, -0.598052978515625, -0.5606231689453125, -0.523193359375, -0.4857635498046875, -0.448333740234375, -0.4109039306640625, -0.37347412109375, -0.3360443115234375, -0.298614501953125, -0.2611846923828125, -0.2237548828125, -0.1863250732421875, -0.148895263671875, -0.1114654541015625, -0.07403564453125, -0.0366058349609375, 0.000823974609375, 0.0382537841796875, 0.07568359375, 0.1131134033203125, 0.150543212890625, 0.1879730224609375, 0.22540283203125, 0.2628326416015625, 0.300262451171875, 0.3376922607421875, 0.3751220703125, 0.4125518798828125, 0.449981689453125, 0.4874114990234375, 0.52484130859375, 0.5622711181640625, 0.599700927734375, 0.6371307373046875, 0.674560546875, 0.7119903564453125, 0.749420166015625, 0.7868499755859375, 0.82427978515625, 0.8617095947265625, 0.899139404296875, 0.9365692138671875, 0.9739990234375, 1.0114288330078125, 1.048858642578125, 1.0862884521484375, 1.12371826171875, 1.1611480712890625, 1.198577880859375, 1.2360076904296875, 1.2734375]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 4.0, 8.0, 7.0, 15.0, 9.0, 15.0, 26.0, 41.0, 52.0, 69.0, 119.0, 166.0, 306.0, 631.0, 1410.0, 4793.0, 29436.0, 744288.0, 3313587.0, 85640.0, 9419.0, 2329.0, 840.0, 376.0, 212.0, 138.0, 78.0, 64.0, 50.0, 38.0, 36.0, 18.0, 11.0, 9.0, 9.0, 9.0, 8.0, 1.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.1953125, -2.120147705078125, -2.04498291015625, -1.969818115234375, -1.8946533203125, -1.819488525390625, -1.74432373046875, -1.669158935546875, -1.593994140625, -1.518829345703125, -1.44366455078125, -1.368499755859375, -1.2933349609375, -1.218170166015625, -1.14300537109375, -1.067840576171875, -0.99267578125, -0.917510986328125, -0.84234619140625, -0.767181396484375, -0.6920166015625, -0.616851806640625, -0.54168701171875, -0.466522216796875, -0.391357421875, -0.316192626953125, -0.24102783203125, -0.165863037109375, -0.0906982421875, -0.015533447265625, 0.05963134765625, 0.134796142578125, 0.2099609375, 0.285125732421875, 0.36029052734375, 0.435455322265625, 0.5106201171875, 0.585784912109375, 0.66094970703125, 0.736114501953125, 0.811279296875, 0.886444091796875, 0.96160888671875, 1.036773681640625, 1.1119384765625, 1.187103271484375, 1.26226806640625, 1.337432861328125, 1.41259765625, 1.487762451171875, 1.56292724609375, 1.638092041015625, 1.7132568359375, 1.788421630859375, 1.86358642578125, 1.938751220703125, 2.013916015625, 2.089080810546875, 2.16424560546875, 2.239410400390625, 2.3145751953125, 2.389739990234375, 2.46490478515625, 2.540069580078125, 2.615234375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 12.0, 9.0, 12.0, 10.0, 21.0, 28.0, 29.0, 43.0, 42.0, 63.0, 94.0, 148.0, 204.0, 332.0, 426.0, 495.0, 517.0, 438.0, 329.0, 273.0, 153.0, 99.0, 68.0, 55.0, 42.0, 23.0, 25.0, 16.0, 9.0, 16.0, 8.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45166015625, -0.4384193420410156, -0.42517852783203125, -0.4119377136230469, -0.3986968994140625, -0.3854560852050781, -0.37221527099609375, -0.3589744567871094, -0.345733642578125, -0.3324928283691406, -0.31925201416015625, -0.3060111999511719, -0.2927703857421875, -0.2795295715332031, -0.26628875732421875, -0.2530479431152344, -0.23980712890625, -0.22656631469726562, -0.21332550048828125, -0.20008468627929688, -0.1868438720703125, -0.17360305786132812, -0.16036224365234375, -0.14712142944335938, -0.133880615234375, -0.12063980102539062, -0.10739898681640625, -0.09415817260742188, -0.0809173583984375, -0.06767654418945312, -0.05443572998046875, -0.041194915771484375, -0.0279541015625, -0.014713287353515625, -0.00147247314453125, 0.011768341064453125, 0.0250091552734375, 0.038249969482421875, 0.05149078369140625, 0.06473159790039062, 0.077972412109375, 0.09121322631835938, 0.10445404052734375, 0.11769485473632812, 0.1309356689453125, 0.14417648315429688, 0.15741729736328125, 0.17065811157226562, 0.18389892578125, 0.19713973999023438, 0.21038055419921875, 0.22362136840820312, 0.2368621826171875, 0.2501029968261719, 0.26334381103515625, 0.2765846252441406, 0.289825439453125, 0.3030662536621094, 0.31630706787109375, 0.3295478820800781, 0.3427886962890625, 0.3560295104980469, 0.36927032470703125, 0.3825111389160156, 0.395751953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 7.0, 6.0, 20.0, 23.0, 35.0, 43.0, 73.0, 94.0, 101.0, 125.0, 135.0, 98.0, 78.0, 56.0, 39.0, 25.0, 16.0, 12.0, 3.0, 6.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.3336222171783447, -2.2580389976501465, -2.1824557781219482, -2.10687255859375, -2.031289577484131, -1.955706238746643, -1.8801231384277344, -1.8045399188995361, -1.728956699371338, -1.6533734798431396, -1.5777902603149414, -1.5022071599960327, -1.4266239404678345, -1.3510407209396362, -1.2754576206207275, -1.1998744010925293, -1.124291181564331, -1.0487079620361328, -0.9731248021125793, -0.8975416421890259, -0.8219584226608276, -0.7463752031326294, -0.6707920432090759, -0.5952088832855225, -0.5196256637573242, -0.44404247403144836, -0.3684592843055725, -0.29287609457969666, -0.2172929048538208, -0.14170971512794495, -0.06612652540206909, 0.009456634521484375, 0.08504009246826172, 0.16062328219413757, 0.23620647192001343, 0.3117896616458893, 0.38737285137176514, 0.462956041097641, 0.5385392308235168, 0.6141223907470703, 0.6897056102752686, 0.7652888298034668, 0.8408719897270203, 0.9164551496505737, 0.992038369178772, 1.0676215887069702, 1.143204689025879, 1.2187879085540771, 1.2943711280822754, 1.3699543476104736, 1.4455375671386719, 1.5211206674575806, 1.5967038869857788, 1.672287106513977, 1.7478702068328857, 1.823453426361084, 1.8990366458892822, 1.9746198654174805, 2.0502030849456787, 2.125786304473877, 2.201369285583496, 2.2769525051116943, 2.3525357246398926, 2.428118944168091, 2.503702163696289]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 2.0, 2.0, 6.0, 8.0, 4.0, 13.0, 19.0, 15.0, 20.0, 21.0, 26.0, 35.0, 25.0, 36.0, 37.0, 38.0, 42.0, 39.0, 41.0, 57.0, 43.0, 49.0, 44.0, 51.0, 46.0, 41.0, 36.0, 27.0, 27.0, 28.0, 25.0, 17.0, 13.0, 13.0, 4.0, 7.0, 11.0, 5.0, 6.0, 7.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.130346655845642, -1.093722939491272, -1.0570991039276123, -1.0204753875732422, -0.9838516712188721, -0.9472278952598572, -0.9106041193008423, -0.8739804029464722, -0.8373566269874573, -0.8007328510284424, -0.7641091346740723, -0.7274853587150574, -0.6908615827560425, -0.6542378664016724, -0.6176140904426575, -0.5809903144836426, -0.5443665981292725, -0.5077428221702576, -0.47111910581588745, -0.43449532985687256, -0.39787158370018005, -0.36124783754348755, -0.32462406158447266, -0.28800031542778015, -0.25137656927108765, -0.21475282311439514, -0.17812906205654144, -0.14150530099868774, -0.10488155484199524, -0.06825780868530273, -0.031634047627449036, 0.004989713430404663, 0.04161334037780762, 0.07823709398508072, 0.11486084759235382, 0.15148460865020752, 0.18810835480690002, 0.22473210096359253, 0.2613558769226074, 0.2979796230792999, 0.33460336923599243, 0.37122711539268494, 0.40785086154937744, 0.44447463750839233, 0.48109838366508484, 0.5177221298217773, 0.5543459057807922, 0.5909696817398071, 0.6275933980941772, 0.6642171740531921, 0.7008408904075623, 0.7374646663665771, 0.7740883827209473, 0.8107121586799622, 0.847335934638977, 0.8839596509933472, 0.9205834269523621, 0.957207202911377, 0.9938309192657471, 1.0304546356201172, 1.0670784711837769, 1.103702187538147, 1.140325903892517, 1.1769497394561768, 1.2135734558105469]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 2.0, 7.0, 6.0, 9.0, 14.0, 11.0, 20.0, 29.0, 51.0, 84.0, 97.0, 155.0, 237.0, 417.0, 640.0, 1137.0, 1949.0, 3824.0, 7274.0, 14821.0, 31996.0, 72921.0, 164020.0, 285878.0, 243800.0, 119427.0, 52732.0, 23576.0, 10899.0, 5572.0, 2964.0, 1659.0, 867.0, 485.0, 323.0, 199.0, 142.0, 101.0, 55.0, 38.0, 31.0, 26.0, 15.0, 17.0, 11.0, 2.0, 6.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.2025146484375, -0.19634056091308594, -0.19016647338867188, -0.1839923858642578, -0.17781829833984375, -0.1716442108154297, -0.16547012329101562, -0.15929603576660156, -0.1531219482421875, -0.14694786071777344, -0.14077377319335938, -0.1345996856689453, -0.12842559814453125, -0.12225151062011719, -0.11607742309570312, -0.10990333557128906, -0.103729248046875, -0.09755516052246094, -0.09138107299804688, -0.08520698547363281, -0.07903289794921875, -0.07285881042480469, -0.06668472290039062, -0.06051063537597656, -0.0543365478515625, -0.04816246032714844, -0.041988372802734375, -0.03581428527832031, -0.02964019775390625, -0.023466110229492188, -0.017292022705078125, -0.011117935180664062, -0.00494384765625, 0.0012302398681640625, 0.007404327392578125, 0.013578414916992188, 0.01975250244140625, 0.025926589965820312, 0.032100677490234375, 0.03827476501464844, 0.0444488525390625, 0.05062294006347656, 0.056797027587890625, 0.06297111511230469, 0.06914520263671875, 0.07531929016113281, 0.08149337768554688, 0.08766746520996094, 0.093841552734375, 0.10001564025878906, 0.10618972778320312, 0.11236381530761719, 0.11853790283203125, 0.12471199035644531, 0.13088607788085938, 0.13706016540527344, 0.1432342529296875, 0.14940834045410156, 0.15558242797851562, 0.1617565155029297, 0.16793060302734375, 0.1741046905517578, 0.18027877807617188, 0.18645286560058594, 0.192626953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 5.0, 1.0, 6.0, 6.0, 5.0, 7.0, 13.0, 11.0, 17.0, 26.0, 21.0, 27.0, 33.0, 35.0, 39.0, 41.0, 48.0, 48.0, 60.0, 56.0, 46.0, 53.0, 59.0, 56.0, 42.0, 33.0, 38.0, 33.0, 25.0, 22.0, 27.0, 15.0, 7.0, 6.0, 11.0, 4.0, 11.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6787109375, -0.6525802612304688, -0.6264495849609375, -0.6003189086914062, -0.574188232421875, -0.5480575561523438, -0.5219268798828125, -0.49579620361328125, -0.46966552734375, -0.44353485107421875, -0.4174041748046875, -0.39127349853515625, -0.365142822265625, -0.33901214599609375, -0.3128814697265625, -0.28675079345703125, -0.2606201171875, -0.23448944091796875, -0.2083587646484375, -0.18222808837890625, -0.156097412109375, -0.12996673583984375, -0.1038360595703125, -0.07770538330078125, -0.05157470703125, -0.02544403076171875, 0.0006866455078125, 0.02681732177734375, 0.052947998046875, 0.07907867431640625, 0.1052093505859375, 0.13134002685546875, 0.157470703125, 0.18360137939453125, 0.2097320556640625, 0.23586273193359375, 0.261993408203125, 0.28812408447265625, 0.3142547607421875, 0.34038543701171875, 0.36651611328125, 0.39264678955078125, 0.4187774658203125, 0.44490814208984375, 0.471038818359375, 0.49716949462890625, 0.5233001708984375, 0.5494308471679688, 0.5755615234375, 0.6016921997070312, 0.6278228759765625, 0.6539535522460938, 0.680084228515625, 0.7062149047851562, 0.7323455810546875, 0.7584762573242188, 0.78460693359375, 0.8107376098632812, 0.8368682861328125, 0.8629989624023438, 0.889129638671875, 0.9152603149414062, 0.9413909912109375, 0.9675216674804688, 0.99365234375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 5.0, 4.0, 10.0, 11.0, 11.0, 23.0, 32.0, 53.0, 105.0, 184.0, 292.0, 476.0, 865.0, 1946.0, 4544.0, 12581.0, 38918.0, 126202.0, 331036.0, 338264.0, 130951.0, 40239.0, 13015.0, 4716.0, 1940.0, 933.0, 486.0, 259.0, 170.0, 99.0, 80.0, 36.0, 22.0, 24.0, 8.0, 3.0, 9.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.244873046875, -0.23613357543945312, -0.22739410400390625, -0.21865463256835938, -0.2099151611328125, -0.20117568969726562, -0.19243621826171875, -0.18369674682617188, -0.174957275390625, -0.16621780395507812, -0.15747833251953125, -0.14873886108398438, -0.1399993896484375, -0.13125991821289062, -0.12252044677734375, -0.11378097534179688, -0.10504150390625, -0.09630203247070312, -0.08756256103515625, -0.07882308959960938, -0.0700836181640625, -0.061344146728515625, -0.05260467529296875, -0.043865203857421875, -0.035125732421875, -0.026386260986328125, -0.01764678955078125, -0.008907318115234375, -0.0001678466796875, 0.008571624755859375, 0.01731109619140625, 0.026050567626953125, 0.0347900390625, 0.043529510498046875, 0.05226898193359375, 0.061008453369140625, 0.0697479248046875, 0.07848739624023438, 0.08722686767578125, 0.09596633911132812, 0.104705810546875, 0.11344528198242188, 0.12218475341796875, 0.13092422485351562, 0.1396636962890625, 0.14840316772460938, 0.15714263916015625, 0.16588211059570312, 0.17462158203125, 0.18336105346679688, 0.19210052490234375, 0.20083999633789062, 0.2095794677734375, 0.21831893920898438, 0.22705841064453125, 0.23579788208007812, 0.244537353515625, 0.2532768249511719, 0.26201629638671875, 0.2707557678222656, 0.2794952392578125, 0.2882347106933594, 0.29697418212890625, 0.3057136535644531, 0.314453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 7.0, 4.0, 5.0, 14.0, 14.0, 17.0, 18.0, 21.0, 24.0, 24.0, 36.0, 43.0, 48.0, 53.0, 51.0, 55.0, 65.0, 66.0, 49.0, 52.0, 50.0, 55.0, 33.0, 35.0, 22.0, 21.0, 25.0, 21.0, 11.0, 18.0, 10.0, 13.0, 8.0, 3.0, 5.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.080078125, -2.0226593017578125, -1.965240478515625, -1.9078216552734375, -1.85040283203125, -1.7929840087890625, -1.735565185546875, -1.6781463623046875, -1.6207275390625, -1.5633087158203125, -1.505889892578125, -1.4484710693359375, -1.39105224609375, -1.3336334228515625, -1.276214599609375, -1.2187957763671875, -1.161376953125, -1.1039581298828125, -1.046539306640625, -0.9891204833984375, -0.93170166015625, -0.8742828369140625, -0.816864013671875, -0.7594451904296875, -0.7020263671875, -0.6446075439453125, -0.587188720703125, -0.5297698974609375, -0.47235107421875, -0.4149322509765625, -0.357513427734375, -0.3000946044921875, -0.24267578125, -0.1852569580078125, -0.127838134765625, -0.0704193115234375, -0.01300048828125, 0.0444183349609375, 0.101837158203125, 0.1592559814453125, 0.2166748046875, 0.2740936279296875, 0.331512451171875, 0.3889312744140625, 0.44635009765625, 0.5037689208984375, 0.561187744140625, 0.6186065673828125, 0.676025390625, 0.7334442138671875, 0.790863037109375, 0.8482818603515625, 0.90570068359375, 0.9631195068359375, 1.020538330078125, 1.0779571533203125, 1.1353759765625, 1.1927947998046875, 1.250213623046875, 1.3076324462890625, 1.36505126953125, 1.4224700927734375, 1.479888916015625, 1.5373077392578125, 1.5947265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 9.0, 6.0, 10.0, 13.0, 18.0, 36.0, 47.0, 69.0, 103.0, 162.0, 285.0, 501.0, 940.0, 2034.0, 4681.0, 13961.0, 61460.0, 334073.0, 485199.0, 110870.0, 22008.0, 6683.0, 2636.0, 1198.0, 616.0, 326.0, 226.0, 122.0, 75.0, 50.0, 39.0, 38.0, 23.0, 14.0, 8.0, 2.0, 8.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.14208984375, -0.13753128051757812, -0.13297271728515625, -0.12841415405273438, -0.1238555908203125, -0.11929702758789062, -0.11473846435546875, -0.11017990112304688, -0.105621337890625, -0.10106277465820312, -0.09650421142578125, -0.09194564819335938, -0.0873870849609375, -0.08282852172851562, -0.07826995849609375, -0.07371139526367188, -0.06915283203125, -0.06459426879882812, -0.06003570556640625, -0.055477142333984375, -0.0509185791015625, -0.046360015869140625, -0.04180145263671875, -0.037242889404296875, -0.032684326171875, -0.028125762939453125, -0.02356719970703125, -0.019008636474609375, -0.0144500732421875, -0.009891510009765625, -0.00533294677734375, -0.000774383544921875, 0.0037841796875, 0.008342742919921875, 0.01290130615234375, 0.017459869384765625, 0.0220184326171875, 0.026576995849609375, 0.03113555908203125, 0.035694122314453125, 0.040252685546875, 0.044811248779296875, 0.04936981201171875, 0.053928375244140625, 0.0584869384765625, 0.06304550170898438, 0.06760406494140625, 0.07216262817382812, 0.07672119140625, 0.08127975463867188, 0.08583831787109375, 0.09039688110351562, 0.0949554443359375, 0.09951400756835938, 0.10407257080078125, 0.10863113403320312, 0.113189697265625, 0.11774826049804688, 0.12230682373046875, 0.12686538696289062, 0.1314239501953125, 0.13598251342773438, 0.14054107666015625, 0.14509963989257812, 0.149658203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 9.0, 7.0, 14.0, 16.0, 27.0, 43.0, 64.0, 72.0, 96.0, 97.0, 125.0, 117.0, 98.0, 66.0, 56.0, 34.0, 18.0, 12.0, 10.0, 11.0, 7.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.87973403930664e-05, -7.68834725022316e-05, -7.496960461139679e-05, -7.305573672056198e-05, -7.114186882972717e-05, -6.922800093889236e-05, -6.731413304805756e-05, -6.540026515722275e-05, -6.348639726638794e-05, -6.157252937555313e-05, -5.965866148471832e-05, -5.7744793593883514e-05, -5.5830925703048706e-05, -5.39170578122139e-05, -5.200318992137909e-05, -5.008932203054428e-05, -4.817545413970947e-05, -4.6261586248874664e-05, -4.4347718358039856e-05, -4.243385046720505e-05, -4.051998257637024e-05, -3.860611468553543e-05, -3.669224679470062e-05, -3.4778378903865814e-05, -3.2864511013031006e-05, -3.09506431221962e-05, -2.903677523136139e-05, -2.712290734052658e-05, -2.5209039449691772e-05, -2.3295171558856964e-05, -2.1381303668022156e-05, -1.9467435777187347e-05, -1.755356788635254e-05, -1.563969999551773e-05, -1.3725832104682922e-05, -1.1811964213848114e-05, -9.898096323013306e-06, -7.984228432178497e-06, -6.070360541343689e-06, -4.156492650508881e-06, -2.2426247596740723e-06, -3.287568688392639e-07, 1.5851110219955444e-06, 3.4989789128303528e-06, 5.412846803665161e-06, 7.3267146944999695e-06, 9.240582585334778e-06, 1.1154450476169586e-05, 1.3068318367004395e-05, 1.4982186257839203e-05, 1.689605414867401e-05, 1.880992203950882e-05, 2.0723789930343628e-05, 2.2637657821178436e-05, 2.4551525712013245e-05, 2.6465393602848053e-05, 2.837926149368286e-05, 3.029312938451767e-05, 3.220699727535248e-05, 3.4120865166187286e-05, 3.6034733057022095e-05, 3.79486009478569e-05, 3.986246883869171e-05, 4.177633672952652e-05, 4.369020462036133e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 0.0, 0.0, 6.0, 4.0, 13.0, 9.0, 11.0, 9.0, 11.0, 19.0, 22.0, 36.0, 67.0, 95.0, 143.0, 262.0, 616.0, 1472.0, 5574.0, 27218.0, 191105.0, 627930.0, 162501.0, 23734.0, 4973.0, 1439.0, 588.0, 287.0, 155.0, 72.0, 60.0, 37.0, 18.0, 19.0, 16.0, 12.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.2294921875, -0.22336578369140625, -0.2172393798828125, -0.21111297607421875, -0.204986572265625, -0.19886016845703125, -0.1927337646484375, -0.18660736083984375, -0.18048095703125, -0.17435455322265625, -0.1682281494140625, -0.16210174560546875, -0.155975341796875, -0.14984893798828125, -0.1437225341796875, -0.13759613037109375, -0.1314697265625, -0.12534332275390625, -0.1192169189453125, -0.11309051513671875, -0.106964111328125, -0.10083770751953125, -0.0947113037109375, -0.08858489990234375, -0.08245849609375, -0.07633209228515625, -0.0702056884765625, -0.06407928466796875, -0.057952880859375, -0.05182647705078125, -0.0457000732421875, -0.03957366943359375, -0.033447265625, -0.02732086181640625, -0.0211944580078125, -0.01506805419921875, -0.008941650390625, -0.00281524658203125, 0.0033111572265625, 0.00943756103515625, 0.01556396484375, 0.02169036865234375, 0.0278167724609375, 0.03394317626953125, 0.040069580078125, 0.04619598388671875, 0.0523223876953125, 0.05844879150390625, 0.0645751953125, 0.07070159912109375, 0.0768280029296875, 0.08295440673828125, 0.089080810546875, 0.09520721435546875, 0.1013336181640625, 0.10746002197265625, 0.11358642578125, 0.11971282958984375, 0.1258392333984375, 0.13196563720703125, 0.138092041015625, 0.14421844482421875, 0.1503448486328125, 0.15647125244140625, 0.16259765625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 11.0, 7.0, 13.0, 14.0, 16.0, 25.0, 26.0, 50.0, 40.0, 68.0, 56.0, 80.0, 82.0, 80.0, 87.0, 71.0, 66.0, 35.0, 40.0, 25.0, 20.0, 25.0, 13.0, 8.0, 8.0, 5.0, 9.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0304107666015625, -0.02928328514099121, -0.028155803680419922, -0.027028322219848633, -0.025900840759277344, -0.024773359298706055, -0.023645877838134766, -0.022518396377563477, -0.021390914916992188, -0.0202634334564209, -0.01913595199584961, -0.01800847053527832, -0.01688098907470703, -0.015753507614135742, -0.014626026153564453, -0.013498544692993164, -0.012371063232421875, -0.011243581771850586, -0.010116100311279297, -0.008988618850708008, -0.007861137390136719, -0.00673365592956543, -0.005606174468994141, -0.0044786930084228516, -0.0033512115478515625, -0.0022237300872802734, -0.0010962486267089844, 3.123283386230469e-05, 0.0011587142944335938, 0.002286195755004883, 0.003413677215576172, 0.004541158676147461, 0.00566864013671875, 0.006796121597290039, 0.007923603057861328, 0.009051084518432617, 0.010178565979003906, 0.011306047439575195, 0.012433528900146484, 0.013561010360717773, 0.014688491821289062, 0.01581597328186035, 0.01694345474243164, 0.01807093620300293, 0.01919841766357422, 0.020325899124145508, 0.021453380584716797, 0.022580862045288086, 0.023708343505859375, 0.024835824966430664, 0.025963306427001953, 0.027090787887573242, 0.02821826934814453, 0.02934575080871582, 0.03047323226928711, 0.0316007137298584, 0.03272819519042969, 0.03385567665100098, 0.034983158111572266, 0.036110639572143555, 0.037238121032714844, 0.03836560249328613, 0.03949308395385742, 0.04062056541442871, 0.041748046875]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 7.0, 14.0, 29.0, 40.0, 90.0, 127.0, 170.0, 199.0, 122.0, 91.0, 49.0, 30.0, 15.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.035905599594116, -1.9725351333618164, -1.9091647863388062, -1.8457943201065063, -1.782423973083496, -1.7190535068511963, -1.6556830406188965, -1.5923125743865967, -1.5289422273635864, -1.4655717611312866, -1.4022014141082764, -1.3388309478759766, -1.2754604816436768, -1.2120901346206665, -1.1487196683883667, -1.0853493213653564, -1.0219788551330566, -0.9586084485054016, -0.8952380418777466, -0.8318675756454468, -0.7684971690177917, -0.7051267623901367, -0.6417562961578369, -0.5783858895301819, -0.5150154829025269, -0.4516450762748718, -0.3882746398448944, -0.324904203414917, -0.26153379678726196, -0.19816339015960693, -0.13479295372962952, -0.0714225172996521, -0.00805211067199707, 0.05531831085681915, 0.11868873238563538, 0.1820591539144516, 0.24542957544326782, 0.30879998207092285, 0.37217041850090027, 0.4355408549308777, 0.4989112615585327, 0.5622816681861877, 0.6256520748138428, 0.6890225410461426, 0.7523929476737976, 0.8157633543014526, 0.8791338205337524, 0.9425042271614075, 1.0058746337890625, 1.0692451000213623, 1.1326154470443726, 1.1959859132766724, 1.2593562602996826, 1.3227267265319824, 1.3860971927642822, 1.449467658996582, 1.5128380060195923, 1.576208472251892, 1.6395788192749023, 1.7029492855072021, 1.766319751739502, 1.8296900987625122, 1.893060564994812, 1.9564309120178223, 2.019801378250122]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 2.0, 7.0, 8.0, 12.0, 17.0, 10.0, 15.0, 21.0, 30.0, 33.0, 37.0, 34.0, 38.0, 54.0, 45.0, 48.0, 51.0, 66.0, 46.0, 55.0, 55.0, 45.0, 48.0, 29.0, 24.0, 39.0, 26.0, 13.0, 18.0, 16.0, 4.0, 8.0, 9.0, 7.0, 8.0, 6.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6306495070457458, -0.6057257056236267, -0.5808018445968628, -0.5558780431747437, -0.5309542417526245, -0.5060304403305054, -0.48110657930374146, -0.4561827778816223, -0.4312589466571808, -0.40633511543273926, -0.3814113140106201, -0.3564874827861786, -0.33156365156173706, -0.3066398501396179, -0.2817160189151764, -0.25679218769073486, -0.23186838626861572, -0.2069445699453354, -0.18202075362205505, -0.15709692239761353, -0.1321731060743332, -0.10724928975105286, -0.08232545852661133, -0.057401642203330994, -0.03247782588005066, -0.007554005831480026, 0.017369814217090607, 0.04229363799095154, 0.06721745431423187, 0.09214127063751221, 0.11706510186195374, 0.14198891818523407, 0.1669127345085144, 0.19183655083179474, 0.21676036715507507, 0.2416841983795166, 0.26660799980163574, 0.29153183102607727, 0.3164556622505188, 0.34137946367263794, 0.36630329489707947, 0.391227126121521, 0.41615092754364014, 0.44107475876808167, 0.4659985899925232, 0.49092239141464233, 0.5158462524414062, 0.5407700538635254, 0.5656938552856445, 0.5906176567077637, 0.6155415177345276, 0.6404653191566467, 0.6653891205787659, 0.6903129816055298, 0.7152367830276489, 0.7401605844497681, 0.7650843858718872, 0.7900081872940063, 0.8149320483207703, 0.8398558497428894, 0.8647796511650085, 0.8897035121917725, 0.9146273136138916, 0.9395511150360107, 0.9644749760627747]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 5.0, 2.0, 9.0, 6.0, 22.0, 22.0, 39.0, 46.0, 84.0, 123.0, 219.0, 474.0, 877.0, 1762.0, 4290.0, 11457.0, 36329.0, 143029.0, 517698.0, 247705.0, 56627.0, 16903.0, 5923.0, 2484.0, 1146.0, 557.0, 254.0, 188.0, 117.0, 57.0, 39.0, 20.0, 15.0, 11.0, 12.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.0107421875, -0.9858932495117188, -0.9610443115234375, -0.9361953735351562, -0.911346435546875, -0.8864974975585938, -0.8616485595703125, -0.8367996215820312, -0.81195068359375, -0.7871017456054688, -0.7622528076171875, -0.7374038696289062, -0.712554931640625, -0.6877059936523438, -0.6628570556640625, -0.6380081176757812, -0.6131591796875, -0.5883102416992188, -0.5634613037109375, -0.5386123657226562, -0.513763427734375, -0.48891448974609375, -0.4640655517578125, -0.43921661376953125, -0.41436767578125, -0.38951873779296875, -0.3646697998046875, -0.33982086181640625, -0.314971923828125, -0.29012298583984375, -0.2652740478515625, -0.24042510986328125, -0.215576171875, -0.19072723388671875, -0.1658782958984375, -0.14102935791015625, -0.116180419921875, -0.09133148193359375, -0.0664825439453125, -0.04163360595703125, -0.01678466796875, 0.00806427001953125, 0.0329132080078125, 0.05776214599609375, 0.082611083984375, 0.10746002197265625, 0.1323089599609375, 0.15715789794921875, 0.1820068359375, 0.20685577392578125, 0.2317047119140625, 0.25655364990234375, 0.281402587890625, 0.30625152587890625, 0.3311004638671875, 0.35594940185546875, 0.38079833984375, 0.40564727783203125, 0.4304962158203125, 0.45534515380859375, 0.480194091796875, 0.5050430297851562, 0.5298919677734375, 0.5547409057617188, 0.57958984375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 6.0, 8.0, 7.0, 12.0, 18.0, 14.0, 23.0, 28.0, 42.0, 47.0, 50.0, 46.0, 66.0, 57.0, 70.0, 67.0, 54.0, 68.0, 66.0, 48.0, 48.0, 25.0, 19.0, 32.0, 16.0, 18.0, 9.0, 6.0, 8.0, 6.0, 9.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3251953125, -1.2624053955078125, -1.199615478515625, -1.1368255615234375, -1.07403564453125, -1.0112457275390625, -0.948455810546875, -0.8856658935546875, -0.8228759765625, -0.7600860595703125, -0.697296142578125, -0.6345062255859375, -0.57171630859375, -0.5089263916015625, -0.446136474609375, -0.3833465576171875, -0.320556640625, -0.2577667236328125, -0.194976806640625, -0.1321868896484375, -0.06939697265625, -0.0066070556640625, 0.056182861328125, 0.1189727783203125, 0.1817626953125, 0.2445526123046875, 0.307342529296875, 0.3701324462890625, 0.43292236328125, 0.4957122802734375, 0.558502197265625, 0.6212921142578125, 0.68408203125, 0.7468719482421875, 0.809661865234375, 0.8724517822265625, 0.93524169921875, 0.9980316162109375, 1.060821533203125, 1.1236114501953125, 1.1864013671875, 1.2491912841796875, 1.311981201171875, 1.3747711181640625, 1.43756103515625, 1.5003509521484375, 1.563140869140625, 1.6259307861328125, 1.688720703125, 1.7515106201171875, 1.814300537109375, 1.8770904541015625, 1.93988037109375, 2.0026702880859375, 2.065460205078125, 2.1282501220703125, 2.1910400390625, 2.2538299560546875, 2.316619873046875, 2.3794097900390625, 2.44219970703125, 2.5049896240234375, 2.567779541015625, 2.6305694580078125, 2.693359375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 6.0, 4.0, 3.0, 8.0, 3.0, 9.0, 8.0, 9.0, 23.0, 26.0, 36.0, 64.0, 74.0, 84.0, 151.0, 241.0, 465.0, 1097.0, 7606.0, 199562.0, 805890.0, 29121.0, 2409.0, 695.0, 325.0, 224.0, 117.0, 78.0, 58.0, 48.0, 25.0, 18.0, 17.0, 13.0, 15.0, 5.0, 6.0, 6.0, 4.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9072265625, -1.8480682373046875, -1.788909912109375, -1.7297515869140625, -1.67059326171875, -1.6114349365234375, -1.552276611328125, -1.4931182861328125, -1.4339599609375, -1.3748016357421875, -1.315643310546875, -1.2564849853515625, -1.19732666015625, -1.1381683349609375, -1.079010009765625, -1.0198516845703125, -0.960693359375, -0.9015350341796875, -0.842376708984375, -0.7832183837890625, -0.72406005859375, -0.6649017333984375, -0.605743408203125, -0.5465850830078125, -0.4874267578125, -0.4282684326171875, -0.369110107421875, -0.3099517822265625, -0.25079345703125, -0.1916351318359375, -0.132476806640625, -0.0733184814453125, -0.01416015625, 0.0449981689453125, 0.104156494140625, 0.1633148193359375, 0.22247314453125, 0.2816314697265625, 0.340789794921875, 0.3999481201171875, 0.4591064453125, 0.5182647705078125, 0.577423095703125, 0.6365814208984375, 0.69573974609375, 0.7548980712890625, 0.814056396484375, 0.8732147216796875, 0.932373046875, 0.9915313720703125, 1.050689697265625, 1.1098480224609375, 1.16900634765625, 1.2281646728515625, 1.287322998046875, 1.3464813232421875, 1.4056396484375, 1.4647979736328125, 1.523956298828125, 1.5831146240234375, 1.64227294921875, 1.7014312744140625, 1.760589599609375, 1.8197479248046875, 1.87890625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 8.0, 3.0, 6.0, 5.0, 7.0, 17.0, 16.0, 24.0, 16.0, 26.0, 31.0, 24.0, 28.0, 27.0, 40.0, 37.0, 47.0, 54.0, 45.0, 39.0, 38.0, 50.0, 48.0, 47.0, 40.0, 28.0, 32.0, 31.0, 30.0, 34.0, 18.0, 13.0, 15.0, 11.0, 7.0, 12.0, 10.0, 6.0, 12.0, 2.0, 6.0, 6.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.6767578125, -1.624114990234375, -1.57147216796875, -1.518829345703125, -1.4661865234375, -1.413543701171875, -1.36090087890625, -1.308258056640625, -1.255615234375, -1.202972412109375, -1.15032958984375, -1.097686767578125, -1.0450439453125, -0.992401123046875, -0.93975830078125, -0.887115478515625, -0.83447265625, -0.781829833984375, -0.72918701171875, -0.676544189453125, -0.6239013671875, -0.571258544921875, -0.51861572265625, -0.465972900390625, -0.413330078125, -0.360687255859375, -0.30804443359375, -0.255401611328125, -0.2027587890625, -0.150115966796875, -0.09747314453125, -0.044830322265625, 0.0078125, 0.060455322265625, 0.11309814453125, 0.165740966796875, 0.2183837890625, 0.271026611328125, 0.32366943359375, 0.376312255859375, 0.428955078125, 0.481597900390625, 0.53424072265625, 0.586883544921875, 0.6395263671875, 0.692169189453125, 0.74481201171875, 0.797454833984375, 0.85009765625, 0.902740478515625, 0.95538330078125, 1.008026123046875, 1.0606689453125, 1.113311767578125, 1.16595458984375, 1.218597412109375, 1.271240234375, 1.323883056640625, 1.37652587890625, 1.429168701171875, 1.4818115234375, 1.534454345703125, 1.58709716796875, 1.639739990234375, 1.6923828125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 9.0, 0.0, 9.0, 11.0, 17.0, 28.0, 49.0, 59.0, 123.0, 254.0, 813.0, 3290.0, 41345.0, 904692.0, 91334.0, 4793.0, 994.0, 351.0, 141.0, 84.0, 50.0, 30.0, 19.0, 15.0, 13.0, 12.0, 8.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6865234375, -0.66546630859375, -0.6444091796875, -0.62335205078125, -0.602294921875, -0.58123779296875, -0.5601806640625, -0.53912353515625, -0.51806640625, -0.49700927734375, -0.4759521484375, -0.45489501953125, -0.433837890625, -0.41278076171875, -0.3917236328125, -0.37066650390625, -0.349609375, -0.32855224609375, -0.3074951171875, -0.28643798828125, -0.265380859375, -0.24432373046875, -0.2232666015625, -0.20220947265625, -0.18115234375, -0.16009521484375, -0.1390380859375, -0.11798095703125, -0.096923828125, -0.07586669921875, -0.0548095703125, -0.03375244140625, -0.0126953125, 0.00836181640625, 0.0294189453125, 0.05047607421875, 0.071533203125, 0.09259033203125, 0.1136474609375, 0.13470458984375, 0.15576171875, 0.17681884765625, 0.1978759765625, 0.21893310546875, 0.239990234375, 0.26104736328125, 0.2821044921875, 0.30316162109375, 0.32421875, 0.34527587890625, 0.3663330078125, 0.38739013671875, 0.408447265625, 0.42950439453125, 0.4505615234375, 0.47161865234375, 0.49267578125, 0.51373291015625, 0.5347900390625, 0.55584716796875, 0.576904296875, 0.59796142578125, 0.6190185546875, 0.64007568359375, 0.6611328125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 19.0, 12.0, 30.0, 41.0, 60.0, 96.0, 170.0, 167.0, 156.0, 87.0, 61.0, 35.0, 23.0, 16.0, 8.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00011008977890014648, -0.00010776985436677933, -0.00010544992983341217, -0.00010313000530004501, -0.00010081008076667786, -9.84901562333107e-05, -9.617023169994354e-05, -9.385030716657639e-05, -9.153038263320923e-05, -8.921045809984207e-05, -8.689053356647491e-05, -8.457060903310776e-05, -8.22506844997406e-05, -7.993075996637344e-05, -7.761083543300629e-05, -7.529091089963913e-05, -7.297098636627197e-05, -7.065106183290482e-05, -6.833113729953766e-05, -6.60112127661705e-05, -6.369128823280334e-05, -6.137136369943619e-05, -5.905143916606903e-05, -5.6731514632701874e-05, -5.441159009933472e-05, -5.209166556596756e-05, -4.97717410326004e-05, -4.7451816499233246e-05, -4.513189196586609e-05, -4.281196743249893e-05, -4.0492042899131775e-05, -3.817211836576462e-05, -3.585219383239746e-05, -3.3532269299030304e-05, -3.121234476566315e-05, -2.889242023229599e-05, -2.6572495698928833e-05, -2.4252571165561676e-05, -2.193264663219452e-05, -1.9612722098827362e-05, -1.7292797565460205e-05, -1.4972873032093048e-05, -1.2652948498725891e-05, -1.0333023965358734e-05, -8.013099431991577e-06, -5.69317489862442e-06, -3.373250365257263e-06, -1.0533258318901062e-06, 1.2665987014770508e-06, 3.5865232348442078e-06, 5.906447768211365e-06, 8.226372301578522e-06, 1.0546296834945679e-05, 1.2866221368312836e-05, 1.5186145901679993e-05, 1.750607043504715e-05, 1.9825994968414307e-05, 2.2145919501781464e-05, 2.446584403514862e-05, 2.6785768568515778e-05, 2.9105693101882935e-05, 3.142561763525009e-05, 3.374554216861725e-05, 3.6065466701984406e-05, 3.838539123535156e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 4.0, 18.0, 17.0, 41.0, 59.0, 175.0, 406.0, 1774.0, 11633.0, 874560.0, 153671.0, 4651.0, 942.0, 332.0, 123.0, 52.0, 26.0, 16.0, 12.0, 5.0, 4.0, 4.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.099609375, -1.0688934326171875, -1.038177490234375, -1.0074615478515625, -0.97674560546875, -0.9460296630859375, -0.915313720703125, -0.8845977783203125, -0.8538818359375, -0.8231658935546875, -0.792449951171875, -0.7617340087890625, -0.73101806640625, -0.7003021240234375, -0.669586181640625, -0.6388702392578125, -0.608154296875, -0.5774383544921875, -0.546722412109375, -0.5160064697265625, -0.48529052734375, -0.4545745849609375, -0.423858642578125, -0.3931427001953125, -0.3624267578125, -0.3317108154296875, -0.300994873046875, -0.2702789306640625, -0.23956298828125, -0.2088470458984375, -0.178131103515625, -0.1474151611328125, -0.11669921875, -0.0859832763671875, -0.055267333984375, -0.0245513916015625, 0.00616455078125, 0.0368804931640625, 0.067596435546875, 0.0983123779296875, 0.1290283203125, 0.1597442626953125, 0.190460205078125, 0.2211761474609375, 0.25189208984375, 0.2826080322265625, 0.313323974609375, 0.3440399169921875, 0.374755859375, 0.4054718017578125, 0.436187744140625, 0.4669036865234375, 0.49761962890625, 0.5283355712890625, 0.559051513671875, 0.5897674560546875, 0.6204833984375, 0.6511993408203125, 0.681915283203125, 0.7126312255859375, 0.74334716796875, 0.7740631103515625, 0.804779052734375, 0.8354949951171875, 0.8662109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 2.0, 6.0, 18.0, 17.0, 31.0, 52.0, 69.0, 91.0, 135.0, 170.0, 128.0, 93.0, 61.0, 42.0, 26.0, 10.0, 21.0, 14.0, 3.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1864013671875, -0.1796245574951172, -0.17284774780273438, -0.16607093811035156, -0.15929412841796875, -0.15251731872558594, -0.14574050903320312, -0.1389636993408203, -0.1321868896484375, -0.1254100799560547, -0.11863327026367188, -0.11185646057128906, -0.10507965087890625, -0.09830284118652344, -0.09152603149414062, -0.08474922180175781, -0.077972412109375, -0.07119560241699219, -0.06441879272460938, -0.05764198303222656, -0.05086517333984375, -0.04408836364746094, -0.037311553955078125, -0.030534744262695312, -0.0237579345703125, -0.016981124877929688, -0.010204315185546875, -0.0034275054931640625, 0.00334930419921875, 0.010126113891601562, 0.016902923583984375, 0.023679733276367188, 0.03045654296875, 0.03723335266113281, 0.044010162353515625, 0.05078697204589844, 0.05756378173828125, 0.06434059143066406, 0.07111740112304688, 0.07789421081542969, 0.0846710205078125, 0.09144783020019531, 0.09822463989257812, 0.10500144958496094, 0.11177825927734375, 0.11855506896972656, 0.12533187866210938, 0.1321086883544922, 0.138885498046875, 0.1456623077392578, 0.15243911743164062, 0.15921592712402344, 0.16599273681640625, 0.17276954650878906, 0.17954635620117188, 0.1863231658935547, 0.1930999755859375, 0.1998767852783203, 0.20665359497070312, 0.21343040466308594, 0.22020721435546875, 0.22698402404785156, 0.23376083374023438, 0.2405376434326172, 0.247314453125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 8.0, 25.0, 40.0, 102.0, 220.0, 247.0, 177.0, 99.0, 54.0, 17.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.928035259246826, -7.749937057495117, -7.57183837890625, -7.393740177154541, -7.215641975402832, -7.037543773651123, -6.859445095062256, -6.681346893310547, -6.503248691558838, -6.325150489807129, -6.147051811218262, -5.968953609466553, -5.790855407714844, -5.612757205963135, -5.434658527374268, -5.256560325622559, -5.078461647033691, -4.900363445281982, -4.722264766693115, -4.544166564941406, -4.366068363189697, -4.187970161437988, -4.009871482849121, -3.831773281097412, -3.653675079345703, -3.475576639175415, -3.297478437423706, -3.119379997253418, -2.941281795501709, -2.763183355331421, -2.585084915161133, -2.406986713409424, -2.2288882732391357, -2.0507898330688477, -1.8726916313171387, -1.6945931911468506, -1.5164949893951416, -1.3383965492248535, -1.160298228263855, -0.9821999073028564, -0.8041015863418579, -0.6260032653808594, -0.44790491461753845, -0.26980656385421753, -0.091708242893219, 0.08639007806777954, 0.26448845863342285, 0.4425867795944214, 0.6206851005554199, 0.7987834215164185, 0.976881742477417, 1.154980182647705, 1.333078384399414, 1.5111768245697021, 1.6892751455307007, 1.8673734664916992, 2.045471668243408, 2.2235701084136963, 2.4016683101654053, 2.5797667503356934, 2.7578649520874023, 2.9359633922576904, 3.1140618324279785, 3.2921600341796875, 3.4702584743499756]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 7.0, 4.0, 2.0, 7.0, 8.0, 13.0, 8.0, 13.0, 15.0, 22.0, 19.0, 22.0, 25.0, 24.0, 28.0, 33.0, 39.0, 51.0, 35.0, 64.0, 50.0, 52.0, 47.0, 53.0, 40.0, 33.0, 40.0, 28.0, 35.0, 39.0, 18.0, 28.0, 16.0, 14.0, 14.0, 8.0, 8.0, 10.0, 11.0, 7.0, 1.0, 4.0, 6.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.5424437522888184, -2.4560534954071045, -2.3696634769439697, -2.283273220062256, -2.196883201599121, -2.1104929447174072, -2.0241029262542725, -1.9377126693725586, -1.8513226509094238, -1.7649325132369995, -1.6785423755645752, -1.5921522378921509, -1.5057621002197266, -1.4193719625473022, -1.332981824874878, -1.246591567993164, -1.1602014303207397, -1.0738112926483154, -0.9874211549758911, -0.9010310173034668, -0.8146408796310425, -0.7282507419586182, -0.6418605446815491, -0.5554704070091248, -0.46908026933670044, -0.3826901316642761, -0.2962999939918518, -0.2099098265171051, -0.12351968884468079, -0.03712955117225647, 0.049260616302490234, 0.13565075397491455, 0.22204089164733887, 0.3084310293197632, 0.3948211669921875, 0.4812113344669342, 0.5676014423370361, 0.6539915800094604, 0.7403817772865295, 0.8267719149589539, 0.9131620526313782, 0.9995521903038025, 1.0859423875808716, 1.172332525253296, 1.2587226629257202, 1.3451128005981445, 1.4315029382705688, 1.5178930759429932, 1.6042832136154175, 1.6906733512878418, 1.7770634889602661, 1.8634536266326904, 1.9498437643051147, 2.036233901977539, 2.122624158859253, 2.2090141773223877, 2.2954044342041016, 2.3817946910858154, 2.46818470954895, 2.554574966430664, 2.640964984893799, 2.7273552417755127, 2.8137452602386475, 2.9001355171203613, 2.986525535583496]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 5.0, 7.0, 7.0, 11.0, 17.0, 34.0, 47.0, 88.0, 142.0, 255.0, 484.0, 1035.0, 2384.0, 6349.0, 23359.0, 125216.0, 945327.0, 2424779.0, 563429.0, 76914.0, 15835.0, 4869.0, 1871.0, 843.0, 397.0, 208.0, 136.0, 81.0, 53.0, 41.0, 19.0, 14.0, 8.0, 3.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.55859375, -1.5118865966796875, -1.465179443359375, -1.4184722900390625, -1.37176513671875, -1.3250579833984375, -1.278350830078125, -1.2316436767578125, -1.1849365234375, -1.1382293701171875, -1.091522216796875, -1.0448150634765625, -0.99810791015625, -0.9514007568359375, -0.904693603515625, -0.8579864501953125, -0.811279296875, -0.7645721435546875, -0.717864990234375, -0.6711578369140625, -0.62445068359375, -0.5777435302734375, -0.531036376953125, -0.4843292236328125, -0.4376220703125, -0.3909149169921875, -0.344207763671875, -0.2975006103515625, -0.25079345703125, -0.2040863037109375, -0.157379150390625, -0.1106719970703125, -0.06396484375, -0.0172576904296875, 0.029449462890625, 0.0761566162109375, 0.12286376953125, 0.1695709228515625, 0.216278076171875, 0.2629852294921875, 0.3096923828125, 0.3563995361328125, 0.403106689453125, 0.4498138427734375, 0.49652099609375, 0.5432281494140625, 0.589935302734375, 0.6366424560546875, 0.683349609375, 0.7300567626953125, 0.776763916015625, 0.8234710693359375, 0.87017822265625, 0.9168853759765625, 0.963592529296875, 1.0102996826171875, 1.0570068359375, 1.1037139892578125, 1.150421142578125, 1.1971282958984375, 1.24383544921875, 1.2905426025390625, 1.337249755859375, 1.3839569091796875, 1.4306640625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 7.0, 8.0, 11.0, 21.0, 19.0, 33.0, 36.0, 38.0, 40.0, 41.0, 57.0, 47.0, 60.0, 59.0, 67.0, 49.0, 70.0, 62.0, 37.0, 36.0, 37.0, 29.0, 22.0, 18.0, 17.0, 12.0, 10.0, 8.0, 7.0, 8.0, 7.0, 5.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1025390625, -1.065948486328125, -1.02935791015625, -0.992767333984375, -0.9561767578125, -0.919586181640625, -0.88299560546875, -0.846405029296875, -0.809814453125, -0.773223876953125, -0.73663330078125, -0.700042724609375, -0.6634521484375, -0.626861572265625, -0.59027099609375, -0.553680419921875, -0.51708984375, -0.480499267578125, -0.44390869140625, -0.407318115234375, -0.3707275390625, -0.334136962890625, -0.29754638671875, -0.260955810546875, -0.224365234375, -0.187774658203125, -0.15118408203125, -0.114593505859375, -0.0780029296875, -0.041412353515625, -0.00482177734375, 0.031768798828125, 0.068359375, 0.104949951171875, 0.14154052734375, 0.178131103515625, 0.2147216796875, 0.251312255859375, 0.28790283203125, 0.324493408203125, 0.361083984375, 0.397674560546875, 0.43426513671875, 0.470855712890625, 0.5074462890625, 0.544036865234375, 0.58062744140625, 0.617218017578125, 0.65380859375, 0.690399169921875, 0.72698974609375, 0.763580322265625, 0.8001708984375, 0.836761474609375, 0.87335205078125, 0.909942626953125, 0.946533203125, 0.983123779296875, 1.01971435546875, 1.056304931640625, 1.0928955078125, 1.129486083984375, 1.16607666015625, 1.202667236328125, 1.2392578125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 8.0, 4.0, 6.0, 8.0, 23.0, 27.0, 56.0, 120.0, 185.0, 450.0, 1051.0, 4097.0, 44968.0, 3811728.0, 318932.0, 9568.0, 1853.0, 611.0, 272.0, 140.0, 76.0, 44.0, 17.0, 13.0, 12.0, 6.0, 9.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.587890625, -3.478240966796875, -3.36859130859375, -3.258941650390625, -3.1492919921875, -3.039642333984375, -2.92999267578125, -2.820343017578125, -2.710693359375, -2.601043701171875, -2.49139404296875, -2.381744384765625, -2.2720947265625, -2.162445068359375, -2.05279541015625, -1.943145751953125, -1.83349609375, -1.723846435546875, -1.61419677734375, -1.504547119140625, -1.3948974609375, -1.285247802734375, -1.17559814453125, -1.065948486328125, -0.956298828125, -0.846649169921875, -0.73699951171875, -0.627349853515625, -0.5177001953125, -0.408050537109375, -0.29840087890625, -0.188751220703125, -0.0791015625, 0.030548095703125, 0.14019775390625, 0.249847412109375, 0.3594970703125, 0.469146728515625, 0.57879638671875, 0.688446044921875, 0.798095703125, 0.907745361328125, 1.01739501953125, 1.127044677734375, 1.2366943359375, 1.346343994140625, 1.45599365234375, 1.565643310546875, 1.67529296875, 1.784942626953125, 1.89459228515625, 2.004241943359375, 2.1138916015625, 2.223541259765625, 2.33319091796875, 2.442840576171875, 2.552490234375, 2.662139892578125, 2.77178955078125, 2.881439208984375, 2.9910888671875, 3.100738525390625, 3.21038818359375, 3.320037841796875, 3.4296875]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 1.0, 7.0, 8.0, 15.0, 14.0, 35.0, 46.0, 102.0, 200.0, 365.0, 650.0, 903.0, 733.0, 471.0, 224.0, 127.0, 75.0, 41.0, 33.0, 13.0, 4.0, 3.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43408203125, -0.41089630126953125, -0.3877105712890625, -0.36452484130859375, -0.341339111328125, -0.31815338134765625, -0.2949676513671875, -0.27178192138671875, -0.24859619140625, -0.22541046142578125, -0.2022247314453125, -0.17903900146484375, -0.155853271484375, -0.13266754150390625, -0.1094818115234375, -0.08629608154296875, -0.0631103515625, -0.03992462158203125, -0.0167388916015625, 0.00644683837890625, 0.029632568359375, 0.05281829833984375, 0.0760040283203125, 0.09918975830078125, 0.12237548828125, 0.14556121826171875, 0.1687469482421875, 0.19193267822265625, 0.215118408203125, 0.23830413818359375, 0.2614898681640625, 0.28467559814453125, 0.307861328125, 0.33104705810546875, 0.3542327880859375, 0.37741851806640625, 0.400604248046875, 0.42378997802734375, 0.4469757080078125, 0.47016143798828125, 0.49334716796875, 0.5165328979492188, 0.5397186279296875, 0.5629043579101562, 0.586090087890625, 0.6092758178710938, 0.6324615478515625, 0.6556472778320312, 0.6788330078125, 0.7020187377929688, 0.7252044677734375, 0.7483901977539062, 0.771575927734375, 0.7947616577148438, 0.8179473876953125, 0.8411331176757812, 0.86431884765625, 0.8875045776367188, 0.9106903076171875, 0.9338760375976562, 0.957061767578125, 0.9802474975585938, 1.0034332275390625, 1.0266189575195312, 1.0498046875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 14.0, 11.0, 24.0, 35.0, 34.0, 59.0, 99.0, 101.0, 128.0, 110.0, 74.0, 85.0, 75.0, 60.0, 27.0, 27.0, 13.0, 5.0, 5.0, 4.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2227377891540527, -2.1516666412353516, -2.0805954933166504, -2.009524345397949, -1.9384530782699585, -1.8673819303512573, -1.7963106632232666, -1.7252395153045654, -1.6541683673858643, -1.583097219467163, -1.512026071548462, -1.4409548044204712, -1.36988365650177, -1.2988125085830688, -1.2277412414550781, -1.156670093536377, -1.0855989456176758, -1.0145277976989746, -0.9434565901756287, -0.8723853826522827, -0.8013142347335815, -0.7302430868148804, -0.6591718792915344, -0.5881006717681885, -0.5170295238494873, -0.44595834612846375, -0.3748871684074402, -0.3038159906864166, -0.23274481296539307, -0.1616736352443695, -0.09060245752334595, -0.019531279802322388, 0.05154013633728027, 0.12261131405830383, 0.1936824917793274, 0.26475366950035095, 0.3358248472213745, 0.40689602494239807, 0.47796720266342163, 0.5490384101867676, 0.6201095581054688, 0.6911807060241699, 0.7622519135475159, 0.8333231210708618, 0.904394268989563, 0.9754654169082642, 1.0465366840362549, 1.117607831954956, 1.1886789798736572, 1.2597501277923584, 1.3308212757110596, 1.4018925428390503, 1.4729636907577515, 1.5440348386764526, 1.6151061058044434, 1.6861772537231445, 1.7572484016418457, 1.8283195495605469, 1.899390697479248, 1.9704619646072388, 2.0415329933166504, 2.1126043796539307, 2.183675527572632, 2.254746675491333, 2.325817823410034]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 10.0, 5.0, 4.0, 4.0, 14.0, 11.0, 20.0, 30.0, 15.0, 34.0, 28.0, 27.0, 41.0, 28.0, 31.0, 41.0, 38.0, 57.0, 43.0, 48.0, 52.0, 51.0, 45.0, 38.0, 37.0, 35.0, 31.0, 28.0, 27.0, 10.0, 28.0, 16.0, 15.0, 12.0, 12.0, 12.0, 7.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1532191038131714, -1.1176023483276367, -1.0819854736328125, -1.0463687181472778, -1.0107519626617432, -0.9751352071762085, -0.939518392086029, -0.9039015769958496, -0.8682848215103149, -0.8326680660247803, -0.7970512509346008, -0.7614344358444214, -0.7258176803588867, -0.690200924873352, -0.6545841097831726, -0.6189672946929932, -0.5833505392074585, -0.5477337837219238, -0.5121169686317444, -0.47650018334388733, -0.4408833980560303, -0.4052666127681732, -0.36964982748031616, -0.3340330421924591, -0.29841625690460205, -0.262799471616745, -0.22718268632888794, -0.19156590104103088, -0.15594911575317383, -0.12033233046531677, -0.08471554517745972, -0.04909875988960266, -0.013481855392456055, 0.022134929895401, 0.05775171518325806, 0.09336850047111511, 0.12898528575897217, 0.16460207104682922, 0.20021885633468628, 0.23583564162254333, 0.2714524269104004, 0.30706921219825745, 0.3426859974861145, 0.37830278277397156, 0.4139195680618286, 0.44953635334968567, 0.4851531386375427, 0.5207699537277222, 0.5563867092132568, 0.5920034646987915, 0.627620279788971, 0.6632370948791504, 0.6988538503646851, 0.7344706058502197, 0.7700874209403992, 0.8057042360305786, 0.8413209915161133, 0.876937747001648, 0.9125545620918274, 0.9481713771820068, 0.9837881326675415, 1.0194048881530762, 1.0550217628479004, 1.090638518333435, 1.1262552738189697]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 8.0, 8.0, 11.0, 22.0, 34.0, 59.0, 77.0, 141.0, 264.0, 422.0, 1003.0, 2364.0, 6556.0, 21185.0, 76918.0, 315318.0, 444586.0, 130164.0, 33150.0, 10014.0, 3458.0, 1428.0, 591.0, 286.0, 185.0, 112.0, 70.0, 37.0, 20.0, 16.0, 9.0, 9.0, 8.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.326416015625, -0.3152313232421875, -0.304046630859375, -0.2928619384765625, -0.28167724609375, -0.2704925537109375, -0.259307861328125, -0.2481231689453125, -0.2369384765625, -0.2257537841796875, -0.214569091796875, -0.2033843994140625, -0.19219970703125, -0.1810150146484375, -0.169830322265625, -0.1586456298828125, -0.1474609375, -0.1362762451171875, -0.125091552734375, -0.1139068603515625, -0.10272216796875, -0.0915374755859375, -0.080352783203125, -0.0691680908203125, -0.0579833984375, -0.0467987060546875, -0.035614013671875, -0.0244293212890625, -0.01324462890625, -0.0020599365234375, 0.009124755859375, 0.0203094482421875, 0.031494140625, 0.0426788330078125, 0.053863525390625, 0.0650482177734375, 0.07623291015625, 0.0874176025390625, 0.098602294921875, 0.1097869873046875, 0.1209716796875, 0.1321563720703125, 0.143341064453125, 0.1545257568359375, 0.16571044921875, 0.1768951416015625, 0.188079833984375, 0.1992645263671875, 0.21044921875, 0.2216339111328125, 0.232818603515625, 0.2440032958984375, 0.25518798828125, 0.2663726806640625, 0.277557373046875, 0.2887420654296875, 0.2999267578125, 0.3111114501953125, 0.322296142578125, 0.3334808349609375, 0.34466552734375, 0.3558502197265625, 0.367034912109375, 0.3782196044921875, 0.389404296875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 2.0, 5.0, 7.0, 9.0, 4.0, 11.0, 18.0, 15.0, 32.0, 22.0, 21.0, 23.0, 38.0, 38.0, 40.0, 44.0, 41.0, 50.0, 52.0, 40.0, 58.0, 58.0, 45.0, 38.0, 37.0, 38.0, 43.0, 32.0, 12.0, 18.0, 23.0, 20.0, 10.0, 13.0, 8.0, 8.0, 5.0, 9.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.74365234375, -0.718353271484375, -0.69305419921875, -0.667755126953125, -0.6424560546875, -0.617156982421875, -0.59185791015625, -0.566558837890625, -0.541259765625, -0.515960693359375, -0.49066162109375, -0.465362548828125, -0.4400634765625, -0.414764404296875, -0.38946533203125, -0.364166259765625, -0.3388671875, -0.313568115234375, -0.28826904296875, -0.262969970703125, -0.2376708984375, -0.212371826171875, -0.18707275390625, -0.161773681640625, -0.136474609375, -0.111175537109375, -0.08587646484375, -0.060577392578125, -0.0352783203125, -0.009979248046875, 0.01531982421875, 0.040618896484375, 0.06591796875, 0.091217041015625, 0.11651611328125, 0.141815185546875, 0.1671142578125, 0.192413330078125, 0.21771240234375, 0.243011474609375, 0.268310546875, 0.293609619140625, 0.31890869140625, 0.344207763671875, 0.3695068359375, 0.394805908203125, 0.42010498046875, 0.445404052734375, 0.470703125, 0.496002197265625, 0.52130126953125, 0.546600341796875, 0.5718994140625, 0.597198486328125, 0.62249755859375, 0.647796630859375, 0.673095703125, 0.698394775390625, 0.72369384765625, 0.748992919921875, 0.7742919921875, 0.799591064453125, 0.82489013671875, 0.850189208984375, 0.87548828125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 8.0, 16.0, 14.0, 10.0, 29.0, 41.0, 66.0, 83.0, 174.0, 248.0, 426.0, 882.0, 1892.0, 4396.0, 11325.0, 31146.0, 100432.0, 315923.0, 377670.0, 137714.0, 41411.0, 14369.0, 5578.0, 2387.0, 1057.0, 506.0, 271.0, 172.0, 97.0, 61.0, 42.0, 31.0, 21.0, 15.0, 9.0, 11.0, 11.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26318359375, -0.25444793701171875, -0.2457122802734375, -0.23697662353515625, -0.228240966796875, -0.21950531005859375, -0.2107696533203125, -0.20203399658203125, -0.19329833984375, -0.18456268310546875, -0.1758270263671875, -0.16709136962890625, -0.158355712890625, -0.14962005615234375, -0.1408843994140625, -0.13214874267578125, -0.1234130859375, -0.11467742919921875, -0.1059417724609375, -0.09720611572265625, -0.088470458984375, -0.07973480224609375, -0.0709991455078125, -0.06226348876953125, -0.05352783203125, -0.04479217529296875, -0.0360565185546875, -0.02732086181640625, -0.018585205078125, -0.00984954833984375, -0.0011138916015625, 0.00762176513671875, 0.016357421875, 0.02509307861328125, 0.0338287353515625, 0.04256439208984375, 0.051300048828125, 0.06003570556640625, 0.0687713623046875, 0.07750701904296875, 0.08624267578125, 0.09497833251953125, 0.1037139892578125, 0.11244964599609375, 0.121185302734375, 0.12992095947265625, 0.1386566162109375, 0.14739227294921875, 0.1561279296875, 0.16486358642578125, 0.1735992431640625, 0.18233489990234375, 0.191070556640625, 0.19980621337890625, 0.2085418701171875, 0.21727752685546875, 0.22601318359375, 0.23474884033203125, 0.2434844970703125, 0.25222015380859375, 0.260955810546875, 0.26969146728515625, 0.2784271240234375, 0.28716278076171875, 0.2958984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 2.0, 2.0, 6.0, 8.0, 12.0, 11.0, 12.0, 20.0, 13.0, 26.0, 29.0, 19.0, 29.0, 30.0, 33.0, 39.0, 49.0, 40.0, 53.0, 51.0, 55.0, 66.0, 47.0, 48.0, 30.0, 32.0, 48.0, 33.0, 22.0, 31.0, 19.0, 14.0, 17.0, 22.0, 9.0, 5.0, 2.0, 4.0, 7.0, 4.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7822265625, -1.731658935546875, -1.68109130859375, -1.630523681640625, -1.5799560546875, -1.529388427734375, -1.47882080078125, -1.428253173828125, -1.377685546875, -1.327117919921875, -1.27655029296875, -1.225982666015625, -1.1754150390625, -1.124847412109375, -1.07427978515625, -1.023712158203125, -0.97314453125, -0.922576904296875, -0.87200927734375, -0.821441650390625, -0.7708740234375, -0.720306396484375, -0.66973876953125, -0.619171142578125, -0.568603515625, -0.518035888671875, -0.46746826171875, -0.416900634765625, -0.3663330078125, -0.315765380859375, -0.26519775390625, -0.214630126953125, -0.1640625, -0.113494873046875, -0.06292724609375, -0.012359619140625, 0.0382080078125, 0.088775634765625, 0.13934326171875, 0.189910888671875, 0.240478515625, 0.291046142578125, 0.34161376953125, 0.392181396484375, 0.4427490234375, 0.493316650390625, 0.54388427734375, 0.594451904296875, 0.64501953125, 0.695587158203125, 0.74615478515625, 0.796722412109375, 0.8472900390625, 0.897857666015625, 0.94842529296875, 0.998992919921875, 1.049560546875, 1.100128173828125, 1.15069580078125, 1.201263427734375, 1.2518310546875, 1.302398681640625, 1.35296630859375, 1.403533935546875, 1.4541015625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 6.0, 7.0, 7.0, 8.0, 20.0, 20.0, 40.0, 53.0, 118.0, 170.0, 314.0, 564.0, 1177.0, 2457.0, 6320.0, 21170.0, 82764.0, 331288.0, 431903.0, 124672.0, 30357.0, 8860.0, 3196.0, 1445.0, 644.0, 386.0, 234.0, 143.0, 72.0, 49.0, 16.0, 29.0, 13.0, 13.0, 6.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1170654296875, -0.11304855346679688, -0.10903167724609375, -0.10501480102539062, -0.1009979248046875, -0.09698104858398438, -0.09296417236328125, -0.08894729614257812, -0.084930419921875, -0.08091354370117188, -0.07689666748046875, -0.07287979125976562, -0.0688629150390625, -0.06484603881835938, -0.06082916259765625, -0.056812286376953125, -0.05279541015625, -0.048778533935546875, -0.04476165771484375, -0.040744781494140625, -0.0367279052734375, -0.032711029052734375, -0.02869415283203125, -0.024677276611328125, -0.020660400390625, -0.016643524169921875, -0.01262664794921875, -0.008609771728515625, -0.0045928955078125, -0.000576019287109375, 0.00344085693359375, 0.007457733154296875, 0.011474609375, 0.015491485595703125, 0.01950836181640625, 0.023525238037109375, 0.0275421142578125, 0.031558990478515625, 0.03557586669921875, 0.039592742919921875, 0.043609619140625, 0.047626495361328125, 0.05164337158203125, 0.055660247802734375, 0.0596771240234375, 0.06369400024414062, 0.06771087646484375, 0.07172775268554688, 0.07574462890625, 0.07976150512695312, 0.08377838134765625, 0.08779525756835938, 0.0918121337890625, 0.09582901000976562, 0.09984588623046875, 0.10386276245117188, 0.107879638671875, 0.11189651489257812, 0.11591339111328125, 0.11993026733398438, 0.1239471435546875, 0.12796401977539062, 0.13198089599609375, 0.13599777221679688, 0.1400146484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 9.0, 8.0, 10.0, 14.0, 22.0, 33.0, 27.0, 68.0, 68.0, 85.0, 91.0, 103.0, 99.0, 94.0, 74.0, 58.0, 36.0, 24.0, 20.0, 14.0, 14.0, 8.0, 10.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.681680679321289e-05, -6.51627779006958e-05, -6.350874900817871e-05, -6.185472011566162e-05, -6.020069122314453e-05, -5.854666233062744e-05, -5.689263343811035e-05, -5.523860454559326e-05, -5.358457565307617e-05, -5.193054676055908e-05, -5.027651786804199e-05, -4.86224889755249e-05, -4.696846008300781e-05, -4.531443119049072e-05, -4.366040229797363e-05, -4.200637340545654e-05, -4.035234451293945e-05, -3.869831562042236e-05, -3.7044286727905273e-05, -3.5390257835388184e-05, -3.3736228942871094e-05, -3.2082200050354004e-05, -3.0428171157836914e-05, -2.8774142265319824e-05, -2.7120113372802734e-05, -2.5466084480285645e-05, -2.3812055587768555e-05, -2.2158026695251465e-05, -2.0503997802734375e-05, -1.8849968910217285e-05, -1.7195940017700195e-05, -1.5541911125183105e-05, -1.3887882232666016e-05, -1.2233853340148926e-05, -1.0579824447631836e-05, -8.925795555114746e-06, -7.271766662597656e-06, -5.617737770080566e-06, -3.9637088775634766e-06, -2.3096799850463867e-06, -6.556510925292969e-07, 9.98377799987793e-07, 2.652406692504883e-06, 4.306435585021973e-06, 5.9604644775390625e-06, 7.614493370056152e-06, 9.268522262573242e-06, 1.0922551155090332e-05, 1.2576580047607422e-05, 1.4230608940124512e-05, 1.58846378326416e-05, 1.753866672515869e-05, 1.919269561767578e-05, 2.084672451019287e-05, 2.250075340270996e-05, 2.415478229522705e-05, 2.580881118774414e-05, 2.746284008026123e-05, 2.911686897277832e-05, 3.077089786529541e-05, 3.24249267578125e-05, 3.407895565032959e-05, 3.573298454284668e-05, 3.738701343536377e-05, 3.904104232788086e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 7.0, 4.0, 13.0, 6.0, 15.0, 10.0, 35.0, 47.0, 60.0, 82.0, 154.0, 266.0, 622.0, 1593.0, 5491.0, 26081.0, 177334.0, 634711.0, 169101.0, 24775.0, 5345.0, 1508.0, 626.0, 285.0, 147.0, 79.0, 42.0, 27.0, 29.0, 21.0, 12.0, 9.0, 4.0, 5.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2091064453125, -0.20286178588867188, -0.19661712646484375, -0.19037246704101562, -0.1841278076171875, -0.17788314819335938, -0.17163848876953125, -0.16539382934570312, -0.159149169921875, -0.15290451049804688, -0.14665985107421875, -0.14041519165039062, -0.1341705322265625, -0.12792587280273438, -0.12168121337890625, -0.11543655395507812, -0.10919189453125, -0.10294723510742188, -0.09670257568359375, -0.09045791625976562, -0.0842132568359375, -0.07796859741210938, -0.07172393798828125, -0.06547927856445312, -0.059234619140625, -0.052989959716796875, -0.04674530029296875, -0.040500640869140625, -0.0342559814453125, -0.028011322021484375, -0.02176666259765625, -0.015522003173828125, -0.00927734375, -0.003032684326171875, 0.00321197509765625, 0.009456634521484375, 0.0157012939453125, 0.021945953369140625, 0.02819061279296875, 0.034435272216796875, 0.040679931640625, 0.046924591064453125, 0.05316925048828125, 0.059413909912109375, 0.0656585693359375, 0.07190322875976562, 0.07814788818359375, 0.08439254760742188, 0.09063720703125, 0.09688186645507812, 0.10312652587890625, 0.10937118530273438, 0.1156158447265625, 0.12186050415039062, 0.12810516357421875, 0.13434982299804688, 0.140594482421875, 0.14683914184570312, 0.15308380126953125, 0.15932846069335938, 0.1655731201171875, 0.17181777954101562, 0.17806243896484375, 0.18430709838867188, 0.1905517578125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 0.0, 2.0, 2.0, 6.0, 5.0, 8.0, 8.0, 16.0, 25.0, 26.0, 34.0, 42.0, 46.0, 68.0, 106.0, 84.0, 93.0, 85.0, 68.0, 63.0, 49.0, 44.0, 28.0, 18.0, 16.0, 19.0, 12.0, 8.0, 6.0, 5.0, 1.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03863525390625, -0.037210941314697266, -0.03578662872314453, -0.0343623161315918, -0.03293800354003906, -0.03151369094848633, -0.030089378356933594, -0.02866506576538086, -0.027240753173828125, -0.02581644058227539, -0.024392127990722656, -0.022967815399169922, -0.021543502807617188, -0.020119190216064453, -0.01869487762451172, -0.017270565032958984, -0.01584625244140625, -0.014421939849853516, -0.012997627258300781, -0.011573314666748047, -0.010149002075195312, -0.008724689483642578, -0.007300376892089844, -0.005876064300537109, -0.004451751708984375, -0.0030274391174316406, -0.0016031265258789062, -0.00017881393432617188, 0.0012454986572265625, 0.002669811248779297, 0.004094123840332031, 0.005518436431884766, 0.0069427490234375, 0.008367061614990234, 0.009791374206542969, 0.011215686798095703, 0.012639999389648438, 0.014064311981201172, 0.015488624572753906, 0.01691293716430664, 0.018337249755859375, 0.01976156234741211, 0.021185874938964844, 0.022610187530517578, 0.024034500122070312, 0.025458812713623047, 0.02688312530517578, 0.028307437896728516, 0.02973175048828125, 0.031156063079833984, 0.03258037567138672, 0.03400468826293945, 0.03542900085449219, 0.03685331344604492, 0.038277626037597656, 0.03970193862915039, 0.041126251220703125, 0.04255056381225586, 0.043974876403808594, 0.04539918899536133, 0.04682350158691406, 0.0482478141784668, 0.04967212677001953, 0.051096439361572266, 0.052520751953125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 5.0, 5.0, 16.0, 19.0, 46.0, 44.0, 80.0, 125.0, 140.0, 155.0, 127.0, 93.0, 57.0, 31.0, 27.0, 15.0, 7.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.9136167764663696, -1.8592132329940796, -1.8048096895217896, -1.750406265258789, -1.696002721786499, -1.641599178314209, -1.587195634841919, -1.532792091369629, -1.4783885478973389, -1.4239850044250488, -1.3695814609527588, -1.3151779174804688, -1.2607744932174683, -1.2063709497451782, -1.1519674062728882, -1.0975638628005981, -1.0431604385375977, -0.9887568950653076, -0.9343534111976624, -0.8799498677253723, -0.825546383857727, -0.771142840385437, -0.716739296913147, -0.6623357534408569, -0.6079322695732117, -0.5535287261009216, -0.49912524223327637, -0.44472169876098633, -0.3903181850910187, -0.335914671421051, -0.281511127948761, -0.22710761427879333, -0.17270398139953613, -0.11830046027898788, -0.06389693915843964, -0.009493410587310791, 0.04491010308265686, 0.09931361675262451, 0.15371716022491455, 0.2081206738948822, 0.26252418756484985, 0.3169277012348175, 0.37133121490478516, 0.4257347583770752, 0.48013827204704285, 0.5345417857170105, 0.5889453291893005, 0.6433488130569458, 0.6977523565292358, 0.7521559000015259, 0.8065593838691711, 0.8609629273414612, 0.9153664112091064, 0.9697699546813965, 1.0241734981536865, 1.0785770416259766, 1.1329805850982666, 1.1873841285705566, 1.2417876720428467, 1.2961912155151367, 1.3505946397781372, 1.4049981832504272, 1.4594017267227173, 1.5138052701950073, 1.5682086944580078]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 8.0, 5.0, 3.0, 6.0, 5.0, 4.0, 8.0, 6.0, 24.0, 19.0, 26.0, 28.0, 26.0, 24.0, 42.0, 36.0, 27.0, 38.0, 42.0, 44.0, 48.0, 45.0, 51.0, 46.0, 49.0, 40.0, 35.0, 39.0, 43.0, 28.0, 24.0, 26.0, 16.0, 14.0, 21.0, 12.0, 11.0, 10.0, 7.0, 7.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6900408267974854, -0.6668879389762878, -0.6437351107597351, -0.6205822229385376, -0.5974293947219849, -0.5742765069007874, -0.5511236190795898, -0.5279707908630371, -0.5048179626464844, -0.48166510462760925, -0.45851224660873413, -0.4353593587875366, -0.4122065305709839, -0.3890536427497864, -0.36590078473091125, -0.34274792671203613, -0.3195950388908386, -0.2964421808719635, -0.2732893228530884, -0.25013643503189087, -0.22698359191417694, -0.20383073389530182, -0.1806778609752655, -0.15752500295639038, -0.13437214493751526, -0.11121928691864014, -0.08806642144918442, -0.0649135559797287, -0.04176069796085358, -0.018607839941978455, 0.004545032978057861, 0.027697890996932983, 0.05085068941116333, 0.07400354743003845, 0.09715641289949417, 0.12030927836894989, 0.143462136387825, 0.16661499440670013, 0.18976786732673645, 0.21292072534561157, 0.2360735833644867, 0.2592264413833618, 0.28237929940223694, 0.30553215742111206, 0.32868504524230957, 0.3518378734588623, 0.3749907612800598, 0.39814361929893494, 0.42129647731781006, 0.4444493353366852, 0.4676021933555603, 0.4907550811767578, 0.5139079093933105, 0.5370607972145081, 0.5602136850357056, 0.5833665132522583, 0.606519341468811, 0.6296722292900085, 0.6528250575065613, 0.6759779453277588, 0.6991307735443115, 0.722283661365509, 0.7454365491867065, 0.7685893774032593, 0.7917422652244568]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 4.0, 6.0, 22.0, 11.0, 14.0, 37.0, 58.0, 69.0, 113.0, 190.0, 250.0, 401.0, 650.0, 1077.0, 1981.0, 3666.0, 7669.0, 16575.0, 37859.0, 96839.0, 273034.0, 373937.0, 138502.0, 52737.0, 22162.0, 9997.0, 4762.0, 2435.0, 1358.0, 806.0, 450.0, 290.0, 181.0, 130.0, 86.0, 60.0, 30.0, 29.0, 17.0, 17.0, 12.0, 9.0, 4.0, 5.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.52685546875, -0.5104827880859375, -0.494110107421875, -0.4777374267578125, -0.46136474609375, -0.4449920654296875, -0.428619384765625, -0.4122467041015625, -0.3958740234375, -0.3795013427734375, -0.363128662109375, -0.3467559814453125, -0.33038330078125, -0.3140106201171875, -0.297637939453125, -0.2812652587890625, -0.264892578125, -0.2485198974609375, -0.232147216796875, -0.2157745361328125, -0.19940185546875, -0.1830291748046875, -0.166656494140625, -0.1502838134765625, -0.1339111328125, -0.1175384521484375, -0.101165771484375, -0.0847930908203125, -0.06842041015625, -0.0520477294921875, -0.035675048828125, -0.0193023681640625, -0.0029296875, 0.0134429931640625, 0.029815673828125, 0.0461883544921875, 0.06256103515625, 0.0789337158203125, 0.095306396484375, 0.1116790771484375, 0.1280517578125, 0.1444244384765625, 0.160797119140625, 0.1771697998046875, 0.19354248046875, 0.2099151611328125, 0.226287841796875, 0.2426605224609375, 0.259033203125, 0.2754058837890625, 0.291778564453125, 0.3081512451171875, 0.32452392578125, 0.3408966064453125, 0.357269287109375, 0.3736419677734375, 0.3900146484375, 0.4063873291015625, 0.422760009765625, 0.4391326904296875, 0.45550537109375, 0.4718780517578125, 0.488250732421875, 0.5046234130859375, 0.52099609375]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 4.0, 5.0, 6.0, 12.0, 9.0, 11.0, 11.0, 26.0, 22.0, 31.0, 33.0, 19.0, 31.0, 46.0, 35.0, 40.0, 43.0, 50.0, 57.0, 46.0, 53.0, 54.0, 43.0, 37.0, 41.0, 42.0, 29.0, 32.0, 18.0, 19.0, 11.0, 20.0, 14.0, 13.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.369140625, -1.3199920654296875, -1.270843505859375, -1.2216949462890625, -1.17254638671875, -1.1233978271484375, -1.074249267578125, -1.0251007080078125, -0.9759521484375, -0.9268035888671875, -0.877655029296875, -0.8285064697265625, -0.77935791015625, -0.7302093505859375, -0.681060791015625, -0.6319122314453125, -0.582763671875, -0.5336151123046875, -0.484466552734375, -0.4353179931640625, -0.38616943359375, -0.3370208740234375, -0.287872314453125, -0.2387237548828125, -0.1895751953125, -0.1404266357421875, -0.091278076171875, -0.0421295166015625, 0.00701904296875, 0.0561676025390625, 0.105316162109375, 0.1544647216796875, 0.20361328125, 0.2527618408203125, 0.301910400390625, 0.3510589599609375, 0.40020751953125, 0.4493560791015625, 0.498504638671875, 0.5476531982421875, 0.5968017578125, 0.6459503173828125, 0.695098876953125, 0.7442474365234375, 0.79339599609375, 0.8425445556640625, 0.891693115234375, 0.9408416748046875, 0.989990234375, 1.0391387939453125, 1.088287353515625, 1.1374359130859375, 1.18658447265625, 1.2357330322265625, 1.284881591796875, 1.3340301513671875, 1.3831787109375, 1.4323272705078125, 1.481475830078125, 1.5306243896484375, 1.57977294921875, 1.6289215087890625, 1.678070068359375, 1.7272186279296875, 1.7763671875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 9.0, 3.0, 10.0, 12.0, 10.0, 24.0, 22.0, 37.0, 40.0, 71.0, 107.0, 127.0, 216.0, 375.0, 839.0, 3478.0, 41929.0, 795689.0, 193562.0, 9163.0, 1478.0, 545.0, 273.0, 166.0, 103.0, 80.0, 57.0, 32.0, 26.0, 21.0, 8.0, 13.0, 6.0, 6.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9853515625, -1.9312896728515625, -1.877227783203125, -1.8231658935546875, -1.76910400390625, -1.7150421142578125, -1.660980224609375, -1.6069183349609375, -1.5528564453125, -1.4987945556640625, -1.444732666015625, -1.3906707763671875, -1.33660888671875, -1.2825469970703125, -1.228485107421875, -1.1744232177734375, -1.120361328125, -1.0662994384765625, -1.012237548828125, -0.9581756591796875, -0.90411376953125, -0.8500518798828125, -0.795989990234375, -0.7419281005859375, -0.6878662109375, -0.6338043212890625, -0.579742431640625, -0.5256805419921875, -0.47161865234375, -0.4175567626953125, -0.363494873046875, -0.3094329833984375, -0.25537109375, -0.2013092041015625, -0.147247314453125, -0.0931854248046875, -0.03912353515625, 0.0149383544921875, 0.069000244140625, 0.1230621337890625, 0.1771240234375, 0.2311859130859375, 0.285247802734375, 0.3393096923828125, 0.39337158203125, 0.4474334716796875, 0.501495361328125, 0.5555572509765625, 0.609619140625, 0.6636810302734375, 0.717742919921875, 0.7718048095703125, 0.82586669921875, 0.8799285888671875, 0.933990478515625, 0.9880523681640625, 1.0421142578125, 1.0961761474609375, 1.150238037109375, 1.2042999267578125, 1.25836181640625, 1.3124237060546875, 1.366485595703125, 1.4205474853515625, 1.474609375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 7.0, 3.0, 6.0, 8.0, 5.0, 10.0, 9.0, 7.0, 13.0, 12.0, 12.0, 15.0, 21.0, 23.0, 20.0, 29.0, 42.0, 35.0, 37.0, 43.0, 43.0, 34.0, 37.0, 30.0, 50.0, 44.0, 39.0, 36.0, 35.0, 33.0, 21.0, 27.0, 33.0, 37.0, 19.0, 17.0, 12.0, 17.0, 5.0, 19.0, 6.0, 13.0, 8.0, 8.0, 8.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0], "bins": [-1.701171875, -1.6514739990234375, -1.601776123046875, -1.5520782470703125, -1.50238037109375, -1.4526824951171875, -1.402984619140625, -1.3532867431640625, -1.3035888671875, -1.2538909912109375, -1.204193115234375, -1.1544952392578125, -1.10479736328125, -1.0550994873046875, -1.005401611328125, -0.9557037353515625, -0.906005859375, -0.8563079833984375, -0.806610107421875, -0.7569122314453125, -0.70721435546875, -0.6575164794921875, -0.607818603515625, -0.5581207275390625, -0.5084228515625, -0.4587249755859375, -0.409027099609375, -0.3593292236328125, -0.30963134765625, -0.2599334716796875, -0.210235595703125, -0.1605377197265625, -0.11083984375, -0.0611419677734375, -0.011444091796875, 0.0382537841796875, 0.08795166015625, 0.1376495361328125, 0.187347412109375, 0.2370452880859375, 0.2867431640625, 0.3364410400390625, 0.386138916015625, 0.4358367919921875, 0.48553466796875, 0.5352325439453125, 0.584930419921875, 0.6346282958984375, 0.684326171875, 0.7340240478515625, 0.783721923828125, 0.8334197998046875, 0.88311767578125, 0.9328155517578125, 0.982513427734375, 1.0322113037109375, 1.0819091796875, 1.1316070556640625, 1.181304931640625, 1.2310028076171875, 1.28070068359375, 1.3303985595703125, 1.380096435546875, 1.4297943115234375, 1.4794921875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 6.0, 22.0, 44.0, 84.0, 209.0, 1260.0, 119956.0, 923073.0, 3244.0, 401.0, 122.0, 53.0, 26.0, 13.0, 8.0, 6.0, 7.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3359375, -1.2867584228515625, -1.237579345703125, -1.1884002685546875, -1.13922119140625, -1.0900421142578125, -1.040863037109375, -0.9916839599609375, -0.9425048828125, -0.8933258056640625, -0.844146728515625, -0.7949676513671875, -0.74578857421875, -0.6966094970703125, -0.647430419921875, -0.5982513427734375, -0.549072265625, -0.4998931884765625, -0.450714111328125, -0.4015350341796875, -0.35235595703125, -0.3031768798828125, -0.253997802734375, -0.2048187255859375, -0.1556396484375, -0.1064605712890625, -0.057281494140625, -0.0081024169921875, 0.04107666015625, 0.0902557373046875, 0.139434814453125, 0.1886138916015625, 0.23779296875, 0.2869720458984375, 0.336151123046875, 0.3853302001953125, 0.43450927734375, 0.4836883544921875, 0.532867431640625, 0.5820465087890625, 0.6312255859375, 0.6804046630859375, 0.729583740234375, 0.7787628173828125, 0.82794189453125, 0.8771209716796875, 0.926300048828125, 0.9754791259765625, 1.024658203125, 1.0738372802734375, 1.123016357421875, 1.1721954345703125, 1.22137451171875, 1.2705535888671875, 1.319732666015625, 1.3689117431640625, 1.4180908203125, 1.4672698974609375, 1.516448974609375, 1.5656280517578125, 1.61480712890625, 1.6639862060546875, 1.713165283203125, 1.7623443603515625, 1.8115234375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 10.0, 7.0, 5.0, 10.0, 14.0, 20.0, 39.0, 58.0, 107.0, 143.0, 166.0, 141.0, 110.0, 61.0, 45.0, 19.0, 20.0, 13.0, 10.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00010859966278076172, -0.0001061074435710907, -0.00010361522436141968, -0.00010112300515174866, -9.863078594207764e-05, -9.613856673240662e-05, -9.36463475227356e-05, -9.115412831306458e-05, -8.866190910339355e-05, -8.616968989372253e-05, -8.367747068405151e-05, -8.118525147438049e-05, -7.869303226470947e-05, -7.620081305503845e-05, -7.370859384536743e-05, -7.121637463569641e-05, -6.872415542602539e-05, -6.623193621635437e-05, -6.373971700668335e-05, -6.124749779701233e-05, -5.875527858734131e-05, -5.626305937767029e-05, -5.377084016799927e-05, -5.127862095832825e-05, -4.8786401748657227e-05, -4.6294182538986206e-05, -4.3801963329315186e-05, -4.1309744119644165e-05, -3.8817524909973145e-05, -3.6325305700302124e-05, -3.3833086490631104e-05, -3.134086728096008e-05, -2.8848648071289062e-05, -2.6356428861618042e-05, -2.386420965194702e-05, -2.1371990442276e-05, -1.887977123260498e-05, -1.638755202293396e-05, -1.389533281326294e-05, -1.1403113603591919e-05, -8.910894393920898e-06, -6.418675184249878e-06, -3.926455974578857e-06, -1.434236764907837e-06, 1.0579824447631836e-06, 3.550201654434204e-06, 6.042420864105225e-06, 8.534640073776245e-06, 1.1026859283447266e-05, 1.3519078493118286e-05, 1.6011297702789307e-05, 1.8503516912460327e-05, 2.0995736122131348e-05, 2.3487955331802368e-05, 2.598017454147339e-05, 2.847239375114441e-05, 3.096461296081543e-05, 3.345683217048645e-05, 3.594905138015747e-05, 3.844127058982849e-05, 4.093348979949951e-05, 4.342570900917053e-05, 4.591792821884155e-05, 4.841014742851257e-05, 5.0902366638183594e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 6.0, 1.0, 3.0, 8.0, 9.0, 12.0, 19.0, 24.0, 56.0, 88.0, 219.0, 772.0, 4735.0, 702743.0, 335381.0, 3555.0, 583.0, 168.0, 74.0, 32.0, 22.0, 20.0, 12.0, 10.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.884765625, -1.8418731689453125, -1.798980712890625, -1.7560882568359375, -1.71319580078125, -1.6703033447265625, -1.627410888671875, -1.5845184326171875, -1.5416259765625, -1.4987335205078125, -1.455841064453125, -1.4129486083984375, -1.37005615234375, -1.3271636962890625, -1.284271240234375, -1.2413787841796875, -1.198486328125, -1.1555938720703125, -1.112701416015625, -1.0698089599609375, -1.02691650390625, -0.9840240478515625, -0.941131591796875, -0.8982391357421875, -0.8553466796875, -0.8124542236328125, -0.769561767578125, -0.7266693115234375, -0.68377685546875, -0.6408843994140625, -0.597991943359375, -0.5550994873046875, -0.51220703125, -0.4693145751953125, -0.426422119140625, -0.3835296630859375, -0.34063720703125, -0.2977447509765625, -0.254852294921875, -0.2119598388671875, -0.1690673828125, -0.1261749267578125, -0.083282470703125, -0.0403900146484375, 0.00250244140625, 0.0453948974609375, 0.088287353515625, 0.1311798095703125, 0.174072265625, 0.2169647216796875, 0.259857177734375, 0.3027496337890625, 0.34564208984375, 0.3885345458984375, 0.431427001953125, 0.4743194580078125, 0.5172119140625, 0.5601043701171875, 0.602996826171875, 0.6458892822265625, 0.68878173828125, 0.7316741943359375, 0.774566650390625, 0.8174591064453125, 0.8603515625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 11.0, 6.0, 15.0, 20.0, 54.0, 69.0, 124.0, 163.0, 187.0, 127.0, 76.0, 53.0, 36.0, 20.0, 10.0, 10.0, 7.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.25634765625, -0.24568557739257812, -0.23502349853515625, -0.22436141967773438, -0.2136993408203125, -0.20303726196289062, -0.19237518310546875, -0.18171310424804688, -0.171051025390625, -0.16038894653320312, -0.14972686767578125, -0.13906478881835938, -0.1284027099609375, -0.11774063110351562, -0.10707855224609375, -0.09641647338867188, -0.08575439453125, -0.07509231567382812, -0.06443023681640625, -0.053768157958984375, -0.0431060791015625, -0.032444000244140625, -0.02178192138671875, -0.011119842529296875, -0.000457763671875, 0.010204315185546875, 0.02086639404296875, 0.031528472900390625, 0.0421905517578125, 0.052852630615234375, 0.06351470947265625, 0.07417678833007812, 0.0848388671875, 0.09550094604492188, 0.10616302490234375, 0.11682510375976562, 0.1274871826171875, 0.13814926147460938, 0.14881134033203125, 0.15947341918945312, 0.170135498046875, 0.18079757690429688, 0.19145965576171875, 0.20212173461914062, 0.2127838134765625, 0.22344589233398438, 0.23410797119140625, 0.24477005004882812, 0.25543212890625, 0.2660942077636719, 0.27675628662109375, 0.2874183654785156, 0.2980804443359375, 0.3087425231933594, 0.31940460205078125, 0.3300666809082031, 0.340728759765625, 0.3513908386230469, 0.36205291748046875, 0.3727149963378906, 0.3833770751953125, 0.3940391540527344, 0.40470123291015625, 0.4153633117675781, 0.426025390625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 9.0, 10.0, 40.0, 60.0, 105.0, 170.0, 201.0, 169.0, 100.0, 68.0, 34.0, 16.0, 9.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-6.5707292556762695, -6.426671028137207, -6.2826128005981445, -6.13855504989624, -5.994496822357178, -5.850438594818115, -5.706380367279053, -5.56232213973999, -5.418264389038086, -5.274206161499023, -5.130147933959961, -4.986090183258057, -4.842031955718994, -4.697973728179932, -4.553915500640869, -4.409857273101807, -4.265799045562744, -4.121740818023682, -3.9776828289031982, -3.8336246013641357, -3.6895666122436523, -3.54550838470459, -3.4014501571655273, -3.257391929626465, -3.1133339405059814, -2.969275712966919, -2.8252177238464355, -2.681159496307373, -2.5371012687683105, -2.393043279647827, -2.2489850521087646, -2.1049270629882812, -1.9608688354492188, -1.8168107271194458, -1.6727526187896729, -1.5286943912506104, -1.3846362829208374, -1.2405781745910645, -1.096519947052002, -0.952461838722229, -0.808403730392456, -0.6643456220626831, -0.5202874541282654, -0.37622931599617004, -0.2321711778640747, -0.08811306953430176, 0.05594509840011597, 0.2000032663345337, 0.34406137466430664, 0.488119512796402, 0.6321776509284973, 0.776235818862915, 0.920293927192688, 1.064352035522461, 1.2084102630615234, 1.3524683713912964, 1.4965264797210693, 1.6405845880508423, 1.7846426963806152, 1.9287009239196777, 2.0727591514587402, 2.2168171405792236, 2.360875368118286, 2.5049333572387695, 2.648991584777832]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 0.0, 5.0, 6.0, 6.0, 12.0, 10.0, 11.0, 18.0, 24.0, 16.0, 26.0, 22.0, 19.0, 21.0, 40.0, 40.0, 34.0, 49.0, 35.0, 36.0, 28.0, 42.0, 40.0, 20.0, 45.0, 34.0, 51.0, 41.0, 34.0, 28.0, 28.0, 27.0, 32.0, 23.0, 12.0, 12.0, 16.0, 17.0, 8.0, 2.0, 8.0, 7.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.7254226207733154, -2.6395819187164307, -2.553741216659546, -2.467900514602661, -2.3820598125457764, -2.2962191104888916, -2.210378646850586, -2.124537944793701, -2.0386972427368164, -1.9528565406799316, -1.8670158386230469, -1.781175136566162, -1.6953344345092773, -1.6094937324523926, -1.5236531496047974, -1.4378124475479126, -1.3519716262817383, -1.2661309242248535, -1.1802902221679688, -1.094449520111084, -1.0086088180541992, -0.9227681756019592, -0.8369275331497192, -0.7510868310928345, -0.6652461290359497, -0.5794054269790649, -0.49356475472450256, -0.4077240824699402, -0.3218833804130554, -0.23604267835617065, -0.15020203590393066, -0.0643613338470459, 0.021479368209838867, 0.10732005536556244, 0.193160742521286, 0.2790014147758484, 0.36484211683273315, 0.4506828188896179, 0.5365234613418579, 0.6223641633987427, 0.7082048654556274, 0.7940455675125122, 0.879886269569397, 0.965726912021637, 1.051567554473877, 1.1374082565307617, 1.2232489585876465, 1.3090896606445312, 1.394930362701416, 1.4807710647583008, 1.5666117668151855, 1.6524524688720703, 1.738293170928955, 1.8241338729858398, 1.909974455833435, 1.9958151578903198, 2.081655979156494, 2.167496681213379, 2.2533373832702637, 2.3391780853271484, 2.425018787384033, 2.510859489440918, 2.5967001914978027, 2.6825408935546875, 2.768381357192993]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 10.0, 17.0, 8.0, 8.0, 19.0, 26.0, 29.0, 27.0, 56.0, 65.0, 104.0, 166.0, 252.0, 403.0, 743.0, 1316.0, 2641.0, 5989.0, 16103.0, 56159.0, 270214.0, 1298996.0, 1871141.0, 525483.0, 102917.0, 25506.0, 8461.0, 3402.0, 1620.0, 889.0, 515.0, 325.0, 213.0, 118.0, 110.0, 71.0, 45.0, 36.0, 24.0, 17.0, 8.0, 15.0, 0.0, 7.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.201171875, -1.1649932861328125, -1.128814697265625, -1.0926361083984375, -1.05645751953125, -1.0202789306640625, -0.984100341796875, -0.9479217529296875, -0.9117431640625, -0.8755645751953125, -0.839385986328125, -0.8032073974609375, -0.76702880859375, -0.7308502197265625, -0.694671630859375, -0.6584930419921875, -0.622314453125, -0.5861358642578125, -0.549957275390625, -0.5137786865234375, -0.47760009765625, -0.4414215087890625, -0.405242919921875, -0.3690643310546875, -0.3328857421875, -0.2967071533203125, -0.260528564453125, -0.2243499755859375, -0.18817138671875, -0.1519927978515625, -0.115814208984375, -0.0796356201171875, -0.04345703125, -0.0072784423828125, 0.028900146484375, 0.0650787353515625, 0.10125732421875, 0.1374359130859375, 0.173614501953125, 0.2097930908203125, 0.2459716796875, 0.2821502685546875, 0.318328857421875, 0.3545074462890625, 0.39068603515625, 0.4268646240234375, 0.463043212890625, 0.4992218017578125, 0.535400390625, 0.5715789794921875, 0.607757568359375, 0.6439361572265625, 0.68011474609375, 0.7162933349609375, 0.752471923828125, 0.7886505126953125, 0.8248291015625, 0.8610076904296875, 0.897186279296875, 0.9333648681640625, 0.96954345703125, 1.0057220458984375, 1.041900634765625, 1.0780792236328125, 1.1142578125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 8.0, 12.0, 8.0, 17.0, 25.0, 21.0, 22.0, 25.0, 43.0, 46.0, 48.0, 60.0, 45.0, 60.0, 54.0, 54.0, 61.0, 56.0, 44.0, 50.0, 45.0, 40.0, 39.0, 32.0, 11.0, 13.0, 19.0, 10.0, 6.0, 8.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.919921875, -0.8827056884765625, -0.845489501953125, -0.8082733154296875, -0.77105712890625, -0.7338409423828125, -0.696624755859375, -0.6594085693359375, -0.6221923828125, -0.5849761962890625, -0.547760009765625, -0.5105438232421875, -0.47332763671875, -0.4361114501953125, -0.398895263671875, -0.3616790771484375, -0.324462890625, -0.2872467041015625, -0.250030517578125, -0.2128143310546875, -0.17559814453125, -0.1383819580078125, -0.101165771484375, -0.0639495849609375, -0.0267333984375, 0.0104827880859375, 0.047698974609375, 0.0849151611328125, 0.12213134765625, 0.1593475341796875, 0.196563720703125, 0.2337799072265625, 0.27099609375, 0.3082122802734375, 0.345428466796875, 0.3826446533203125, 0.41986083984375, 0.4570770263671875, 0.494293212890625, 0.5315093994140625, 0.5687255859375, 0.6059417724609375, 0.643157958984375, 0.6803741455078125, 0.71759033203125, 0.7548065185546875, 0.792022705078125, 0.8292388916015625, 0.866455078125, 0.9036712646484375, 0.940887451171875, 0.9781036376953125, 1.01531982421875, 1.0525360107421875, 1.089752197265625, 1.1269683837890625, 1.1641845703125, 1.2014007568359375, 1.238616943359375, 1.2758331298828125, 1.31304931640625, 1.3502655029296875, 1.387481689453125, 1.4246978759765625, 1.4619140625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 6.0, 8.0, 10.0, 15.0, 27.0, 32.0, 50.0, 108.0, 171.0, 340.0, 713.0, 1875.0, 7454.0, 82703.0, 3764510.0, 316663.0, 14816.0, 2857.0, 937.0, 441.0, 195.0, 128.0, 85.0, 45.0, 22.0, 21.0, 9.0, 13.0, 5.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.849609375, -2.753570556640625, -2.65753173828125, -2.561492919921875, -2.4654541015625, -2.369415283203125, -2.27337646484375, -2.177337646484375, -2.081298828125, -1.985260009765625, -1.88922119140625, -1.793182373046875, -1.6971435546875, -1.601104736328125, -1.50506591796875, -1.409027099609375, -1.31298828125, -1.216949462890625, -1.12091064453125, -1.024871826171875, -0.9288330078125, -0.832794189453125, -0.73675537109375, -0.640716552734375, -0.544677734375, -0.448638916015625, -0.35260009765625, -0.256561279296875, -0.1605224609375, -0.064483642578125, 0.03155517578125, 0.127593994140625, 0.2236328125, 0.319671630859375, 0.41571044921875, 0.511749267578125, 0.6077880859375, 0.703826904296875, 0.79986572265625, 0.895904541015625, 0.991943359375, 1.087982177734375, 1.18402099609375, 1.280059814453125, 1.3760986328125, 1.472137451171875, 1.56817626953125, 1.664215087890625, 1.76025390625, 1.856292724609375, 1.95233154296875, 2.048370361328125, 2.1444091796875, 2.240447998046875, 2.33648681640625, 2.432525634765625, 2.528564453125, 2.624603271484375, 2.72064208984375, 2.816680908203125, 2.9127197265625, 3.008758544921875, 3.10479736328125, 3.200836181640625, 3.296875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 7.0, 9.0, 6.0, 14.0, 21.0, 24.0, 41.0, 64.0, 104.0, 164.0, 300.0, 550.0, 782.0, 770.0, 509.0, 304.0, 168.0, 97.0, 37.0, 37.0, 25.0, 17.0, 6.0, 7.0, 4.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60693359375, -0.5859603881835938, -0.5649871826171875, -0.5440139770507812, -0.523040771484375, -0.5020675659179688, -0.4810943603515625, -0.46012115478515625, -0.43914794921875, -0.41817474365234375, -0.3972015380859375, -0.37622833251953125, -0.355255126953125, -0.33428192138671875, -0.3133087158203125, -0.29233551025390625, -0.2713623046875, -0.25038909912109375, -0.2294158935546875, -0.20844268798828125, -0.187469482421875, -0.16649627685546875, -0.1455230712890625, -0.12454986572265625, -0.10357666015625, -0.08260345458984375, -0.0616302490234375, -0.04065704345703125, -0.019683837890625, 0.00128936767578125, 0.0222625732421875, 0.04323577880859375, 0.064208984375, 0.08518218994140625, 0.1061553955078125, 0.12712860107421875, 0.148101806640625, 0.16907501220703125, 0.1900482177734375, 0.21102142333984375, 0.23199462890625, 0.25296783447265625, 0.2739410400390625, 0.29491424560546875, 0.315887451171875, 0.33686065673828125, 0.3578338623046875, 0.37880706787109375, 0.3997802734375, 0.42075347900390625, 0.4417266845703125, 0.46269989013671875, 0.483673095703125, 0.5046463012695312, 0.5256195068359375, 0.5465927124023438, 0.56756591796875, 0.5885391235351562, 0.6095123291015625, 0.6304855346679688, 0.651458740234375, 0.6724319458007812, 0.6934051513671875, 0.7143783569335938, 0.7353515625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 12.0, 7.0, 29.0, 36.0, 62.0, 84.0, 101.0, 138.0, 134.0, 123.0, 100.0, 74.0, 41.0, 25.0, 13.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.4242005348205566, -2.33559513092041, -2.2469897270202637, -2.158384323120117, -2.0697786808013916, -1.9811732769012451, -1.8925678730010986, -1.8039624691009521, -1.7153569459915161, -1.6267515420913696, -1.5381460189819336, -1.449540615081787, -1.3609352111816406, -1.2723296880722046, -1.183724284172058, -1.095118761062622, -1.0065133571624756, -0.9179078936576843, -0.8293024301528931, -0.7406970262527466, -0.6520915627479553, -0.5634860992431641, -0.4748806953430176, -0.3862752318382263, -0.29766976833343506, -0.209064319729805, -0.12045887112617493, -0.031853437423706055, 0.056752026081085205, 0.14535748958587646, 0.23396289348602295, 0.3225683569908142, 0.41117382049560547, 0.49977928400039673, 0.588384747505188, 0.6769901514053345, 0.7655956149101257, 0.854201078414917, 0.9428064823150635, 1.03141188621521, 1.120017409324646, 1.2086228132247925, 1.2972283363342285, 1.385833740234375, 1.4744391441345215, 1.5630446672439575, 1.651650071144104, 1.74025559425354, 1.8288609981536865, 1.917466402053833, 2.0060718059539795, 2.094677448272705, 2.1832828521728516, 2.271888256072998, 2.3604936599731445, 2.449099063873291, 2.5377044677734375, 2.626309871673584, 2.7149152755737305, 2.803520679473877, 2.8921263217926025, 2.980731725692749, 3.0693371295928955, 3.157942533493042, 3.2465481758117676]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 9.0, 10.0, 11.0, 13.0, 20.0, 16.0, 27.0, 27.0, 18.0, 20.0, 34.0, 39.0, 42.0, 31.0, 35.0, 40.0, 46.0, 31.0, 39.0, 39.0, 35.0, 35.0, 50.0, 34.0, 48.0, 41.0, 36.0, 23.0, 24.0, 23.0, 29.0, 13.0, 15.0, 13.0, 4.0, 8.0, 1.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0734831094741821, -1.0392005443572998, -1.0049179792404175, -0.9706354737281799, -0.9363529086112976, -0.9020703434944153, -0.8677878379821777, -0.8335052728652954, -0.7992227077484131, -0.7649401426315308, -0.7306575775146484, -0.6963750720024109, -0.6620925068855286, -0.6278099417686462, -0.5935274362564087, -0.5592448711395264, -0.524962306022644, -0.4906797409057617, -0.4563972055912018, -0.42211467027664185, -0.3878321051597595, -0.3535495400428772, -0.31926700472831726, -0.2849844694137573, -0.250701904296875, -0.21641935408115387, -0.18213680386543274, -0.1478542536497116, -0.11357170343399048, -0.07928915321826935, -0.04500660300254822, -0.010724052786827087, 0.023558378219604492, 0.05784092843532562, 0.09212347865104675, 0.12640602886676788, 0.160688579082489, 0.19497112929821014, 0.22925367951393127, 0.2635362148284912, 0.29781877994537354, 0.33210134506225586, 0.3663838803768158, 0.40066641569137573, 0.43494898080825806, 0.4692315459251404, 0.5035140514373779, 0.5377966165542603, 0.5720791816711426, 0.6063617467880249, 0.6406443119049072, 0.6749268174171448, 0.7092093825340271, 0.7434919476509094, 0.777774453163147, 0.8120570182800293, 0.8463395833969116, 0.880622148513794, 0.9149047136306763, 0.9491872191429138, 0.9834697842597961, 1.0177522897720337, 1.052034854888916, 1.0863174200057983, 1.1205999851226807]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 2.0, 6.0, 11.0, 14.0, 17.0, 29.0, 66.0, 101.0, 165.0, 235.0, 463.0, 841.0, 1497.0, 3073.0, 6903.0, 17291.0, 61097.0, 286285.0, 487876.0, 131387.0, 31189.0, 10664.0, 4571.0, 2180.0, 1121.0, 598.0, 319.0, 218.0, 115.0, 86.0, 49.0, 26.0, 18.0, 8.0, 13.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.51513671875, -0.5013084411621094, -0.48748016357421875, -0.4736518859863281, -0.4598236083984375, -0.4459953308105469, -0.43216705322265625, -0.4183387756347656, -0.404510498046875, -0.3906822204589844, -0.37685394287109375, -0.3630256652832031, -0.3491973876953125, -0.3353691101074219, -0.32154083251953125, -0.3077125549316406, -0.29388427734375, -0.2800559997558594, -0.26622772216796875, -0.2523994445800781, -0.2385711669921875, -0.22474288940429688, -0.21091461181640625, -0.19708633422851562, -0.183258056640625, -0.16942977905273438, -0.15560150146484375, -0.14177322387695312, -0.1279449462890625, -0.11411666870117188, -0.10028839111328125, -0.08646011352539062, -0.0726318359375, -0.058803558349609375, -0.04497528076171875, -0.031147003173828125, -0.0173187255859375, -0.003490447998046875, 0.01033782958984375, 0.024166107177734375, 0.037994384765625, 0.051822662353515625, 0.06565093994140625, 0.07947921752929688, 0.0933074951171875, 0.10713577270507812, 0.12096405029296875, 0.13479232788085938, 0.14862060546875, 0.16244888305664062, 0.17627716064453125, 0.19010543823242188, 0.2039337158203125, 0.21776199340820312, 0.23159027099609375, 0.24541854858398438, 0.259246826171875, 0.2730751037597656, 0.28690338134765625, 0.3007316589355469, 0.3145599365234375, 0.3283882141113281, 0.34221649169921875, 0.3560447692871094, 0.369873046875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 12.0, 9.0, 7.0, 11.0, 23.0, 28.0, 25.0, 33.0, 38.0, 47.0, 36.0, 44.0, 60.0, 51.0, 43.0, 44.0, 40.0, 54.0, 51.0, 59.0, 55.0, 48.0, 39.0, 30.0, 26.0, 26.0, 14.0, 13.0, 10.0, 10.0, 3.0, 1.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81005859375, -0.78265380859375, -0.7552490234375, -0.72784423828125, -0.700439453125, -0.67303466796875, -0.6456298828125, -0.61822509765625, -0.5908203125, -0.56341552734375, -0.5360107421875, -0.50860595703125, -0.481201171875, -0.45379638671875, -0.4263916015625, -0.39898681640625, -0.37158203125, -0.34417724609375, -0.3167724609375, -0.28936767578125, -0.261962890625, -0.23455810546875, -0.2071533203125, -0.17974853515625, -0.15234375, -0.12493896484375, -0.0975341796875, -0.07012939453125, -0.042724609375, -0.01531982421875, 0.0120849609375, 0.03948974609375, 0.06689453125, 0.09429931640625, 0.1217041015625, 0.14910888671875, 0.176513671875, 0.20391845703125, 0.2313232421875, 0.25872802734375, 0.2861328125, 0.31353759765625, 0.3409423828125, 0.36834716796875, 0.395751953125, 0.42315673828125, 0.4505615234375, 0.47796630859375, 0.50537109375, 0.53277587890625, 0.5601806640625, 0.58758544921875, 0.614990234375, 0.64239501953125, 0.6697998046875, 0.69720458984375, 0.724609375, 0.75201416015625, 0.7794189453125, 0.80682373046875, 0.834228515625, 0.86163330078125, 0.8890380859375, 0.91644287109375, 0.94384765625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 5.0, 5.0, 6.0, 9.0, 11.0, 16.0, 24.0, 38.0, 54.0, 92.0, 119.0, 171.0, 250.0, 406.0, 658.0, 1112.0, 2173.0, 4531.0, 12902.0, 72985.0, 587100.0, 316645.0, 33425.0, 8131.0, 3408.0, 1691.0, 900.0, 604.0, 351.0, 246.0, 154.0, 95.0, 78.0, 37.0, 37.0, 23.0, 15.0, 15.0, 8.0, 8.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.53125, -0.513427734375, -0.49560546875, -0.477783203125, -0.4599609375, -0.442138671875, -0.42431640625, -0.406494140625, -0.388671875, -0.370849609375, -0.35302734375, -0.335205078125, -0.3173828125, -0.299560546875, -0.28173828125, -0.263916015625, -0.24609375, -0.228271484375, -0.21044921875, -0.192626953125, -0.1748046875, -0.156982421875, -0.13916015625, -0.121337890625, -0.103515625, -0.085693359375, -0.06787109375, -0.050048828125, -0.0322265625, -0.014404296875, 0.00341796875, 0.021240234375, 0.0390625, 0.056884765625, 0.07470703125, 0.092529296875, 0.1103515625, 0.128173828125, 0.14599609375, 0.163818359375, 0.181640625, 0.199462890625, 0.21728515625, 0.235107421875, 0.2529296875, 0.270751953125, 0.28857421875, 0.306396484375, 0.32421875, 0.342041015625, 0.35986328125, 0.377685546875, 0.3955078125, 0.413330078125, 0.43115234375, 0.448974609375, 0.466796875, 0.484619140625, 0.50244140625, 0.520263671875, 0.5380859375, 0.555908203125, 0.57373046875, 0.591552734375, 0.609375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 9.0, 6.0, 2.0, 7.0, 11.0, 14.0, 25.0, 20.0, 27.0, 21.0, 34.0, 31.0, 38.0, 41.0, 55.0, 60.0, 44.0, 47.0, 61.0, 52.0, 47.0, 48.0, 49.0, 30.0, 29.0, 54.0, 28.0, 27.0, 18.0, 16.0, 9.0, 8.0, 6.0, 10.0, 2.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.58984375, -1.5363922119140625, -1.482940673828125, -1.4294891357421875, -1.37603759765625, -1.3225860595703125, -1.269134521484375, -1.2156829833984375, -1.1622314453125, -1.1087799072265625, -1.055328369140625, -1.0018768310546875, -0.94842529296875, -0.8949737548828125, -0.841522216796875, -0.7880706787109375, -0.734619140625, -0.6811676025390625, -0.627716064453125, -0.5742645263671875, -0.52081298828125, -0.4673614501953125, -0.413909912109375, -0.3604583740234375, -0.3070068359375, -0.2535552978515625, -0.200103759765625, -0.1466522216796875, -0.09320068359375, -0.0397491455078125, 0.013702392578125, 0.0671539306640625, 0.12060546875, 0.1740570068359375, 0.227508544921875, 0.2809600830078125, 0.33441162109375, 0.3878631591796875, 0.441314697265625, 0.4947662353515625, 0.5482177734375, 0.6016693115234375, 0.655120849609375, 0.7085723876953125, 0.76202392578125, 0.8154754638671875, 0.868927001953125, 0.9223785400390625, 0.975830078125, 1.0292816162109375, 1.082733154296875, 1.1361846923828125, 1.18963623046875, 1.2430877685546875, 1.296539306640625, 1.3499908447265625, 1.4034423828125, 1.4568939208984375, 1.510345458984375, 1.5637969970703125, 1.61724853515625, 1.6707000732421875, 1.724151611328125, 1.7776031494140625, 1.8310546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 10.0, 17.0, 18.0, 18.0, 36.0, 64.0, 84.0, 138.0, 229.0, 416.0, 705.0, 1348.0, 2461.0, 5103.0, 10859.0, 26338.0, 88487.0, 437763.0, 360720.0, 71263.0, 22954.0, 9793.0, 4600.0, 2270.0, 1205.0, 697.0, 353.0, 242.0, 130.0, 84.0, 54.0, 27.0, 19.0, 16.0, 14.0, 10.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1502685546875, -0.14468765258789062, -0.13910675048828125, -0.13352584838867188, -0.1279449462890625, -0.12236404418945312, -0.11678314208984375, -0.11120223999023438, -0.105621337890625, -0.10004043579101562, -0.09445953369140625, -0.08887863159179688, -0.0832977294921875, -0.07771682739257812, -0.07213592529296875, -0.06655502319335938, -0.06097412109375, -0.055393218994140625, -0.04981231689453125, -0.044231414794921875, -0.0386505126953125, -0.033069610595703125, -0.02748870849609375, -0.021907806396484375, -0.016326904296875, -0.010746002197265625, -0.00516510009765625, 0.000415802001953125, 0.0059967041015625, 0.011577606201171875, 0.01715850830078125, 0.022739410400390625, 0.0283203125, 0.033901214599609375, 0.03948211669921875, 0.045063018798828125, 0.0506439208984375, 0.056224822998046875, 0.06180572509765625, 0.06738662719726562, 0.072967529296875, 0.07854843139648438, 0.08412933349609375, 0.08971023559570312, 0.0952911376953125, 0.10087203979492188, 0.10645294189453125, 0.11203384399414062, 0.11761474609375, 0.12319564819335938, 0.12877655029296875, 0.13435745239257812, 0.1399383544921875, 0.14551925659179688, 0.15110015869140625, 0.15668106079101562, 0.162261962890625, 0.16784286499023438, 0.17342376708984375, 0.17900466918945312, 0.1845855712890625, 0.19016647338867188, 0.19574737548828125, 0.20132827758789062, 0.2069091796875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 7.0, 10.0, 13.0, 13.0, 41.0, 99.0, 183.0, 315.0, 171.0, 83.0, 26.0, 19.0, 9.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001766681671142578, -0.00017168372869491577, -0.00016669929027557373, -0.0001617148518562317, -0.00015673041343688965, -0.0001517459750175476, -0.00014676153659820557, -0.00014177709817886353, -0.00013679265975952148, -0.00013180822134017944, -0.0001268237829208374, -0.00012183934450149536, -0.00011685490608215332, -0.00011187046766281128, -0.00010688602924346924, -0.0001019015908241272, -9.691715240478516e-05, -9.193271398544312e-05, -8.694827556610107e-05, -8.196383714675903e-05, -7.697939872741699e-05, -7.199496030807495e-05, -6.701052188873291e-05, -6.202608346939087e-05, -5.704164505004883e-05, -5.205720663070679e-05, -4.7072768211364746e-05, -4.2088329792022705e-05, -3.7103891372680664e-05, -3.211945295333862e-05, -2.7135014533996582e-05, -2.215057611465454e-05, -1.71661376953125e-05, -1.2181699275970459e-05, -7.197260856628418e-06, -2.212822437286377e-06, 2.771615982055664e-06, 7.756054401397705e-06, 1.2740492820739746e-05, 1.7724931240081787e-05, 2.2709369659423828e-05, 2.769380807876587e-05, 3.267824649810791e-05, 3.766268491744995e-05, 4.264712333679199e-05, 4.763156175613403e-05, 5.2616000175476074e-05, 5.7600438594818115e-05, 6.258487701416016e-05, 6.75693154335022e-05, 7.255375385284424e-05, 7.753819227218628e-05, 8.252263069152832e-05, 8.750706911087036e-05, 9.24915075302124e-05, 9.747594594955444e-05, 0.00010246038436889648, 0.00010744482278823853, 0.00011242926120758057, 0.00011741369962692261, 0.00012239813804626465, 0.0001273825764656067, 0.00013236701488494873, 0.00013735145330429077, 0.0001423358917236328]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 4.0, 12.0, 7.0, 8.0, 11.0, 16.0, 28.0, 39.0, 47.0, 81.0, 140.0, 177.0, 290.0, 506.0, 967.0, 1819.0, 3557.0, 7683.0, 18442.0, 52822.0, 236453.0, 530000.0, 133896.0, 35902.0, 13515.0, 5903.0, 2792.0, 1449.0, 773.0, 459.0, 271.0, 144.0, 94.0, 78.0, 51.0, 24.0, 23.0, 19.0, 17.0, 9.0, 4.0, 2.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.1939697265625, -0.18777847290039062, -0.18158721923828125, -0.17539596557617188, -0.1692047119140625, -0.16301345825195312, -0.15682220458984375, -0.15063095092773438, -0.144439697265625, -0.13824844360351562, -0.13205718994140625, -0.12586593627929688, -0.1196746826171875, -0.11348342895507812, -0.10729217529296875, -0.10110092163085938, -0.09490966796875, -0.08871841430664062, -0.08252716064453125, -0.07633590698242188, -0.0701446533203125, -0.06395339965820312, -0.05776214599609375, -0.051570892333984375, -0.045379638671875, -0.039188385009765625, -0.03299713134765625, -0.026805877685546875, -0.0206146240234375, -0.014423370361328125, -0.00823211669921875, -0.002040863037109375, 0.004150390625, 0.010341644287109375, 0.01653289794921875, 0.022724151611328125, 0.0289154052734375, 0.035106658935546875, 0.04129791259765625, 0.047489166259765625, 0.053680419921875, 0.059871673583984375, 0.06606292724609375, 0.07225418090820312, 0.0784454345703125, 0.08463668823242188, 0.09082794189453125, 0.09701919555664062, 0.10321044921875, 0.10940170288085938, 0.11559295654296875, 0.12178421020507812, 0.1279754638671875, 0.13416671752929688, 0.14035797119140625, 0.14654922485351562, 0.152740478515625, 0.15893173217773438, 0.16512298583984375, 0.17131423950195312, 0.1775054931640625, 0.18369674682617188, 0.18988800048828125, 0.19607925415039062, 0.2022705078125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 8.0, 10.0, 10.0, 7.0, 9.0, 9.0, 22.0, 18.0, 26.0, 39.0, 43.0, 63.0, 116.0, 109.0, 124.0, 94.0, 77.0, 51.0, 34.0, 29.0, 14.0, 20.0, 9.0, 8.0, 6.0, 10.0, 8.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.059051513671875, -0.057233333587646484, -0.05541515350341797, -0.05359697341918945, -0.05177879333496094, -0.04996061325073242, -0.048142433166503906, -0.04632425308227539, -0.044506072998046875, -0.04268789291381836, -0.040869712829589844, -0.03905153274536133, -0.03723335266113281, -0.0354151725769043, -0.03359699249267578, -0.031778812408447266, -0.02996063232421875, -0.028142452239990234, -0.02632427215576172, -0.024506092071533203, -0.022687911987304688, -0.020869731903076172, -0.019051551818847656, -0.01723337173461914, -0.015415191650390625, -0.01359701156616211, -0.011778831481933594, -0.009960651397705078, -0.008142471313476562, -0.006324291229248047, -0.004506111145019531, -0.0026879310607910156, -0.0008697509765625, 0.0009484291076660156, 0.0027666091918945312, 0.004584789276123047, 0.0064029693603515625, 0.008221149444580078, 0.010039329528808594, 0.01185750961303711, 0.013675689697265625, 0.01549386978149414, 0.017312049865722656, 0.019130229949951172, 0.020948410034179688, 0.022766590118408203, 0.02458477020263672, 0.026402950286865234, 0.02822113037109375, 0.030039310455322266, 0.03185749053955078, 0.0336756706237793, 0.03549385070800781, 0.03731203079223633, 0.039130210876464844, 0.04094839096069336, 0.042766571044921875, 0.04458475112915039, 0.046402931213378906, 0.04822111129760742, 0.05003929138183594, 0.05185747146606445, 0.05367565155029297, 0.055493831634521484, 0.05731201171875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 7.0, 15.0, 19.0, 51.0, 81.0, 115.0, 145.0, 179.0, 145.0, 111.0, 56.0, 31.0, 21.0, 9.0, 8.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.060208320617676, -1.9967817068099976, -1.9333550930023193, -1.8699283599853516, -1.8065017461776733, -1.7430751323699951, -1.679648518562317, -1.6162219047546387, -1.552795171737671, -1.4893685579299927, -1.4259419441223145, -1.3625152111053467, -1.2990885972976685, -1.2356619834899902, -1.172235369682312, -1.1088087558746338, -1.0453821420669556, -0.9819555282592773, -0.9185288548469543, -0.8551022410392761, -0.7916755676269531, -0.7282489538192749, -0.6648223400115967, -0.6013957262039185, -0.5379690527915955, -0.47454240918159485, -0.41111576557159424, -0.347689151763916, -0.2842625081539154, -0.2208358645439148, -0.15740925073623657, -0.09398260712623596, -0.0305558443069458, 0.03287079185247421, 0.09629742801189423, 0.15972405672073364, 0.22315070033073425, 0.28657734394073486, 0.3500039577484131, 0.4134306013584137, 0.4768572449684143, 0.5402838587760925, 0.6037105321884155, 0.6671371459960938, 0.730563759803772, 0.793990433216095, 0.8574170470237732, 0.9208437204360962, 0.9842703342437744, 1.0476969480514526, 1.1111235618591309, 1.1745502948760986, 1.2379769086837769, 1.301403522491455, 1.3648301362991333, 1.4282567501068115, 1.4916834831237793, 1.5551100969314575, 1.6185367107391357, 1.6819634437561035, 1.7453900575637817, 1.80881667137146, 1.8722432851791382, 1.9356698989868164, 1.9990965127944946]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 15.0, 8.0, 14.0, 21.0, 25.0, 22.0, 30.0, 29.0, 29.0, 43.0, 49.0, 38.0, 47.0, 39.0, 59.0, 52.0, 35.0, 48.0, 46.0, 51.0, 54.0, 36.0, 34.0, 36.0, 36.0, 27.0, 21.0, 9.0, 11.0, 6.0, 3.0, 7.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.8579243421554565, -0.8328648209571838, -0.8078052997589111, -0.7827457785606384, -0.7576862573623657, -0.732626736164093, -0.7075672149658203, -0.6825076937675476, -0.6574481725692749, -0.6323886513710022, -0.6073291301727295, -0.5822696089744568, -0.5572100877761841, -0.5321505665779114, -0.5070910453796387, -0.48203152418136597, -0.45697200298309326, -0.43191248178482056, -0.40685296058654785, -0.38179343938827515, -0.35673391819000244, -0.33167439699172974, -0.30661487579345703, -0.2815553545951843, -0.2564958333969116, -0.23143631219863892, -0.2063767910003662, -0.1813172698020935, -0.1562577486038208, -0.1311982274055481, -0.10613870620727539, -0.08107918500900269, -0.05601966381072998, -0.030960142612457275, -0.00590062141418457, 0.019158899784088135, 0.04421842098236084, 0.06927794218063354, 0.09433746337890625, 0.11939698457717896, 0.14445650577545166, 0.16951602697372437, 0.19457554817199707, 0.21963506937026978, 0.24469459056854248, 0.2697541117668152, 0.2948136329650879, 0.3198731541633606, 0.3449326753616333, 0.369992196559906, 0.3950517177581787, 0.4201112389564514, 0.4451707601547241, 0.4702302813529968, 0.49528980255126953, 0.5203493237495422, 0.5454088449478149, 0.5704683661460876, 0.5955278873443604, 0.6205874085426331, 0.6456469297409058, 0.6707064509391785, 0.6957659721374512, 0.7208254933357239, 0.7458850145339966]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 8.0, 16.0, 24.0, 50.0, 68.0, 149.0, 290.0, 546.0, 1500.0, 4508.0, 15311.0, 73450.0, 716081.0, 197768.0, 27460.0, 7387.0, 2261.0, 873.0, 381.0, 198.0, 85.0, 67.0, 33.0, 20.0, 12.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1015625, -1.0656890869140625, -1.029815673828125, -0.9939422607421875, -0.95806884765625, -0.9221954345703125, -0.886322021484375, -0.8504486083984375, -0.8145751953125, -0.7787017822265625, -0.742828369140625, -0.7069549560546875, -0.67108154296875, -0.6352081298828125, -0.599334716796875, -0.5634613037109375, -0.527587890625, -0.4917144775390625, -0.455841064453125, -0.4199676513671875, -0.38409423828125, -0.3482208251953125, -0.312347412109375, -0.2764739990234375, -0.2406005859375, -0.2047271728515625, -0.168853759765625, -0.1329803466796875, -0.09710693359375, -0.0612335205078125, -0.025360107421875, 0.0105133056640625, 0.04638671875, 0.0822601318359375, 0.118133544921875, 0.1540069580078125, 0.18988037109375, 0.2257537841796875, 0.261627197265625, 0.2975006103515625, 0.3333740234375, 0.3692474365234375, 0.405120849609375, 0.4409942626953125, 0.47686767578125, 0.5127410888671875, 0.548614501953125, 0.5844879150390625, 0.620361328125, 0.6562347412109375, 0.692108154296875, 0.7279815673828125, 0.76385498046875, 0.7997283935546875, 0.835601806640625, 0.8714752197265625, 0.9073486328125, 0.9432220458984375, 0.979095458984375, 1.0149688720703125, 1.05084228515625, 1.0867156982421875, 1.122589111328125, 1.1584625244140625, 1.1943359375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 6.0, 7.0, 18.0, 20.0, 17.0, 28.0, 44.0, 49.0, 40.0, 65.0, 68.0, 67.0, 82.0, 63.0, 65.0, 83.0, 63.0, 60.0, 41.0, 38.0, 28.0, 15.0, 15.0, 5.0, 6.0, 5.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.83203125, -2.7590789794921875, -2.686126708984375, -2.6131744384765625, -2.54022216796875, -2.4672698974609375, -2.394317626953125, -2.3213653564453125, -2.2484130859375, -2.1754608154296875, -2.102508544921875, -2.0295562744140625, -1.95660400390625, -1.8836517333984375, -1.810699462890625, -1.7377471923828125, -1.664794921875, -1.5918426513671875, -1.518890380859375, -1.4459381103515625, -1.37298583984375, -1.3000335693359375, -1.227081298828125, -1.1541290283203125, -1.0811767578125, -1.0082244873046875, -0.935272216796875, -0.8623199462890625, -0.78936767578125, -0.7164154052734375, -0.643463134765625, -0.5705108642578125, -0.49755859375, -0.4246063232421875, -0.351654052734375, -0.2787017822265625, -0.20574951171875, -0.1327972412109375, -0.059844970703125, 0.0131072998046875, 0.0860595703125, 0.1590118408203125, 0.231964111328125, 0.3049163818359375, 0.37786865234375, 0.4508209228515625, 0.523773193359375, 0.5967254638671875, 0.669677734375, 0.7426300048828125, 0.815582275390625, 0.8885345458984375, 0.96148681640625, 1.0344390869140625, 1.107391357421875, 1.1803436279296875, 1.2532958984375, 1.3262481689453125, 1.399200439453125, 1.4721527099609375, 1.54510498046875, 1.6180572509765625, 1.691009521484375, 1.7639617919921875, 1.8369140625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 5.0, 7.0, 7.0, 7.0, 9.0, 8.0, 13.0, 20.0, 24.0, 24.0, 25.0, 42.0, 53.0, 97.0, 120.0, 212.0, 483.0, 1507.0, 21615.0, 970441.0, 50223.0, 2307.0, 564.0, 233.0, 154.0, 94.0, 58.0, 45.0, 31.0, 26.0, 21.0, 15.0, 14.0, 8.0, 7.0, 7.0, 4.0, 2.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.06640625, -2.972381591796875, -2.87835693359375, -2.784332275390625, -2.6903076171875, -2.596282958984375, -2.50225830078125, -2.408233642578125, -2.314208984375, -2.220184326171875, -2.12615966796875, -2.032135009765625, -1.9381103515625, -1.844085693359375, -1.75006103515625, -1.656036376953125, -1.56201171875, -1.467987060546875, -1.37396240234375, -1.279937744140625, -1.1859130859375, -1.091888427734375, -0.99786376953125, -0.903839111328125, -0.809814453125, -0.715789794921875, -0.62176513671875, -0.527740478515625, -0.4337158203125, -0.339691162109375, -0.24566650390625, -0.151641845703125, -0.0576171875, 0.036407470703125, 0.13043212890625, 0.224456787109375, 0.3184814453125, 0.412506103515625, 0.50653076171875, 0.600555419921875, 0.694580078125, 0.788604736328125, 0.88262939453125, 0.976654052734375, 1.0706787109375, 1.164703369140625, 1.25872802734375, 1.352752685546875, 1.44677734375, 1.540802001953125, 1.63482666015625, 1.728851318359375, 1.8228759765625, 1.916900634765625, 2.01092529296875, 2.104949951171875, 2.198974609375, 2.292999267578125, 2.38702392578125, 2.481048583984375, 2.5750732421875, 2.669097900390625, 2.76312255859375, 2.857147216796875, 2.951171875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 0.0, 4.0, 7.0, 5.0, 15.0, 6.0, 10.0, 11.0, 11.0, 24.0, 14.0, 22.0, 29.0, 35.0, 28.0, 45.0, 34.0, 50.0, 47.0, 59.0, 52.0, 40.0, 61.0, 53.0, 63.0, 35.0, 42.0, 30.0, 21.0, 28.0, 23.0, 16.0, 12.0, 8.0, 13.0, 6.0, 9.0, 9.0, 7.0, 4.0, 4.0, 4.0, 1.0, 4.0, 4.0, 1.0, 3.0, 2.0], "bins": [-2.25390625, -2.1930694580078125, -2.132232666015625, -2.0713958740234375, -2.01055908203125, -1.9497222900390625, -1.888885498046875, -1.8280487060546875, -1.7672119140625, -1.7063751220703125, -1.645538330078125, -1.5847015380859375, -1.52386474609375, -1.4630279541015625, -1.402191162109375, -1.3413543701171875, -1.280517578125, -1.2196807861328125, -1.158843994140625, -1.0980072021484375, -1.03717041015625, -0.9763336181640625, -0.915496826171875, -0.8546600341796875, -0.7938232421875, -0.7329864501953125, -0.672149658203125, -0.6113128662109375, -0.55047607421875, -0.4896392822265625, -0.428802490234375, -0.3679656982421875, -0.30712890625, -0.2462921142578125, -0.185455322265625, -0.1246185302734375, -0.06378173828125, -0.0029449462890625, 0.057891845703125, 0.1187286376953125, 0.1795654296875, 0.2404022216796875, 0.301239013671875, 0.3620758056640625, 0.42291259765625, 0.4837493896484375, 0.544586181640625, 0.6054229736328125, 0.666259765625, 0.7270965576171875, 0.787933349609375, 0.8487701416015625, 0.90960693359375, 0.9704437255859375, 1.031280517578125, 1.0921173095703125, 1.1529541015625, 1.2137908935546875, 1.274627685546875, 1.3354644775390625, 1.39630126953125, 1.4571380615234375, 1.517974853515625, 1.5788116455078125, 1.6396484375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 9.0, 8.0, 21.0, 29.0, 41.0, 109.0, 170.0, 548.0, 1671.0, 9158.0, 144354.0, 858601.0, 29087.0, 3417.0, 776.0, 306.0, 113.0, 58.0, 21.0, 26.0, 13.0, 9.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2880859375, -0.27034759521484375, -0.2526092529296875, -0.23487091064453125, -0.217132568359375, -0.19939422607421875, -0.1816558837890625, -0.16391754150390625, -0.14617919921875, -0.12844085693359375, -0.1107025146484375, -0.09296417236328125, -0.075225830078125, -0.05748748779296875, -0.0397491455078125, -0.02201080322265625, -0.0042724609375, 0.01346588134765625, 0.0312042236328125, 0.04894256591796875, 0.066680908203125, 0.08441925048828125, 0.1021575927734375, 0.11989593505859375, 0.13763427734375, 0.15537261962890625, 0.1731109619140625, 0.19084930419921875, 0.208587646484375, 0.22632598876953125, 0.2440643310546875, 0.26180267333984375, 0.279541015625, 0.29727935791015625, 0.3150177001953125, 0.33275604248046875, 0.350494384765625, 0.36823272705078125, 0.3859710693359375, 0.40370941162109375, 0.42144775390625, 0.43918609619140625, 0.4569244384765625, 0.47466278076171875, 0.492401123046875, 0.5101394653320312, 0.5278778076171875, 0.5456161499023438, 0.5633544921875, 0.5810928344726562, 0.5988311767578125, 0.6165695190429688, 0.634307861328125, 0.6520462036132812, 0.6697845458984375, 0.6875228881835938, 0.70526123046875, 0.7229995727539062, 0.7407379150390625, 0.7584762573242188, 0.776214599609375, 0.7939529418945312, 0.8116912841796875, 0.8294296264648438, 0.84716796875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 5.0, 9.0, 8.0, 21.0, 28.0, 62.0, 102.0, 169.0, 234.0, 118.0, 89.0, 63.0, 36.0, 17.0, 10.0, 5.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4717063903808594e-05, -5.285162478685379e-05, -5.098618566989899e-05, -4.912074655294418e-05, -4.725530743598938e-05, -4.5389868319034576e-05, -4.352442920207977e-05, -4.165899008512497e-05, -3.9793550968170166e-05, -3.792811185121536e-05, -3.606267273426056e-05, -3.4197233617305756e-05, -3.233179450035095e-05, -3.046635538339615e-05, -2.8600916266441345e-05, -2.6735477149486542e-05, -2.4870038032531738e-05, -2.3004598915576935e-05, -2.113915979862213e-05, -1.9273720681667328e-05, -1.7408281564712524e-05, -1.554284244775772e-05, -1.3677403330802917e-05, -1.1811964213848114e-05, -9.94652509689331e-06, -8.081085979938507e-06, -6.215646862983704e-06, -4.3502077460289e-06, -2.4847686290740967e-06, -6.193295121192932e-07, 1.2461096048355103e-06, 3.1115487217903137e-06, 4.976987838745117e-06, 6.842426955699921e-06, 8.707866072654724e-06, 1.0573305189609528e-05, 1.2438744306564331e-05, 1.4304183423519135e-05, 1.6169622540473938e-05, 1.803506165742874e-05, 1.9900500774383545e-05, 2.176593989133835e-05, 2.3631379008293152e-05, 2.5496818125247955e-05, 2.736225724220276e-05, 2.9227696359157562e-05, 3.1093135476112366e-05, 3.295857459306717e-05, 3.482401371002197e-05, 3.6689452826976776e-05, 3.855489194393158e-05, 4.042033106088638e-05, 4.2285770177841187e-05, 4.415120929479599e-05, 4.6016648411750793e-05, 4.78820875287056e-05, 4.97475266456604e-05, 5.1612965762615204e-05, 5.347840487957001e-05, 5.534384399652481e-05, 5.7209283113479614e-05, 5.907472223043442e-05, 6.094016134738922e-05, 6.280560046434402e-05, 6.467103958129883e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 11.0, 8.0, 10.0, 16.0, 30.0, 42.0, 108.0, 145.0, 280.0, 615.0, 1598.0, 5696.0, 40779.0, 858710.0, 124939.0, 11351.0, 2448.0, 883.0, 402.0, 208.0, 101.0, 78.0, 38.0, 19.0, 14.0, 5.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.74365234375, -0.7253799438476562, -0.7071075439453125, -0.6888351440429688, -0.670562744140625, -0.6522903442382812, -0.6340179443359375, -0.6157455444335938, -0.59747314453125, -0.5792007446289062, -0.5609283447265625, -0.5426559448242188, -0.524383544921875, -0.5061111450195312, -0.4878387451171875, -0.46956634521484375, -0.4512939453125, -0.43302154541015625, -0.4147491455078125, -0.39647674560546875, -0.378204345703125, -0.35993194580078125, -0.3416595458984375, -0.32338714599609375, -0.30511474609375, -0.28684234619140625, -0.2685699462890625, -0.25029754638671875, -0.232025146484375, -0.21375274658203125, -0.1954803466796875, -0.17720794677734375, -0.158935546875, -0.14066314697265625, -0.1223907470703125, -0.10411834716796875, -0.085845947265625, -0.06757354736328125, -0.0493011474609375, -0.03102874755859375, -0.01275634765625, 0.00551605224609375, 0.0237884521484375, 0.04206085205078125, 0.060333251953125, 0.07860565185546875, 0.0968780517578125, 0.11515045166015625, 0.1334228515625, 0.15169525146484375, 0.1699676513671875, 0.18824005126953125, 0.206512451171875, 0.22478485107421875, 0.2430572509765625, 0.26132965087890625, 0.27960205078125, 0.29787445068359375, 0.3161468505859375, 0.33441925048828125, 0.352691650390625, 0.37096405029296875, 0.3892364501953125, 0.40750885009765625, 0.42578125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 5.0, 10.0, 10.0, 20.0, 21.0, 27.0, 38.0, 50.0, 133.0, 146.0, 199.0, 113.0, 59.0, 47.0, 28.0, 23.0, 10.0, 12.0, 10.0, 9.0, 6.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1282958984375, -0.12276458740234375, -0.1172332763671875, -0.11170196533203125, -0.106170654296875, -0.10063934326171875, -0.0951080322265625, -0.08957672119140625, -0.08404541015625, -0.07851409912109375, -0.0729827880859375, -0.06745147705078125, -0.061920166015625, -0.05638885498046875, -0.0508575439453125, -0.04532623291015625, -0.039794921875, -0.03426361083984375, -0.0287322998046875, -0.02320098876953125, -0.017669677734375, -0.01213836669921875, -0.0066070556640625, -0.00107574462890625, 0.00445556640625, 0.00998687744140625, 0.0155181884765625, 0.02104949951171875, 0.026580810546875, 0.03211212158203125, 0.0376434326171875, 0.04317474365234375, 0.0487060546875, 0.05423736572265625, 0.0597686767578125, 0.06529998779296875, 0.070831298828125, 0.07636260986328125, 0.0818939208984375, 0.08742523193359375, 0.09295654296875, 0.09848785400390625, 0.1040191650390625, 0.10955047607421875, 0.115081787109375, 0.12061309814453125, 0.1261444091796875, 0.13167572021484375, 0.13720703125, 0.14273834228515625, 0.1482696533203125, 0.15380096435546875, 0.159332275390625, 0.16486358642578125, 0.1703948974609375, 0.17592620849609375, 0.18145751953125, 0.18698883056640625, 0.1925201416015625, 0.19805145263671875, 0.203582763671875, 0.20911407470703125, 0.2146453857421875, 0.22017669677734375, 0.2257080078125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 14.0, 29.0, 44.0, 112.0, 162.0, 215.0, 199.0, 133.0, 51.0, 20.0, 16.0, 8.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.017664909362793, -5.844317436218262, -5.670969486236572, -5.497621536254883, -5.324274063110352, -5.15092658996582, -4.977578639984131, -4.804230690002441, -4.63088321685791, -4.457535743713379, -4.2841877937316895, -4.11083984375, -3.9374923706054688, -3.7641446590423584, -3.590796947479248, -3.4174492359161377, -3.2441015243530273, -3.070753812789917, -2.8974061012268066, -2.7240583896636963, -2.550710678100586, -2.3773629665374756, -2.2040152549743652, -2.030667543411255, -1.8573198318481445, -1.6839721202850342, -1.5106244087219238, -1.3372766971588135, -1.1639289855957031, -0.9905812740325928, -0.8172335624694824, -0.6438858509063721, -0.4705386161804199, -0.29719090461730957, -0.12384319305419922, 0.04950451850891113, 0.22285223007202148, 0.39619994163513184, 0.5695476531982422, 0.7428953647613525, 0.9162430763244629, 1.0895907878875732, 1.2629384994506836, 1.436286211013794, 1.6096339225769043, 1.7829816341400146, 1.956329345703125, 2.1296770572662354, 2.3030247688293457, 2.476372480392456, 2.6497201919555664, 2.8230679035186768, 2.996415615081787, 3.1697633266448975, 3.343111038208008, 3.516458749771118, 3.6898064613342285, 3.863154172897339, 4.036501884460449, 4.2098493576049805, 4.38319730758667, 4.556545257568359, 4.729892730712891, 4.903240203857422, 5.076588153839111]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 12.0, 8.0, 8.0, 16.0, 14.0, 23.0, 8.0, 25.0, 37.0, 28.0, 31.0, 34.0, 58.0, 41.0, 49.0, 44.0, 51.0, 47.0, 65.0, 37.0, 39.0, 49.0, 42.0, 43.0, 35.0, 26.0, 22.0, 37.0, 16.0, 15.0, 11.0, 10.0, 6.0, 6.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.8116557598114014, -3.7090628147125244, -3.6064701080322266, -3.5038771629333496, -3.4012842178344727, -3.298691511154175, -3.196098566055298, -3.093505859375, -2.990912914276123, -2.888319969177246, -2.7857272624969482, -2.6831343173980713, -2.5805416107177734, -2.4779486656188965, -2.3753557205200195, -2.2727627754211426, -2.1701700687408447, -2.0675771236419678, -1.96498441696167, -1.862391471862793, -1.7597986459732056, -1.6572058200836182, -1.5546128749847412, -1.4520200490951538, -1.3494272232055664, -1.246834397315979, -1.1442415714263916, -1.0416486263275146, -0.9390558004379272, -0.8364629745483398, -0.7338700890541077, -0.6312772035598755, -0.5286843776702881, -0.4260915219783783, -0.3234986662864685, -0.22090581059455872, -0.11831295490264893, -0.015720129013061523, 0.08687275648117065, 0.18946564197540283, 0.29205846786499023, 0.3946513235569, 0.4972441792488098, 0.599837064743042, 0.7024298906326294, 0.8050227165222168, 0.907615602016449, 1.0102084875106812, 1.1128013134002686, 1.215394139289856, 1.3179869651794434, 1.4205799102783203, 1.5231727361679077, 1.6257655620574951, 1.728358507156372, 1.8309513330459595, 1.9335441589355469, 2.036137104034424, 2.1387298107147217, 2.2413227558135986, 2.3439154624938965, 2.4465084075927734, 2.5491013526916504, 2.6516942977905273, 2.754287004470825]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 8.0, 7.0, 5.0, 12.0, 11.0, 13.0, 16.0, 21.0, 31.0, 43.0, 46.0, 63.0, 101.0, 163.0, 442.0, 1369.0, 7793.0, 144285.0, 3647339.0, 377858.0, 11628.0, 1874.0, 539.0, 205.0, 118.0, 90.0, 45.0, 42.0, 33.0, 21.0, 17.0, 18.0, 8.0, 7.0, 6.0, 5.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.51171875, -3.410247802734375, -3.30877685546875, -3.207305908203125, -3.1058349609375, -3.004364013671875, -2.90289306640625, -2.801422119140625, -2.699951171875, -2.598480224609375, -2.49700927734375, -2.395538330078125, -2.2940673828125, -2.192596435546875, -2.09112548828125, -1.989654541015625, -1.88818359375, -1.786712646484375, -1.68524169921875, -1.583770751953125, -1.4822998046875, -1.380828857421875, -1.27935791015625, -1.177886962890625, -1.076416015625, -0.974945068359375, -0.87347412109375, -0.772003173828125, -0.6705322265625, -0.569061279296875, -0.46759033203125, -0.366119384765625, -0.2646484375, -0.163177490234375, -0.06170654296875, 0.039764404296875, 0.1412353515625, 0.242706298828125, 0.34417724609375, 0.445648193359375, 0.547119140625, 0.648590087890625, 0.75006103515625, 0.851531982421875, 0.9530029296875, 1.054473876953125, 1.15594482421875, 1.257415771484375, 1.35888671875, 1.460357666015625, 1.56182861328125, 1.663299560546875, 1.7647705078125, 1.866241455078125, 1.96771240234375, 2.069183349609375, 2.170654296875, 2.272125244140625, 2.37359619140625, 2.475067138671875, 2.5765380859375, 2.678009033203125, 2.77947998046875, 2.880950927734375, 2.982421875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 7.0, 6.0, 15.0, 11.0, 19.0, 17.0, 22.0, 23.0, 36.0, 33.0, 42.0, 48.0, 38.0, 46.0, 48.0, 41.0, 51.0, 36.0, 39.0, 50.0, 49.0, 43.0, 35.0, 41.0, 49.0, 24.0, 28.0, 21.0, 12.0, 13.0, 8.0, 11.0, 9.0, 3.0, 7.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85400390625, -0.8232345581054688, -0.7924652099609375, -0.7616958618164062, -0.730926513671875, -0.7001571655273438, -0.6693878173828125, -0.6386184692382812, -0.60784912109375, -0.5770797729492188, -0.5463104248046875, -0.5155410766601562, -0.484771728515625, -0.45400238037109375, -0.4232330322265625, -0.39246368408203125, -0.3616943359375, -0.33092498779296875, -0.3001556396484375, -0.26938629150390625, -0.238616943359375, -0.20784759521484375, -0.1770782470703125, -0.14630889892578125, -0.11553955078125, -0.08477020263671875, -0.0540008544921875, -0.02323150634765625, 0.007537841796875, 0.03830718994140625, 0.0690765380859375, 0.09984588623046875, 0.130615234375, 0.16138458251953125, 0.1921539306640625, 0.22292327880859375, 0.253692626953125, 0.28446197509765625, 0.3152313232421875, 0.34600067138671875, 0.37677001953125, 0.40753936767578125, 0.4383087158203125, 0.46907806396484375, 0.499847412109375, 0.5306167602539062, 0.5613861083984375, 0.5921554565429688, 0.6229248046875, 0.6536941528320312, 0.6844635009765625, 0.7152328491210938, 0.746002197265625, 0.7767715454101562, 0.8075408935546875, 0.8383102416992188, 0.86907958984375, 0.8998489379882812, 0.9306182861328125, 0.9613876342773438, 0.992156982421875, 1.0229263305664062, 1.0536956787109375, 1.0844650268554688, 1.115234375]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 12.0, 12.0, 23.0, 44.0, 82.0, 167.0, 427.0, 1489.0, 8546.0, 465643.0, 3692374.0, 21799.0, 2536.0, 663.0, 227.0, 102.0, 45.0, 36.0, 21.0, 10.0, 5.0, 5.0, 2.0, 4.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0703125, -3.9205322265625, -3.770751953125, -3.6209716796875, -3.47119140625, -3.3214111328125, -3.171630859375, -3.0218505859375, -2.8720703125, -2.7222900390625, -2.572509765625, -2.4227294921875, -2.27294921875, -2.1231689453125, -1.973388671875, -1.8236083984375, -1.673828125, -1.5240478515625, -1.374267578125, -1.2244873046875, -1.07470703125, -0.9249267578125, -0.775146484375, -0.6253662109375, -0.4755859375, -0.3258056640625, -0.176025390625, -0.0262451171875, 0.12353515625, 0.2733154296875, 0.423095703125, 0.5728759765625, 0.72265625, 0.8724365234375, 1.022216796875, 1.1719970703125, 1.32177734375, 1.4715576171875, 1.621337890625, 1.7711181640625, 1.9208984375, 2.0706787109375, 2.220458984375, 2.3702392578125, 2.52001953125, 2.6697998046875, 2.819580078125, 2.9693603515625, 3.119140625, 3.2689208984375, 3.418701171875, 3.5684814453125, 3.71826171875, 3.8680419921875, 4.017822265625, 4.1676025390625, 4.3173828125, 4.4671630859375, 4.616943359375, 4.7667236328125, 4.91650390625, 5.0662841796875, 5.216064453125, 5.3658447265625, 5.515625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 11.0, 12.0, 20.0, 48.0, 73.0, 115.0, 236.0, 485.0, 900.0, 954.0, 588.0, 279.0, 146.0, 81.0, 51.0, 31.0, 19.0, 7.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.958984375, -0.9308853149414062, -0.9027862548828125, -0.8746871948242188, -0.846588134765625, -0.8184890747070312, -0.7903900146484375, -0.7622909545898438, -0.73419189453125, -0.7060928344726562, -0.6779937744140625, -0.6498947143554688, -0.621795654296875, -0.5936965942382812, -0.5655975341796875, -0.5374984741210938, -0.5093994140625, -0.48130035400390625, -0.4532012939453125, -0.42510223388671875, -0.397003173828125, -0.36890411376953125, -0.3408050537109375, -0.31270599365234375, -0.28460693359375, -0.25650787353515625, -0.2284088134765625, -0.20030975341796875, -0.172210693359375, -0.14411163330078125, -0.1160125732421875, -0.08791351318359375, -0.059814453125, -0.03171539306640625, -0.0036163330078125, 0.02448272705078125, 0.052581787109375, 0.08068084716796875, 0.1087799072265625, 0.13687896728515625, 0.16497802734375, 0.19307708740234375, 0.2211761474609375, 0.24927520751953125, 0.277374267578125, 0.30547332763671875, 0.3335723876953125, 0.36167144775390625, 0.3897705078125, 0.41786956787109375, 0.4459686279296875, 0.47406768798828125, 0.502166748046875, 0.5302658081054688, 0.5583648681640625, 0.5864639282226562, 0.61456298828125, 0.6426620483398438, 0.6707611083984375, 0.6988601684570312, 0.726959228515625, 0.7550582885742188, 0.7831573486328125, 0.8112564086914062, 0.83935546875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 3.0, 9.0, 14.0, 21.0, 22.0, 32.0, 47.0, 46.0, 75.0, 76.0, 95.0, 94.0, 105.0, 91.0, 71.0, 55.0, 45.0, 27.0, 28.0, 14.0, 13.0, 12.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.474672555923462, -2.410276174545288, -2.3458797931671143, -2.2814831733703613, -2.2170867919921875, -2.1526904106140137, -2.08829402923584, -2.023897647857666, -1.9595011472702026, -1.8951047658920288, -1.8307082653045654, -1.7663118839263916, -1.7019155025482178, -1.6375190019607544, -1.5731226205825806, -1.5087261199951172, -1.4443297386169434, -1.3799333572387695, -1.3155368566513062, -1.2511404752731323, -1.186743974685669, -1.1223475933074951, -1.0579512119293213, -0.9935547709465027, -0.9291583299636841, -0.8647618889808655, -0.8003654479980469, -0.735969066619873, -0.6715726256370544, -0.6071761846542358, -0.542779803276062, -0.4783833622932434, -0.4139869213104248, -0.3495904803276062, -0.28519406914711, -0.22079764306545258, -0.15640121698379517, -0.09200477600097656, -0.027608364820480347, 0.03678804636001587, 0.10118448734283447, 0.16558091342449188, 0.2299773395061493, 0.2943737506866455, 0.3587701916694641, 0.4231666326522827, 0.48756304383277893, 0.5519594550132751, 0.6163558959960938, 0.6807523369789124, 0.745148777961731, 0.8095451593399048, 0.8739416003227234, 0.938338041305542, 1.0027344226837158, 1.0671308040618896, 1.131527304649353, 1.1959236860275269, 1.2603201866149902, 1.324716567993164, 1.389112949371338, 1.4535094499588013, 1.517905831336975, 1.5823023319244385, 1.6466987133026123]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 7.0, 4.0, 3.0, 14.0, 7.0, 18.0, 14.0, 13.0, 20.0, 18.0, 25.0, 31.0, 34.0, 40.0, 47.0, 41.0, 50.0, 46.0, 53.0, 41.0, 43.0, 42.0, 42.0, 44.0, 45.0, 28.0, 39.0, 31.0, 22.0, 26.0, 25.0, 22.0, 16.0, 13.0, 7.0, 6.0, 12.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.220424771308899, -1.1819335222244263, -1.1434423923492432, -1.1049511432647705, -1.0664600133895874, -1.0279687643051147, -0.9894775748252869, -0.950986385345459, -0.9124951958656311, -0.8740040063858032, -0.8355128169059753, -0.7970216274261475, -0.7585303783416748, -0.7200392484664917, -0.681547999382019, -0.6430568099021912, -0.6045656204223633, -0.5660744309425354, -0.5275832414627075, -0.48909202218055725, -0.45060083270072937, -0.4121096432209015, -0.3736184239387512, -0.33512723445892334, -0.29663604497909546, -0.2581448554992676, -0.2196536511182785, -0.18116244673728943, -0.14267125725746155, -0.10418006777763367, -0.06568886339664459, -0.027197659015655518, 0.011293649673461914, 0.04978484660387039, 0.08827604353427887, 0.12676724791526794, 0.16525843739509583, 0.2037496268749237, 0.24224083125591278, 0.28073203563690186, 0.31922322511672974, 0.3577144145965576, 0.3962056040763855, 0.43469682335853577, 0.47318801283836365, 0.5116791725158691, 0.5501704216003418, 0.5886616110801697, 0.6271528005599976, 0.6656439900398254, 0.7041351795196533, 0.7426263689994812, 0.7811175584793091, 0.8196088075637817, 0.8580999970436096, 0.8965911865234375, 0.9350823760032654, 0.9735735654830933, 1.012064814567566, 1.050555944442749, 1.0890471935272217, 1.1275383234024048, 1.1660295724868774, 1.2045207023620605, 1.2430119514465332]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 2.0, 4.0, 3.0, 8.0, 10.0, 20.0, 33.0, 49.0, 67.0, 134.0, 278.0, 494.0, 933.0, 1847.0, 3912.0, 10614.0, 59890.0, 639871.0, 291750.0, 25923.0, 6828.0, 2910.0, 1328.0, 738.0, 386.0, 224.0, 130.0, 72.0, 37.0, 26.0, 14.0, 9.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.853515625, -0.8266754150390625, -0.799835205078125, -0.7729949951171875, -0.74615478515625, -0.7193145751953125, -0.692474365234375, -0.6656341552734375, -0.6387939453125, -0.6119537353515625, -0.585113525390625, -0.5582733154296875, -0.53143310546875, -0.5045928955078125, -0.477752685546875, -0.4509124755859375, -0.424072265625, -0.3972320556640625, -0.370391845703125, -0.3435516357421875, -0.31671142578125, -0.2898712158203125, -0.263031005859375, -0.2361907958984375, -0.2093505859375, -0.1825103759765625, -0.155670166015625, -0.1288299560546875, -0.10198974609375, -0.0751495361328125, -0.048309326171875, -0.0214691162109375, 0.00537109375, 0.0322113037109375, 0.059051513671875, 0.0858917236328125, 0.11273193359375, 0.1395721435546875, 0.166412353515625, 0.1932525634765625, 0.2200927734375, 0.2469329833984375, 0.273773193359375, 0.3006134033203125, 0.32745361328125, 0.3542938232421875, 0.381134033203125, 0.4079742431640625, 0.434814453125, 0.4616546630859375, 0.488494873046875, 0.5153350830078125, 0.54217529296875, 0.5690155029296875, 0.595855712890625, 0.6226959228515625, 0.6495361328125, 0.6763763427734375, 0.703216552734375, 0.7300567626953125, 0.75689697265625, 0.7837371826171875, 0.810577392578125, 0.8374176025390625, 0.8642578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 11.0, 9.0, 8.0, 10.0, 11.0, 16.0, 15.0, 20.0, 23.0, 27.0, 46.0, 43.0, 40.0, 60.0, 63.0, 44.0, 47.0, 44.0, 50.0, 31.0, 49.0, 39.0, 33.0, 30.0, 33.0, 37.0, 26.0, 28.0, 22.0, 20.0, 15.0, 11.0, 10.0, 8.0, 7.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.931640625, -0.904449462890625, -0.87725830078125, -0.850067138671875, -0.8228759765625, -0.795684814453125, -0.76849365234375, -0.741302490234375, -0.714111328125, -0.686920166015625, -0.65972900390625, -0.632537841796875, -0.6053466796875, -0.578155517578125, -0.55096435546875, -0.523773193359375, -0.49658203125, -0.469390869140625, -0.44219970703125, -0.415008544921875, -0.3878173828125, -0.360626220703125, -0.33343505859375, -0.306243896484375, -0.279052734375, -0.251861572265625, -0.22467041015625, -0.197479248046875, -0.1702880859375, -0.143096923828125, -0.11590576171875, -0.088714599609375, -0.0615234375, -0.034332275390625, -0.00714111328125, 0.020050048828125, 0.0472412109375, 0.074432373046875, 0.10162353515625, 0.128814697265625, 0.156005859375, 0.183197021484375, 0.21038818359375, 0.237579345703125, 0.2647705078125, 0.291961669921875, 0.31915283203125, 0.346343994140625, 0.37353515625, 0.400726318359375, 0.42791748046875, 0.455108642578125, 0.4822998046875, 0.509490966796875, 0.53668212890625, 0.563873291015625, 0.591064453125, 0.618255615234375, 0.64544677734375, 0.672637939453125, 0.6998291015625, 0.727020263671875, 0.75421142578125, 0.781402587890625, 0.80859375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 10.0, 13.0, 18.0, 19.0, 36.0, 56.0, 67.0, 115.0, 172.0, 254.0, 389.0, 599.0, 1092.0, 2212.0, 4774.0, 13473.0, 237743.0, 736886.0, 36829.0, 6940.0, 3121.0, 1462.0, 831.0, 471.0, 321.0, 212.0, 141.0, 78.0, 61.0, 44.0, 33.0, 22.0, 12.0, 13.0, 7.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8466796875, -0.815582275390625, -0.78448486328125, -0.753387451171875, -0.7222900390625, -0.691192626953125, -0.66009521484375, -0.628997802734375, -0.597900390625, -0.566802978515625, -0.53570556640625, -0.504608154296875, -0.4735107421875, -0.442413330078125, -0.41131591796875, -0.380218505859375, -0.34912109375, -0.318023681640625, -0.28692626953125, -0.255828857421875, -0.2247314453125, -0.193634033203125, -0.16253662109375, -0.131439208984375, -0.100341796875, -0.069244384765625, -0.03814697265625, -0.007049560546875, 0.0240478515625, 0.055145263671875, 0.08624267578125, 0.117340087890625, 0.1484375, 0.179534912109375, 0.21063232421875, 0.241729736328125, 0.2728271484375, 0.303924560546875, 0.33502197265625, 0.366119384765625, 0.397216796875, 0.428314208984375, 0.45941162109375, 0.490509033203125, 0.5216064453125, 0.552703857421875, 0.58380126953125, 0.614898681640625, 0.64599609375, 0.677093505859375, 0.70819091796875, 0.739288330078125, 0.7703857421875, 0.801483154296875, 0.83258056640625, 0.863677978515625, 0.894775390625, 0.925872802734375, 0.95697021484375, 0.988067626953125, 1.0191650390625, 1.050262451171875, 1.08135986328125, 1.112457275390625, 1.1435546875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 3.0, 6.0, 10.0, 7.0, 12.0, 9.0, 16.0, 24.0, 16.0, 26.0, 30.0, 24.0, 43.0, 39.0, 38.0, 49.0, 56.0, 53.0, 50.0, 53.0, 48.0, 51.0, 48.0, 37.0, 45.0, 32.0, 33.0, 26.0, 21.0, 25.0, 9.0, 19.0, 8.0, 12.0, 10.0, 5.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.14453125, -2.0845947265625, -2.024658203125, -1.9647216796875, -1.90478515625, -1.8448486328125, -1.784912109375, -1.7249755859375, -1.6650390625, -1.6051025390625, -1.545166015625, -1.4852294921875, -1.42529296875, -1.3653564453125, -1.305419921875, -1.2454833984375, -1.185546875, -1.1256103515625, -1.065673828125, -1.0057373046875, -0.94580078125, -0.8858642578125, -0.825927734375, -0.7659912109375, -0.7060546875, -0.6461181640625, -0.586181640625, -0.5262451171875, -0.46630859375, -0.4063720703125, -0.346435546875, -0.2864990234375, -0.2265625, -0.1666259765625, -0.106689453125, -0.0467529296875, 0.01318359375, 0.0731201171875, 0.133056640625, 0.1929931640625, 0.2529296875, 0.3128662109375, 0.372802734375, 0.4327392578125, 0.49267578125, 0.5526123046875, 0.612548828125, 0.6724853515625, 0.732421875, 0.7923583984375, 0.852294921875, 0.9122314453125, 0.97216796875, 1.0321044921875, 1.092041015625, 1.1519775390625, 1.2119140625, 1.2718505859375, 1.331787109375, 1.3917236328125, 1.45166015625, 1.5115966796875, 1.571533203125, 1.6314697265625, 1.69140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 6.0, 9.0, 6.0, 10.0, 12.0, 27.0, 31.0, 47.0, 77.0, 88.0, 143.0, 270.0, 487.0, 825.0, 1511.0, 3226.0, 7423.0, 20270.0, 70811.0, 331725.0, 459063.0, 106544.0, 27820.0, 9849.0, 4017.0, 1872.0, 941.0, 583.0, 329.0, 186.0, 128.0, 79.0, 54.0, 20.0, 24.0, 14.0, 11.0, 10.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1778564453125, -0.17248916625976562, -0.16712188720703125, -0.16175460815429688, -0.1563873291015625, -0.15102005004882812, -0.14565277099609375, -0.14028549194335938, -0.134918212890625, -0.12955093383789062, -0.12418365478515625, -0.11881637573242188, -0.1134490966796875, -0.10808181762695312, -0.10271453857421875, -0.09734725952148438, -0.09197998046875, -0.08661270141601562, -0.08124542236328125, -0.07587814331054688, -0.0705108642578125, -0.06514358520507812, -0.05977630615234375, -0.054409027099609375, -0.049041748046875, -0.043674468994140625, -0.03830718994140625, -0.032939910888671875, -0.0275726318359375, -0.022205352783203125, -0.01683807373046875, -0.011470794677734375, -0.006103515625, -0.000736236572265625, 0.00463104248046875, 0.009998321533203125, 0.0153656005859375, 0.020732879638671875, 0.02610015869140625, 0.031467437744140625, 0.036834716796875, 0.042201995849609375, 0.04756927490234375, 0.052936553955078125, 0.0583038330078125, 0.06367111206054688, 0.06903839111328125, 0.07440567016601562, 0.07977294921875, 0.08514022827148438, 0.09050750732421875, 0.09587478637695312, 0.1012420654296875, 0.10660934448242188, 0.11197662353515625, 0.11734390258789062, 0.122711181640625, 0.12807846069335938, 0.13344573974609375, 0.13881301879882812, 0.1441802978515625, 0.14954757690429688, 0.15491485595703125, 0.16028213500976562, 0.1656494140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 6.0, 4.0, 5.0, 8.0, 9.0, 17.0, 24.0, 39.0, 62.0, 91.0, 109.0, 149.0, 146.0, 103.0, 72.0, 35.0, 37.0, 24.0, 15.0, 11.0, 9.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.749961853027344e-05, -8.497387170791626e-05, -8.244812488555908e-05, -7.99223780632019e-05, -7.739663124084473e-05, -7.487088441848755e-05, -7.234513759613037e-05, -6.98193907737732e-05, -6.729364395141602e-05, -6.476789712905884e-05, -6.224215030670166e-05, -5.971640348434448e-05, -5.7190656661987305e-05, -5.466490983963013e-05, -5.213916301727295e-05, -4.961341619491577e-05, -4.7087669372558594e-05, -4.4561922550201416e-05, -4.203617572784424e-05, -3.951042890548706e-05, -3.698468208312988e-05, -3.4458935260772705e-05, -3.193318843841553e-05, -2.940744161605835e-05, -2.6881694793701172e-05, -2.4355947971343994e-05, -2.1830201148986816e-05, -1.930445432662964e-05, -1.677870750427246e-05, -1.4252960681915283e-05, -1.1727213859558105e-05, -9.201467037200928e-06, -6.67572021484375e-06, -4.149973392486572e-06, -1.6242265701293945e-06, 9.015202522277832e-07, 3.427267074584961e-06, 5.953013896942139e-06, 8.478760719299316e-06, 1.1004507541656494e-05, 1.3530254364013672e-05, 1.605600118637085e-05, 1.8581748008728027e-05, 2.1107494831085205e-05, 2.3633241653442383e-05, 2.615898847579956e-05, 2.8684735298156738e-05, 3.1210482120513916e-05, 3.3736228942871094e-05, 3.626197576522827e-05, 3.878772258758545e-05, 4.131346940994263e-05, 4.3839216232299805e-05, 4.636496305465698e-05, 4.889070987701416e-05, 5.141645669937134e-05, 5.3942203521728516e-05, 5.646795034408569e-05, 5.899369716644287e-05, 6.151944398880005e-05, 6.404519081115723e-05, 6.65709376335144e-05, 6.909668445587158e-05, 7.162243127822876e-05, 7.414817810058594e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 4.0, 8.0, 9.0, 8.0, 15.0, 21.0, 25.0, 47.0, 84.0, 123.0, 244.0, 574.0, 1387.0, 4112.0, 14092.0, 62056.0, 436201.0, 445198.0, 62993.0, 14229.0, 4465.0, 1477.0, 580.0, 237.0, 133.0, 74.0, 52.0, 22.0, 34.0, 13.0, 12.0, 5.0, 4.0, 7.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.30810546875, -0.29977989196777344, -0.2914543151855469, -0.2831287384033203, -0.27480316162109375, -0.2664775848388672, -0.2581520080566406, -0.24982643127441406, -0.2415008544921875, -0.23317527770996094, -0.22484970092773438, -0.2165241241455078, -0.20819854736328125, -0.1998729705810547, -0.19154739379882812, -0.18322181701660156, -0.174896240234375, -0.16657066345214844, -0.15824508666992188, -0.1499195098876953, -0.14159393310546875, -0.1332683563232422, -0.12494277954101562, -0.11661720275878906, -0.1082916259765625, -0.09996604919433594, -0.09164047241210938, -0.08331489562988281, -0.07498931884765625, -0.06666374206542969, -0.058338165283203125, -0.05001258850097656, -0.04168701171875, -0.03336143493652344, -0.025035858154296875, -0.016710281372070312, -0.00838470458984375, -5.91278076171875e-05, 0.008266448974609375, 0.016592025756835938, 0.0249176025390625, 0.03324317932128906, 0.041568756103515625, 0.04989433288574219, 0.05821990966796875, 0.06654548645019531, 0.07487106323242188, 0.08319664001464844, 0.091522216796875, 0.09984779357910156, 0.10817337036132812, 0.11649894714355469, 0.12482452392578125, 0.1331501007080078, 0.14147567749023438, 0.14980125427246094, 0.1581268310546875, 0.16645240783691406, 0.17477798461914062, 0.1831035614013672, 0.19142913818359375, 0.1997547149658203, 0.20808029174804688, 0.21640586853027344, 0.2247314453125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 4.0, 12.0, 5.0, 17.0, 14.0, 24.0, 24.0, 31.0, 43.0, 46.0, 45.0, 76.0, 52.0, 86.0, 71.0, 78.0, 82.0, 55.0, 46.0, 33.0, 23.0, 23.0, 24.0, 13.0, 13.0, 13.0, 7.0, 5.0, 3.0, 6.0, 1.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046783447265625, -0.04524421691894531, -0.043704986572265625, -0.04216575622558594, -0.04062652587890625, -0.03908729553222656, -0.037548065185546875, -0.03600883483886719, -0.0344696044921875, -0.03293037414550781, -0.031391143798828125, -0.029851913452148438, -0.02831268310546875, -0.026773452758789062, -0.025234222412109375, -0.023694992065429688, -0.02215576171875, -0.020616531372070312, -0.019077301025390625, -0.017538070678710938, -0.01599884033203125, -0.014459609985351562, -0.012920379638671875, -0.011381149291992188, -0.0098419189453125, -0.008302688598632812, -0.006763458251953125, -0.0052242279052734375, -0.00368499755859375, -0.0021457672119140625, -0.000606536865234375, 0.0009326934814453125, 0.002471923828125, 0.0040111541748046875, 0.005550384521484375, 0.0070896148681640625, 0.00862884521484375, 0.010168075561523438, 0.011707305908203125, 0.013246536254882812, 0.0147857666015625, 0.016324996948242188, 0.017864227294921875, 0.019403457641601562, 0.02094268798828125, 0.022481918334960938, 0.024021148681640625, 0.025560379028320312, 0.027099609375, 0.028638839721679688, 0.030178070068359375, 0.03171730041503906, 0.03325653076171875, 0.03479576110839844, 0.036334991455078125, 0.03787422180175781, 0.0394134521484375, 0.04095268249511719, 0.042491912841796875, 0.04403114318847656, 0.04557037353515625, 0.04710960388183594, 0.048648834228515625, 0.05018806457519531, 0.051727294921875]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 9.0, 13.0, 17.0, 32.0, 41.0, 53.0, 58.0, 108.0, 118.0, 142.0, 106.0, 94.0, 62.0, 50.0, 32.0, 25.0, 22.0, 7.0, 10.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9193627834320068, -1.8680018186569214, -1.8166407346725464, -1.765279769897461, -1.7139188051223755, -1.66255784034729, -1.611196756362915, -1.5598357915878296, -1.5084748268127441, -1.4571138620376587, -1.4057527780532837, -1.3543918132781982, -1.3030308485031128, -1.2516698837280273, -1.2003087997436523, -1.148947834968567, -1.097586750984192, -1.0462257862091064, -0.9948647618293762, -0.943503737449646, -0.8921427726745605, -0.8407817482948303, -0.7894207239151001, -0.7380597591400146, -0.6866987347602844, -0.6353377103805542, -0.5839767456054688, -0.5326157212257385, -0.4812547266483307, -0.42989373207092285, -0.3785327076911926, -0.3271717131137848, -0.27581071853637695, -0.22444972395896912, -0.17308871448040009, -0.12172770500183105, -0.07036671042442322, -0.01900571584701538, 0.032355308532714844, 0.08371630311012268, 0.13507729768753052, 0.18643829226493835, 0.23779930174350739, 0.2891603112220764, 0.34052130579948425, 0.3918823003768921, 0.4432433247566223, 0.49460431933403015, 0.545965313911438, 0.5973263382911682, 0.6486873030662537, 0.7000483274459839, 0.7514092922210693, 0.8027703166007996, 0.8541313409805298, 0.9054923057556152, 0.9568533301353455, 1.0082143545150757, 1.0595753192901611, 1.1109364032745361, 1.1622973680496216, 1.213658332824707, 1.265019416809082, 1.3163803815841675, 1.367741346359253]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 6.0, 2.0, 4.0, 4.0, 10.0, 9.0, 8.0, 19.0, 17.0, 13.0, 23.0, 17.0, 26.0, 44.0, 34.0, 42.0, 48.0, 46.0, 47.0, 46.0, 45.0, 46.0, 45.0, 41.0, 47.0, 40.0, 37.0, 32.0, 30.0, 36.0, 32.0, 17.0, 23.0, 17.0, 10.0, 12.0, 9.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8063705563545227, -0.7802299857139587, -0.75408935546875, -0.727948784828186, -0.7018081545829773, -0.6756675839424133, -0.6495269536972046, -0.6233863830566406, -0.5972458124160767, -0.5711052417755127, -0.544964611530304, -0.51882404088974, -0.49268341064453125, -0.4665428400039673, -0.44040223956108093, -0.4142616391181946, -0.38812100887298584, -0.3619804084300995, -0.33583980798721313, -0.30969923734664917, -0.28355860710144043, -0.25741803646087646, -0.2312774360179901, -0.20513683557510376, -0.1789962351322174, -0.15285563468933105, -0.1267150342464447, -0.10057444870471954, -0.07443384826183319, -0.04829324781894684, -0.02215266227722168, 0.003987938165664673, 0.03012847900390625, 0.056269075721502304, 0.08240967243909836, 0.10855026543140411, 0.13469086587429047, 0.16083146631717682, 0.18697205185890198, 0.21311265230178833, 0.23925325274467468, 0.26539385318756104, 0.2915344536304474, 0.31767505407333374, 0.3438156247138977, 0.36995625495910645, 0.3960968255996704, 0.42223742604255676, 0.4483780264854431, 0.47451862692832947, 0.5006592273712158, 0.5267997980117798, 0.5529404282569885, 0.5790809988975525, 0.6052216291427612, 0.6313621997833252, 0.6575027704238892, 0.6836433410644531, 0.7097839713096619, 0.7359245419502258, 0.7620651721954346, 0.7882057428359985, 0.8143463134765625, 0.8404869437217712, 0.86662757396698]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 6.0, 11.0, 5.0, 15.0, 9.0, 21.0, 20.0, 23.0, 35.0, 52.0, 84.0, 92.0, 169.0, 237.0, 360.0, 611.0, 1092.0, 2245.0, 4899.0, 11218.0, 29642.0, 87474.0, 385766.0, 386464.0, 87394.0, 29306.0, 11454.0, 4805.0, 2203.0, 1085.0, 625.0, 375.0, 221.0, 167.0, 103.0, 81.0, 37.0, 35.0, 25.0, 28.0, 16.0, 10.0, 10.0, 10.0, 9.0, 8.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7197265625, -0.6930694580078125, -0.666412353515625, -0.6397552490234375, -0.61309814453125, -0.5864410400390625, -0.559783935546875, -0.5331268310546875, -0.5064697265625, -0.4798126220703125, -0.453155517578125, -0.4264984130859375, -0.39984130859375, -0.3731842041015625, -0.346527099609375, -0.3198699951171875, -0.293212890625, -0.2665557861328125, -0.239898681640625, -0.2132415771484375, -0.18658447265625, -0.1599273681640625, -0.133270263671875, -0.1066131591796875, -0.0799560546875, -0.0532989501953125, -0.026641845703125, 1.52587890625e-05, 0.02667236328125, 0.0533294677734375, 0.079986572265625, 0.1066436767578125, 0.13330078125, 0.1599578857421875, 0.186614990234375, 0.2132720947265625, 0.23992919921875, 0.2665863037109375, 0.293243408203125, 0.3199005126953125, 0.3465576171875, 0.3732147216796875, 0.399871826171875, 0.4265289306640625, 0.45318603515625, 0.4798431396484375, 0.506500244140625, 0.5331573486328125, 0.559814453125, 0.5864715576171875, 0.613128662109375, 0.6397857666015625, 0.66644287109375, 0.6930999755859375, 0.719757080078125, 0.7464141845703125, 0.7730712890625, 0.7997283935546875, 0.826385498046875, 0.8530426025390625, 0.87969970703125, 0.9063568115234375, 0.933013916015625, 0.9596710205078125, 0.986328125]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 10.0, 10.0, 12.0, 16.0, 17.0, 25.0, 17.0, 30.0, 14.0, 34.0, 38.0, 47.0, 55.0, 49.0, 49.0, 42.0, 52.0, 39.0, 46.0, 42.0, 42.0, 32.0, 39.0, 38.0, 41.0, 30.0, 21.0, 21.0, 19.0, 10.0, 14.0, 6.0, 9.0, 4.0, 2.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5869140625, -1.538177490234375, -1.48944091796875, -1.440704345703125, -1.3919677734375, -1.343231201171875, -1.29449462890625, -1.245758056640625, -1.197021484375, -1.148284912109375, -1.09954833984375, -1.050811767578125, -1.0020751953125, -0.953338623046875, -0.90460205078125, -0.855865478515625, -0.80712890625, -0.758392333984375, -0.70965576171875, -0.660919189453125, -0.6121826171875, -0.563446044921875, -0.51470947265625, -0.465972900390625, -0.417236328125, -0.368499755859375, -0.31976318359375, -0.271026611328125, -0.2222900390625, -0.173553466796875, -0.12481689453125, -0.076080322265625, -0.02734375, 0.021392822265625, 0.07012939453125, 0.118865966796875, 0.1676025390625, 0.216339111328125, 0.26507568359375, 0.313812255859375, 0.362548828125, 0.411285400390625, 0.46002197265625, 0.508758544921875, 0.5574951171875, 0.606231689453125, 0.65496826171875, 0.703704833984375, 0.75244140625, 0.801177978515625, 0.84991455078125, 0.898651123046875, 0.9473876953125, 0.996124267578125, 1.04486083984375, 1.093597412109375, 1.142333984375, 1.191070556640625, 1.23980712890625, 1.288543701171875, 1.3372802734375, 1.386016845703125, 1.43475341796875, 1.483489990234375, 1.5322265625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 6.0, 2.0, 6.0, 4.0, 3.0, 7.0, 11.0, 19.0, 16.0, 26.0, 27.0, 45.0, 57.0, 100.0, 163.0, 373.0, 885.0, 8394.0, 731791.0, 300175.0, 4954.0, 702.0, 311.0, 147.0, 87.0, 59.0, 42.0, 33.0, 31.0, 25.0, 9.0, 10.0, 6.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-3.96484375, -3.854461669921875, -3.74407958984375, -3.633697509765625, -3.5233154296875, -3.412933349609375, -3.30255126953125, -3.192169189453125, -3.081787109375, -2.971405029296875, -2.86102294921875, -2.750640869140625, -2.6402587890625, -2.529876708984375, -2.41949462890625, -2.309112548828125, -2.19873046875, -2.088348388671875, -1.97796630859375, -1.867584228515625, -1.7572021484375, -1.646820068359375, -1.53643798828125, -1.426055908203125, -1.315673828125, -1.205291748046875, -1.09490966796875, -0.984527587890625, -0.8741455078125, -0.763763427734375, -0.65338134765625, -0.542999267578125, -0.4326171875, -0.322235107421875, -0.21185302734375, -0.101470947265625, 0.0089111328125, 0.119293212890625, 0.22967529296875, 0.340057373046875, 0.450439453125, 0.560821533203125, 0.67120361328125, 0.781585693359375, 0.8919677734375, 1.002349853515625, 1.11273193359375, 1.223114013671875, 1.33349609375, 1.443878173828125, 1.55426025390625, 1.664642333984375, 1.7750244140625, 1.885406494140625, 1.99578857421875, 2.106170654296875, 2.216552734375, 2.326934814453125, 2.43731689453125, 2.547698974609375, 2.6580810546875, 2.768463134765625, 2.87884521484375, 2.989227294921875, 3.099609375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 3.0, 5.0, 4.0, 9.0, 10.0, 11.0, 12.0, 7.0, 9.0, 11.0, 16.0, 30.0, 35.0, 34.0, 39.0, 42.0, 36.0, 40.0, 56.0, 51.0, 66.0, 47.0, 46.0, 48.0, 38.0, 49.0, 47.0, 31.0, 34.0, 18.0, 13.0, 23.0, 19.0, 15.0, 10.0, 9.0, 8.0, 3.0, 3.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.080078125, -2.0183258056640625, -1.956573486328125, -1.8948211669921875, -1.83306884765625, -1.7713165283203125, -1.709564208984375, -1.6478118896484375, -1.5860595703125, -1.5243072509765625, -1.462554931640625, -1.4008026123046875, -1.33905029296875, -1.2772979736328125, -1.215545654296875, -1.1537933349609375, -1.092041015625, -1.0302886962890625, -0.968536376953125, -0.9067840576171875, -0.84503173828125, -0.7832794189453125, -0.721527099609375, -0.6597747802734375, -0.5980224609375, -0.5362701416015625, -0.474517822265625, -0.4127655029296875, -0.35101318359375, -0.2892608642578125, -0.227508544921875, -0.1657562255859375, -0.10400390625, -0.0422515869140625, 0.019500732421875, 0.0812530517578125, 0.14300537109375, 0.2047576904296875, 0.266510009765625, 0.3282623291015625, 0.3900146484375, 0.4517669677734375, 0.513519287109375, 0.5752716064453125, 0.63702392578125, 0.6987762451171875, 0.760528564453125, 0.8222808837890625, 0.884033203125, 0.9457855224609375, 1.007537841796875, 1.0692901611328125, 1.13104248046875, 1.1927947998046875, 1.254547119140625, 1.3162994384765625, 1.3780517578125, 1.4398040771484375, 1.501556396484375, 1.5633087158203125, 1.62506103515625, 1.6868133544921875, 1.748565673828125, 1.8103179931640625, 1.8720703125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 2.0, 3.0, 6.0, 0.0, 5.0, 7.0, 9.0, 18.0, 14.0, 18.0, 29.0, 40.0, 63.0, 74.0, 158.0, 266.0, 486.0, 1154.0, 3570.0, 15344.0, 101234.0, 701830.0, 191129.0, 24916.0, 5225.0, 1532.0, 601.0, 293.0, 134.0, 95.0, 75.0, 49.0, 32.0, 35.0, 34.0, 17.0, 14.0, 9.0, 11.0, 2.0, 5.0, 2.0, 7.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.325439453125, -0.31446075439453125, -0.3034820556640625, -0.29250335693359375, -0.281524658203125, -0.27054595947265625, -0.2595672607421875, -0.24858856201171875, -0.23760986328125, -0.22663116455078125, -0.2156524658203125, -0.20467376708984375, -0.193695068359375, -0.18271636962890625, -0.1717376708984375, -0.16075897216796875, -0.1497802734375, -0.13880157470703125, -0.1278228759765625, -0.11684417724609375, -0.105865478515625, -0.09488677978515625, -0.0839080810546875, -0.07292938232421875, -0.06195068359375, -0.05097198486328125, -0.0399932861328125, -0.02901458740234375, -0.018035888671875, -0.00705718994140625, 0.0039215087890625, 0.01490020751953125, 0.02587890625, 0.03685760498046875, 0.0478363037109375, 0.05881500244140625, 0.069793701171875, 0.08077239990234375, 0.0917510986328125, 0.10272979736328125, 0.11370849609375, 0.12468719482421875, 0.1356658935546875, 0.14664459228515625, 0.157623291015625, 0.16860198974609375, 0.1795806884765625, 0.19055938720703125, 0.2015380859375, 0.21251678466796875, 0.2234954833984375, 0.23447418212890625, 0.245452880859375, 0.25643157958984375, 0.2674102783203125, 0.27838897705078125, 0.28936767578125, 0.30034637451171875, 0.3113250732421875, 0.32230377197265625, 0.333282470703125, 0.34426116943359375, 0.3552398681640625, 0.36621856689453125, 0.377197265625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 6.0, 8.0, 12.0, 10.0, 16.0, 15.0, 25.0, 43.0, 49.0, 56.0, 80.0, 106.0, 95.0, 84.0, 67.0, 56.0, 38.0, 40.0, 24.0, 42.0, 29.0, 17.0, 10.0, 16.0, 4.0, 16.0, 8.0, 6.0, 2.0, 6.0, 3.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.0650367736816406e-05, -3.9548613131046295e-05, -3.8446858525276184e-05, -3.734510391950607e-05, -3.624334931373596e-05, -3.514159470796585e-05, -3.403984010219574e-05, -3.293808549642563e-05, -3.183633089065552e-05, -3.0734576284885406e-05, -2.9632821679115295e-05, -2.8531067073345184e-05, -2.7429312467575073e-05, -2.6327557861804962e-05, -2.522580325603485e-05, -2.412404865026474e-05, -2.302229404449463e-05, -2.1920539438724518e-05, -2.0818784832954407e-05, -1.9717030227184296e-05, -1.8615275621414185e-05, -1.7513521015644073e-05, -1.6411766409873962e-05, -1.531001180410385e-05, -1.420825719833374e-05, -1.3106502592563629e-05, -1.2004747986793518e-05, -1.0902993381023407e-05, -9.801238775253296e-06, -8.699484169483185e-06, -7.597729563713074e-06, -6.495974957942963e-06, -5.3942203521728516e-06, -4.2924657464027405e-06, -3.1907111406326294e-06, -2.0889565348625183e-06, -9.872019290924072e-07, 1.1455267667770386e-07, 1.216307282447815e-06, 2.318061888217926e-06, 3.419816493988037e-06, 4.521571099758148e-06, 5.623325705528259e-06, 6.72508031129837e-06, 7.826834917068481e-06, 8.928589522838593e-06, 1.0030344128608704e-05, 1.1132098734378815e-05, 1.2233853340148926e-05, 1.3335607945919037e-05, 1.4437362551689148e-05, 1.553911715745926e-05, 1.664087176322937e-05, 1.774262636899948e-05, 1.8844380974769592e-05, 1.9946135580539703e-05, 2.1047890186309814e-05, 2.2149644792079926e-05, 2.3251399397850037e-05, 2.4353154003620148e-05, 2.545490860939026e-05, 2.655666321516037e-05, 2.765841782093048e-05, 2.8760172426700592e-05, 2.9861927032470703e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 3.0, 9.0, 10.0, 21.0, 36.0, 61.0, 103.0, 224.0, 648.0, 2417.0, 28924.0, 915568.0, 94508.0, 4550.0, 846.0, 308.0, 144.0, 72.0, 37.0, 22.0, 8.0, 8.0, 5.0, 3.0, 8.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8984375, -0.8717422485351562, -0.8450469970703125, -0.8183517456054688, -0.791656494140625, -0.7649612426757812, -0.7382659912109375, -0.7115707397460938, -0.68487548828125, -0.6581802368164062, -0.6314849853515625, -0.6047897338867188, -0.578094482421875, -0.5513992309570312, -0.5247039794921875, -0.49800872802734375, -0.4713134765625, -0.44461822509765625, -0.4179229736328125, -0.39122772216796875, -0.364532470703125, -0.33783721923828125, -0.3111419677734375, -0.28444671630859375, -0.25775146484375, -0.23105621337890625, -0.2043609619140625, -0.17766571044921875, -0.150970458984375, -0.12427520751953125, -0.0975799560546875, -0.07088470458984375, -0.044189453125, -0.01749420166015625, 0.0092010498046875, 0.03589630126953125, 0.062591552734375, 0.08928680419921875, 0.1159820556640625, 0.14267730712890625, 0.16937255859375, 0.19606781005859375, 0.2227630615234375, 0.24945831298828125, 0.276153564453125, 0.30284881591796875, 0.3295440673828125, 0.35623931884765625, 0.3829345703125, 0.40962982177734375, 0.4363250732421875, 0.46302032470703125, 0.489715576171875, 0.5164108276367188, 0.5431060791015625, 0.5698013305664062, 0.59649658203125, 0.6231918334960938, 0.6498870849609375, 0.6765823364257812, 0.703277587890625, 0.7299728393554688, 0.7566680908203125, 0.7833633422851562, 0.81005859375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 9.0, 7.0, 18.0, 17.0, 35.0, 65.0, 99.0, 180.0, 274.0, 119.0, 69.0, 40.0, 19.0, 17.0, 12.0, 12.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.35791015625, -0.34827423095703125, -0.3386383056640625, -0.32900238037109375, -0.319366455078125, -0.30973052978515625, -0.3000946044921875, -0.29045867919921875, -0.28082275390625, -0.27118682861328125, -0.2615509033203125, -0.25191497802734375, -0.242279052734375, -0.23264312744140625, -0.2230072021484375, -0.21337127685546875, -0.2037353515625, -0.19409942626953125, -0.1844635009765625, -0.17482757568359375, -0.165191650390625, -0.15555572509765625, -0.1459197998046875, -0.13628387451171875, -0.12664794921875, -0.11701202392578125, -0.1073760986328125, -0.09774017333984375, -0.088104248046875, -0.07846832275390625, -0.0688323974609375, -0.05919647216796875, -0.049560546875, -0.03992462158203125, -0.0302886962890625, -0.02065277099609375, -0.011016845703125, -0.00138092041015625, 0.0082550048828125, 0.01789093017578125, 0.02752685546875, 0.03716278076171875, 0.0467987060546875, 0.05643463134765625, 0.066070556640625, 0.07570648193359375, 0.0853424072265625, 0.09497833251953125, 0.1046142578125, 0.11425018310546875, 0.1238861083984375, 0.13352203369140625, 0.143157958984375, 0.15279388427734375, 0.1624298095703125, 0.17206573486328125, 0.18170166015625, 0.19133758544921875, 0.2009735107421875, 0.21060943603515625, 0.220245361328125, 0.22988128662109375, 0.2395172119140625, 0.24915313720703125, 0.2587890625]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 18.0, 55.0, 120.0, 208.0, 268.0, 188.0, 102.0, 34.0, 16.0, 5.0], "bins": [-13.263665199279785, -13.036294937133789, -12.808924674987793, -12.581554412841797, -12.3541841506958, -12.126813888549805, -11.899443626403809, -11.672073364257812, -11.444703102111816, -11.21733283996582, -10.989962577819824, -10.762592315673828, -10.535222053527832, -10.307851791381836, -10.08048152923584, -9.853111267089844, -9.625741004943848, -9.398370742797852, -9.171000480651855, -8.94363021850586, -8.716259956359863, -8.488889694213867, -8.261519432067871, -8.034149169921875, -7.806778907775879, -7.579408645629883, -7.352038383483887, -7.124668121337891, -6.8972978591918945, -6.669927597045898, -6.442557334899902, -6.215187072753906, -5.987817287445068, -5.760447025299072, -5.533076763153076, -5.30570650100708, -5.078336238861084, -4.850965976715088, -4.623595714569092, -4.396225452423096, -4.1688551902771, -3.9414849281311035, -3.7141146659851074, -3.4867444038391113, -3.2593741416931152, -3.032003879547119, -2.804633617401123, -2.577263355255127, -2.349893093109131, -2.1225228309631348, -1.8951525688171387, -1.6677823066711426, -1.4404120445251465, -1.2130417823791504, -0.9856715202331543, -0.7583012580871582, -0.5309308767318726, -0.30356061458587646, -0.07619035243988037, 0.15117990970611572, 0.3785501718521118, 0.6059204339981079, 0.833290696144104, 1.0606609582901, 1.2880312204360962]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 5.0, 3.0, 9.0, 11.0, 12.0, 13.0, 8.0, 28.0, 27.0, 26.0, 29.0, 42.0, 28.0, 33.0, 29.0, 42.0, 42.0, 45.0, 44.0, 30.0, 41.0, 44.0, 32.0, 50.0, 35.0, 31.0, 41.0, 34.0, 19.0, 24.0, 26.0, 22.0, 16.0, 11.0, 15.0, 11.0, 9.0, 8.0, 8.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.86728572845459, -2.7767083644866943, -2.686131000518799, -2.5955538749694824, -2.504976511001587, -2.4143991470336914, -2.323822021484375, -2.2332446575164795, -2.142667293548584, -2.0520899295806885, -1.9615126848220825, -1.8709354400634766, -1.780358076095581, -1.6897807121276855, -1.5992034673690796, -1.5086262226104736, -1.4180488586425781, -1.3274714946746826, -1.2368942499160767, -1.1463170051574707, -1.0557396411895752, -0.9651623368263245, -0.8745850324630737, -0.784007728099823, -0.6934304237365723, -0.6028531193733215, -0.5122758150100708, -0.42169851064682007, -0.33112120628356934, -0.2405439019203186, -0.14996659755706787, -0.05938929319381714, 0.031188011169433594, 0.12176531553268433, 0.21234261989593506, 0.3029199242591858, 0.3934972286224365, 0.48407453298568726, 0.574651837348938, 0.6652291417121887, 0.7558064460754395, 0.8463837504386902, 0.9369610548019409, 1.0275382995605469, 1.1181156635284424, 1.208693027496338, 1.2992702722549438, 1.3898475170135498, 1.4804248809814453, 1.5710022449493408, 1.6615794897079468, 1.7521567344665527, 1.8427340984344482, 1.9333114624023438, 2.02388858795166, 2.1144659519195557, 2.205043315887451, 2.2956206798553467, 2.386198043823242, 2.4767751693725586, 2.567352533340454, 2.6579298973083496, 2.748507022857666, 2.8390843868255615, 2.929661750793457]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 6.0, 7.0, 10.0, 8.0, 12.0, 12.0, 16.0, 13.0, 30.0, 32.0, 48.0, 48.0, 83.0, 103.0, 132.0, 201.0, 300.0, 540.0, 902.0, 2011.0, 4915.0, 15344.0, 71477.0, 659501.0, 2591482.0, 740040.0, 81336.0, 16097.0, 4970.0, 2032.0, 984.0, 508.0, 315.0, 206.0, 151.0, 107.0, 75.0, 49.0, 49.0, 35.0, 14.0, 24.0, 15.0, 7.0, 9.0, 7.0, 13.0, 2.0, 6.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0], "bins": [-1.5595703125, -1.510101318359375, -1.46063232421875, -1.411163330078125, -1.3616943359375, -1.312225341796875, -1.26275634765625, -1.213287353515625, -1.163818359375, -1.114349365234375, -1.06488037109375, -1.015411376953125, -0.9659423828125, -0.916473388671875, -0.86700439453125, -0.817535400390625, -0.76806640625, -0.718597412109375, -0.66912841796875, -0.619659423828125, -0.5701904296875, -0.520721435546875, -0.47125244140625, -0.421783447265625, -0.372314453125, -0.322845458984375, -0.27337646484375, -0.223907470703125, -0.1744384765625, -0.124969482421875, -0.07550048828125, -0.026031494140625, 0.0234375, 0.072906494140625, 0.12237548828125, 0.171844482421875, 0.2213134765625, 0.270782470703125, 0.32025146484375, 0.369720458984375, 0.419189453125, 0.468658447265625, 0.51812744140625, 0.567596435546875, 0.6170654296875, 0.666534423828125, 0.71600341796875, 0.765472412109375, 0.81494140625, 0.864410400390625, 0.91387939453125, 0.963348388671875, 1.0128173828125, 1.062286376953125, 1.11175537109375, 1.161224365234375, 1.210693359375, 1.260162353515625, 1.30963134765625, 1.359100341796875, 1.4085693359375, 1.458038330078125, 1.50750732421875, 1.556976318359375, 1.6064453125]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 5.0, 5.0, 8.0, 13.0, 7.0, 7.0, 13.0, 21.0, 25.0, 36.0, 35.0, 33.0, 49.0, 38.0, 57.0, 50.0, 64.0, 53.0, 59.0, 52.0, 51.0, 36.0, 39.0, 45.0, 39.0, 27.0, 24.0, 31.0, 21.0, 19.0, 11.0, 9.0, 8.0, 4.0, 4.0, 3.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1142578125, -1.0802154541015625, -1.046173095703125, -1.0121307373046875, -0.97808837890625, -0.9440460205078125, -0.910003662109375, -0.8759613037109375, -0.8419189453125, -0.8078765869140625, -0.773834228515625, -0.7397918701171875, -0.70574951171875, -0.6717071533203125, -0.637664794921875, -0.6036224365234375, -0.569580078125, -0.5355377197265625, -0.501495361328125, -0.4674530029296875, -0.43341064453125, -0.3993682861328125, -0.365325927734375, -0.3312835693359375, -0.2972412109375, -0.2631988525390625, -0.229156494140625, -0.1951141357421875, -0.16107177734375, -0.1270294189453125, -0.092987060546875, -0.0589447021484375, -0.02490234375, 0.0091400146484375, 0.043182373046875, 0.0772247314453125, 0.11126708984375, 0.1453094482421875, 0.179351806640625, 0.2133941650390625, 0.2474365234375, 0.2814788818359375, 0.315521240234375, 0.3495635986328125, 0.38360595703125, 0.4176483154296875, 0.451690673828125, 0.4857330322265625, 0.519775390625, 0.5538177490234375, 0.587860107421875, 0.6219024658203125, 0.65594482421875, 0.6899871826171875, 0.724029541015625, 0.7580718994140625, 0.7921142578125, 0.8261566162109375, 0.860198974609375, 0.8942413330078125, 0.92828369140625, 0.9623260498046875, 0.996368408203125, 1.0304107666015625, 1.064453125]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 5.0, 2.0, 9.0, 16.0, 9.0, 28.0, 24.0, 46.0, 82.0, 124.0, 213.0, 443.0, 1183.0, 4600.0, 26871.0, 540900.0, 3507103.0, 98298.0, 10677.0, 2264.0, 694.0, 302.0, 165.0, 73.0, 51.0, 32.0, 25.0, 10.0, 5.0, 6.0, 9.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.962890625, -2.871063232421875, -2.77923583984375, -2.687408447265625, -2.5955810546875, -2.503753662109375, -2.41192626953125, -2.320098876953125, -2.228271484375, -2.136444091796875, -2.04461669921875, -1.952789306640625, -1.8609619140625, -1.769134521484375, -1.67730712890625, -1.585479736328125, -1.49365234375, -1.401824951171875, -1.30999755859375, -1.218170166015625, -1.1263427734375, -1.034515380859375, -0.94268798828125, -0.850860595703125, -0.759033203125, -0.667205810546875, -0.57537841796875, -0.483551025390625, -0.3917236328125, -0.299896240234375, -0.20806884765625, -0.116241455078125, -0.0244140625, 0.067413330078125, 0.15924072265625, 0.251068115234375, 0.3428955078125, 0.434722900390625, 0.52655029296875, 0.618377685546875, 0.710205078125, 0.802032470703125, 0.89385986328125, 0.985687255859375, 1.0775146484375, 1.169342041015625, 1.26116943359375, 1.352996826171875, 1.44482421875, 1.536651611328125, 1.62847900390625, 1.720306396484375, 1.8121337890625, 1.903961181640625, 1.99578857421875, 2.087615966796875, 2.179443359375, 2.271270751953125, 2.36309814453125, 2.454925537109375, 2.5467529296875, 2.638580322265625, 2.73040771484375, 2.822235107421875, 2.9140625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 9.0, 6.0, 19.0, 22.0, 21.0, 52.0, 64.0, 135.0, 212.0, 433.0, 665.0, 763.0, 634.0, 421.0, 255.0, 142.0, 76.0, 41.0, 27.0, 26.0, 11.0, 7.0, 7.0, 12.0, 7.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56201171875, -0.53814697265625, -0.5142822265625, -0.49041748046875, -0.466552734375, -0.44268798828125, -0.4188232421875, -0.39495849609375, -0.37109375, -0.34722900390625, -0.3233642578125, -0.29949951171875, -0.275634765625, -0.25177001953125, -0.2279052734375, -0.20404052734375, -0.18017578125, -0.15631103515625, -0.1324462890625, -0.10858154296875, -0.084716796875, -0.06085205078125, -0.0369873046875, -0.01312255859375, 0.0107421875, 0.03460693359375, 0.0584716796875, 0.08233642578125, 0.106201171875, 0.13006591796875, 0.1539306640625, 0.17779541015625, 0.20166015625, 0.22552490234375, 0.2493896484375, 0.27325439453125, 0.297119140625, 0.32098388671875, 0.3448486328125, 0.36871337890625, 0.392578125, 0.41644287109375, 0.4403076171875, 0.46417236328125, 0.488037109375, 0.51190185546875, 0.5357666015625, 0.55963134765625, 0.58349609375, 0.60736083984375, 0.6312255859375, 0.65509033203125, 0.678955078125, 0.70281982421875, 0.7266845703125, 0.75054931640625, 0.7744140625, 0.79827880859375, 0.8221435546875, 0.84600830078125, 0.869873046875, 0.89373779296875, 0.9176025390625, 0.94146728515625, 0.96533203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 10.0, 15.0, 15.0, 24.0, 41.0, 51.0, 66.0, 79.0, 130.0, 108.0, 103.0, 90.0, 82.0, 67.0, 46.0, 29.0, 21.0, 11.0, 9.0, 8.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.892338275909424, -2.8175418376922607, -2.7427456378936768, -2.6679491996765137, -2.5931529998779297, -2.5183565616607666, -2.4435603618621826, -2.3687639236450195, -2.2939677238464355, -2.2191712856292725, -2.1443750858306885, -2.0695786476135254, -1.9947824478149414, -1.9199861288070679, -1.8451898097991943, -1.7703933715820312, -1.6955970525741577, -1.6208007335662842, -1.5460044145584106, -1.471208095550537, -1.3964117765426636, -1.32161545753479, -1.246819019317627, -1.172022819519043, -1.0972263813018799, -1.0224300622940063, -0.9476337432861328, -0.8728374242782593, -0.7980411052703857, -0.7232447862625122, -0.6484484076499939, -0.5736520886421204, -0.49885571002960205, -0.4240593910217285, -0.349263072013855, -0.27446672320365906, -0.19967040419578552, -0.12487408518791199, -0.050077736377716064, 0.02471858263015747, 0.099514901638031, 0.17431122064590454, 0.24910755455493927, 0.323903888463974, 0.39870020747184753, 0.47349652647972107, 0.548292875289917, 0.6230891942977905, 0.6978855133056641, 0.7726818323135376, 0.8474781513214111, 0.9222744703292847, 0.9970707893371582, 1.0718671083450317, 1.1466634273529053, 1.2214598655700684, 1.2962560653686523, 1.3710523843765259, 1.4458487033843994, 1.520645022392273, 1.5954413414001465, 1.67023766040802, 1.7450339794158936, 1.8198304176330566, 1.8946267366409302]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 4.0, 3.0, 6.0, 9.0, 9.0, 11.0, 11.0, 16.0, 12.0, 21.0, 24.0, 18.0, 20.0, 28.0, 42.0, 27.0, 35.0, 34.0, 31.0, 54.0, 37.0, 50.0, 45.0, 41.0, 43.0, 35.0, 45.0, 42.0, 27.0, 21.0, 31.0, 24.0, 14.0, 22.0, 14.0, 10.0, 24.0, 14.0, 8.0, 11.0, 7.0, 3.0, 6.0, 5.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.1347416639328003, -1.1009100675582886, -1.0670783519744873, -1.0332467555999756, -0.9994151592254639, -0.9655835032463074, -0.9317518472671509, -0.8979202508926392, -0.8640885949134827, -0.8302569389343262, -0.7964253425598145, -0.762593686580658, -0.7287620306015015, -0.6949304342269897, -0.6610987782478333, -0.6272671222686768, -0.593435525894165, -0.5596038699150085, -0.5257722735404968, -0.49194061756134033, -0.4581089913845062, -0.4242773652076721, -0.3904457092285156, -0.3566140830516815, -0.3227824568748474, -0.2889508306980133, -0.2551192045211792, -0.2212875485420227, -0.1874559223651886, -0.1536242961883545, -0.11979265511035919, -0.08596101403236389, -0.052129387855529785, -0.018297754228115082, 0.015533879399299622, 0.049365513026714325, 0.08319714665412903, 0.11702877283096313, 0.15086041390895844, 0.18469205498695374, 0.21852368116378784, 0.25235530734062195, 0.28618693351745605, 0.32001858949661255, 0.35385021567344666, 0.38768184185028076, 0.42151349782943726, 0.45534512400627136, 0.48917675018310547, 0.523008406162262, 0.5568400025367737, 0.5906716585159302, 0.6245032548904419, 0.6583349108695984, 0.6921665668487549, 0.7259981632232666, 0.7598298192024231, 0.7936614751815796, 0.8274930715560913, 0.8613247275352478, 0.8951563835144043, 0.928987979888916, 0.9628196358680725, 0.996651291847229, 1.0304828882217407]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 5.0, 10.0, 13.0, 14.0, 16.0, 20.0, 42.0, 55.0, 84.0, 111.0, 183.0, 275.0, 419.0, 587.0, 1014.0, 1655.0, 2687.0, 4726.0, 8525.0, 16409.0, 33963.0, 83649.0, 229899.0, 362409.0, 178086.0, 64651.0, 27707.0, 13716.0, 7311.0, 4065.0, 2332.0, 1388.0, 842.0, 588.0, 362.0, 267.0, 149.0, 101.0, 71.0, 34.0, 37.0, 20.0, 22.0, 5.0, 8.0, 8.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.3212890625, -0.3116607666015625, -0.302032470703125, -0.2924041748046875, -0.28277587890625, -0.2731475830078125, -0.263519287109375, -0.2538909912109375, -0.2442626953125, -0.2346343994140625, -0.225006103515625, -0.2153778076171875, -0.20574951171875, -0.1961212158203125, -0.186492919921875, -0.1768646240234375, -0.167236328125, -0.1576080322265625, -0.147979736328125, -0.1383514404296875, -0.12872314453125, -0.1190948486328125, -0.109466552734375, -0.0998382568359375, -0.0902099609375, -0.0805816650390625, -0.070953369140625, -0.0613250732421875, -0.05169677734375, -0.0420684814453125, -0.032440185546875, -0.0228118896484375, -0.01318359375, -0.0035552978515625, 0.006072998046875, 0.0157012939453125, 0.02532958984375, 0.0349578857421875, 0.044586181640625, 0.0542144775390625, 0.0638427734375, 0.0734710693359375, 0.083099365234375, 0.0927276611328125, 0.10235595703125, 0.1119842529296875, 0.121612548828125, 0.1312408447265625, 0.140869140625, 0.1504974365234375, 0.160125732421875, 0.1697540283203125, 0.17938232421875, 0.1890106201171875, 0.198638916015625, 0.2082672119140625, 0.2178955078125, 0.2275238037109375, 0.237152099609375, 0.2467803955078125, 0.25640869140625, 0.2660369873046875, 0.275665283203125, 0.2852935791015625, 0.294921875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 7.0, 5.0, 7.0, 2.0, 6.0, 4.0, 7.0, 14.0, 8.0, 22.0, 23.0, 30.0, 36.0, 27.0, 36.0, 38.0, 28.0, 39.0, 55.0, 52.0, 58.0, 56.0, 48.0, 37.0, 41.0, 42.0, 47.0, 38.0, 26.0, 31.0, 30.0, 17.0, 19.0, 13.0, 12.0, 11.0, 12.0, 9.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.748046875, -0.7247772216796875, -0.701507568359375, -0.6782379150390625, -0.65496826171875, -0.6316986083984375, -0.608428955078125, -0.5851593017578125, -0.5618896484375, -0.5386199951171875, -0.515350341796875, -0.4920806884765625, -0.46881103515625, -0.4455413818359375, -0.422271728515625, -0.3990020751953125, -0.375732421875, -0.3524627685546875, -0.329193115234375, -0.3059234619140625, -0.28265380859375, -0.2593841552734375, -0.236114501953125, -0.2128448486328125, -0.1895751953125, -0.1663055419921875, -0.143035888671875, -0.1197662353515625, -0.09649658203125, -0.0732269287109375, -0.049957275390625, -0.0266876220703125, -0.00341796875, 0.0198516845703125, 0.043121337890625, 0.0663909912109375, 0.08966064453125, 0.1129302978515625, 0.136199951171875, 0.1594696044921875, 0.1827392578125, 0.2060089111328125, 0.229278564453125, 0.2525482177734375, 0.27581787109375, 0.2990875244140625, 0.322357177734375, 0.3456268310546875, 0.368896484375, 0.3921661376953125, 0.415435791015625, 0.4387054443359375, 0.46197509765625, 0.4852447509765625, 0.508514404296875, 0.5317840576171875, 0.5550537109375, 0.5783233642578125, 0.601593017578125, 0.6248626708984375, 0.64813232421875, 0.6714019775390625, 0.694671630859375, 0.7179412841796875, 0.7412109375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 1.0, 8.0, 8.0, 13.0, 16.0, 18.0, 15.0, 24.0, 28.0, 30.0, 55.0, 81.0, 115.0, 190.0, 301.0, 458.0, 830.0, 1516.0, 2913.0, 5629.0, 12816.0, 31555.0, 99860.0, 338205.0, 373093.0, 117224.0, 36215.0, 14118.0, 6308.0, 3043.0, 1670.0, 815.0, 489.0, 270.0, 206.0, 117.0, 80.0, 49.0, 47.0, 38.0, 11.0, 21.0, 15.0, 8.0, 14.0, 8.0, 4.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.366943359375, -0.356170654296875, -0.34539794921875, -0.334625244140625, -0.3238525390625, -0.313079833984375, -0.30230712890625, -0.291534423828125, -0.28076171875, -0.269989013671875, -0.25921630859375, -0.248443603515625, -0.2376708984375, -0.226898193359375, -0.21612548828125, -0.205352783203125, -0.194580078125, -0.183807373046875, -0.17303466796875, -0.162261962890625, -0.1514892578125, -0.140716552734375, -0.12994384765625, -0.119171142578125, -0.1083984375, -0.097625732421875, -0.08685302734375, -0.076080322265625, -0.0653076171875, -0.054534912109375, -0.04376220703125, -0.032989501953125, -0.022216796875, -0.011444091796875, -0.00067138671875, 0.010101318359375, 0.0208740234375, 0.031646728515625, 0.04241943359375, 0.053192138671875, 0.06396484375, 0.074737548828125, 0.08551025390625, 0.096282958984375, 0.1070556640625, 0.117828369140625, 0.12860107421875, 0.139373779296875, 0.150146484375, 0.160919189453125, 0.17169189453125, 0.182464599609375, 0.1932373046875, 0.204010009765625, 0.21478271484375, 0.225555419921875, 0.236328125, 0.247100830078125, 0.25787353515625, 0.268646240234375, 0.2794189453125, 0.290191650390625, 0.30096435546875, 0.311737060546875, 0.322509765625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 3.0, 7.0, 8.0, 11.0, 7.0, 18.0, 12.0, 18.0, 22.0, 20.0, 32.0, 33.0, 46.0, 42.0, 39.0, 50.0, 51.0, 45.0, 42.0, 39.0, 44.0, 42.0, 42.0, 38.0, 30.0, 36.0, 33.0, 31.0, 15.0, 28.0, 18.0, 16.0, 10.0, 16.0, 10.0, 10.0, 6.0, 4.0, 5.0, 0.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.5712890625, -1.5228118896484375, -1.474334716796875, -1.4258575439453125, -1.37738037109375, -1.3289031982421875, -1.280426025390625, -1.2319488525390625, -1.1834716796875, -1.1349945068359375, -1.086517333984375, -1.0380401611328125, -0.98956298828125, -0.9410858154296875, -0.892608642578125, -0.8441314697265625, -0.795654296875, -0.7471771240234375, -0.698699951171875, -0.6502227783203125, -0.60174560546875, -0.5532684326171875, -0.504791259765625, -0.4563140869140625, -0.4078369140625, -0.3593597412109375, -0.310882568359375, -0.2624053955078125, -0.21392822265625, -0.1654510498046875, -0.116973876953125, -0.0684967041015625, -0.02001953125, 0.0284576416015625, 0.076934814453125, 0.1254119873046875, 0.17388916015625, 0.2223663330078125, 0.270843505859375, 0.3193206787109375, 0.3677978515625, 0.4162750244140625, 0.464752197265625, 0.5132293701171875, 0.56170654296875, 0.6101837158203125, 0.658660888671875, 0.7071380615234375, 0.755615234375, 0.8040924072265625, 0.852569580078125, 0.9010467529296875, 0.94952392578125, 0.9980010986328125, 1.046478271484375, 1.0949554443359375, 1.1434326171875, 1.1919097900390625, 1.240386962890625, 1.2888641357421875, 1.33734130859375, 1.3858184814453125, 1.434295654296875, 1.4827728271484375, 1.53125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 5.0, 10.0, 18.0, 14.0, 24.0, 32.0, 47.0, 67.0, 102.0, 141.0, 261.0, 341.0, 539.0, 944.0, 1616.0, 2996.0, 5921.0, 13500.0, 35536.0, 179451.0, 649091.0, 107821.0, 27655.0, 11203.0, 5026.0, 2548.0, 1402.0, 762.0, 487.0, 318.0, 212.0, 142.0, 87.0, 52.0, 47.0, 44.0, 25.0, 17.0, 14.0, 7.0, 5.0, 6.0, 2.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.275390625, -0.2660179138183594, -0.25664520263671875, -0.24727249145507812, -0.2378997802734375, -0.22852706909179688, -0.21915435791015625, -0.20978164672851562, -0.200408935546875, -0.19103622436523438, -0.18166351318359375, -0.17229080200195312, -0.1629180908203125, -0.15354537963867188, -0.14417266845703125, -0.13479995727539062, -0.12542724609375, -0.11605453491210938, -0.10668182373046875, -0.09730911254882812, -0.0879364013671875, -0.07856369018554688, -0.06919097900390625, -0.059818267822265625, -0.050445556640625, -0.041072845458984375, -0.03170013427734375, -0.022327423095703125, -0.0129547119140625, -0.003582000732421875, 0.00579071044921875, 0.015163421630859375, 0.0245361328125, 0.033908843994140625, 0.04328155517578125, 0.052654266357421875, 0.0620269775390625, 0.07139968872070312, 0.08077239990234375, 0.09014511108398438, 0.099517822265625, 0.10889053344726562, 0.11826324462890625, 0.12763595581054688, 0.1370086669921875, 0.14638137817382812, 0.15575408935546875, 0.16512680053710938, 0.17449951171875, 0.18387222290039062, 0.19324493408203125, 0.20261764526367188, 0.2119903564453125, 0.22136306762695312, 0.23073577880859375, 0.24010848999023438, 0.249481201171875, 0.2588539123535156, 0.26822662353515625, 0.2775993347167969, 0.2869720458984375, 0.2963447570800781, 0.30571746826171875, 0.3150901794433594, 0.324462890625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 1.0, 6.0, 11.0, 13.0, 8.0, 16.0, 26.0, 60.0, 109.0, 207.0, 198.0, 154.0, 79.0, 36.0, 29.0, 10.0, 8.0, 6.0, 10.0, 4.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014638900756835938, -0.00014153867959976196, -0.00013668835163116455, -0.00013183802366256714, -0.00012698769569396973, -0.00012213736772537231, -0.0001172870397567749, -0.00011243671178817749, -0.00010758638381958008, -0.00010273605585098267, -9.788572788238525e-05, -9.303539991378784e-05, -8.818507194519043e-05, -8.333474397659302e-05, -7.84844160079956e-05, -7.36340880393982e-05, -6.878376007080078e-05, -6.393343210220337e-05, -5.908310413360596e-05, -5.4232776165008545e-05, -4.938244819641113e-05, -4.453212022781372e-05, -3.968179225921631e-05, -3.4831464290618896e-05, -2.9981136322021484e-05, -2.5130808353424072e-05, -2.028048038482666e-05, -1.5430152416229248e-05, -1.0579824447631836e-05, -5.729496479034424e-06, -8.791685104370117e-07, 3.9711594581604e-06, 8.821487426757812e-06, 1.3671815395355225e-05, 1.8522143363952637e-05, 2.337247133255005e-05, 2.822279930114746e-05, 3.307312726974487e-05, 3.7923455238342285e-05, 4.27737832069397e-05, 4.762411117553711e-05, 5.247443914413452e-05, 5.7324767112731934e-05, 6.217509508132935e-05, 6.702542304992676e-05, 7.187575101852417e-05, 7.672607898712158e-05, 8.1576406955719e-05, 8.64267349243164e-05, 9.127706289291382e-05, 9.612739086151123e-05, 0.00010097771883010864, 0.00010582804679870605, 0.00011067837476730347, 0.00011552870273590088, 0.00012037903070449829, 0.0001252293586730957, 0.00013007968664169312, 0.00013493001461029053, 0.00013978034257888794, 0.00014463067054748535, 0.00014948099851608276, 0.00015433132648468018, 0.0001591816544532776, 0.000164031982421875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 4.0, 11.0, 11.0, 15.0, 35.0, 52.0, 84.0, 153.0, 266.0, 589.0, 1218.0, 2864.0, 7284.0, 21310.0, 107282.0, 737428.0, 132176.0, 23938.0, 7979.0, 3136.0, 1372.0, 628.0, 314.0, 151.0, 84.0, 57.0, 32.0, 19.0, 22.0, 15.0, 9.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.55224609375, -0.5379180908203125, -0.523590087890625, -0.5092620849609375, -0.49493408203125, -0.4806060791015625, -0.466278076171875, -0.4519500732421875, -0.4376220703125, -0.4232940673828125, -0.408966064453125, -0.3946380615234375, -0.38031005859375, -0.3659820556640625, -0.351654052734375, -0.3373260498046875, -0.322998046875, -0.3086700439453125, -0.294342041015625, -0.2800140380859375, -0.26568603515625, -0.2513580322265625, -0.237030029296875, -0.2227020263671875, -0.2083740234375, -0.1940460205078125, -0.179718017578125, -0.1653900146484375, -0.15106201171875, -0.1367340087890625, -0.122406005859375, -0.1080780029296875, -0.09375, -0.0794219970703125, -0.065093994140625, -0.0507659912109375, -0.03643798828125, -0.0221099853515625, -0.007781982421875, 0.0065460205078125, 0.0208740234375, 0.0352020263671875, 0.049530029296875, 0.0638580322265625, 0.07818603515625, 0.0925140380859375, 0.106842041015625, 0.1211700439453125, 0.135498046875, 0.1498260498046875, 0.164154052734375, 0.1784820556640625, 0.19281005859375, 0.2071380615234375, 0.221466064453125, 0.2357940673828125, 0.2501220703125, 0.2644500732421875, 0.278778076171875, 0.2931060791015625, 0.30743408203125, 0.3217620849609375, 0.336090087890625, 0.3504180908203125, 0.36474609375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 5.0, 4.0, 4.0, 7.0, 7.0, 17.0, 12.0, 16.0, 25.0, 37.0, 66.0, 95.0, 132.0, 164.0, 129.0, 99.0, 65.0, 36.0, 24.0, 11.0, 10.0, 7.0, 5.0, 7.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09588623046875, -0.09227275848388672, -0.08865928649902344, -0.08504581451416016, -0.08143234252929688, -0.0778188705444336, -0.07420539855957031, -0.07059192657470703, -0.06697845458984375, -0.06336498260498047, -0.05975151062011719, -0.056138038635253906, -0.052524566650390625, -0.048911094665527344, -0.04529762268066406, -0.04168415069580078, -0.0380706787109375, -0.03445720672607422, -0.030843734741210938, -0.027230262756347656, -0.023616790771484375, -0.020003318786621094, -0.016389846801757812, -0.012776374816894531, -0.00916290283203125, -0.005549430847167969, -0.0019359588623046875, 0.0016775131225585938, 0.005290985107421875, 0.008904457092285156, 0.012517929077148438, 0.01613140106201172, 0.019744873046875, 0.02335834503173828, 0.026971817016601562, 0.030585289001464844, 0.034198760986328125, 0.037812232971191406, 0.04142570495605469, 0.04503917694091797, 0.04865264892578125, 0.05226612091064453, 0.05587959289550781, 0.059493064880371094, 0.06310653686523438, 0.06672000885009766, 0.07033348083496094, 0.07394695281982422, 0.0775604248046875, 0.08117389678955078, 0.08478736877441406, 0.08840084075927734, 0.09201431274414062, 0.0956277847290039, 0.09924125671386719, 0.10285472869873047, 0.10646820068359375, 0.11008167266845703, 0.11369514465332031, 0.1173086166381836, 0.12092208862304688, 0.12453556060791016, 0.12814903259277344, 0.13176250457763672, 0.1353759765625]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 14.0, 18.0, 31.0, 35.0, 62.0, 84.0, 135.0, 123.0, 131.0, 100.0, 95.0, 57.0, 54.0, 18.0, 25.0, 10.0, 10.0, 5.0, 0.0, 4.0], "bins": [-2.4272518157958984, -2.3806257247924805, -2.3339996337890625, -2.2873733043670654, -2.2407472133636475, -2.1941211223602295, -2.1474950313568115, -2.1008687019348145, -2.0542426109313965, -2.0076165199279785, -1.960990309715271, -1.914364218711853, -1.8677380084991455, -1.8211119174957275, -1.7744858264923096, -1.727859616279602, -1.681233525276184, -1.6346074342727661, -1.5879812240600586, -1.5413551330566406, -1.494728922843933, -1.4481028318405151, -1.4014766216278076, -1.3548505306243896, -1.3082244396209717, -1.2615983486175537, -1.2149721384048462, -1.1683460474014282, -1.1217198371887207, -1.0750937461853027, -1.0284676551818848, -0.9818414449691772, -0.9352153539657593, -0.8885892033576965, -0.8419630527496338, -0.7953369617462158, -0.7487107515335083, -0.7020846605300903, -0.6554585099220276, -0.6088323593139648, -0.5622062087059021, -0.5155800580978394, -0.4689539074897766, -0.42232778668403625, -0.3757016360759735, -0.32907548546791077, -0.2824493646621704, -0.23582321405410767, -0.18919706344604492, -0.14257091283798218, -0.09594477713108063, -0.04931864142417908, -0.002692490816116333, 0.04393365979194641, 0.09055978059768677, 0.1371859312057495, 0.18381208181381226, 0.230438232421875, 0.27706438302993774, 0.3236905038356781, 0.37031665444374084, 0.4169428050518036, 0.46356892585754395, 0.5101950764656067, 0.5568212270736694]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 7.0, 6.0, 4.0, 9.0, 10.0, 22.0, 12.0, 19.0, 24.0, 21.0, 26.0, 40.0, 38.0, 24.0, 29.0, 36.0, 27.0, 42.0, 48.0, 42.0, 45.0, 34.0, 57.0, 34.0, 36.0, 33.0, 25.0, 33.0, 33.0, 24.0, 27.0, 17.0, 17.0, 15.0, 13.0, 10.0, 11.0, 8.0, 10.0, 6.0, 5.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.6026099920272827, -0.5838498473167419, -0.5650897026062012, -0.5463295578956604, -0.5275694131851196, -0.5088092088699341, -0.4900490939617157, -0.47128891944885254, -0.45252877473831177, -0.433768630027771, -0.4150084853172302, -0.39624834060668945, -0.3774881660938263, -0.3587280213832855, -0.33996787667274475, -0.3212077021598816, -0.3024475872516632, -0.28368744254112244, -0.26492729783058167, -0.2461671382188797, -0.22740697860717773, -0.20864683389663696, -0.1898866891860962, -0.17112652957439423, -0.15236638486385345, -0.13360624015331268, -0.11484608054161072, -0.09608593583106995, -0.07732578366994858, -0.05856563150882721, -0.03980548679828644, -0.021045327186584473, -0.002285182476043701, 0.016474967822432518, 0.03523511812090874, 0.05399526655673981, 0.07275541871786118, 0.09151557087898254, 0.11027571558952332, 0.12903587520122528, 0.14779601991176605, 0.16655616462230682, 0.1853163242340088, 0.20407646894454956, 0.22283661365509033, 0.2415967732667923, 0.2603569030761719, 0.27911707758903503, 0.2978772222995758, 0.3166373670101166, 0.33539751172065735, 0.3541576862335205, 0.3729178309440613, 0.39167797565460205, 0.4104381203651428, 0.4291982650756836, 0.44795840978622437, 0.46671855449676514, 0.4854786992073059, 0.5042388439178467, 0.5229989886283875, 0.5417591333389282, 0.5605193376541138, 0.5792794823646545, 0.5980396270751953]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 7.0, 2.0, 5.0, 3.0, 2.0, 6.0, 9.0, 16.0, 28.0, 27.0, 59.0, 76.0, 127.0, 155.0, 293.0, 439.0, 782.0, 1327.0, 2556.0, 5204.0, 10615.0, 22776.0, 56244.0, 194453.0, 467077.0, 187959.0, 54480.0, 22490.0, 10165.0, 5103.0, 2626.0, 1368.0, 804.0, 473.0, 278.0, 166.0, 125.0, 72.0, 52.0, 36.0, 24.0, 16.0, 12.0, 11.0, 4.0, 8.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.9462890625, -0.9196243286132812, -0.8929595947265625, -0.8662948608398438, -0.839630126953125, -0.8129653930664062, -0.7863006591796875, -0.7596359252929688, -0.73297119140625, -0.7063064575195312, -0.6796417236328125, -0.6529769897460938, -0.626312255859375, -0.5996475219726562, -0.5729827880859375, -0.5463180541992188, -0.5196533203125, -0.49298858642578125, -0.4663238525390625, -0.43965911865234375, -0.412994384765625, -0.38632965087890625, -0.3596649169921875, -0.33300018310546875, -0.30633544921875, -0.27967071533203125, -0.2530059814453125, -0.22634124755859375, -0.199676513671875, -0.17301177978515625, -0.1463470458984375, -0.11968231201171875, -0.093017578125, -0.06635284423828125, -0.0396881103515625, -0.01302337646484375, 0.013641357421875, 0.04030609130859375, 0.0669708251953125, 0.09363555908203125, 0.12030029296875, 0.14696502685546875, 0.1736297607421875, 0.20029449462890625, 0.226959228515625, 0.25362396240234375, 0.2802886962890625, 0.30695343017578125, 0.3336181640625, 0.36028289794921875, 0.3869476318359375, 0.41361236572265625, 0.440277099609375, 0.46694183349609375, 0.4936065673828125, 0.5202713012695312, 0.54693603515625, 0.5736007690429688, 0.6002655029296875, 0.6269302368164062, 0.653594970703125, 0.6802597045898438, 0.7069244384765625, 0.7335891723632812, 0.76025390625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 4.0, 4.0, 3.0, 6.0, 5.0, 5.0, 10.0, 15.0, 13.0, 20.0, 22.0, 21.0, 20.0, 41.0, 32.0, 31.0, 39.0, 37.0, 42.0, 40.0, 51.0, 53.0, 40.0, 48.0, 37.0, 43.0, 42.0, 40.0, 30.0, 20.0, 30.0, 18.0, 17.0, 25.0, 17.0, 20.0, 14.0, 13.0, 10.0, 4.0, 8.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1982421875, -1.1567535400390625, -1.115264892578125, -1.0737762451171875, -1.03228759765625, -0.9907989501953125, -0.949310302734375, -0.9078216552734375, -0.8663330078125, -0.8248443603515625, -0.783355712890625, -0.7418670654296875, -0.70037841796875, -0.6588897705078125, -0.617401123046875, -0.5759124755859375, -0.534423828125, -0.4929351806640625, -0.451446533203125, -0.4099578857421875, -0.36846923828125, -0.3269805908203125, -0.285491943359375, -0.2440032958984375, -0.2025146484375, -0.1610260009765625, -0.119537353515625, -0.0780487060546875, -0.03656005859375, 0.0049285888671875, 0.046417236328125, 0.0879058837890625, 0.12939453125, 0.1708831787109375, 0.212371826171875, 0.2538604736328125, 0.29534912109375, 0.3368377685546875, 0.378326416015625, 0.4198150634765625, 0.4613037109375, 0.5027923583984375, 0.544281005859375, 0.5857696533203125, 0.62725830078125, 0.6687469482421875, 0.710235595703125, 0.7517242431640625, 0.793212890625, 0.8347015380859375, 0.876190185546875, 0.9176788330078125, 0.95916748046875, 1.0006561279296875, 1.042144775390625, 1.0836334228515625, 1.1251220703125, 1.1666107177734375, 1.208099365234375, 1.2495880126953125, 1.29107666015625, 1.3325653076171875, 1.374053955078125, 1.4155426025390625, 1.45703125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 10.0, 13.0, 18.0, 23.0, 29.0, 49.0, 58.0, 76.0, 137.0, 221.0, 522.0, 1397.0, 4422.0, 17380.0, 94864.0, 677484.0, 211006.0, 30230.0, 6990.0, 2006.0, 750.0, 322.0, 165.0, 110.0, 76.0, 48.0, 38.0, 29.0, 19.0, 7.0, 11.0, 14.0, 8.0, 4.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.7099609375, -1.6620330810546875, -1.614105224609375, -1.5661773681640625, -1.51824951171875, -1.4703216552734375, -1.422393798828125, -1.3744659423828125, -1.3265380859375, -1.2786102294921875, -1.230682373046875, -1.1827545166015625, -1.13482666015625, -1.0868988037109375, -1.038970947265625, -0.9910430908203125, -0.943115234375, -0.8951873779296875, -0.847259521484375, -0.7993316650390625, -0.75140380859375, -0.7034759521484375, -0.655548095703125, -0.6076202392578125, -0.5596923828125, -0.5117645263671875, -0.463836669921875, -0.4159088134765625, -0.36798095703125, -0.3200531005859375, -0.272125244140625, -0.2241973876953125, -0.17626953125, -0.1283416748046875, -0.080413818359375, -0.0324859619140625, 0.01544189453125, 0.0633697509765625, 0.111297607421875, 0.1592254638671875, 0.2071533203125, 0.2550811767578125, 0.303009033203125, 0.3509368896484375, 0.39886474609375, 0.4467926025390625, 0.494720458984375, 0.5426483154296875, 0.590576171875, 0.6385040283203125, 0.686431884765625, 0.7343597412109375, 0.78228759765625, 0.8302154541015625, 0.878143310546875, 0.9260711669921875, 0.9739990234375, 1.0219268798828125, 1.069854736328125, 1.1177825927734375, 1.16571044921875, 1.2136383056640625, 1.261566162109375, 1.3094940185546875, 1.357421875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 4.0, 5.0, 6.0, 10.0, 11.0, 13.0, 14.0, 13.0, 16.0, 20.0, 32.0, 32.0, 38.0, 33.0, 47.0, 50.0, 65.0, 58.0, 50.0, 54.0, 59.0, 52.0, 33.0, 53.0, 38.0, 36.0, 29.0, 18.0, 27.0, 20.0, 13.0, 11.0, 10.0, 5.0, 4.0, 9.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0], "bins": [-1.91796875, -1.865692138671875, -1.81341552734375, -1.761138916015625, -1.7088623046875, -1.656585693359375, -1.60430908203125, -1.552032470703125, -1.499755859375, -1.447479248046875, -1.39520263671875, -1.342926025390625, -1.2906494140625, -1.238372802734375, -1.18609619140625, -1.133819580078125, -1.08154296875, -1.029266357421875, -0.97698974609375, -0.924713134765625, -0.8724365234375, -0.820159912109375, -0.76788330078125, -0.715606689453125, -0.663330078125, -0.611053466796875, -0.55877685546875, -0.506500244140625, -0.4542236328125, -0.401947021484375, -0.34967041015625, -0.297393798828125, -0.2451171875, -0.192840576171875, -0.14056396484375, -0.088287353515625, -0.0360107421875, 0.016265869140625, 0.06854248046875, 0.120819091796875, 0.173095703125, 0.225372314453125, 0.27764892578125, 0.329925537109375, 0.3822021484375, 0.434478759765625, 0.48675537109375, 0.539031982421875, 0.59130859375, 0.643585205078125, 0.69586181640625, 0.748138427734375, 0.8004150390625, 0.852691650390625, 0.90496826171875, 0.957244873046875, 1.009521484375, 1.061798095703125, 1.11407470703125, 1.166351318359375, 1.2186279296875, 1.270904541015625, 1.32318115234375, 1.375457763671875, 1.427734375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 6.0, 7.0, 15.0, 16.0, 27.0, 50.0, 92.0, 160.0, 337.0, 779.0, 2106.0, 7879.0, 54057.0, 653840.0, 296322.0, 25576.0, 4686.0, 1463.0, 541.0, 277.0, 137.0, 70.0, 34.0, 28.0, 15.0, 9.0, 7.0, 4.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.4326171875, -0.4185829162597656, -0.40454864501953125, -0.3905143737792969, -0.3764801025390625, -0.3624458312988281, -0.34841156005859375, -0.3343772888183594, -0.320343017578125, -0.3063087463378906, -0.29227447509765625, -0.2782402038574219, -0.2642059326171875, -0.2501716613769531, -0.23613739013671875, -0.22210311889648438, -0.20806884765625, -0.19403457641601562, -0.18000030517578125, -0.16596603393554688, -0.1519317626953125, -0.13789749145507812, -0.12386322021484375, -0.10982894897460938, -0.095794677734375, -0.08176040649414062, -0.06772613525390625, -0.053691864013671875, -0.0396575927734375, -0.025623321533203125, -0.01158905029296875, 0.002445220947265625, 0.0164794921875, 0.030513763427734375, 0.04454803466796875, 0.058582305908203125, 0.0726165771484375, 0.08665084838867188, 0.10068511962890625, 0.11471939086914062, 0.128753662109375, 0.14278793334960938, 0.15682220458984375, 0.17085647583007812, 0.1848907470703125, 0.19892501831054688, 0.21295928955078125, 0.22699356079101562, 0.24102783203125, 0.2550621032714844, 0.26909637451171875, 0.2831306457519531, 0.2971649169921875, 0.3111991882324219, 0.32523345947265625, 0.3392677307128906, 0.353302001953125, 0.3673362731933594, 0.38137054443359375, 0.3954048156738281, 0.4094390869140625, 0.4234733581542969, 0.43750762939453125, 0.4515419006347656, 0.465576171875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 5.0, 1.0, 3.0, 4.0, 11.0, 9.0, 6.0, 7.0, 9.0, 13.0, 21.0, 19.0, 34.0, 39.0, 38.0, 53.0, 66.0, 87.0, 81.0, 93.0, 65.0, 48.0, 44.0, 37.0, 44.0, 42.0, 17.0, 15.0, 15.0, 13.0, 11.0, 9.0, 8.0, 5.0, 5.0, 6.0, 2.0, 3.0, 2.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.254413604736328e-05, -3.145821392536163e-05, -3.0372291803359985e-05, -2.9286369681358337e-05, -2.820044755935669e-05, -2.711452543735504e-05, -2.6028603315353394e-05, -2.4942681193351746e-05, -2.3856759071350098e-05, -2.277083694934845e-05, -2.1684914827346802e-05, -2.0598992705345154e-05, -1.9513070583343506e-05, -1.8427148461341858e-05, -1.734122633934021e-05, -1.6255304217338562e-05, -1.5169382095336914e-05, -1.4083459973335266e-05, -1.2997537851333618e-05, -1.191161572933197e-05, -1.0825693607330322e-05, -9.739771485328674e-06, -8.653849363327026e-06, -7.567927241325378e-06, -6.4820051193237305e-06, -5.3960829973220825e-06, -4.3101608753204346e-06, -3.2242387533187866e-06, -2.1383166313171387e-06, -1.0523945093154907e-06, 3.3527612686157227e-08, 1.1194497346878052e-06, 2.205371856689453e-06, 3.291293978691101e-06, 4.377216100692749e-06, 5.463138222694397e-06, 6.549060344696045e-06, 7.634982466697693e-06, 8.72090458869934e-06, 9.806826710700989e-06, 1.0892748832702637e-05, 1.1978670954704285e-05, 1.3064593076705933e-05, 1.415051519870758e-05, 1.5236437320709229e-05, 1.6322359442710876e-05, 1.7408281564712524e-05, 1.8494203686714172e-05, 1.958012580871582e-05, 2.0666047930717468e-05, 2.1751970052719116e-05, 2.2837892174720764e-05, 2.3923814296722412e-05, 2.500973641872406e-05, 2.6095658540725708e-05, 2.7181580662727356e-05, 2.8267502784729004e-05, 2.9353424906730652e-05, 3.04393470287323e-05, 3.152526915073395e-05, 3.2611191272735596e-05, 3.3697113394737244e-05, 3.478303551673889e-05, 3.586895763874054e-05, 3.695487976074219e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 7.0, 4.0, 14.0, 10.0, 21.0, 30.0, 33.0, 48.0, 60.0, 88.0, 158.0, 274.0, 486.0, 850.0, 1876.0, 4035.0, 11653.0, 47616.0, 317325.0, 547726.0, 87567.0, 17972.0, 5687.0, 2454.0, 1124.0, 568.0, 324.0, 165.0, 113.0, 63.0, 43.0, 37.0, 26.0, 18.0, 14.0, 17.0, 11.0, 3.0, 2.0, 3.0, 5.0, 3.0, 4.0, 1.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.351318359375, -0.3392753601074219, -0.32723236083984375, -0.3151893615722656, -0.3031463623046875, -0.2911033630371094, -0.27906036376953125, -0.2670173645019531, -0.254974365234375, -0.24293136596679688, -0.23088836669921875, -0.21884536743164062, -0.2068023681640625, -0.19475936889648438, -0.18271636962890625, -0.17067337036132812, -0.15863037109375, -0.14658737182617188, -0.13454437255859375, -0.12250137329101562, -0.1104583740234375, -0.09841537475585938, -0.08637237548828125, -0.07432937622070312, -0.062286376953125, -0.050243377685546875, -0.03820037841796875, -0.026157379150390625, -0.0141143798828125, -0.002071380615234375, 0.00997161865234375, 0.022014617919921875, 0.0340576171875, 0.046100616455078125, 0.05814361572265625, 0.07018661499023438, 0.0822296142578125, 0.09427261352539062, 0.10631561279296875, 0.11835861206054688, 0.130401611328125, 0.14244461059570312, 0.15448760986328125, 0.16653060913085938, 0.1785736083984375, 0.19061660766601562, 0.20265960693359375, 0.21470260620117188, 0.22674560546875, 0.23878860473632812, 0.25083160400390625, 0.2628746032714844, 0.2749176025390625, 0.2869606018066406, 0.29900360107421875, 0.3110466003417969, 0.323089599609375, 0.3351325988769531, 0.34717559814453125, 0.3592185974121094, 0.3712615966796875, 0.3833045959472656, 0.39534759521484375, 0.4073905944824219, 0.41943359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 7.0, 8.0, 7.0, 12.0, 18.0, 18.0, 21.0, 24.0, 49.0, 46.0, 67.0, 68.0, 78.0, 97.0, 89.0, 67.0, 65.0, 49.0, 37.0, 33.0, 30.0, 24.0, 15.0, 13.0, 11.0, 2.0, 7.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.134765625, -0.13036155700683594, -0.12595748901367188, -0.12155342102050781, -0.11714935302734375, -0.11274528503417969, -0.10834121704101562, -0.10393714904785156, -0.0995330810546875, -0.09512901306152344, -0.09072494506835938, -0.08632087707519531, -0.08191680908203125, -0.07751274108886719, -0.07310867309570312, -0.06870460510253906, -0.064300537109375, -0.05989646911621094, -0.055492401123046875, -0.05108833312988281, -0.04668426513671875, -0.04228019714355469, -0.037876129150390625, -0.03347206115722656, -0.0290679931640625, -0.024663925170898438, -0.020259857177734375, -0.015855789184570312, -0.01145172119140625, -0.0070476531982421875, -0.002643585205078125, 0.0017604827880859375, 0.00616455078125, 0.010568618774414062, 0.014972686767578125, 0.019376754760742188, 0.02378082275390625, 0.028184890747070312, 0.032588958740234375, 0.03699302673339844, 0.0413970947265625, 0.04580116271972656, 0.050205230712890625, 0.05460929870605469, 0.05901336669921875, 0.06341743469238281, 0.06782150268554688, 0.07222557067871094, 0.076629638671875, 0.08103370666503906, 0.08543777465820312, 0.08984184265136719, 0.09424591064453125, 0.09864997863769531, 0.10305404663085938, 0.10745811462402344, 0.1118621826171875, 0.11626625061035156, 0.12067031860351562, 0.1250743865966797, 0.12947845458984375, 0.1338825225830078, 0.13828659057617188, 0.14269065856933594, 0.1470947265625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 14.0, 22.0, 49.0, 79.0, 147.0, 159.0, 149.0, 125.0, 105.0, 67.0, 50.0, 12.0, 13.0, 9.0, 4.0, 2.0, 1.0, 1.0], "bins": [-6.4617156982421875, -6.337893962860107, -6.214072227478027, -6.090250492095947, -5.966428756713867, -5.842607498168945, -5.718785762786865, -5.594964027404785, -5.471142292022705, -5.347320556640625, -5.223498821258545, -5.099677085876465, -4.975855827331543, -4.852034091949463, -4.728212356567383, -4.604390621185303, -4.480568885803223, -4.356747150421143, -4.2329254150390625, -4.109103679656982, -3.9852821826934814, -3.8614604473114014, -3.7376389503479004, -3.6138172149658203, -3.4899954795837402, -3.36617374420166, -3.24235200881958, -3.118530511856079, -2.994708776473999, -2.870887041091919, -2.747065544128418, -2.623243808746338, -2.499422073364258, -2.3756003379821777, -2.2517786026000977, -2.1279571056365967, -2.0041353702545166, -1.8803136348724365, -1.756492018699646, -1.6326704025268555, -1.508848786354065, -1.3850271701812744, -1.2612054347991943, -1.1373836994171143, -1.0135620832443237, -0.8897404074668884, -0.7659187316894531, -0.6420970559120178, -0.5182753801345825, -0.3944537043571472, -0.2706320285797119, -0.1468103528022766, -0.02298867702484131, 0.100832998752594, 0.2246546745300293, 0.3484763503074646, 0.4722980260848999, 0.5961197018623352, 0.7199413776397705, 0.8437630534172058, 0.9675847291946411, 1.0914063453674316, 1.2152280807495117, 1.3390498161315918, 1.4628714323043823]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 10.0, 6.0, 6.0, 12.0, 10.0, 17.0, 18.0, 15.0, 14.0, 27.0, 34.0, 36.0, 37.0, 37.0, 28.0, 50.0, 53.0, 35.0, 41.0, 40.0, 43.0, 54.0, 44.0, 36.0, 36.0, 34.0, 25.0, 36.0, 35.0, 28.0, 25.0, 14.0, 9.0, 11.0, 10.0, 12.0, 6.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.384341239929199, -2.3093955516815186, -2.234449863433838, -2.1595041751861572, -2.0845584869384766, -2.009612798690796, -1.9346672296524048, -1.8597215414047241, -1.7847758531570435, -1.7098301649093628, -1.6348844766616821, -1.5599387884140015, -1.4849932193756104, -1.4100475311279297, -1.335101842880249, -1.2601561546325684, -1.1852104663848877, -1.110264778137207, -1.0353190898895264, -0.9603734612464905, -0.8854277729988098, -0.8104820847511292, -0.7355364561080933, -0.6605907678604126, -0.5856450796127319, -0.5106993913650513, -0.435753732919693, -0.3608080744743347, -0.28586238622665405, -0.2109166979789734, -0.1359710395336151, -0.061025381088256836, 0.013920307159423828, 0.0888659805059433, 0.16381165385246277, 0.23875732719898224, 0.3137030005455017, 0.3886486887931824, 0.46359434723854065, 0.5385400056838989, 0.6134856939315796, 0.6884313821792603, 0.7633770704269409, 0.8383226990699768, 0.9132683873176575, 0.9882140755653381, 1.063159704208374, 1.1381053924560547, 1.2130510807037354, 1.287996768951416, 1.3629424571990967, 1.4378881454467773, 1.512833833694458, 1.5877795219421387, 1.6627250909805298, 1.7376707792282104, 1.8126164674758911, 1.8875621557235718, 1.9625078439712524, 2.0374534130096436, 2.112399101257324, 2.187344789505005, 2.2622904777526855, 2.337236166000366, 2.412181854248047]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 5.0, 7.0, 12.0, 5.0, 16.0, 12.0, 8.0, 13.0, 29.0, 42.0, 42.0, 110.0, 208.0, 312.0, 681.0, 1583.0, 4381.0, 14957.0, 92776.0, 1474468.0, 2394435.0, 179532.0, 21512.0, 5528.0, 1955.0, 772.0, 343.0, 223.0, 110.0, 71.0, 36.0, 25.0, 23.0, 11.0, 11.0, 6.0, 5.0, 8.0, 6.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9716796875, -1.91217041015625, -1.8526611328125, -1.79315185546875, -1.733642578125, -1.67413330078125, -1.6146240234375, -1.55511474609375, -1.49560546875, -1.43609619140625, -1.3765869140625, -1.31707763671875, -1.257568359375, -1.19805908203125, -1.1385498046875, -1.07904052734375, -1.01953125, -0.96002197265625, -0.9005126953125, -0.84100341796875, -0.781494140625, -0.72198486328125, -0.6624755859375, -0.60296630859375, -0.54345703125, -0.48394775390625, -0.4244384765625, -0.36492919921875, -0.305419921875, -0.24591064453125, -0.1864013671875, -0.12689208984375, -0.0673828125, -0.00787353515625, 0.0516357421875, 0.11114501953125, 0.170654296875, 0.23016357421875, 0.2896728515625, 0.34918212890625, 0.40869140625, 0.46820068359375, 0.5277099609375, 0.58721923828125, 0.646728515625, 0.70623779296875, 0.7657470703125, 0.82525634765625, 0.884765625, 0.94427490234375, 1.0037841796875, 1.06329345703125, 1.122802734375, 1.18231201171875, 1.2418212890625, 1.30133056640625, 1.36083984375, 1.42034912109375, 1.4798583984375, 1.53936767578125, 1.598876953125, 1.65838623046875, 1.7178955078125, 1.77740478515625, 1.8369140625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 4.0, 4.0, 4.0, 7.0, 7.0, 10.0, 12.0, 18.0, 25.0, 21.0, 15.0, 22.0, 31.0, 34.0, 45.0, 28.0, 33.0, 35.0, 54.0, 41.0, 45.0, 51.0, 42.0, 41.0, 31.0, 37.0, 35.0, 34.0, 31.0, 33.0, 28.0, 24.0, 22.0, 18.0, 6.0, 17.0, 14.0, 6.0, 10.0, 8.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.67724609375, -0.6538925170898438, -0.6305389404296875, -0.6071853637695312, -0.583831787109375, -0.5604782104492188, -0.5371246337890625, -0.5137710571289062, -0.49041748046875, -0.46706390380859375, -0.4437103271484375, -0.42035675048828125, -0.397003173828125, -0.37364959716796875, -0.3502960205078125, -0.32694244384765625, -0.3035888671875, -0.28023529052734375, -0.2568817138671875, -0.23352813720703125, -0.210174560546875, -0.18682098388671875, -0.1634674072265625, -0.14011383056640625, -0.11676025390625, -0.09340667724609375, -0.0700531005859375, -0.04669952392578125, -0.023345947265625, 7.62939453125e-06, 0.0233612060546875, 0.04671478271484375, 0.070068359375, 0.09342193603515625, 0.1167755126953125, 0.14012908935546875, 0.163482666015625, 0.18683624267578125, 0.2101898193359375, 0.23354339599609375, 0.25689697265625, 0.28025054931640625, 0.3036041259765625, 0.32695770263671875, 0.350311279296875, 0.37366485595703125, 0.3970184326171875, 0.42037200927734375, 0.4437255859375, 0.46707916259765625, 0.4904327392578125, 0.5137863159179688, 0.537139892578125, 0.5604934692382812, 0.5838470458984375, 0.6072006225585938, 0.63055419921875, 0.6539077758789062, 0.6772613525390625, 0.7006149291992188, 0.723968505859375, 0.7473220825195312, 0.7706756591796875, 0.7940292358398438, 0.8173828125]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 9.0, 7.0, 9.0, 9.0, 27.0, 33.0, 66.0, 98.0, 225.0, 486.0, 1391.0, 5160.0, 36699.0, 2241169.0, 1867761.0, 34000.0, 4859.0, 1309.0, 440.0, 205.0, 111.0, 70.0, 43.0, 22.0, 21.0, 12.0, 10.0, 4.0, 9.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.49609375, -3.39892578125, -3.3017578125, -3.20458984375, -3.107421875, -3.01025390625, -2.9130859375, -2.81591796875, -2.71875, -2.62158203125, -2.5244140625, -2.42724609375, -2.330078125, -2.23291015625, -2.1357421875, -2.03857421875, -1.94140625, -1.84423828125, -1.7470703125, -1.64990234375, -1.552734375, -1.45556640625, -1.3583984375, -1.26123046875, -1.1640625, -1.06689453125, -0.9697265625, -0.87255859375, -0.775390625, -0.67822265625, -0.5810546875, -0.48388671875, -0.38671875, -0.28955078125, -0.1923828125, -0.09521484375, 0.001953125, 0.09912109375, 0.1962890625, 0.29345703125, 0.390625, 0.48779296875, 0.5849609375, 0.68212890625, 0.779296875, 0.87646484375, 0.9736328125, 1.07080078125, 1.16796875, 1.26513671875, 1.3623046875, 1.45947265625, 1.556640625, 1.65380859375, 1.7509765625, 1.84814453125, 1.9453125, 2.04248046875, 2.1396484375, 2.23681640625, 2.333984375, 2.43115234375, 2.5283203125, 2.62548828125, 2.72265625]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 11.0, 10.0, 16.0, 20.0, 25.0, 52.0, 57.0, 109.0, 232.0, 377.0, 649.0, 775.0, 690.0, 464.0, 263.0, 123.0, 84.0, 31.0, 21.0, 17.0, 15.0, 8.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64697265625, -0.62353515625, -0.60009765625, -0.57666015625, -0.55322265625, -0.52978515625, -0.50634765625, -0.48291015625, -0.45947265625, -0.43603515625, -0.41259765625, -0.38916015625, -0.36572265625, -0.34228515625, -0.31884765625, -0.29541015625, -0.27197265625, -0.24853515625, -0.22509765625, -0.20166015625, -0.17822265625, -0.15478515625, -0.13134765625, -0.10791015625, -0.08447265625, -0.06103515625, -0.03759765625, -0.01416015625, 0.00927734375, 0.03271484375, 0.05615234375, 0.07958984375, 0.10302734375, 0.12646484375, 0.14990234375, 0.17333984375, 0.19677734375, 0.22021484375, 0.24365234375, 0.26708984375, 0.29052734375, 0.31396484375, 0.33740234375, 0.36083984375, 0.38427734375, 0.40771484375, 0.43115234375, 0.45458984375, 0.47802734375, 0.50146484375, 0.52490234375, 0.54833984375, 0.57177734375, 0.59521484375, 0.61865234375, 0.64208984375, 0.66552734375, 0.68896484375, 0.71240234375, 0.73583984375, 0.75927734375, 0.78271484375, 0.80615234375, 0.82958984375, 0.85302734375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 7.0, 9.0, 7.0, 11.0, 16.0, 12.0, 11.0, 16.0, 22.0, 25.0, 31.0, 33.0, 41.0, 50.0, 40.0, 49.0, 60.0, 51.0, 65.0, 53.0, 58.0, 45.0, 52.0, 35.0, 42.0, 32.0, 24.0, 20.0, 16.0, 15.0, 11.0, 10.0, 7.0, 10.0, 8.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9333469271659851, -0.8966100811958313, -0.8598732352256775, -0.8231363892555237, -0.7863996028900146, -0.7496627569198608, -0.712925910949707, -0.6761890649795532, -0.6394522190093994, -0.6027153730392456, -0.5659785270690918, -0.529241681098938, -0.49250486493110657, -0.45576801896095276, -0.41903120279312134, -0.38229435682296753, -0.3455575108528137, -0.3088206648826599, -0.2720838189125061, -0.23534700274467468, -0.19861015677452087, -0.16187331080436707, -0.12513647973537445, -0.08839964866638184, -0.05166280269622803, -0.014925964176654816, 0.021810874342918396, 0.05854771286249161, 0.09528455138206482, 0.13202139735221863, 0.16875822842121124, 0.20549505949020386, 0.24223196506500244, 0.27896881103515625, 0.31570565700531006, 0.3524424731731415, 0.3891793191432953, 0.4259161651134491, 0.4626529812812805, 0.4993898272514343, 0.5361266732215881, 0.5728635191917419, 0.6096003651618958, 0.6463372111320496, 0.6830739974975586, 0.7198108434677124, 0.7565476894378662, 0.79328453540802, 0.8300213813781738, 0.8667582273483276, 0.9034950733184814, 0.9402319192886353, 0.9769687652587891, 1.0137056112289429, 1.0504424571990967, 1.087179183959961, 1.1239161491394043, 1.160652995109558, 1.197389841079712, 1.2341266870498657, 1.2708635330200195, 1.3076003789901733, 1.3443372249603271, 1.3810739517211914, 1.4178107976913452]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 4.0, 4.0, 3.0, 5.0, 5.0, 3.0, 13.0, 15.0, 17.0, 12.0, 17.0, 19.0, 22.0, 21.0, 23.0, 29.0, 32.0, 32.0, 37.0, 29.0, 42.0, 40.0, 43.0, 40.0, 41.0, 42.0, 37.0, 40.0, 34.0, 36.0, 34.0, 15.0, 13.0, 24.0, 31.0, 20.0, 29.0, 18.0, 14.0, 16.0, 9.0, 4.0, 10.0, 8.0, 9.0, 6.0, 3.0, 2.0, 5.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7717025876045227, -0.7422186732292175, -0.7127347588539124, -0.6832508444786072, -0.653766930103302, -0.6242830157279968, -0.5947991013526917, -0.5653151869773865, -0.5358312726020813, -0.5063473582267761, -0.47686344385147095, -0.44737952947616577, -0.4178956151008606, -0.3884117007255554, -0.35892778635025024, -0.32944387197494507, -0.2999599575996399, -0.2704760432243347, -0.24099212884902954, -0.21150821447372437, -0.1820243000984192, -0.152540385723114, -0.12305647134780884, -0.09357255697250366, -0.06408864259719849, -0.03460472822189331, -0.005120813846588135, 0.02436310052871704, 0.05384701490402222, 0.08333092927932739, 0.11281484365463257, 0.14229875802993774, 0.17178261280059814, 0.20126652717590332, 0.2307504415512085, 0.26023435592651367, 0.28971827030181885, 0.319202184677124, 0.3486860990524292, 0.3781700134277344, 0.40765392780303955, 0.4371378421783447, 0.4666217565536499, 0.4961056709289551, 0.5255895853042603, 0.5550734996795654, 0.5845574140548706, 0.6140413284301758, 0.643525242805481, 0.6730091571807861, 0.7024930715560913, 0.7319769859313965, 0.7614609003067017, 0.7909448146820068, 0.820428729057312, 0.8499126434326172, 0.8793965578079224, 0.9088804721832275, 0.9383643865585327, 0.9678483009338379, 0.9973322153091431, 1.0268161296844482, 1.0563000440597534, 1.0857839584350586, 1.1152678728103638]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 4.0, 7.0, 14.0, 22.0, 29.0, 32.0, 37.0, 75.0, 97.0, 125.0, 202.0, 301.0, 494.0, 825.0, 1404.0, 2579.0, 5181.0, 13233.0, 67092.0, 477245.0, 404381.0, 52883.0, 11715.0, 4766.0, 2318.0, 1339.0, 737.0, 493.0, 306.0, 166.0, 113.0, 103.0, 67.0, 51.0, 42.0, 21.0, 18.0, 6.0, 5.0, 6.0, 3.0, 8.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.414306640625, -0.4017295837402344, -0.38915252685546875, -0.3765754699707031, -0.3639984130859375, -0.3514213562011719, -0.33884429931640625, -0.3262672424316406, -0.313690185546875, -0.3011131286621094, -0.28853607177734375, -0.2759590148925781, -0.2633819580078125, -0.2508049011230469, -0.23822784423828125, -0.22565078735351562, -0.21307373046875, -0.20049667358398438, -0.18791961669921875, -0.17534255981445312, -0.1627655029296875, -0.15018844604492188, -0.13761138916015625, -0.12503433227539062, -0.112457275390625, -0.09988021850585938, -0.08730316162109375, -0.07472610473632812, -0.0621490478515625, -0.049571990966796875, -0.03699493408203125, -0.024417877197265625, -0.0118408203125, 0.000736236572265625, 0.01331329345703125, 0.025890350341796875, 0.0384674072265625, 0.051044464111328125, 0.06362152099609375, 0.07619857788085938, 0.088775634765625, 0.10135269165039062, 0.11392974853515625, 0.12650680541992188, 0.1390838623046875, 0.15166091918945312, 0.16423797607421875, 0.17681503295898438, 0.18939208984375, 0.20196914672851562, 0.21454620361328125, 0.22712326049804688, 0.2397003173828125, 0.2522773742675781, 0.26485443115234375, 0.2774314880371094, 0.290008544921875, 0.3025856018066406, 0.31516265869140625, 0.3277397155761719, 0.3403167724609375, 0.3528938293457031, 0.36547088623046875, 0.3780479431152344, 0.390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 4.0, 4.0, 5.0, 5.0, 9.0, 12.0, 11.0, 16.0, 20.0, 28.0, 15.0, 28.0, 29.0, 32.0, 42.0, 37.0, 34.0, 41.0, 45.0, 48.0, 41.0, 41.0, 46.0, 54.0, 31.0, 32.0, 34.0, 33.0, 27.0, 32.0, 36.0, 23.0, 15.0, 22.0, 13.0, 11.0, 16.0, 7.0, 8.0, 5.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62451171875, -0.604278564453125, -0.58404541015625, -0.563812255859375, -0.5435791015625, -0.523345947265625, -0.50311279296875, -0.482879638671875, -0.462646484375, -0.442413330078125, -0.42218017578125, -0.401947021484375, -0.3817138671875, -0.361480712890625, -0.34124755859375, -0.321014404296875, -0.30078125, -0.280548095703125, -0.26031494140625, -0.240081787109375, -0.2198486328125, -0.199615478515625, -0.17938232421875, -0.159149169921875, -0.138916015625, -0.118682861328125, -0.09844970703125, -0.078216552734375, -0.0579833984375, -0.037750244140625, -0.01751708984375, 0.002716064453125, 0.02294921875, 0.043182373046875, 0.06341552734375, 0.083648681640625, 0.1038818359375, 0.124114990234375, 0.14434814453125, 0.164581298828125, 0.184814453125, 0.205047607421875, 0.22528076171875, 0.245513916015625, 0.2657470703125, 0.285980224609375, 0.30621337890625, 0.326446533203125, 0.3466796875, 0.366912841796875, 0.38714599609375, 0.407379150390625, 0.4276123046875, 0.447845458984375, 0.46807861328125, 0.488311767578125, 0.508544921875, 0.528778076171875, 0.54901123046875, 0.569244384765625, 0.5894775390625, 0.609710693359375, 0.62994384765625, 0.650177001953125, 0.67041015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 10.0, 19.0, 21.0, 30.0, 31.0, 49.0, 115.0, 151.0, 270.0, 481.0, 855.0, 1974.0, 5017.0, 23868.0, 431892.0, 542732.0, 30760.0, 5961.0, 2134.0, 965.0, 477.0, 255.0, 154.0, 105.0, 69.0, 48.0, 36.0, 16.0, 26.0, 7.0, 5.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.7021484375, -0.6836967468261719, -0.6652450561523438, -0.6467933654785156, -0.6283416748046875, -0.6098899841308594, -0.5914382934570312, -0.5729866027832031, -0.554534912109375, -0.5360832214355469, -0.5176315307617188, -0.4991798400878906, -0.4807281494140625, -0.4622764587402344, -0.44382476806640625, -0.4253730773925781, -0.40692138671875, -0.3884696960449219, -0.37001800537109375, -0.3515663146972656, -0.3331146240234375, -0.3146629333496094, -0.29621124267578125, -0.2777595520019531, -0.259307861328125, -0.24085617065429688, -0.22240447998046875, -0.20395278930664062, -0.1855010986328125, -0.16704940795898438, -0.14859771728515625, -0.13014602661132812, -0.1116943359375, -0.09324264526367188, -0.07479095458984375, -0.056339263916015625, -0.0378875732421875, -0.019435882568359375, -0.00098419189453125, 0.017467498779296875, 0.035919189453125, 0.054370880126953125, 0.07282257080078125, 0.09127426147460938, 0.1097259521484375, 0.12817764282226562, 0.14662933349609375, 0.16508102416992188, 0.18353271484375, 0.20198440551757812, 0.22043609619140625, 0.23888778686523438, 0.2573394775390625, 0.2757911682128906, 0.29424285888671875, 0.3126945495605469, 0.331146240234375, 0.3495979309082031, 0.36804962158203125, 0.3865013122558594, 0.4049530029296875, 0.4234046936035156, 0.44185638427734375, 0.4603080749511719, 0.478759765625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 8.0, 9.0, 23.0, 10.0, 13.0, 23.0, 23.0, 21.0, 30.0, 19.0, 24.0, 39.0, 42.0, 46.0, 50.0, 46.0, 55.0, 45.0, 31.0, 56.0, 42.0, 48.0, 33.0, 33.0, 23.0, 30.0, 25.0, 27.0, 25.0, 15.0, 11.0, 12.0, 11.0, 8.0, 9.0, 10.0, 3.0, 4.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.955078125, -1.9002532958984375, -1.845428466796875, -1.7906036376953125, -1.73577880859375, -1.6809539794921875, -1.626129150390625, -1.5713043212890625, -1.5164794921875, -1.4616546630859375, -1.406829833984375, -1.3520050048828125, -1.29718017578125, -1.2423553466796875, -1.187530517578125, -1.1327056884765625, -1.077880859375, -1.0230560302734375, -0.968231201171875, -0.9134063720703125, -0.85858154296875, -0.8037567138671875, -0.748931884765625, -0.6941070556640625, -0.6392822265625, -0.5844573974609375, -0.529632568359375, -0.4748077392578125, -0.41998291015625, -0.3651580810546875, -0.310333251953125, -0.2555084228515625, -0.20068359375, -0.1458587646484375, -0.091033935546875, -0.0362091064453125, 0.01861572265625, 0.0734405517578125, 0.128265380859375, 0.1830902099609375, 0.2379150390625, 0.2927398681640625, 0.347564697265625, 0.4023895263671875, 0.45721435546875, 0.5120391845703125, 0.566864013671875, 0.6216888427734375, 0.676513671875, 0.7313385009765625, 0.786163330078125, 0.8409881591796875, 0.89581298828125, 0.9506378173828125, 1.005462646484375, 1.0602874755859375, 1.1151123046875, 1.1699371337890625, 1.224761962890625, 1.2795867919921875, 1.33441162109375, 1.3892364501953125, 1.444061279296875, 1.4988861083984375, 1.5537109375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 0.0, 4.0, 6.0, 5.0, 4.0, 5.0, 7.0, 12.0, 20.0, 16.0, 31.0, 55.0, 87.0, 111.0, 166.0, 232.0, 404.0, 690.0, 1309.0, 2353.0, 4997.0, 11820.0, 43870.0, 322179.0, 544866.0, 84250.0, 17594.0, 6592.0, 3000.0, 1592.0, 860.0, 528.0, 302.0, 204.0, 122.0, 93.0, 53.0, 35.0, 19.0, 20.0, 9.0, 10.0, 7.0, 0.0, 5.0, 3.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1971435546875, -0.1906108856201172, -0.18407821655273438, -0.17754554748535156, -0.17101287841796875, -0.16448020935058594, -0.15794754028320312, -0.1514148712158203, -0.1448822021484375, -0.1383495330810547, -0.13181686401367188, -0.12528419494628906, -0.11875152587890625, -0.11221885681152344, -0.10568618774414062, -0.09915351867675781, -0.092620849609375, -0.08608818054199219, -0.07955551147460938, -0.07302284240722656, -0.06649017333984375, -0.05995750427246094, -0.053424835205078125, -0.04689216613769531, -0.0403594970703125, -0.03382682800292969, -0.027294158935546875, -0.020761489868164062, -0.01422882080078125, -0.0076961517333984375, -0.001163482666015625, 0.0053691864013671875, 0.01190185546875, 0.018434524536132812, 0.024967193603515625, 0.03149986267089844, 0.03803253173828125, 0.04456520080566406, 0.051097869873046875, 0.05763053894042969, 0.0641632080078125, 0.07069587707519531, 0.07722854614257812, 0.08376121520996094, 0.09029388427734375, 0.09682655334472656, 0.10335922241210938, 0.10989189147949219, 0.116424560546875, 0.12295722961425781, 0.12948989868164062, 0.13602256774902344, 0.14255523681640625, 0.14908790588378906, 0.15562057495117188, 0.1621532440185547, 0.1686859130859375, 0.1752185821533203, 0.18175125122070312, 0.18828392028808594, 0.19481658935546875, 0.20134925842285156, 0.20788192749023438, 0.2144145965576172, 0.220947265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 10.0, 10.0, 10.0, 33.0, 75.0, 204.0, 327.0, 178.0, 100.0, 32.0, 16.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002651214599609375, -0.0002587251365184784, -0.0002523288130760193, -0.0002459324896335602, -0.00023953616619110107, -0.00023313984274864197, -0.00022674351930618286, -0.00022034719586372375, -0.00021395087242126465, -0.00020755454897880554, -0.00020115822553634644, -0.00019476190209388733, -0.00018836557865142822, -0.00018196925520896912, -0.00017557293176651, -0.0001691766083240509, -0.0001627802848815918, -0.0001563839614391327, -0.00014998763799667358, -0.00014359131455421448, -0.00013719499111175537, -0.00013079866766929626, -0.00012440234422683716, -0.00011800602078437805, -0.00011160969734191895, -0.00010521337389945984, -9.881705045700073e-05, -9.242072701454163e-05, -8.602440357208252e-05, -7.962808012962341e-05, -7.32317566871643e-05, -6.68354332447052e-05, -6.0439109802246094e-05, -5.404278635978699e-05, -4.764646291732788e-05, -4.1250139474868774e-05, -3.485381603240967e-05, -2.845749258995056e-05, -2.2061169147491455e-05, -1.566484570503235e-05, -9.268522262573242e-06, -2.8721988201141357e-06, 3.5241246223449707e-06, 9.920448064804077e-06, 1.6316771507263184e-05, 2.271309494972229e-05, 2.9109418392181396e-05, 3.55057418346405e-05, 4.190206527709961e-05, 4.8298388719558716e-05, 5.469471216201782e-05, 6.109103560447693e-05, 6.748735904693604e-05, 7.388368248939514e-05, 8.028000593185425e-05, 8.667632937431335e-05, 9.307265281677246e-05, 9.946897625923157e-05, 0.00010586529970169067, 0.00011226162314414978, 0.00011865794658660889, 0.000125054270029068, 0.0001314505934715271, 0.0001378469169139862, 0.0001442432403564453]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 10.0, 8.0, 22.0, 20.0, 50.0, 63.0, 97.0, 169.0, 268.0, 422.0, 637.0, 1029.0, 1621.0, 2652.0, 4441.0, 8081.0, 17270.0, 46584.0, 158922.0, 392091.0, 276361.0, 83983.0, 27004.0, 11276.0, 5968.0, 3505.0, 2133.0, 1399.0, 866.0, 541.0, 336.0, 268.0, 154.0, 109.0, 71.0, 36.0, 35.0, 12.0, 13.0, 13.0, 7.0, 7.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.136474609375, -0.13254642486572266, -0.1286182403564453, -0.12469005584716797, -0.12076187133789062, -0.11683368682861328, -0.11290550231933594, -0.1089773178100586, -0.10504913330078125, -0.1011209487915039, -0.09719276428222656, -0.09326457977294922, -0.08933639526367188, -0.08540821075439453, -0.08148002624511719, -0.07755184173583984, -0.0736236572265625, -0.06969547271728516, -0.06576728820800781, -0.06183910369873047, -0.057910919189453125, -0.05398273468017578, -0.05005455017089844, -0.046126365661621094, -0.04219818115234375, -0.038269996643066406, -0.03434181213378906, -0.03041362762451172, -0.026485443115234375, -0.02255725860595703, -0.018629074096679688, -0.014700889587402344, -0.010772705078125, -0.006844520568847656, -0.0029163360595703125, 0.0010118484497070312, 0.004940032958984375, 0.008868217468261719, 0.012796401977539062, 0.016724586486816406, 0.02065277099609375, 0.024580955505371094, 0.028509140014648438, 0.03243732452392578, 0.036365509033203125, 0.04029369354248047, 0.04422187805175781, 0.048150062561035156, 0.0520782470703125, 0.056006431579589844, 0.05993461608886719, 0.06386280059814453, 0.06779098510742188, 0.07171916961669922, 0.07564735412597656, 0.0795755386352539, 0.08350372314453125, 0.0874319076538086, 0.09136009216308594, 0.09528827667236328, 0.09921646118164062, 0.10314464569091797, 0.10707283020019531, 0.11100101470947266, 0.11492919921875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 8.0, 5.0, 5.0, 9.0, 8.0, 14.0, 13.0, 22.0, 38.0, 59.0, 74.0, 84.0, 88.0, 99.0, 112.0, 92.0, 65.0, 62.0, 37.0, 31.0, 16.0, 13.0, 15.0, 6.0, 5.0, 7.0, 6.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048187255859375, -0.04643869400024414, -0.04469013214111328, -0.04294157028198242, -0.04119300842285156, -0.0394444465637207, -0.037695884704589844, -0.035947322845458984, -0.034198760986328125, -0.032450199127197266, -0.030701637268066406, -0.028953075408935547, -0.027204513549804688, -0.025455951690673828, -0.02370738983154297, -0.02195882797241211, -0.02021026611328125, -0.01846170425415039, -0.01671314239501953, -0.014964580535888672, -0.013216018676757812, -0.011467456817626953, -0.009718894958496094, -0.007970333099365234, -0.006221771240234375, -0.004473209381103516, -0.0027246475219726562, -0.0009760856628417969, 0.0007724761962890625, 0.002521038055419922, 0.004269599914550781, 0.006018161773681641, 0.0077667236328125, 0.00951528549194336, 0.011263847351074219, 0.013012409210205078, 0.014760971069335938, 0.016509532928466797, 0.018258094787597656, 0.020006656646728516, 0.021755218505859375, 0.023503780364990234, 0.025252342224121094, 0.027000904083251953, 0.028749465942382812, 0.030498027801513672, 0.03224658966064453, 0.03399515151977539, 0.03574371337890625, 0.03749227523803711, 0.03924083709716797, 0.04098939895629883, 0.04273796081542969, 0.04448652267456055, 0.046235084533691406, 0.047983646392822266, 0.049732208251953125, 0.051480770111083984, 0.053229331970214844, 0.0549778938293457, 0.05672645568847656, 0.05847501754760742, 0.06022357940673828, 0.06197214126586914, 0.063720703125]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 0.0, 9.0, 10.0, 3.0, 16.0, 9.0, 16.0, 20.0, 8.0, 24.0, 23.0, 33.0, 56.0, 32.0, 40.0, 38.0, 42.0, 55.0, 54.0, 47.0, 52.0, 67.0, 57.0, 31.0, 31.0, 43.0, 30.0, 30.0, 27.0, 24.0, 14.0, 11.0, 7.0, 9.0, 11.0, 4.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.5443191528320312, -0.5244734287261963, -0.5046277046203613, -0.48478201031684875, -0.4649362862110138, -0.4450905919075012, -0.42524486780166626, -0.4053991436958313, -0.38555341958999634, -0.3657076954841614, -0.3458620011806488, -0.32601627707481384, -0.3061705529689789, -0.2863248586654663, -0.26647913455963135, -0.2466334104537964, -0.2267877161502838, -0.20694200694561005, -0.18709628283977509, -0.16725057363510132, -0.14740484952926636, -0.1275591403245926, -0.10771343111991882, -0.08786770701408386, -0.0680219978094101, -0.04817628115415573, -0.028330568224191666, -0.0084848552942276, 0.011360861361026764, 0.031206578016281128, 0.051052287220954895, 0.07089801132678986, 0.09074372053146362, 0.11058943718671799, 0.13043515384197235, 0.15028086304664612, 0.17012658715248108, 0.18997229635715485, 0.2098180055618286, 0.22966372966766357, 0.24950943887233734, 0.2693551480770111, 0.28920087218284607, 0.30904656648635864, 0.3288922905921936, 0.34873801469802856, 0.3685837388038635, 0.3884294629096985, 0.40827515721321106, 0.428120881319046, 0.4479665756225586, 0.46781229972839355, 0.4876580238342285, 0.5075037479400635, 0.5273494720458984, 0.5471951961517334, 0.5670408606529236, 0.5868865847587585, 0.6067323088645935, 0.6265779733657837, 0.6464236974716187, 0.6662694215774536, 0.6861151456832886, 0.7059608697891235, 0.7258065938949585]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 5.0, 10.0, 8.0, 16.0, 4.0, 14.0, 11.0, 17.0, 24.0, 31.0, 19.0, 27.0, 24.0, 36.0, 26.0, 41.0, 41.0, 44.0, 35.0, 28.0, 50.0, 38.0, 46.0, 39.0, 44.0, 27.0, 38.0, 25.0, 17.0, 24.0, 22.0, 23.0, 20.0, 28.0, 18.0, 12.0, 12.0, 11.0, 8.0, 9.0, 2.0, 7.0, 4.0, 3.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5060173273086548, -0.48837611079216003, -0.4707348942756653, -0.45309364795684814, -0.4354524314403534, -0.41781121492385864, -0.4001699686050415, -0.38252875208854675, -0.364887535572052, -0.34724631905555725, -0.3296051025390625, -0.31196385622024536, -0.2943226397037506, -0.27668142318725586, -0.2590401768684387, -0.24139896035194397, -0.22375774383544922, -0.20611652731895447, -0.18847529590129852, -0.17083406448364258, -0.15319284796714783, -0.13555163145065308, -0.11791040003299713, -0.10026917606592178, -0.08262795209884644, -0.06498672813177109, -0.04734550416469574, -0.029704280197620392, -0.012063056230545044, 0.005578167736530304, 0.023219391703605652, 0.040860615670681, 0.05850178003311157, 0.07614300400018692, 0.09378422796726227, 0.11142545193433762, 0.12906667590141296, 0.14670789241790771, 0.16434912383556366, 0.1819903552532196, 0.19963157176971436, 0.2172727882862091, 0.23491401970386505, 0.252555251121521, 0.27019646763801575, 0.2878376841545105, 0.30547893047332764, 0.3231201469898224, 0.34076136350631714, 0.3584025800228119, 0.37604379653930664, 0.3936850428581238, 0.41132625937461853, 0.4289674758911133, 0.4466087222099304, 0.46424993872642517, 0.4818911552429199, 0.4995323717594147, 0.5171735882759094, 0.5348148345947266, 0.5524560213088989, 0.5700972676277161, 0.5877385139465332, 0.6053797006607056, 0.6230209469795227]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 6.0, 3.0, 10.0, 10.0, 21.0, 21.0, 21.0, 49.0, 64.0, 105.0, 114.0, 165.0, 265.0, 408.0, 686.0, 1126.0, 2045.0, 3581.0, 6429.0, 11831.0, 22300.0, 43841.0, 101899.0, 263866.0, 330599.0, 141017.0, 57318.0, 27740.0, 14721.0, 7947.0, 4247.0, 2418.0, 1396.0, 839.0, 484.0, 298.0, 186.0, 163.0, 90.0, 74.0, 40.0, 36.0, 23.0, 18.0, 5.0, 6.0, 11.0, 7.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70361328125, -0.6786346435546875, -0.653656005859375, -0.6286773681640625, -0.60369873046875, -0.5787200927734375, -0.553741455078125, -0.5287628173828125, -0.5037841796875, -0.4788055419921875, -0.453826904296875, -0.4288482666015625, -0.40386962890625, -0.3788909912109375, -0.353912353515625, -0.3289337158203125, -0.303955078125, -0.2789764404296875, -0.253997802734375, -0.2290191650390625, -0.20404052734375, -0.1790618896484375, -0.154083251953125, -0.1291046142578125, -0.1041259765625, -0.0791473388671875, -0.054168701171875, -0.0291900634765625, -0.00421142578125, 0.0207672119140625, 0.045745849609375, 0.0707244873046875, 0.095703125, 0.1206817626953125, 0.145660400390625, 0.1706390380859375, 0.19561767578125, 0.2205963134765625, 0.245574951171875, 0.2705535888671875, 0.2955322265625, 0.3205108642578125, 0.345489501953125, 0.3704681396484375, 0.39544677734375, 0.4204254150390625, 0.445404052734375, 0.4703826904296875, 0.495361328125, 0.5203399658203125, 0.545318603515625, 0.5702972412109375, 0.59527587890625, 0.6202545166015625, 0.645233154296875, 0.6702117919921875, 0.6951904296875, 0.7201690673828125, 0.745147705078125, 0.7701263427734375, 0.79510498046875, 0.8200836181640625, 0.845062255859375, 0.8700408935546875, 0.89501953125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 6.0, 1.0, 6.0, 1.0, 9.0, 7.0, 11.0, 10.0, 15.0, 15.0, 7.0, 18.0, 19.0, 21.0, 34.0, 24.0, 31.0, 37.0, 36.0, 24.0, 33.0, 44.0, 50.0, 45.0, 41.0, 54.0, 34.0, 32.0, 43.0, 27.0, 31.0, 21.0, 28.0, 28.0, 27.0, 20.0, 13.0, 17.0, 22.0, 14.0, 12.0, 11.0, 6.0, 6.0, 6.0, 2.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85986328125, -0.8283462524414062, -0.7968292236328125, -0.7653121948242188, -0.733795166015625, -0.7022781372070312, -0.6707611083984375, -0.6392440795898438, -0.60772705078125, -0.5762100219726562, -0.5446929931640625, -0.5131759643554688, -0.481658935546875, -0.45014190673828125, -0.4186248779296875, -0.38710784912109375, -0.3555908203125, -0.32407379150390625, -0.2925567626953125, -0.26103973388671875, -0.229522705078125, -0.19800567626953125, -0.1664886474609375, -0.13497161865234375, -0.10345458984375, -0.07193756103515625, -0.0404205322265625, -0.00890350341796875, 0.022613525390625, 0.05413055419921875, 0.0856475830078125, 0.11716461181640625, 0.148681640625, 0.18019866943359375, 0.2117156982421875, 0.24323272705078125, 0.274749755859375, 0.30626678466796875, 0.3377838134765625, 0.36930084228515625, 0.40081787109375, 0.43233489990234375, 0.4638519287109375, 0.49536895751953125, 0.526885986328125, 0.5584030151367188, 0.5899200439453125, 0.6214370727539062, 0.6529541015625, 0.6844711303710938, 0.7159881591796875, 0.7475051879882812, 0.779022216796875, 0.8105392456054688, 0.8420562744140625, 0.8735733032226562, 0.90509033203125, 0.9366073608398438, 0.9681243896484375, 0.9996414184570312, 1.031158447265625, 1.0626754760742188, 1.0941925048828125, 1.1257095336914062, 1.1572265625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 14.0, 16.0, 40.0, 34.0, 55.0, 84.0, 125.0, 175.0, 310.0, 514.0, 913.0, 1761.0, 3941.0, 10158.0, 27983.0, 90674.0, 361683.0, 398986.0, 100741.0, 30612.0, 10965.0, 4471.0, 1818.0, 949.0, 583.0, 333.0, 175.0, 141.0, 80.0, 62.0, 36.0, 28.0, 29.0, 16.0, 9.0, 12.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4296875, -1.38507080078125, -1.3404541015625, -1.29583740234375, -1.251220703125, -1.20660400390625, -1.1619873046875, -1.11737060546875, -1.07275390625, -1.02813720703125, -0.9835205078125, -0.93890380859375, -0.894287109375, -0.84967041015625, -0.8050537109375, -0.76043701171875, -0.7158203125, -0.67120361328125, -0.6265869140625, -0.58197021484375, -0.537353515625, -0.49273681640625, -0.4481201171875, -0.40350341796875, -0.35888671875, -0.31427001953125, -0.2696533203125, -0.22503662109375, -0.180419921875, -0.13580322265625, -0.0911865234375, -0.04656982421875, -0.001953125, 0.04266357421875, 0.0872802734375, 0.13189697265625, 0.176513671875, 0.22113037109375, 0.2657470703125, 0.31036376953125, 0.35498046875, 0.39959716796875, 0.4442138671875, 0.48883056640625, 0.533447265625, 0.57806396484375, 0.6226806640625, 0.66729736328125, 0.7119140625, 0.75653076171875, 0.8011474609375, 0.84576416015625, 0.890380859375, 0.93499755859375, 0.9796142578125, 1.02423095703125, 1.06884765625, 1.11346435546875, 1.1580810546875, 1.20269775390625, 1.247314453125, 1.29193115234375, 1.3365478515625, 1.38116455078125, 1.42578125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 8.0, 4.0, 8.0, 7.0, 16.0, 14.0, 23.0, 20.0, 26.0, 40.0, 31.0, 53.0, 51.0, 42.0, 53.0, 52.0, 49.0, 53.0, 57.0, 57.0, 34.0, 39.0, 34.0, 31.0, 40.0, 27.0, 32.0, 23.0, 14.0, 6.0, 12.0, 12.0, 10.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4873046875, -1.44317626953125, -1.3990478515625, -1.35491943359375, -1.310791015625, -1.26666259765625, -1.2225341796875, -1.17840576171875, -1.13427734375, -1.09014892578125, -1.0460205078125, -1.00189208984375, -0.957763671875, -0.91363525390625, -0.8695068359375, -0.82537841796875, -0.78125, -0.73712158203125, -0.6929931640625, -0.64886474609375, -0.604736328125, -0.56060791015625, -0.5164794921875, -0.47235107421875, -0.42822265625, -0.38409423828125, -0.3399658203125, -0.29583740234375, -0.251708984375, -0.20758056640625, -0.1634521484375, -0.11932373046875, -0.0751953125, -0.03106689453125, 0.0130615234375, 0.05718994140625, 0.101318359375, 0.14544677734375, 0.1895751953125, 0.23370361328125, 0.27783203125, 0.32196044921875, 0.3660888671875, 0.41021728515625, 0.454345703125, 0.49847412109375, 0.5426025390625, 0.58673095703125, 0.630859375, 0.67498779296875, 0.7191162109375, 0.76324462890625, 0.807373046875, 0.85150146484375, 0.8956298828125, 0.93975830078125, 0.98388671875, 1.02801513671875, 1.0721435546875, 1.11627197265625, 1.160400390625, 1.20452880859375, 1.2486572265625, 1.29278564453125, 1.3369140625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 6.0, 1.0, 9.0, 8.0, 15.0, 17.0, 18.0, 21.0, 42.0, 43.0, 73.0, 106.0, 145.0, 177.0, 315.0, 422.0, 700.0, 1171.0, 2159.0, 4276.0, 8591.0, 19152.0, 48538.0, 130863.0, 358859.0, 277772.0, 117405.0, 43183.0, 17632.0, 7838.0, 3810.0, 2038.0, 1165.0, 659.0, 392.0, 247.0, 188.0, 137.0, 81.0, 98.0, 50.0, 43.0, 21.0, 18.0, 12.0, 11.0, 12.0, 8.0, 4.0, 5.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0], "bins": [-0.1705322265625, -0.16535568237304688, -0.16017913818359375, -0.15500259399414062, -0.1498260498046875, -0.14464950561523438, -0.13947296142578125, -0.13429641723632812, -0.129119873046875, -0.12394332885742188, -0.11876678466796875, -0.11359024047851562, -0.1084136962890625, -0.10323715209960938, -0.09806060791015625, -0.09288406372070312, -0.08770751953125, -0.08253097534179688, -0.07735443115234375, -0.07217788696289062, -0.0670013427734375, -0.061824798583984375, -0.05664825439453125, -0.051471710205078125, -0.046295166015625, -0.041118621826171875, -0.03594207763671875, -0.030765533447265625, -0.0255889892578125, -0.020412445068359375, -0.01523590087890625, -0.010059356689453125, -0.0048828125, 0.000293731689453125, 0.00547027587890625, 0.010646820068359375, 0.0158233642578125, 0.020999908447265625, 0.02617645263671875, 0.031352996826171875, 0.036529541015625, 0.041706085205078125, 0.04688262939453125, 0.052059173583984375, 0.0572357177734375, 0.062412261962890625, 0.06758880615234375, 0.07276535034179688, 0.07794189453125, 0.08311843872070312, 0.08829498291015625, 0.09347152709960938, 0.0986480712890625, 0.10382461547851562, 0.10900115966796875, 0.11417770385742188, 0.119354248046875, 0.12453079223632812, 0.12970733642578125, 0.13488388061523438, 0.1400604248046875, 0.14523696899414062, 0.15041351318359375, 0.15559005737304688, 0.1607666015625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 3.0, 7.0, 12.0, 12.0, 13.0, 22.0, 17.0, 17.0, 32.0, 38.0, 50.0, 60.0, 70.0, 102.0, 141.0, 76.0, 67.0, 63.0, 38.0, 49.0, 21.0, 22.0, 10.0, 13.0, 11.0, 9.0, 8.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.738569259643555e-05, -4.587322473526001e-05, -4.436075687408447e-05, -4.2848289012908936e-05, -4.13358211517334e-05, -3.982335329055786e-05, -3.8310885429382324e-05, -3.679841756820679e-05, -3.528594970703125e-05, -3.377348184585571e-05, -3.2261013984680176e-05, -3.074854612350464e-05, -2.92360782623291e-05, -2.7723610401153564e-05, -2.6211142539978027e-05, -2.469867467880249e-05, -2.3186206817626953e-05, -2.1673738956451416e-05, -2.016127109527588e-05, -1.8648803234100342e-05, -1.7136335372924805e-05, -1.5623867511749268e-05, -1.411139965057373e-05, -1.2598931789398193e-05, -1.1086463928222656e-05, -9.573996067047119e-06, -8.061528205871582e-06, -6.549060344696045e-06, -5.036592483520508e-06, -3.5241246223449707e-06, -2.0116567611694336e-06, -4.991888999938965e-07, 1.0132789611816406e-06, 2.5257468223571777e-06, 4.038214683532715e-06, 5.550682544708252e-06, 7.063150405883789e-06, 8.575618267059326e-06, 1.0088086128234863e-05, 1.16005539894104e-05, 1.3113021850585938e-05, 1.4625489711761475e-05, 1.6137957572937012e-05, 1.765042543411255e-05, 1.9162893295288086e-05, 2.0675361156463623e-05, 2.218782901763916e-05, 2.3700296878814697e-05, 2.5212764739990234e-05, 2.672523260116577e-05, 2.823770046234131e-05, 2.9750168323516846e-05, 3.126263618469238e-05, 3.277510404586792e-05, 3.428757190704346e-05, 3.5800039768218994e-05, 3.731250762939453e-05, 3.882497549057007e-05, 4.0337443351745605e-05, 4.184991121292114e-05, 4.336237907409668e-05, 4.487484693527222e-05, 4.6387314796447754e-05, 4.789978265762329e-05, 4.941225051879883e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 0.0, 5.0, 9.0, 7.0, 17.0, 21.0, 42.0, 44.0, 55.0, 78.0, 120.0, 201.0, 298.0, 436.0, 669.0, 1062.0, 1818.0, 3064.0, 5765.0, 11771.0, 29429.0, 104953.0, 495299.0, 288799.0, 63549.0, 20808.0, 9037.0, 4569.0, 2508.0, 1511.0, 892.0, 590.0, 388.0, 250.0, 170.0, 112.0, 65.0, 48.0, 37.0, 15.0, 16.0, 7.0, 9.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.349853515625, -0.33919525146484375, -0.3285369873046875, -0.31787872314453125, -0.307220458984375, -0.29656219482421875, -0.2859039306640625, -0.27524566650390625, -0.26458740234375, -0.25392913818359375, -0.2432708740234375, -0.23261260986328125, -0.221954345703125, -0.21129608154296875, -0.2006378173828125, -0.18997955322265625, -0.1793212890625, -0.16866302490234375, -0.1580047607421875, -0.14734649658203125, -0.136688232421875, -0.12602996826171875, -0.1153717041015625, -0.10471343994140625, -0.09405517578125, -0.08339691162109375, -0.0727386474609375, -0.06208038330078125, -0.051422119140625, -0.04076385498046875, -0.0301055908203125, -0.01944732666015625, -0.0087890625, 0.00186920166015625, 0.0125274658203125, 0.02318572998046875, 0.033843994140625, 0.04450225830078125, 0.0551605224609375, 0.06581878662109375, 0.07647705078125, 0.08713531494140625, 0.0977935791015625, 0.10845184326171875, 0.119110107421875, 0.12976837158203125, 0.1404266357421875, 0.15108489990234375, 0.1617431640625, 0.17240142822265625, 0.1830596923828125, 0.19371795654296875, 0.204376220703125, 0.21503448486328125, 0.2256927490234375, 0.23635101318359375, 0.24700927734375, 0.25766754150390625, 0.2683258056640625, 0.27898406982421875, 0.289642333984375, 0.30030059814453125, 0.3109588623046875, 0.32161712646484375, 0.332275390625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 4.0, 8.0, 14.0, 16.0, 22.0, 46.0, 58.0, 83.0, 138.0, 185.0, 124.0, 84.0, 81.0, 37.0, 19.0, 20.0, 9.0, 9.0, 9.0, 7.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27294921875, -0.2648277282714844, -0.25670623779296875, -0.24858474731445312, -0.2404632568359375, -0.23234176635742188, -0.22422027587890625, -0.21609878540039062, -0.207977294921875, -0.19985580444335938, -0.19173431396484375, -0.18361282348632812, -0.1754913330078125, -0.16736984252929688, -0.15924835205078125, -0.15112686157226562, -0.14300537109375, -0.13488388061523438, -0.12676239013671875, -0.11864089965820312, -0.1105194091796875, -0.10239791870117188, -0.09427642822265625, -0.08615493774414062, -0.078033447265625, -0.06991195678710938, -0.06179046630859375, -0.053668975830078125, -0.0455474853515625, -0.037425994873046875, -0.02930450439453125, -0.021183013916015625, -0.0130615234375, -0.004940032958984375, 0.00318145751953125, 0.011302947998046875, 0.0194244384765625, 0.027545928955078125, 0.03566741943359375, 0.043788909912109375, 0.051910400390625, 0.060031890869140625, 0.06815338134765625, 0.07627487182617188, 0.0843963623046875, 0.09251785278320312, 0.10063934326171875, 0.10876083374023438, 0.11688232421875, 0.12500381469726562, 0.13312530517578125, 0.14124679565429688, 0.1493682861328125, 0.15748977661132812, 0.16561126708984375, 0.17373275756835938, 0.181854248046875, 0.18997573852539062, 0.19809722900390625, 0.20621871948242188, 0.2143402099609375, 0.22246170043945312, 0.23058319091796875, 0.23870468139648438, 0.246826171875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 9.0, 21.0, 24.0, 58.0, 71.0, 127.0, 128.0, 141.0, 126.0, 109.0, 75.0, 46.0, 25.0, 17.0, 11.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.467543601989746, -2.367278575897217, -2.2670133113861084, -2.166748285293579, -2.06648325920105, -1.966218113899231, -1.865952968597412, -1.7656879425048828, -1.665422797203064, -1.5651576519012451, -1.4648926258087158, -1.364627480506897, -1.2643623352050781, -1.1640973091125488, -1.06383216381073, -0.9635670781135559, -0.8633019924163818, -0.7630369067192078, -0.6627718210220337, -0.5625066757202148, -0.46224159002304077, -0.3619765043258667, -0.26171135902404785, -0.16144627332687378, -0.06118118762969971, 0.03908391296863556, 0.13934901356697083, 0.23961412906646729, 0.33987921476364136, 0.44014430046081543, 0.5404094457626343, 0.6406745314598083, 0.7409393787384033, 0.8412044644355774, 0.9414695501327515, 1.0417346954345703, 1.1419997215270996, 1.2422648668289185, 1.3425300121307373, 1.4427950382232666, 1.5430601835250854, 1.6433253288269043, 1.7435903549194336, 1.8438555002212524, 1.9441206455230713, 2.0443856716156006, 2.144650936126709, 2.2449159622192383, 2.3451809883117676, 2.445446014404297, 2.5457112789154053, 2.6459763050079346, 2.746241331100464, 2.8465065956115723, 2.9467716217041016, 3.047036647796631, 3.14730167388916, 3.2475666999816895, 3.347831964492798, 3.448096990585327, 3.5483620166778564, 3.648627281188965, 3.748892307281494, 3.8491573333740234, 3.949422597885132]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 2.0, 8.0, 9.0, 16.0, 16.0, 17.0, 16.0, 18.0, 25.0, 30.0, 29.0, 29.0, 33.0, 48.0, 52.0, 58.0, 46.0, 45.0, 43.0, 49.0, 46.0, 52.0, 39.0, 39.0, 36.0, 37.0, 30.0, 22.0, 18.0, 16.0, 20.0, 10.0, 9.0, 11.0, 10.0, 13.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4961495399475098, -2.424999475479126, -2.353849411010742, -2.2826995849609375, -2.2115495204925537, -2.14039945602417, -2.069249391555786, -1.9980993270874023, -1.9269492626190186, -1.8557991981506348, -1.7846492528915405, -1.7134991884231567, -1.642349123954773, -1.5711991786956787, -1.500049114227295, -1.4288990497589111, -1.357749104499817, -1.286599040031433, -1.2154490947723389, -1.144299030303955, -1.0731489658355713, -1.0019989013671875, -0.9308489561080933, -0.8596988916397095, -0.7885488867759705, -0.7173988819122314, -0.6462488174438477, -0.5750988125801086, -0.5039488077163696, -0.43279874324798584, -0.3616487383842468, -0.2904987037181854, -0.21934866905212402, -0.14819863438606262, -0.07704861462116241, -0.005898594856262207, 0.0652514398097992, 0.1364014744758606, 0.2075514793395996, 0.278701514005661, 0.3498515486717224, 0.4210015833377838, 0.4921516180038452, 0.5633016228675842, 0.6344516277313232, 0.705601692199707, 0.776751697063446, 0.8479017019271851, 0.9190517663955688, 0.9902017712593079, 1.0613517761230469, 1.1325018405914307, 1.2036519050598145, 1.2748019695281982, 1.3459519147872925, 1.4171019792556763, 1.4882519245147705, 1.5594019889831543, 1.6305519342422485, 1.7017019987106323, 1.7728520631790161, 1.8440020084381104, 1.9151520729064941, 1.986302137374878, 2.0574522018432617]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 9.0, 7.0, 10.0, 10.0, 13.0, 16.0, 21.0, 26.0, 35.0, 36.0, 45.0, 67.0, 102.0, 142.0, 130.0, 215.0, 275.0, 355.0, 508.0, 616.0, 892.0, 1111.0, 1515.0, 2084.0, 1033957.0, 2080.0, 1588.0, 1140.0, 879.0, 694.0, 500.0, 381.0, 271.0, 187.0, 156.0, 120.0, 107.0, 82.0, 51.0, 36.0, 25.0, 31.0, 21.0, 20.0, 14.0, 8.0, 5.0, 2.0, 3.0, 0.0, 4.0, 3.0, 4.0, 2.0], "bins": [-2.2587437629699707, -2.1933069229125977, -2.1278700828552246, -2.0624332427978516, -1.9969964027404785, -1.9315595626831055, -1.866122841835022, -1.800686001777649, -1.7352491617202759, -1.6698123216629028, -1.6043754816055298, -1.5389386415481567, -1.4735019207000732, -1.4080650806427002, -1.3426282405853271, -1.277191400527954, -1.211754560470581, -1.146317720413208, -1.080880880355835, -1.015444040298462, -0.9500072598457336, -0.8845704197883606, -0.8191336393356323, -0.7536967992782593, -0.6882599592208862, -0.6228231191635132, -0.5573862791061401, -0.49194949865341187, -0.4265126585960388, -0.36107581853866577, -0.2956390082836151, -0.23020219802856445, -0.1647651195526123, -0.09932829439640045, -0.0338914692401886, 0.031545355916023254, 0.09698218107223511, 0.16241902112960815, 0.2278558313846588, 0.2932926416397095, 0.3587294816970825, 0.42416632175445557, 0.4896031320095062, 0.5550399422645569, 0.6204767823219299, 0.685913622379303, 0.7513504028320312, 0.8167872428894043, 0.8822240829467773, 0.9476609230041504, 1.0130977630615234, 1.0785346031188965, 1.1439714431762695, 1.2094082832336426, 1.274845004081726, 1.3402818441390991, 1.4057186841964722, 1.4711555242538452, 1.5365923643112183, 1.6020292043685913, 1.6674659252166748, 1.7329027652740479, 1.798339605331421, 1.863776445388794, 1.929213285446167]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 20.0, 29.0, 36.0, 22.0, 42.0, 70.0, 123.0, 251.0, 517.0, 1363.0, 3337.0, 8114.0, 23150.0, 51392964.0, 23931.0, 9734.0, 4346.0, 1814.0, 783.0, 346.0, 145.0, 76.0, 39.0, 25.0, 21.0, 11.0, 8.0, 1.0, 7.0, 5.0, 5.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.072476387023926, -6.861478805541992, -6.650481700897217, -6.439484119415283, -6.22848653793335, -6.017489433288574, -5.806491851806641, -5.595494270324707, -5.384497165679932, -5.173499584197998, -4.962502479553223, -4.751504898071289, -4.5405073165893555, -4.32951021194458, -4.1185126304626465, -3.907515287399292, -3.6965177059173584, -3.485520362854004, -3.2745227813720703, -3.063525438308716, -2.8525280952453613, -2.6415305137634277, -2.4305331707000732, -2.2195358276367188, -2.008538246154785, -1.7975407838821411, -1.5865434408187866, -1.3755459785461426, -1.164548635482788, -0.953551173210144, -0.7425537109375, -0.5315563678741455, -0.320559024810791, -0.10956160724163055, 0.10143581032752991, 0.31243324279785156, 0.5234306454658508, 0.7344280481338501, 0.9454255104064941, 1.1564228534698486, 1.3674203157424927, 1.5784177780151367, 1.7894151210784912, 2.0004124641418457, 2.2114100456237793, 2.422407388687134, 2.6334047317504883, 2.844402313232422, 3.0553996562957764, 3.266396999359131, 3.4773945808410645, 3.688391923904419, 3.8993892669677734, 4.110386848449707, 4.321384429931641, 4.532381534576416, 4.74337911605835, 4.954376697540283, 5.165373802185059, 5.376371383666992, 5.587368965148926, 5.798366069793701, 6.009363651275635, 6.22036075592041, 6.431358337402344]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 9.0, 11.0, 20.0, 21.0, 25.0, 52.0, 90.0, 119.0, 159.0, 274.0, 369.0, 654.0, 989.0, 1713.0, 2702.0, 4597.0, 7737.0, 13427.0, 23386.0, 41755.0, 75000.0, 130735.0, 215733.0, 328222.0, 521927.0, 3131769.0, 819608.0, 366794.0, 247929.0, 152645.0, 87470.0, 49823.0, 27634.0, 15679.0, 8753.0, 5259.0, 3178.0, 1947.0, 1225.0, 725.0, 443.0, 283.0, 177.0, 137.0, 79.0, 54.0, 28.0, 20.0, 17.0, 15.0, 8.0, 9.0, 6.0, 2.0, 1.0], "bins": [-1.4921875, -1.449127197265625, -1.40606689453125, -1.363006591796875, -1.3199462890625, -1.276885986328125, -1.23382568359375, -1.190765380859375, -1.147705078125, -1.104644775390625, -1.06158447265625, -1.018524169921875, -0.9754638671875, -0.932403564453125, -0.88934326171875, -0.846282958984375, -0.80322265625, -0.760162353515625, -0.71710205078125, -0.674041748046875, -0.6309814453125, -0.587921142578125, -0.54486083984375, -0.501800537109375, -0.458740234375, -0.415679931640625, -0.37261962890625, -0.329559326171875, -0.2864990234375, -0.243438720703125, -0.20037841796875, -0.157318115234375, -0.1142578125, -0.071197509765625, -0.02813720703125, 0.014923095703125, 0.0579833984375, 0.101043701171875, 0.14410400390625, 0.187164306640625, 0.230224609375, 0.273284912109375, 0.31634521484375, 0.359405517578125, 0.4024658203125, 0.445526123046875, 0.48858642578125, 0.531646728515625, 0.57470703125, 0.617767333984375, 0.66082763671875, 0.703887939453125, 0.7469482421875, 0.790008544921875, 0.83306884765625, 0.876129150390625, 0.919189453125, 0.962249755859375, 1.00531005859375, 1.048370361328125, 1.0914306640625, 1.134490966796875, 1.17755126953125, 1.220611572265625, 1.263671875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 0.0, 3.0, 9.0, 11.0, 13.0, 10.0, 22.0, 16.0, 24.0, 22.0, 28.0, 25.0, 13.0, 38.0, 38.0, 53.0, 54.0, 54.0, 123.0, 779.0, 245.0, 59.0, 49.0, 42.0, 41.0, 36.0, 33.0, 30.0, 15.0, 20.0, 26.0, 14.0, 12.0, 10.0, 11.0, 8.0, 8.0, 9.0, 3.0, 7.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.80078125, -7.55487060546875, -7.3089599609375, -7.06304931640625, -6.817138671875, -6.57122802734375, -6.3253173828125, -6.07940673828125, -5.83349609375, -5.58758544921875, -5.3416748046875, -5.09576416015625, -4.849853515625, -4.60394287109375, -4.3580322265625, -4.11212158203125, -3.8662109375, -3.62030029296875, -3.3743896484375, -3.12847900390625, -2.882568359375, -2.63665771484375, -2.3907470703125, -2.14483642578125, -1.89892578125, -1.65301513671875, -1.4071044921875, -1.16119384765625, -0.915283203125, -0.66937255859375, -0.4234619140625, -0.17755126953125, 0.068359375, 0.31427001953125, 0.5601806640625, 0.80609130859375, 1.052001953125, 1.29791259765625, 1.5438232421875, 1.78973388671875, 2.03564453125, 2.28155517578125, 2.5274658203125, 2.77337646484375, 3.019287109375, 3.26519775390625, 3.5111083984375, 3.75701904296875, 4.0029296875, 4.24884033203125, 4.4947509765625, 4.74066162109375, 4.986572265625, 5.23248291015625, 5.4783935546875, 5.72430419921875, 5.97021484375, 6.21612548828125, 6.4620361328125, 6.70794677734375, 6.953857421875, 7.19976806640625, 7.4456787109375, 7.69158935546875, 7.9375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 9.0, 7.0, 14.0, 20.0, 43.0, 77.0, 138.0, 205.0, 375.0, 616.0, 921.0, 1623.0, 2517.0, 3951.0, 6200.0, 9470.0, 14756.0, 21888.0, 31698.0, 45857.0, 64232.0, 87046.0, 115635.0, 146235.0, 179375.0, 211251.0, 257409.0, 727671.0, 2302403.0, 833116.0, 264815.0, 214065.0, 181660.0, 148634.0, 117885.0, 89314.0, 65568.0, 47631.0, 33031.0, 22369.0, 15004.0, 9839.0, 6316.0, 4126.0, 2461.0, 1607.0, 971.0, 569.0, 351.0, 200.0, 111.0, 63.0, 30.0, 29.0, 13.0, 9.0, 10.0, 4.0, 2.0, 2.0], "bins": [-0.63232421875, -0.6128921508789062, -0.5934600830078125, -0.5740280151367188, -0.554595947265625, -0.5351638793945312, -0.5157318115234375, -0.49629974365234375, -0.47686767578125, -0.45743560791015625, -0.4380035400390625, -0.41857147216796875, -0.399139404296875, -0.37970733642578125, -0.3602752685546875, -0.34084320068359375, -0.3214111328125, -0.30197906494140625, -0.2825469970703125, -0.26311492919921875, -0.243682861328125, -0.22425079345703125, -0.2048187255859375, -0.18538665771484375, -0.16595458984375, -0.14652252197265625, -0.1270904541015625, -0.10765838623046875, -0.088226318359375, -0.06879425048828125, -0.0493621826171875, -0.02993011474609375, -0.010498046875, 0.00893402099609375, 0.0283660888671875, 0.04779815673828125, 0.067230224609375, 0.08666229248046875, 0.1060943603515625, 0.12552642822265625, 0.14495849609375, 0.16439056396484375, 0.1838226318359375, 0.20325469970703125, 0.222686767578125, 0.24211883544921875, 0.2615509033203125, 0.28098297119140625, 0.3004150390625, 0.31984710693359375, 0.3392791748046875, 0.35871124267578125, 0.378143310546875, 0.39757537841796875, 0.4170074462890625, 0.43643951416015625, 0.45587158203125, 0.47530364990234375, 0.4947357177734375, 0.5141677856445312, 0.533599853515625, 0.5530319213867188, 0.5724639892578125, 0.5918960571289062, 0.611328125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 2.0, 10.0, 8.0, 12.0, 13.0, 15.0, 19.0, 31.0, 28.0, 34.0, 34.0, 36.0, 48.0, 47.0, 38.0, 57.0, 109.0, 731.0, 326.0, 48.0, 32.0, 46.0, 42.0, 34.0, 39.0, 22.0, 12.0, 27.0, 22.0, 21.0, 19.0, 14.0, 7.0, 11.0, 10.0, 6.0, 3.0, 2.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.02734375, -4.846435546875, -4.66552734375, -4.484619140625, -4.3037109375, -4.122802734375, -3.94189453125, -3.760986328125, -3.580078125, -3.399169921875, -3.21826171875, -3.037353515625, -2.8564453125, -2.675537109375, -2.49462890625, -2.313720703125, -2.1328125, -1.951904296875, -1.77099609375, -1.590087890625, -1.4091796875, -1.228271484375, -1.04736328125, -0.866455078125, -0.685546875, -0.504638671875, -0.32373046875, -0.142822265625, 0.0380859375, 0.218994140625, 0.39990234375, 0.580810546875, 0.76171875, 0.942626953125, 1.12353515625, 1.304443359375, 1.4853515625, 1.666259765625, 1.84716796875, 2.028076171875, 2.208984375, 2.389892578125, 2.57080078125, 2.751708984375, 2.9326171875, 3.113525390625, 3.29443359375, 3.475341796875, 3.65625, 3.837158203125, 4.01806640625, 4.198974609375, 4.3798828125, 4.560791015625, 4.74169921875, 4.922607421875, 5.103515625, 5.284423828125, 5.46533203125, 5.646240234375, 5.8271484375, 6.008056640625, 6.18896484375, 6.369873046875, 6.55078125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 13.0, 9.0, 18.0, 19.0, 37.0, 27.0, 37.0, 57.0, 77.0, 108.0, 140.0, 201.0, 305.0, 431.0, 558.0, 820.0, 1191.0, 1969.0, 3801.0, 8582.0, 24006.0, 71284.0, 201838.0, 477514.0, 2407099.0, 2307029.0, 474175.0, 198763.0, 69436.0, 23595.0, 8586.0, 3689.0, 1989.0, 1233.0, 848.0, 549.0, 414.0, 257.0, 202.0, 130.0, 117.0, 82.0, 55.0, 47.0, 31.0, 29.0, 11.0, 6.0, 6.0, 6.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0], "bins": [-1.7333984375, -1.6808624267578125, -1.628326416015625, -1.5757904052734375, -1.52325439453125, -1.4707183837890625, -1.418182373046875, -1.3656463623046875, -1.3131103515625, -1.2605743408203125, -1.208038330078125, -1.1555023193359375, -1.10296630859375, -1.0504302978515625, -0.997894287109375, -0.9453582763671875, -0.892822265625, -0.8402862548828125, -0.787750244140625, -0.7352142333984375, -0.68267822265625, -0.6301422119140625, -0.577606201171875, -0.5250701904296875, -0.4725341796875, -0.4199981689453125, -0.367462158203125, -0.3149261474609375, -0.26239013671875, -0.2098541259765625, -0.157318115234375, -0.1047821044921875, -0.05224609375, 0.0002899169921875, 0.052825927734375, 0.1053619384765625, 0.15789794921875, 0.2104339599609375, 0.262969970703125, 0.3155059814453125, 0.3680419921875, 0.4205780029296875, 0.473114013671875, 0.5256500244140625, 0.57818603515625, 0.6307220458984375, 0.683258056640625, 0.7357940673828125, 0.788330078125, 0.8408660888671875, 0.893402099609375, 0.9459381103515625, 0.99847412109375, 1.0510101318359375, 1.103546142578125, 1.1560821533203125, 1.2086181640625, 1.2611541748046875, 1.313690185546875, 1.3662261962890625, 1.41876220703125, 1.4712982177734375, 1.523834228515625, 1.5763702392578125, 1.62890625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 6.0, 7.0, 4.0, 10.0, 14.0, 13.0, 12.0, 18.0, 16.0, 25.0, 21.0, 24.0, 28.0, 31.0, 31.0, 37.0, 31.0, 37.0, 35.0, 41.0, 214.0, 662.0, 266.0, 41.0, 40.0, 40.0, 38.0, 43.0, 37.0, 29.0, 26.0, 27.0, 19.0, 15.0, 19.0, 13.0, 12.0, 11.0, 6.0, 8.0, 9.0, 4.0, 7.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.90234375, -3.786468505859375, -3.67059326171875, -3.554718017578125, -3.4388427734375, -3.322967529296875, -3.20709228515625, -3.091217041015625, -2.975341796875, -2.859466552734375, -2.74359130859375, -2.627716064453125, -2.5118408203125, -2.395965576171875, -2.28009033203125, -2.164215087890625, -2.04833984375, -1.932464599609375, -1.81658935546875, -1.700714111328125, -1.5848388671875, -1.468963623046875, -1.35308837890625, -1.237213134765625, -1.121337890625, -1.005462646484375, -0.88958740234375, -0.773712158203125, -0.6578369140625, -0.541961669921875, -0.42608642578125, -0.310211181640625, -0.1943359375, -0.078460693359375, 0.03741455078125, 0.153289794921875, 0.2691650390625, 0.385040283203125, 0.50091552734375, 0.616790771484375, 0.732666015625, 0.848541259765625, 0.96441650390625, 1.080291748046875, 1.1961669921875, 1.312042236328125, 1.42791748046875, 1.543792724609375, 1.65966796875, 1.775543212890625, 1.89141845703125, 2.007293701171875, 2.1231689453125, 2.239044189453125, 2.35491943359375, 2.470794677734375, 2.586669921875, 2.702545166015625, 2.81842041015625, 2.934295654296875, 3.0501708984375, 3.166046142578125, 3.28192138671875, 3.397796630859375, 3.513671875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 10.0, 45.0, 102.0, 216.0, 316.0, 192.0, 93.0, 20.0, 12.0, 1.0], "bins": [-38.39568328857422, -37.740325927734375, -37.0849723815918, -36.42961502075195, -35.774261474609375, -35.11890411376953, -34.46355056762695, -33.80819320678711, -33.15283966064453, -32.49748229980469, -31.84212875366211, -31.1867733001709, -30.531417846679688, -29.876060485839844, -29.220705032348633, -28.565349578857422, -27.909992218017578, -27.254636764526367, -26.599281311035156, -25.943925857543945, -25.288570404052734, -24.63321304321289, -23.97785758972168, -23.32250213623047, -22.667146682739258, -22.011791229248047, -21.356435775756836, -20.701080322265625, -20.04572296142578, -19.39036750793457, -18.73501205444336, -18.07965660095215, -17.424301147460938, -16.768945693969727, -16.113590240478516, -15.458233833312988, -14.802878379821777, -14.147522926330566, -13.492166519165039, -12.836811065673828, -12.181456565856934, -11.526101112365723, -10.870744705200195, -10.215389251708984, -9.560033798217773, -8.904678344726562, -8.249322891235352, -7.593966484069824, -6.938611030578613, -6.283255577087402, -5.627899646759033, -4.972543716430664, -4.317188262939453, -3.661832571029663, -3.006476879119873, -2.351120948791504, -1.695765495300293, -1.040409803390503, -0.3850541114807129, 0.27030158042907715, 0.9256572723388672, 1.5810129642486572, 2.2363686561584473, 2.8917245864868164, 3.5470800399780273]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 5.0, 7.0, 7.0, 12.0, 5.0, 10.0, 7.0, 10.0, 21.0, 14.0, 14.0, 22.0, 20.0, 27.0, 38.0, 41.0, 40.0, 40.0, 39.0, 38.0, 39.0, 36.0, 38.0, 42.0, 40.0, 37.0, 40.0, 38.0, 26.0, 20.0, 35.0, 23.0, 25.0, 21.0, 25.0, 17.0, 18.0, 10.0, 10.0, 17.0, 12.0, 8.0, 3.0, 8.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-6.85384464263916, -6.670539379119873, -6.487234115600586, -6.303928375244141, -6.1206231117248535, -5.937317848205566, -5.754012584686279, -5.570707321166992, -5.387401580810547, -5.20409631729126, -5.020791053771973, -4.837485313415527, -4.65418004989624, -4.470874786376953, -4.287569522857666, -4.104264259338379, -3.920958995819092, -3.7376537322998047, -3.5543482303619385, -3.3710429668426514, -3.187737464904785, -3.004432201385498, -2.821126937866211, -2.637821674346924, -2.4545161724090576, -2.2712109088897705, -2.0879054069519043, -1.9046001434326172, -1.7212947607040405, -1.5379893779754639, -1.3546841144561768, -1.1713787317276, -0.9880733489990234, -0.8047679662704468, -0.6214626431465149, -0.438157320022583, -0.25485193729400635, -0.07154655456542969, 0.11175870895385742, 0.2950640916824341, 0.47836947441101074, 0.6616748571395874, 0.8449801802635193, 1.0282855033874512, 1.2115908861160278, 1.3948962688446045, 1.5782015323638916, 1.7615069150924683, 1.944812297821045, 2.128117561340332, 2.3114230632781982, 2.4947283267974854, 2.6780338287353516, 2.8613390922546387, 3.044644355773926, 3.227949619293213, 3.411255121231079, 3.594560384750366, 3.7778658866882324, 3.9611711502075195, 4.144476413726807, 4.327781677246094, 4.511087417602539, 4.694392681121826, 4.877697944641113]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 1.0, 10.0, 3.0, 10.0, 10.0, 20.0, 22.0, 35.0, 61.0, 133.0, 231.0, 536.0, 1270.0, 2966.0, 7230.0, 22256.0, 102875.0, 1521857.0, 2315876.0, 174180.0, 28973.0, 9390.0, 3561.0, 1448.0, 643.0, 319.0, 151.0, 78.0, 57.0, 27.0, 16.0, 9.0, 13.0, 7.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2369384765625, -0.2281970977783203, -0.21945571899414062, -0.21071434020996094, -0.20197296142578125, -0.19323158264160156, -0.18449020385742188, -0.1757488250732422, -0.1670074462890625, -0.1582660675048828, -0.14952468872070312, -0.14078330993652344, -0.13204193115234375, -0.12330055236816406, -0.11455917358398438, -0.10581779479980469, -0.097076416015625, -0.08833503723144531, -0.07959365844726562, -0.07085227966308594, -0.06211090087890625, -0.05336952209472656, -0.044628143310546875, -0.03588676452636719, -0.0271453857421875, -0.018404006958007812, -0.009662628173828125, -0.0009212493896484375, 0.00782012939453125, 0.016561508178710938, 0.025302886962890625, 0.03404426574707031, 0.04278564453125, 0.05152702331542969, 0.060268402099609375, 0.06900978088378906, 0.07775115966796875, 0.08649253845214844, 0.09523391723632812, 0.10397529602050781, 0.1127166748046875, 0.12145805358886719, 0.13019943237304688, 0.13894081115722656, 0.14768218994140625, 0.15642356872558594, 0.16516494750976562, 0.1739063262939453, 0.182647705078125, 0.1913890838623047, 0.20013046264648438, 0.20887184143066406, 0.21761322021484375, 0.22635459899902344, 0.23509597778320312, 0.2438373565673828, 0.2525787353515625, 0.2613201141357422, 0.2700614929199219, 0.27880287170410156, 0.28754425048828125, 0.29628562927246094, 0.3050270080566406, 0.3137683868408203, 0.322509765625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 7.0, 7.0, 11.0, 12.0, 11.0, 20.0, 20.0, 27.0, 37.0, 44.0, 50.0, 61.0, 43.0, 81.0, 78.0, 75.0, 53.0, 45.0, 59.0, 45.0, 59.0, 34.0, 27.0, 24.0, 13.0, 21.0, 13.0, 9.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1251220703125, -0.12065315246582031, -0.11618423461914062, -0.11171531677246094, -0.10724639892578125, -0.10277748107910156, -0.09830856323242188, -0.09383964538574219, -0.0893707275390625, -0.08490180969238281, -0.08043289184570312, -0.07596397399902344, -0.07149505615234375, -0.06702613830566406, -0.06255722045898438, -0.05808830261230469, -0.053619384765625, -0.04915046691894531, -0.044681549072265625, -0.04021263122558594, -0.03574371337890625, -0.03127479553222656, -0.026805877685546875, -0.022336959838867188, -0.0178680419921875, -0.013399124145507812, -0.008930206298828125, -0.0044612884521484375, 7.62939453125e-06, 0.0044765472412109375, 0.008945465087890625, 0.013414382934570312, 0.01788330078125, 0.022352218627929688, 0.026821136474609375, 0.03129005432128906, 0.03575897216796875, 0.04022789001464844, 0.044696807861328125, 0.04916572570800781, 0.0536346435546875, 0.05810356140136719, 0.06257247924804688, 0.06704139709472656, 0.07151031494140625, 0.07597923278808594, 0.08044815063476562, 0.08491706848144531, 0.089385986328125, 0.09385490417480469, 0.09832382202148438, 0.10279273986816406, 0.10726165771484375, 0.11173057556152344, 0.11619949340820312, 0.12066841125488281, 0.1251373291015625, 0.1296062469482422, 0.13407516479492188, 0.13854408264160156, 0.14301300048828125, 0.14748191833496094, 0.15195083618164062, 0.1564197540283203, 0.160888671875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 7.0, 2.0, 4.0, 2.0, 8.0, 5.0, 7.0, 13.0, 23.0, 28.0, 37.0, 54.0, 77.0, 162.0, 260.0, 501.0, 1235.0, 3669.0, 12347.0, 61325.0, 530538.0, 2703471.0, 774085.0, 83944.0, 15354.0, 4281.0, 1524.0, 584.0, 314.0, 144.0, 91.0, 46.0, 33.0, 31.0, 17.0, 11.0, 15.0, 12.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17236328125, -0.1665363311767578, -0.16070938110351562, -0.15488243103027344, -0.14905548095703125, -0.14322853088378906, -0.13740158081054688, -0.1315746307373047, -0.1257476806640625, -0.11992073059082031, -0.11409378051757812, -0.10826683044433594, -0.10243988037109375, -0.09661293029785156, -0.09078598022460938, -0.08495903015136719, -0.079132080078125, -0.07330513000488281, -0.06747817993164062, -0.06165122985839844, -0.05582427978515625, -0.04999732971191406, -0.044170379638671875, -0.03834342956542969, -0.0325164794921875, -0.026689529418945312, -0.020862579345703125, -0.015035629272460938, -0.00920867919921875, -0.0033817291259765625, 0.002445220947265625, 0.008272171020507812, 0.01409912109375, 0.019926071166992188, 0.025753021240234375, 0.03157997131347656, 0.03740692138671875, 0.04323387145996094, 0.049060821533203125, 0.05488777160644531, 0.0607147216796875, 0.06654167175292969, 0.07236862182617188, 0.07819557189941406, 0.08402252197265625, 0.08984947204589844, 0.09567642211914062, 0.10150337219238281, 0.107330322265625, 0.11315727233886719, 0.11898422241210938, 0.12481117248535156, 0.13063812255859375, 0.13646507263183594, 0.14229202270507812, 0.1481189727783203, 0.1539459228515625, 0.1597728729248047, 0.16559982299804688, 0.17142677307128906, 0.17725372314453125, 0.18308067321777344, 0.18890762329101562, 0.1947345733642578, 0.2005615234375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 6.0, 4.0, 7.0, 13.0, 8.0, 23.0, 35.0, 34.0, 58.0, 87.0, 114.0, 200.0, 240.0, 325.0, 427.0, 447.0, 486.0, 413.0, 323.0, 221.0, 184.0, 114.0, 83.0, 56.0, 37.0, 31.0, 21.0, 23.0, 13.0, 4.0, 5.0, 6.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.1318359375, -0.12817859649658203, -0.12452125549316406, -0.1208639144897461, -0.11720657348632812, -0.11354923248291016, -0.10989189147949219, -0.10623455047607422, -0.10257720947265625, -0.09891986846923828, -0.09526252746582031, -0.09160518646240234, -0.08794784545898438, -0.0842905044555664, -0.08063316345214844, -0.07697582244873047, -0.0733184814453125, -0.06966114044189453, -0.06600379943847656, -0.062346458435058594, -0.058689117431640625, -0.055031776428222656, -0.05137443542480469, -0.04771709442138672, -0.04405975341796875, -0.04040241241455078, -0.03674507141113281, -0.033087730407714844, -0.029430389404296875, -0.025773048400878906, -0.022115707397460938, -0.01845836639404297, -0.014801025390625, -0.011143684387207031, -0.0074863433837890625, -0.0038290023803710938, -0.000171661376953125, 0.0034856796264648438, 0.0071430206298828125, 0.010800361633300781, 0.01445770263671875, 0.01811504364013672, 0.021772384643554688, 0.025429725646972656, 0.029087066650390625, 0.032744407653808594, 0.03640174865722656, 0.04005908966064453, 0.0437164306640625, 0.04737377166748047, 0.05103111267089844, 0.054688453674316406, 0.058345794677734375, 0.062003135681152344, 0.06566047668457031, 0.06931781768798828, 0.07297515869140625, 0.07663249969482422, 0.08028984069824219, 0.08394718170166016, 0.08760452270507812, 0.0912618637084961, 0.09491920471191406, 0.09857654571533203, 0.10223388671875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 4.0, 7.0, 16.0, 38.0, 78.0, 122.0, 158.0, 188.0, 161.0, 95.0, 72.0, 30.0, 16.0, 9.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9050458669662476, -0.878834068775177, -0.8526222705841064, -0.8264104723930359, -0.8001986742019653, -0.77398681640625, -0.7477750182151794, -0.7215632200241089, -0.6953514218330383, -0.6691396236419678, -0.6429278254508972, -0.6167160272598267, -0.5905041694641113, -0.5642924308776855, -0.5380805730819702, -0.5118687748908997, -0.4856569766998291, -0.45944517850875854, -0.433233380317688, -0.40702155232429504, -0.3808097541332245, -0.35459795594215393, -0.328386127948761, -0.30217432975769043, -0.2759625315666199, -0.24975073337554932, -0.22353892028331757, -0.19732710719108582, -0.17111530900001526, -0.1449035108089447, -0.11869169771671295, -0.0924798846244812, -0.06626814603805542, -0.040056340396404266, -0.013844534754753113, 0.01236727088689804, 0.038579076528549194, 0.06479087471961975, 0.0910026878118515, 0.11721450090408325, 0.1434262990951538, 0.16963809728622437, 0.19584991037845612, 0.22206172347068787, 0.24827352166175842, 0.274485319852829, 0.3006971478462219, 0.3269089460372925, 0.35312074422836304, 0.3793325424194336, 0.40554434061050415, 0.4317561686038971, 0.45796796679496765, 0.4841797649860382, 0.5103915929794312, 0.5366033911705017, 0.5628151893615723, 0.5890269875526428, 0.6152387857437134, 0.6414505839347839, 0.6676623821258545, 0.6938742399215698, 0.7200860381126404, 0.7462978363037109, 0.7725096344947815]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 1.0, 11.0, 7.0, 10.0, 14.0, 24.0, 16.0, 18.0, 23.0, 29.0, 27.0, 32.0, 47.0, 40.0, 41.0, 61.0, 47.0, 33.0, 40.0, 38.0, 53.0, 54.0, 35.0, 48.0, 33.0, 30.0, 34.0, 25.0, 21.0, 28.0, 16.0, 16.0, 11.0, 8.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.37412774562835693, -0.36378976702690125, -0.35345175862312317, -0.3431137800216675, -0.3327757716178894, -0.3224377930164337, -0.31209978461265564, -0.30176180601119995, -0.2914237976074219, -0.2810858190059662, -0.2707478106021881, -0.2604098320007324, -0.25007182359695435, -0.23973384499549866, -0.22939585149288177, -0.2190578579902649, -0.2087198793888092, -0.19838188588619232, -0.18804389238357544, -0.17770589888095856, -0.16736790537834167, -0.157029926776886, -0.1466919332742691, -0.13635393977165222, -0.12601594626903534, -0.11567795276641846, -0.10533995926380157, -0.09500197321176529, -0.08466397970914841, -0.07432598620653152, -0.06398800015449524, -0.05365000665187836, -0.043312013149261475, -0.03297401964664459, -0.02263602986931801, -0.012298038229346275, -0.0019600465893745422, 0.00837794691324234, 0.018715936690568924, 0.029053926467895508, 0.03939191997051239, 0.04972991347312927, 0.060067903250455856, 0.07040589302778244, 0.08074388653039932, 0.0910818800330162, 0.10141986608505249, 0.11175785958766937, 0.12209585309028625, 0.13243384659290314, 0.14277184009552002, 0.1531098335981369, 0.16344782710075378, 0.17378580570220947, 0.18412379920482635, 0.19446179270744324, 0.20479978621006012, 0.215137779712677, 0.22547577321529388, 0.23581376671791077, 0.24615174531936646, 0.25648975372314453, 0.2668277323246002, 0.2771657109260559, 0.287503719329834]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 2.0, 3.0, 8.0, 5.0, 8.0, 7.0, 8.0, 12.0, 16.0, 19.0, 31.0, 45.0, 68.0, 70.0, 100.0, 163.0, 208.0, 338.0, 494.0, 759.0, 1415.0, 2609.0, 6048.0, 18030.0, 69424.0, 308558.0, 463738.0, 128898.0, 29919.0, 9258.0, 3568.0, 1824.0, 1045.0, 621.0, 348.0, 253.0, 178.0, 125.0, 83.0, 81.0, 38.0, 32.0, 18.0, 24.0, 11.0, 9.0, 9.0, 6.0, 4.0, 3.0, 5.0, 2.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.193115234375, -0.18650245666503906, -0.17988967895507812, -0.1732769012451172, -0.16666412353515625, -0.1600513458251953, -0.15343856811523438, -0.14682579040527344, -0.1402130126953125, -0.13360023498535156, -0.12698745727539062, -0.12037467956542969, -0.11376190185546875, -0.10714912414550781, -0.10053634643554688, -0.09392356872558594, -0.087310791015625, -0.08069801330566406, -0.07408523559570312, -0.06747245788574219, -0.06085968017578125, -0.05424690246582031, -0.047634124755859375, -0.04102134704589844, -0.0344085693359375, -0.027795791625976562, -0.021183013916015625, -0.014570236206054688, -0.00795745849609375, -0.0013446807861328125, 0.005268096923828125, 0.011880874633789062, 0.01849365234375, 0.025106430053710938, 0.031719207763671875, 0.03833198547363281, 0.04494476318359375, 0.05155754089355469, 0.058170318603515625, 0.06478309631347656, 0.0713958740234375, 0.07800865173339844, 0.08462142944335938, 0.09123420715332031, 0.09784698486328125, 0.10445976257324219, 0.11107254028320312, 0.11768531799316406, 0.124298095703125, 0.13091087341308594, 0.13752365112304688, 0.1441364288330078, 0.15074920654296875, 0.1573619842529297, 0.16397476196289062, 0.17058753967285156, 0.1772003173828125, 0.18381309509277344, 0.19042587280273438, 0.1970386505126953, 0.20365142822265625, 0.2102642059326172, 0.21687698364257812, 0.22348976135253906, 0.2301025390625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 2.0, 4.0, 9.0, 9.0, 7.0, 9.0, 15.0, 16.0, 20.0, 16.0, 22.0, 29.0, 36.0, 41.0, 44.0, 55.0, 47.0, 54.0, 55.0, 76.0, 48.0, 56.0, 55.0, 32.0, 41.0, 28.0, 35.0, 36.0, 20.0, 20.0, 27.0, 8.0, 5.0, 13.0, 2.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1318359375, -0.12804889678955078, -0.12426185607910156, -0.12047481536865234, -0.11668777465820312, -0.1129007339477539, -0.10911369323730469, -0.10532665252685547, -0.10153961181640625, -0.09775257110595703, -0.09396553039550781, -0.0901784896850586, -0.08639144897460938, -0.08260440826416016, -0.07881736755371094, -0.07503032684326172, -0.0712432861328125, -0.06745624542236328, -0.06366920471191406, -0.059882164001464844, -0.056095123291015625, -0.052308082580566406, -0.04852104187011719, -0.04473400115966797, -0.04094696044921875, -0.03715991973876953, -0.03337287902832031, -0.029585838317871094, -0.025798797607421875, -0.022011756896972656, -0.018224716186523438, -0.014437675476074219, -0.010650634765625, -0.006863594055175781, -0.0030765533447265625, 0.0007104873657226562, 0.004497528076171875, 0.008284568786621094, 0.012071609497070312, 0.01585865020751953, 0.01964569091796875, 0.02343273162841797, 0.027219772338867188, 0.031006813049316406, 0.034793853759765625, 0.038580894470214844, 0.04236793518066406, 0.04615497589111328, 0.0499420166015625, 0.05372905731201172, 0.05751609802246094, 0.061303138732910156, 0.06509017944335938, 0.0688772201538086, 0.07266426086425781, 0.07645130157470703, 0.08023834228515625, 0.08402538299560547, 0.08781242370605469, 0.0915994644165039, 0.09538650512695312, 0.09917354583740234, 0.10296058654785156, 0.10674762725830078, 0.11053466796875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 5.0, 2.0, 3.0, 9.0, 12.0, 11.0, 13.0, 13.0, 16.0, 25.0, 30.0, 57.0, 97.0, 202.0, 453.0, 1111.0, 3128.0, 9656.0, 32141.0, 106313.0, 279569.0, 356968.0, 176349.0, 57390.0, 16697.0, 5117.0, 1785.0, 697.0, 292.0, 135.0, 71.0, 49.0, 32.0, 22.0, 22.0, 7.0, 10.0, 17.0, 4.0, 11.0, 4.0, 5.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1654052734375, -0.16057395935058594, -0.15574264526367188, -0.1509113311767578, -0.14608001708984375, -0.1412487030029297, -0.13641738891601562, -0.13158607482910156, -0.1267547607421875, -0.12192344665527344, -0.11709213256835938, -0.11226081848144531, -0.10742950439453125, -0.10259819030761719, -0.09776687622070312, -0.09293556213378906, -0.088104248046875, -0.08327293395996094, -0.07844161987304688, -0.07361030578613281, -0.06877899169921875, -0.06394767761230469, -0.059116363525390625, -0.05428504943847656, -0.0494537353515625, -0.04462242126464844, -0.039791107177734375, -0.03495979309082031, -0.03012847900390625, -0.025297164916992188, -0.020465850830078125, -0.015634536743164062, -0.01080322265625, -0.0059719085693359375, -0.001140594482421875, 0.0036907196044921875, 0.00852203369140625, 0.013353347778320312, 0.018184661865234375, 0.023015975952148438, 0.0278472900390625, 0.03267860412597656, 0.037509918212890625, 0.04234123229980469, 0.04717254638671875, 0.05200386047363281, 0.056835174560546875, 0.06166648864746094, 0.066497802734375, 0.07132911682128906, 0.07616043090820312, 0.08099174499511719, 0.08582305908203125, 0.09065437316894531, 0.09548568725585938, 0.10031700134277344, 0.1051483154296875, 0.10997962951660156, 0.11481094360351562, 0.11964225769042969, 0.12447357177734375, 0.1293048858642578, 0.13413619995117188, 0.13896751403808594, 0.143798828125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 6.0, 10.0, 4.0, 9.0, 7.0, 10.0, 19.0, 30.0, 18.0, 29.0, 30.0, 25.0, 29.0, 33.0, 35.0, 41.0, 43.0, 49.0, 48.0, 49.0, 48.0, 49.0, 44.0, 51.0, 43.0, 29.0, 39.0, 22.0, 21.0, 21.0, 17.0, 13.0, 16.0, 12.0, 11.0, 12.0, 7.0, 7.0, 5.0, 9.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2398681640625, -0.23122215270996094, -0.22257614135742188, -0.2139301300048828, -0.20528411865234375, -0.1966381072998047, -0.18799209594726562, -0.17934608459472656, -0.1707000732421875, -0.16205406188964844, -0.15340805053710938, -0.1447620391845703, -0.13611602783203125, -0.1274700164794922, -0.11882400512695312, -0.11017799377441406, -0.101531982421875, -0.09288597106933594, -0.08423995971679688, -0.07559394836425781, -0.06694793701171875, -0.05830192565917969, -0.049655914306640625, -0.04100990295410156, -0.0323638916015625, -0.023717880249023438, -0.015071868896484375, -0.0064258575439453125, 0.00222015380859375, 0.010866165161132812, 0.019512176513671875, 0.028158187866210938, 0.03680419921875, 0.04545021057128906, 0.054096221923828125, 0.06274223327636719, 0.07138824462890625, 0.08003425598144531, 0.08868026733398438, 0.09732627868652344, 0.1059722900390625, 0.11461830139160156, 0.12326431274414062, 0.1319103240966797, 0.14055633544921875, 0.1492023468017578, 0.15784835815429688, 0.16649436950683594, 0.175140380859375, 0.18378639221191406, 0.19243240356445312, 0.2010784149169922, 0.20972442626953125, 0.2183704376220703, 0.22701644897460938, 0.23566246032714844, 0.2443084716796875, 0.25295448303222656, 0.2616004943847656, 0.2702465057373047, 0.27889251708984375, 0.2875385284423828, 0.2961845397949219, 0.30483055114746094, 0.3134765625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 1.0, 3.0, 10.0, 10.0, 16.0, 14.0, 11.0, 18.0, 29.0, 59.0, 81.0, 112.0, 195.0, 304.0, 596.0, 1166.0, 2346.0, 5538.0, 15200.0, 52924.0, 212126.0, 459851.0, 217488.0, 54059.0, 15599.0, 5624.0, 2440.0, 1174.0, 630.0, 319.0, 197.0, 139.0, 94.0, 48.0, 34.0, 18.0, 23.0, 8.0, 12.0, 10.0, 3.0, 8.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07391357421875, -0.0716400146484375, -0.069366455078125, -0.0670928955078125, -0.0648193359375, -0.0625457763671875, -0.060272216796875, -0.0579986572265625, -0.05572509765625, -0.0534515380859375, -0.051177978515625, -0.0489044189453125, -0.046630859375, -0.0443572998046875, -0.042083740234375, -0.0398101806640625, -0.03753662109375, -0.0352630615234375, -0.032989501953125, -0.0307159423828125, -0.0284423828125, -0.0261688232421875, -0.023895263671875, -0.0216217041015625, -0.01934814453125, -0.0170745849609375, -0.014801025390625, -0.0125274658203125, -0.01025390625, -0.0079803466796875, -0.005706787109375, -0.0034332275390625, -0.00115966796875, 0.0011138916015625, 0.003387451171875, 0.0056610107421875, 0.0079345703125, 0.0102081298828125, 0.012481689453125, 0.0147552490234375, 0.01702880859375, 0.0193023681640625, 0.021575927734375, 0.0238494873046875, 0.026123046875, 0.0283966064453125, 0.030670166015625, 0.0329437255859375, 0.03521728515625, 0.0374908447265625, 0.039764404296875, 0.0420379638671875, 0.0443115234375, 0.0465850830078125, 0.048858642578125, 0.0511322021484375, 0.05340576171875, 0.0556793212890625, 0.057952880859375, 0.0602264404296875, 0.0625, 0.0647735595703125, 0.067047119140625, 0.0693206787109375, 0.07159423828125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 9.0, 9.0, 3.0, 11.0, 17.0, 12.0, 21.0, 16.0, 33.0, 47.0, 48.0, 40.0, 60.0, 66.0, 65.0, 73.0, 48.0, 68.0, 57.0, 65.0, 39.0, 35.0, 35.0, 24.0, 14.0, 16.0, 23.0, 16.0, 14.0, 7.0, 4.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.046627044677734e-06, -7.821246981620789e-06, -7.595866918563843e-06, -7.370486855506897e-06, -7.145106792449951e-06, -6.919726729393005e-06, -6.6943466663360596e-06, -6.468966603279114e-06, -6.243586540222168e-06, -6.018206477165222e-06, -5.792826414108276e-06, -5.5674463510513306e-06, -5.342066287994385e-06, -5.116686224937439e-06, -4.891306161880493e-06, -4.665926098823547e-06, -4.4405460357666016e-06, -4.215165972709656e-06, -3.98978590965271e-06, -3.764405846595764e-06, -3.5390257835388184e-06, -3.3136457204818726e-06, -3.0882656574249268e-06, -2.862885594367981e-06, -2.637505531311035e-06, -2.4121254682540894e-06, -2.1867454051971436e-06, -1.9613653421401978e-06, -1.735985279083252e-06, -1.5106052160263062e-06, -1.2852251529693604e-06, -1.0598450899124146e-06, -8.344650268554688e-07, -6.09084963798523e-07, -3.8370490074157715e-07, -1.5832483768463135e-07, 6.705522537231445e-08, 2.9243528842926025e-07, 5.178153514862061e-07, 7.431954145431519e-07, 9.685754776000977e-07, 1.1939555406570435e-06, 1.4193356037139893e-06, 1.644715666770935e-06, 1.8700957298278809e-06, 2.0954757928848267e-06, 2.3208558559417725e-06, 2.5462359189987183e-06, 2.771615982055664e-06, 2.99699604511261e-06, 3.2223761081695557e-06, 3.4477561712265015e-06, 3.6731362342834473e-06, 3.898516297340393e-06, 4.123896360397339e-06, 4.349276423454285e-06, 4.5746564865112305e-06, 4.800036549568176e-06, 5.025416612625122e-06, 5.250796675682068e-06, 5.476176738739014e-06, 5.7015568017959595e-06, 5.926936864852905e-06, 6.152316927909851e-06, 6.377696990966797e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 4.0, 20.0, 12.0, 35.0, 40.0, 44.0, 80.0, 143.0, 234.0, 382.0, 724.0, 1413.0, 3079.0, 7777.0, 22614.0, 80988.0, 307167.0, 425935.0, 141203.0, 36335.0, 11747.0, 4451.0, 1979.0, 916.0, 509.0, 289.0, 183.0, 86.0, 52.0, 33.0, 19.0, 20.0, 12.0, 8.0, 7.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08306884765625, -0.08063983917236328, -0.07821083068847656, -0.07578182220458984, -0.07335281372070312, -0.0709238052368164, -0.06849479675292969, -0.06606578826904297, -0.06363677978515625, -0.06120777130126953, -0.05877876281738281, -0.056349754333496094, -0.053920745849609375, -0.051491737365722656, -0.04906272888183594, -0.04663372039794922, -0.0442047119140625, -0.04177570343017578, -0.03934669494628906, -0.036917686462402344, -0.034488677978515625, -0.032059669494628906, -0.029630661010742188, -0.02720165252685547, -0.02477264404296875, -0.02234363555908203, -0.019914627075195312, -0.017485618591308594, -0.015056610107421875, -0.012627601623535156, -0.010198593139648438, -0.007769584655761719, -0.005340576171875, -0.0029115676879882812, -0.0004825592041015625, 0.0019464492797851562, 0.004375457763671875, 0.006804466247558594, 0.009233474731445312, 0.011662483215332031, 0.01409149169921875, 0.01652050018310547, 0.018949508666992188, 0.021378517150878906, 0.023807525634765625, 0.026236534118652344, 0.028665542602539062, 0.03109455108642578, 0.0335235595703125, 0.03595256805419922, 0.03838157653808594, 0.040810585021972656, 0.043239593505859375, 0.045668601989746094, 0.04809761047363281, 0.05052661895751953, 0.05295562744140625, 0.05538463592529297, 0.05781364440917969, 0.060242652893066406, 0.06267166137695312, 0.06510066986083984, 0.06752967834472656, 0.06995868682861328, 0.0723876953125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 4.0, 5.0, 5.0, 8.0, 11.0, 14.0, 14.0, 13.0, 27.0, 28.0, 40.0, 41.0, 39.0, 71.0, 70.0, 64.0, 100.0, 75.0, 77.0, 64.0, 42.0, 46.0, 30.0, 29.0, 21.0, 16.0, 8.0, 8.0, 6.0, 4.0, 10.0, 1.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0677490234375, -0.0656728744506836, -0.06359672546386719, -0.06152057647705078, -0.059444427490234375, -0.05736827850341797, -0.05529212951660156, -0.053215980529785156, -0.05113983154296875, -0.049063682556152344, -0.04698753356933594, -0.04491138458251953, -0.042835235595703125, -0.04075908660888672, -0.03868293762207031, -0.036606788635253906, -0.0345306396484375, -0.032454490661621094, -0.030378341674804688, -0.02830219268798828, -0.026226043701171875, -0.02414989471435547, -0.022073745727539062, -0.019997596740722656, -0.01792144775390625, -0.015845298767089844, -0.013769149780273438, -0.011693000793457031, -0.009616851806640625, -0.007540702819824219, -0.0054645538330078125, -0.0033884048461914062, -0.001312255859375, 0.0007638931274414062, 0.0028400421142578125, 0.004916191101074219, 0.006992340087890625, 0.009068489074707031, 0.011144638061523438, 0.013220787048339844, 0.01529693603515625, 0.017373085021972656, 0.019449234008789062, 0.02152538299560547, 0.023601531982421875, 0.02567768096923828, 0.027753829956054688, 0.029829978942871094, 0.0319061279296875, 0.033982276916503906, 0.03605842590332031, 0.03813457489013672, 0.040210723876953125, 0.04228687286376953, 0.04436302185058594, 0.046439170837402344, 0.04851531982421875, 0.050591468811035156, 0.05266761779785156, 0.05474376678466797, 0.056819915771484375, 0.05889606475830078, 0.06097221374511719, 0.0630483627319336, 0.06512451171875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 7.0, 15.0, 31.0, 78.0, 148.0, 219.0, 222.0, 155.0, 79.0, 30.0, 17.0, 8.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7163475751876831, -0.6607193350791931, -0.6050910949707031, -0.5494627952575684, -0.49383458495140076, -0.43820634484291077, -0.3825780749320984, -0.3269498348236084, -0.2713215947151184, -0.21569335460662842, -0.16006509959697723, -0.10443684458732605, -0.04880860447883606, 0.006819635629653931, 0.06244790554046631, 0.1180761456489563, 0.1737043857574463, 0.22933262586593628, 0.28496086597442627, 0.34058913588523865, 0.39621737599372864, 0.45184561610221863, 0.507473886013031, 0.563102126121521, 0.618730366230011, 0.674358606338501, 0.729986846446991, 0.785615086555481, 0.8412433862686157, 0.8968715667724609, 0.9524998664855957, 1.0081281661987305, 1.0637564659118652, 1.119384765625, 1.1750129461288452, 1.23064124584198, 1.2862694263458252, 1.34189772605896, 1.3975260257720947, 1.45315420627594, 1.5087823867797852, 1.56441068649292, 1.6200388669967651, 1.6756671667099, 1.7312953472137451, 1.7869236469268799, 1.8425519466400146, 1.8981801271438599, 1.9538084268569946, 2.00943660736084, 2.0650649070739746, 2.1206932067871094, 2.176321506500244, 2.2319495677948, 2.2875778675079346, 2.3432061672210693, 2.398834466934204, 2.454462766647339, 2.5100910663604736, 2.5657191276550293, 2.621347427368164, 2.676975727081299, 2.7326040267944336, 2.7882323265075684, 2.843860387802124]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 9.0, 10.0, 11.0, 13.0, 11.0, 19.0, 18.0, 18.0, 20.0, 31.0, 31.0, 31.0, 40.0, 30.0, 45.0, 31.0, 58.0, 47.0, 42.0, 33.0, 46.0, 46.0, 46.0, 38.0, 29.0, 42.0, 32.0, 27.0, 23.0, 17.0, 14.0, 15.0, 12.0, 12.0, 10.0, 2.0, 5.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.2559125423431396, -1.2153220176696777, -1.1747313737869263, -1.1341408491134644, -1.0935503244400024, -1.0529597997665405, -1.012369155883789, -0.9717786312103271, -0.9311881065368652, -0.8905975222587585, -0.8500069975852966, -0.8094164133071899, -0.768825888633728, -0.7282353043556213, -0.6876447200775146, -0.6470541954040527, -0.606463611125946, -0.5658730268478394, -0.5252825021743774, -0.48469191789627075, -0.44410139322280884, -0.40351080894470215, -0.36292025446891785, -0.32232969999313354, -0.28173914551734924, -0.24114859104156494, -0.20055803656578064, -0.15996746718883514, -0.11937691271305084, -0.07878635823726654, -0.038195788860321045, 0.002394765615463257, 0.04298532009124756, 0.08357587456703186, 0.12416643649339676, 0.16475699841976166, 0.20534755289554596, 0.24593810737133026, 0.28652867674827576, 0.32711923122406006, 0.36770978569984436, 0.40830034017562866, 0.44889089465141296, 0.48948144912719727, 0.530072033405304, 0.5706625580787659, 0.6112531423568726, 0.6518436670303345, 0.6924342513084412, 0.7330248355865479, 0.7736153602600098, 0.8142059445381165, 0.8547964692115784, 0.8953870534896851, 0.935977578163147, 0.9765681624412537, 1.0171587467193604, 1.0577492713928223, 1.0983399152755737, 1.1389304399490356, 1.1795209646224976, 1.2201114892959595, 1.260702133178711, 1.3012926578521729, 1.3418831825256348]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 7.0, 2.0, 6.0, 8.0, 5.0, 6.0, 14.0, 17.0, 16.0, 21.0, 32.0, 44.0, 57.0, 113.0, 239.0, 533.0, 1512.0, 5487.0, 28820.0, 415632.0, 3564301.0, 155508.0, 16689.0, 3376.0, 990.0, 383.0, 158.0, 74.0, 42.0, 36.0, 29.0, 24.0, 12.0, 18.0, 8.0, 14.0, 8.0, 6.0, 9.0, 1.0, 4.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.6259765625, -0.6082687377929688, -0.5905609130859375, -0.5728530883789062, -0.555145263671875, -0.5374374389648438, -0.5197296142578125, -0.5020217895507812, -0.48431396484375, -0.46660614013671875, -0.4488983154296875, -0.43119049072265625, -0.413482666015625, -0.39577484130859375, -0.3780670166015625, -0.36035919189453125, -0.3426513671875, -0.32494354248046875, -0.3072357177734375, -0.28952789306640625, -0.271820068359375, -0.25411224365234375, -0.2364044189453125, -0.21869659423828125, -0.20098876953125, -0.18328094482421875, -0.1655731201171875, -0.14786529541015625, -0.130157470703125, -0.11244964599609375, -0.0947418212890625, -0.07703399658203125, -0.059326171875, -0.04161834716796875, -0.0239105224609375, -0.00620269775390625, 0.011505126953125, 0.02921295166015625, 0.0469207763671875, 0.06462860107421875, 0.08233642578125, 0.10004425048828125, 0.1177520751953125, 0.13545989990234375, 0.153167724609375, 0.17087554931640625, 0.1885833740234375, 0.20629119873046875, 0.2239990234375, 0.24170684814453125, 0.2594146728515625, 0.27712249755859375, 0.294830322265625, 0.31253814697265625, 0.3302459716796875, 0.34795379638671875, 0.36566162109375, 0.38336944580078125, 0.4010772705078125, 0.41878509521484375, 0.436492919921875, 0.45420074462890625, 0.4719085693359375, 0.48961639404296875, 0.50732421875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 7.0, 9.0, 10.0, 9.0, 12.0, 16.0, 17.0, 18.0, 15.0, 29.0, 26.0, 38.0, 33.0, 36.0, 50.0, 51.0, 54.0, 61.0, 43.0, 41.0, 43.0, 34.0, 47.0, 41.0, 32.0, 40.0, 28.0, 32.0, 18.0, 14.0, 18.0, 9.0, 17.0, 12.0, 5.0, 9.0, 7.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.12469482421875, -0.12134075164794922, -0.11798667907714844, -0.11463260650634766, -0.11127853393554688, -0.1079244613647461, -0.10457038879394531, -0.10121631622314453, -0.09786224365234375, -0.09450817108154297, -0.09115409851074219, -0.0878000259399414, -0.08444595336914062, -0.08109188079833984, -0.07773780822753906, -0.07438373565673828, -0.0710296630859375, -0.06767559051513672, -0.06432151794433594, -0.060967445373535156, -0.057613372802734375, -0.054259300231933594, -0.05090522766113281, -0.04755115509033203, -0.04419708251953125, -0.04084300994873047, -0.03748893737792969, -0.034134864807128906, -0.030780792236328125, -0.027426719665527344, -0.024072647094726562, -0.02071857452392578, -0.017364501953125, -0.014010429382324219, -0.010656356811523438, -0.007302284240722656, -0.003948211669921875, -0.0005941390991210938, 0.0027599334716796875, 0.006114006042480469, 0.00946807861328125, 0.012822151184082031, 0.016176223754882812, 0.019530296325683594, 0.022884368896484375, 0.026238441467285156, 0.029592514038085938, 0.03294658660888672, 0.0363006591796875, 0.03965473175048828, 0.04300880432128906, 0.046362876892089844, 0.049716949462890625, 0.053071022033691406, 0.05642509460449219, 0.05977916717529297, 0.06313323974609375, 0.06648731231689453, 0.06984138488769531, 0.0731954574584961, 0.07654953002929688, 0.07990360260009766, 0.08325767517089844, 0.08661174774169922, 0.0899658203125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 1.0, 7.0, 11.0, 7.0, 23.0, 18.0, 35.0, 39.0, 93.0, 128.0, 223.0, 392.0, 757.0, 1545.0, 3039.0, 6858.0, 15832.0, 41137.0, 120240.0, 411574.0, 1532211.0, 1478753.0, 395509.0, 117425.0, 40013.0, 15728.0, 6516.0, 3091.0, 1499.0, 711.0, 353.0, 212.0, 105.0, 81.0, 39.0, 25.0, 20.0, 16.0, 10.0, 3.0, 1.0, 0.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.251953125, -0.2445392608642578, -0.23712539672851562, -0.22971153259277344, -0.22229766845703125, -0.21488380432128906, -0.20746994018554688, -0.2000560760498047, -0.1926422119140625, -0.1852283477783203, -0.17781448364257812, -0.17040061950683594, -0.16298675537109375, -0.15557289123535156, -0.14815902709960938, -0.1407451629638672, -0.133331298828125, -0.1259174346923828, -0.11850357055664062, -0.11108970642089844, -0.10367584228515625, -0.09626197814941406, -0.08884811401367188, -0.08143424987792969, -0.0740203857421875, -0.06660652160644531, -0.059192657470703125, -0.05177879333496094, -0.04436492919921875, -0.03695106506347656, -0.029537200927734375, -0.022123336791992188, -0.01470947265625, -0.0072956085205078125, 0.000118255615234375, 0.0075321197509765625, 0.01494598388671875, 0.022359848022460938, 0.029773712158203125, 0.03718757629394531, 0.0446014404296875, 0.05201530456542969, 0.059429168701171875, 0.06684303283691406, 0.07425689697265625, 0.08167076110839844, 0.08908462524414062, 0.09649848937988281, 0.103912353515625, 0.11132621765136719, 0.11874008178710938, 0.12615394592285156, 0.13356781005859375, 0.14098167419433594, 0.14839553833007812, 0.1558094024658203, 0.1632232666015625, 0.1706371307373047, 0.17805099487304688, 0.18546485900878906, 0.19287872314453125, 0.20029258728027344, 0.20770645141601562, 0.2151203155517578, 0.2225341796875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 7.0, 3.0, 6.0, 12.0, 13.0, 11.0, 19.0, 32.0, 35.0, 49.0, 90.0, 100.0, 139.0, 227.0, 258.0, 378.0, 503.0, 556.0, 497.0, 320.0, 213.0, 153.0, 133.0, 87.0, 58.0, 37.0, 31.0, 22.0, 19.0, 13.0, 14.0, 8.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1646728515625, -0.1595745086669922, -0.15447616577148438, -0.14937782287597656, -0.14427947998046875, -0.13918113708496094, -0.13408279418945312, -0.1289844512939453, -0.1238861083984375, -0.11878776550292969, -0.11368942260742188, -0.10859107971191406, -0.10349273681640625, -0.09839439392089844, -0.09329605102539062, -0.08819770812988281, -0.083099365234375, -0.07800102233886719, -0.07290267944335938, -0.06780433654785156, -0.06270599365234375, -0.05760765075683594, -0.052509307861328125, -0.04741096496582031, -0.0423126220703125, -0.03721427917480469, -0.032115936279296875, -0.027017593383789062, -0.02191925048828125, -0.016820907592773438, -0.011722564697265625, -0.0066242218017578125, -0.00152587890625, 0.0035724639892578125, 0.008670806884765625, 0.013769149780273438, 0.01886749267578125, 0.023965835571289062, 0.029064178466796875, 0.03416252136230469, 0.0392608642578125, 0.04435920715332031, 0.049457550048828125, 0.05455589294433594, 0.05965423583984375, 0.06475257873535156, 0.06985092163085938, 0.07494926452636719, 0.080047607421875, 0.08514595031738281, 0.09024429321289062, 0.09534263610839844, 0.10044097900390625, 0.10553932189941406, 0.11063766479492188, 0.11573600769042969, 0.1208343505859375, 0.1259326934814453, 0.13103103637695312, 0.13612937927246094, 0.14122772216796875, 0.14632606506347656, 0.15142440795898438, 0.1565227508544922, 0.16162109375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 22.0, 68.0, 155.0, 256.0, 261.0, 140.0, 67.0, 21.0, 7.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3985989093780518, -1.3351898193359375, -1.2717807292938232, -1.2083717584609985, -1.1449626684188843, -1.08155357837677, -1.0181446075439453, -0.954735517501831, -0.8913264274597168, -0.8279173374176025, -0.7645083069801331, -0.7010992765426636, -0.6376901865005493, -0.5742810964584351, -0.5108720660209656, -0.4474630057811737, -0.38405394554138184, -0.32064488530158997, -0.2572358250617981, -0.19382676482200623, -0.13041770458221436, -0.06700864434242249, -0.0035995841026306152, 0.059809476137161255, 0.12321853637695312, 0.186627596616745, 0.25003665685653687, 0.31344571709632874, 0.3768547773361206, 0.4402638375759125, 0.5036728978157043, 0.5670819282531738, 0.630490779876709, 0.6938998699188232, 0.7573089003562927, 0.8207179307937622, 0.8841270208358765, 0.9475361108779907, 1.0109450817108154, 1.0743541717529297, 1.137763261795044, 1.2011723518371582, 1.2645814418792725, 1.3279904127120972, 1.3913995027542114, 1.4548085927963257, 1.5182175636291504, 1.5816266536712646, 1.645035743713379, 1.7084448337554932, 1.7718539237976074, 1.8352628946304321, 1.8986719846725464, 1.9620810747146606, 2.0254900455474854, 2.0888991355895996, 2.152308225631714, 2.215717315673828, 2.2791264057159424, 2.3425354957580566, 2.405944347381592, 2.469353437423706, 2.5327625274658203, 2.5961716175079346, 2.659580707550049]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 3.0, 9.0, 8.0, 8.0, 7.0, 18.0, 19.0, 25.0, 25.0, 32.0, 47.0, 47.0, 32.0, 60.0, 58.0, 55.0, 52.0, 53.0, 52.0, 62.0, 50.0, 36.0, 32.0, 45.0, 31.0, 21.0, 25.0, 23.0, 14.0, 10.0, 11.0, 4.0, 12.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.611383855342865, -0.5926598310470581, -0.573935866355896, -0.5552118420600891, -0.536487877368927, -0.5177638530731201, -0.499039888381958, -0.4803158640861511, -0.461591899394989, -0.4428679049015045, -0.42414391040802, -0.4054199159145355, -0.386695921421051, -0.36797192692756653, -0.34924793243408203, -0.33052390813827515, -0.31179991364479065, -0.29307591915130615, -0.27435192465782166, -0.25562793016433716, -0.23690393567085266, -0.21817994117736816, -0.19945593178272247, -0.18073193728923798, -0.16200794279575348, -0.14328394830226898, -0.12455995380878448, -0.10583595186471939, -0.0871119573712349, -0.0683879628777504, -0.0496639609336853, -0.030939966440200806, -0.012215971946716309, 0.006508024409413338, 0.025232020765542984, 0.04395601898431778, 0.06268001347780228, 0.08140400797128677, 0.10012800991535187, 0.11885200440883636, 0.13757599890232086, 0.15629999339580536, 0.17502398788928986, 0.19374799728393555, 0.21247199177742004, 0.23119598627090454, 0.24991998076438904, 0.26864397525787354, 0.28736796975135803, 0.30609196424484253, 0.324815958738327, 0.3435399532318115, 0.362263947725296, 0.3809879422187805, 0.3997119665145874, 0.4184359312057495, 0.4371599555015564, 0.4558839499950409, 0.4746079444885254, 0.4933319389820099, 0.5120559334754944, 0.5307799577713013, 0.5495039224624634, 0.5682279467582703, 0.5869519114494324]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 7.0, 14.0, 17.0, 11.0, 29.0, 56.0, 67.0, 116.0, 174.0, 293.0, 498.0, 866.0, 1601.0, 3270.0, 6739.0, 14837.0, 34984.0, 86057.0, 204365.0, 323574.0, 212437.0, 90939.0, 37514.0, 15655.0, 7114.0, 3476.0, 1663.0, 887.0, 504.0, 272.0, 176.0, 110.0, 82.0, 49.0, 39.0, 22.0, 10.0, 14.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.19287109375, -0.1867542266845703, -0.18063735961914062, -0.17452049255371094, -0.16840362548828125, -0.16228675842285156, -0.15616989135742188, -0.1500530242919922, -0.1439361572265625, -0.1378192901611328, -0.13170242309570312, -0.12558555603027344, -0.11946868896484375, -0.11335182189941406, -0.10723495483398438, -0.10111808776855469, -0.095001220703125, -0.08888435363769531, -0.08276748657226562, -0.07665061950683594, -0.07053375244140625, -0.06441688537597656, -0.058300018310546875, -0.05218315124511719, -0.0460662841796875, -0.03994941711425781, -0.033832550048828125, -0.027715682983398438, -0.02159881591796875, -0.015481948852539062, -0.009365081787109375, -0.0032482147216796875, 0.00286865234375, 0.008985519409179688, 0.015102386474609375, 0.021219253540039062, 0.02733612060546875, 0.03345298767089844, 0.039569854736328125, 0.04568672180175781, 0.0518035888671875, 0.05792045593261719, 0.06403732299804688, 0.07015419006347656, 0.07627105712890625, 0.08238792419433594, 0.08850479125976562, 0.09462165832519531, 0.100738525390625, 0.10685539245605469, 0.11297225952148438, 0.11908912658691406, 0.12520599365234375, 0.13132286071777344, 0.13743972778320312, 0.1435565948486328, 0.1496734619140625, 0.1557903289794922, 0.16190719604492188, 0.16802406311035156, 0.17414093017578125, 0.18025779724121094, 0.18637466430664062, 0.1924915313720703, 0.1986083984375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 8.0, 3.0, 3.0, 9.0, 17.0, 9.0, 16.0, 19.0, 22.0, 24.0, 26.0, 18.0, 36.0, 44.0, 36.0, 46.0, 49.0, 55.0, 45.0, 58.0, 50.0, 39.0, 40.0, 39.0, 38.0, 41.0, 38.0, 36.0, 21.0, 20.0, 20.0, 13.0, 7.0, 13.0, 9.0, 7.0, 9.0, 6.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.12249755859375, -0.11919498443603516, -0.11589241027832031, -0.11258983612060547, -0.10928726196289062, -0.10598468780517578, -0.10268211364746094, -0.0993795394897461, -0.09607696533203125, -0.0927743911743164, -0.08947181701660156, -0.08616924285888672, -0.08286666870117188, -0.07956409454345703, -0.07626152038574219, -0.07295894622802734, -0.0696563720703125, -0.06635379791259766, -0.06305122375488281, -0.05974864959716797, -0.056446075439453125, -0.05314350128173828, -0.04984092712402344, -0.046538352966308594, -0.04323577880859375, -0.039933204650878906, -0.03663063049316406, -0.03332805633544922, -0.030025482177734375, -0.02672290802001953, -0.023420333862304688, -0.020117759704589844, -0.016815185546875, -0.013512611389160156, -0.010210037231445312, -0.006907463073730469, -0.003604888916015625, -0.00030231475830078125, 0.0030002593994140625, 0.006302833557128906, 0.00960540771484375, 0.012907981872558594, 0.016210556030273438, 0.01951313018798828, 0.022815704345703125, 0.02611827850341797, 0.029420852661132812, 0.032723426818847656, 0.0360260009765625, 0.039328575134277344, 0.04263114929199219, 0.04593372344970703, 0.049236297607421875, 0.05253887176513672, 0.05584144592285156, 0.059144020080566406, 0.06244659423828125, 0.0657491683959961, 0.06905174255371094, 0.07235431671142578, 0.07565689086914062, 0.07895946502685547, 0.08226203918457031, 0.08556461334228516, 0.0888671875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 6.0, 9.0, 6.0, 13.0, 8.0, 11.0, 14.0, 11.0, 12.0, 26.0, 36.0, 28.0, 37.0, 60.0, 82.0, 183.0, 624.0, 7171.0, 252236.0, 761437.0, 24430.0, 1444.0, 224.0, 82.0, 55.0, 38.0, 44.0, 35.0, 35.0, 24.0, 16.0, 13.0, 20.0, 11.0, 15.0, 13.0, 14.0, 11.0, 2.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0], "bins": [-1.1572265625, -1.1261138916015625, -1.095001220703125, -1.0638885498046875, -1.03277587890625, -1.0016632080078125, -0.970550537109375, -0.9394378662109375, -0.9083251953125, -0.8772125244140625, -0.846099853515625, -0.8149871826171875, -0.78387451171875, -0.7527618408203125, -0.721649169921875, -0.6905364990234375, -0.659423828125, -0.6283111572265625, -0.597198486328125, -0.5660858154296875, -0.53497314453125, -0.5038604736328125, -0.472747802734375, -0.4416351318359375, -0.4105224609375, -0.3794097900390625, -0.348297119140625, -0.3171844482421875, -0.28607177734375, -0.2549591064453125, -0.223846435546875, -0.1927337646484375, -0.16162109375, -0.1305084228515625, -0.099395751953125, -0.0682830810546875, -0.03717041015625, -0.0060577392578125, 0.025054931640625, 0.0561676025390625, 0.0872802734375, 0.1183929443359375, 0.149505615234375, 0.1806182861328125, 0.21173095703125, 0.2428436279296875, 0.273956298828125, 0.3050689697265625, 0.336181640625, 0.3672943115234375, 0.398406982421875, 0.4295196533203125, 0.46063232421875, 0.4917449951171875, 0.522857666015625, 0.5539703369140625, 0.5850830078125, 0.6161956787109375, 0.647308349609375, 0.6784210205078125, 0.70953369140625, 0.7406463623046875, 0.771759033203125, 0.8028717041015625, 0.833984375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 8.0, 1.0, 12.0, 2.0, 15.0, 9.0, 10.0, 14.0, 13.0, 18.0, 16.0, 37.0, 32.0, 29.0, 55.0, 34.0, 33.0, 40.0, 50.0, 51.0, 51.0, 42.0, 30.0, 49.0, 32.0, 30.0, 28.0, 38.0, 30.0, 33.0, 25.0, 18.0, 15.0, 19.0, 13.0, 13.0, 13.0, 13.0, 8.0, 6.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.249755859375, -0.24301910400390625, -0.2362823486328125, -0.22954559326171875, -0.222808837890625, -0.21607208251953125, -0.2093353271484375, -0.20259857177734375, -0.19586181640625, -0.18912506103515625, -0.1823883056640625, -0.17565155029296875, -0.168914794921875, -0.16217803955078125, -0.1554412841796875, -0.14870452880859375, -0.1419677734375, -0.13523101806640625, -0.1284942626953125, -0.12175750732421875, -0.115020751953125, -0.10828399658203125, -0.1015472412109375, -0.09481048583984375, -0.08807373046875, -0.08133697509765625, -0.0746002197265625, -0.06786346435546875, -0.061126708984375, -0.05438995361328125, -0.0476531982421875, -0.04091644287109375, -0.0341796875, -0.02744293212890625, -0.0207061767578125, -0.01396942138671875, -0.007232666015625, -0.00049591064453125, 0.0062408447265625, 0.01297760009765625, 0.01971435546875, 0.02645111083984375, 0.0331878662109375, 0.03992462158203125, 0.046661376953125, 0.05339813232421875, 0.0601348876953125, 0.06687164306640625, 0.0736083984375, 0.08034515380859375, 0.0870819091796875, 0.09381866455078125, 0.100555419921875, 0.10729217529296875, 0.1140289306640625, 0.12076568603515625, 0.12750244140625, 0.13423919677734375, 0.1409759521484375, 0.14771270751953125, 0.154449462890625, 0.16118621826171875, 0.1679229736328125, 0.17465972900390625, 0.181396484375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 3.0, 1.0, 7.0, 5.0, 12.0, 14.0, 21.0, 31.0, 63.0, 112.0, 148.0, 267.0, 524.0, 898.0, 1841.0, 3986.0, 8975.0, 23430.0, 70192.0, 236759.0, 427909.0, 184552.0, 55205.0, 19139.0, 7550.0, 3448.0, 1600.0, 784.0, 436.0, 263.0, 125.0, 86.0, 43.0, 46.0, 24.0, 16.0, 9.0, 9.0, 9.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1546630859375, -0.15003204345703125, -0.1454010009765625, -0.14076995849609375, -0.136138916015625, -0.13150787353515625, -0.1268768310546875, -0.12224578857421875, -0.11761474609375, -0.11298370361328125, -0.1083526611328125, -0.10372161865234375, -0.099090576171875, -0.09445953369140625, -0.0898284912109375, -0.08519744873046875, -0.08056640625, -0.07593536376953125, -0.0713043212890625, -0.06667327880859375, -0.062042236328125, -0.05741119384765625, -0.0527801513671875, -0.04814910888671875, -0.04351806640625, -0.03888702392578125, -0.0342559814453125, -0.02962493896484375, -0.024993896484375, -0.02036285400390625, -0.0157318115234375, -0.01110076904296875, -0.0064697265625, -0.00183868408203125, 0.0027923583984375, 0.00742340087890625, 0.012054443359375, 0.01668548583984375, 0.0213165283203125, 0.02594757080078125, 0.03057861328125, 0.03520965576171875, 0.0398406982421875, 0.04447174072265625, 0.049102783203125, 0.05373382568359375, 0.0583648681640625, 0.06299591064453125, 0.067626953125, 0.07225799560546875, 0.0768890380859375, 0.08152008056640625, 0.086151123046875, 0.09078216552734375, 0.0954132080078125, 0.10004425048828125, 0.10467529296875, 0.10930633544921875, 0.1139373779296875, 0.11856842041015625, 0.123199462890625, 0.12783050537109375, 0.1324615478515625, 0.13709259033203125, 0.1417236328125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 5.0, 6.0, 5.0, 3.0, 5.0, 2.0, 10.0, 16.0, 21.0, 23.0, 36.0, 47.0, 63.0, 75.0, 107.0, 112.0, 88.0, 89.0, 72.0, 65.0, 37.0, 33.0, 12.0, 15.0, 13.0, 9.0, 5.0, 8.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9490718841552734e-05, -1.87847763299942e-05, -1.807883381843567e-05, -1.7372891306877136e-05, -1.6666948795318604e-05, -1.596100628376007e-05, -1.5255063772201538e-05, -1.4549121260643005e-05, -1.3843178749084473e-05, -1.313723623752594e-05, -1.2431293725967407e-05, -1.1725351214408875e-05, -1.1019408702850342e-05, -1.0313466191291809e-05, -9.607523679733276e-06, -8.901581168174744e-06, -8.195638656616211e-06, -7.489696145057678e-06, -6.7837536334991455e-06, -6.077811121940613e-06, -5.37186861038208e-06, -4.665926098823547e-06, -3.959983587265015e-06, -3.254041075706482e-06, -2.5480985641479492e-06, -1.8421560525894165e-06, -1.1362135410308838e-06, -4.302710294723511e-07, 2.7567148208618164e-07, 9.816139936447144e-07, 1.687556505203247e-06, 2.3934990167617798e-06, 3.0994415283203125e-06, 3.8053840398788452e-06, 4.511326551437378e-06, 5.217269062995911e-06, 5.923211574554443e-06, 6.629154086112976e-06, 7.335096597671509e-06, 8.041039109230042e-06, 8.746981620788574e-06, 9.452924132347107e-06, 1.015886664390564e-05, 1.0864809155464172e-05, 1.1570751667022705e-05, 1.2276694178581238e-05, 1.298263669013977e-05, 1.3688579201698303e-05, 1.4394521713256836e-05, 1.5100464224815369e-05, 1.58064067363739e-05, 1.6512349247932434e-05, 1.7218291759490967e-05, 1.79242342710495e-05, 1.8630176782608032e-05, 1.9336119294166565e-05, 2.0042061805725098e-05, 2.074800431728363e-05, 2.1453946828842163e-05, 2.2159889340400696e-05, 2.286583185195923e-05, 2.357177436351776e-05, 2.4277716875076294e-05, 2.4983659386634827e-05, 2.568960189819336e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 3.0, 3.0, 0.0, 7.0, 11.0, 6.0, 5.0, 9.0, 13.0, 20.0, 24.0, 33.0, 65.0, 158.0, 732.0, 6684.0, 153239.0, 835993.0, 47746.0, 3047.0, 421.0, 108.0, 63.0, 44.0, 26.0, 21.0, 14.0, 11.0, 20.0, 6.0, 6.0, 2.0, 6.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.414306640625, -0.4034996032714844, -0.39269256591796875, -0.3818855285644531, -0.3710784912109375, -0.3602714538574219, -0.34946441650390625, -0.3386573791503906, -0.327850341796875, -0.3170433044433594, -0.30623626708984375, -0.2954292297363281, -0.2846221923828125, -0.2738151550292969, -0.26300811767578125, -0.2522010803222656, -0.24139404296875, -0.23058700561523438, -0.21977996826171875, -0.20897293090820312, -0.1981658935546875, -0.18735885620117188, -0.17655181884765625, -0.16574478149414062, -0.154937744140625, -0.14413070678710938, -0.13332366943359375, -0.12251663208007812, -0.1117095947265625, -0.10090255737304688, -0.09009552001953125, -0.07928848266601562, -0.0684814453125, -0.057674407958984375, -0.04686737060546875, -0.036060333251953125, -0.0252532958984375, -0.014446258544921875, -0.00363922119140625, 0.007167816162109375, 0.017974853515625, 0.028781890869140625, 0.03958892822265625, 0.050395965576171875, 0.0612030029296875, 0.07201004028320312, 0.08281707763671875, 0.09362411499023438, 0.10443115234375, 0.11523818969726562, 0.12604522705078125, 0.13685226440429688, 0.1476593017578125, 0.15846633911132812, 0.16927337646484375, 0.18008041381835938, 0.190887451171875, 0.20169448852539062, 0.21250152587890625, 0.22330856323242188, 0.2341156005859375, 0.24492263793945312, 0.25572967529296875, 0.2665367126464844, 0.27734375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 10.0, 8.0, 5.0, 11.0, 6.0, 23.0, 22.0, 23.0, 41.0, 59.0, 42.0, 65.0, 80.0, 83.0, 74.0, 106.0, 63.0, 50.0, 41.0, 49.0, 28.0, 22.0, 18.0, 12.0, 19.0, 9.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.08514404296875, -0.0829463005065918, -0.0807485580444336, -0.07855081558227539, -0.07635307312011719, -0.07415533065795898, -0.07195758819580078, -0.06975984573364258, -0.06756210327148438, -0.06536436080932617, -0.06316661834716797, -0.060968875885009766, -0.05877113342285156, -0.05657339096069336, -0.054375648498535156, -0.05217790603637695, -0.04998016357421875, -0.04778242111206055, -0.045584678649902344, -0.04338693618774414, -0.04118919372558594, -0.038991451263427734, -0.03679370880126953, -0.03459596633911133, -0.032398223876953125, -0.030200481414794922, -0.02800273895263672, -0.025804996490478516, -0.023607254028320312, -0.02140951156616211, -0.019211769104003906, -0.017014026641845703, -0.0148162841796875, -0.012618541717529297, -0.010420799255371094, -0.00822305679321289, -0.0060253143310546875, -0.0038275718688964844, -0.0016298294067382812, 0.0005679130554199219, 0.002765655517578125, 0.004963397979736328, 0.007161140441894531, 0.009358882904052734, 0.011556625366210938, 0.01375436782836914, 0.015952110290527344, 0.018149852752685547, 0.02034759521484375, 0.022545337677001953, 0.024743080139160156, 0.02694082260131836, 0.029138565063476562, 0.031336307525634766, 0.03353404998779297, 0.03573179244995117, 0.037929534912109375, 0.04012727737426758, 0.04232501983642578, 0.044522762298583984, 0.04672050476074219, 0.04891824722290039, 0.051115989685058594, 0.0533137321472168, 0.055511474609375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 15.0, 169.0, 752.0, 75.0, 7.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0834548473358154, -0.8841234445571899, -0.6847920417785645, -0.48546063899993896, -0.2861292362213135, -0.08679783344268799, 0.1125335693359375, 0.311864972114563, 0.5111963748931885, 0.710527777671814, 0.9098591804504395, 1.109190583229065, 1.3085219860076904, 1.507853388786316, 1.7071847915649414, 1.906516194343567, 2.1058475971221924, 2.3051791191101074, 2.5045104026794434, 2.7038416862487793, 2.9031732082366943, 3.1025047302246094, 3.3018360137939453, 3.5011672973632812, 3.7004988193511963, 3.8998303413391113, 4.099161624908447, 4.298492908477783, 4.497824668884277, 4.697155952453613, 4.896487236022949, 5.095818519592285, 5.295149803161621, 5.494481086730957, 5.693812370300293, 5.893144130706787, 6.092475414276123, 6.291806697845459, 6.491138458251953, 6.690469741821289, 6.889801025390625, 7.089132308959961, 7.288463592529297, 7.487795352935791, 7.687126636505127, 7.886457920074463, 8.085789680480957, 8.285120964050293, 8.484452247619629, 8.683783531188965, 8.8831148147583, 9.082446098327637, 9.281778335571289, 9.481109619140625, 9.680440902709961, 9.879772186279297, 10.079103469848633, 10.278434753417969, 10.477766036987305, 10.67709732055664, 10.876428604125977, 11.075760841369629, 11.275092124938965, 11.4744234085083, 11.673754692077637]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 1.0, 5.0, 3.0, 3.0, 4.0, 5.0, 10.0, 6.0, 10.0, 10.0, 12.0, 14.0, 26.0, 27.0, 24.0, 21.0, 31.0, 29.0, 44.0, 40.0, 33.0, 50.0, 47.0, 32.0, 55.0, 30.0, 47.0, 40.0, 42.0, 33.0, 37.0, 34.0, 25.0, 22.0, 26.0, 21.0, 17.0, 19.0, 14.0, 9.0, 11.0, 3.0, 6.0, 6.0, 7.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.8769701719284058, -0.8489359021186829, -0.8209016919136047, -0.7928674221038818, -0.7648331522941589, -0.736798882484436, -0.7087646722793579, -0.680730402469635, -0.6526961326599121, -0.6246618628501892, -0.5966276526451111, -0.5685933828353882, -0.5405591130256653, -0.5125248432159424, -0.48449063301086426, -0.45645636320114136, -0.42842215299606323, -0.4003879129886627, -0.3723536431789398, -0.3443194031715393, -0.3162851333618164, -0.2882508933544159, -0.2602166533470154, -0.23218239843845367, -0.20414814352989197, -0.17611388862133026, -0.14807963371276855, -0.12004539370536804, -0.09201113879680634, -0.06397688388824463, -0.035942643880844116, -0.00790838897228241, 0.020125925540924072, 0.04816017672419548, 0.07619442790746689, 0.104228675365448, 0.1322629302740097, 0.1602971851825714, 0.18833142518997192, 0.21636568009853363, 0.24439993500709534, 0.27243417501449585, 0.30046844482421875, 0.32850268483161926, 0.3565369248390198, 0.3845711946487427, 0.4126054346561432, 0.4406396746635437, 0.4686739444732666, 0.4967081844806671, 0.5247424244880676, 0.5527766942977905, 0.5808109641075134, 0.6088452339172363, 0.6368794441223145, 0.6649137139320374, 0.6929479837417603, 0.7209822535514832, 0.7490164637565613, 0.7770507335662842, 0.8050850033760071, 0.83311927318573, 0.8611534833908081, 0.889187753200531, 0.9172219634056091]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 4.0, 7.0, 3.0, 9.0, 5.0, 9.0, 12.0, 21.0, 22.0, 41.0, 40.0, 67.0, 102.0, 135.0, 256.0, 396.0, 632.0, 1232.0, 2245.0, 4588.0, 10214.0, 24890.0, 68859.0, 241632.0, 1391338.0, 1968226.0, 338071.0, 88808.0, 30142.0, 11807.0, 5209.0, 2392.0, 1165.0, 675.0, 359.0, 229.0, 153.0, 101.0, 57.0, 38.0, 41.0, 17.0, 16.0, 10.0, 4.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.295166015625, -0.28721046447753906, -0.2792549133300781, -0.2712993621826172, -0.26334381103515625, -0.2553882598876953, -0.24743270874023438, -0.23947715759277344, -0.2315216064453125, -0.22356605529785156, -0.21561050415039062, -0.2076549530029297, -0.19969940185546875, -0.1917438507080078, -0.18378829956054688, -0.17583274841308594, -0.167877197265625, -0.15992164611816406, -0.15196609497070312, -0.1440105438232422, -0.13605499267578125, -0.1280994415283203, -0.12014389038085938, -0.11218833923339844, -0.1042327880859375, -0.09627723693847656, -0.08832168579101562, -0.08036613464355469, -0.07241058349609375, -0.06445503234863281, -0.056499481201171875, -0.04854393005371094, -0.04058837890625, -0.03263282775878906, -0.024677276611328125, -0.016721725463867188, -0.00876617431640625, -0.0008106231689453125, 0.007144927978515625, 0.015100479125976562, 0.0230560302734375, 0.031011581420898438, 0.038967132568359375, 0.04692268371582031, 0.05487823486328125, 0.06283378601074219, 0.07078933715820312, 0.07874488830566406, 0.086700439453125, 0.09465599060058594, 0.10261154174804688, 0.11056709289550781, 0.11852264404296875, 0.1264781951904297, 0.13443374633789062, 0.14238929748535156, 0.1503448486328125, 0.15830039978027344, 0.16625595092773438, 0.1742115020751953, 0.18216705322265625, 0.1901226043701172, 0.19807815551757812, 0.20603370666503906, 0.2139892578125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 6.0, 2.0, 4.0, 6.0, 4.0, 10.0, 8.0, 9.0, 13.0, 13.0, 15.0, 25.0, 29.0, 28.0, 35.0, 33.0, 44.0, 43.0, 57.0, 59.0, 47.0, 60.0, 43.0, 43.0, 57.0, 39.0, 42.0, 40.0, 33.0, 25.0, 29.0, 23.0, 14.0, 20.0, 11.0, 9.0, 9.0, 6.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.14208984375, -0.13835620880126953, -0.13462257385253906, -0.1308889389038086, -0.12715530395507812, -0.12342166900634766, -0.11968803405761719, -0.11595439910888672, -0.11222076416015625, -0.10848712921142578, -0.10475349426269531, -0.10101985931396484, -0.09728622436523438, -0.0935525894165039, -0.08981895446777344, -0.08608531951904297, -0.0823516845703125, -0.07861804962158203, -0.07488441467285156, -0.0711507797241211, -0.06741714477539062, -0.06368350982666016, -0.05994987487792969, -0.05621623992919922, -0.05248260498046875, -0.04874897003173828, -0.04501533508300781, -0.041281700134277344, -0.037548065185546875, -0.033814430236816406, -0.030080795288085938, -0.02634716033935547, -0.022613525390625, -0.01887989044189453, -0.015146255493164062, -0.011412620544433594, -0.007678985595703125, -0.003945350646972656, -0.0002117156982421875, 0.0035219192504882812, 0.00725555419921875, 0.010989189147949219, 0.014722824096679688, 0.018456459045410156, 0.022190093994140625, 0.025923728942871094, 0.029657363891601562, 0.03339099884033203, 0.0371246337890625, 0.04085826873779297, 0.04459190368652344, 0.048325538635253906, 0.052059173583984375, 0.055792808532714844, 0.05952644348144531, 0.06326007843017578, 0.06699371337890625, 0.07072734832763672, 0.07446098327636719, 0.07819461822509766, 0.08192825317382812, 0.0856618881225586, 0.08939552307128906, 0.09312915802001953, 0.09686279296875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 7.0, 2.0, 6.0, 12.0, 12.0, 33.0, 51.0, 76.0, 166.0, 327.0, 886.0, 3071.0, 16364.0, 123553.0, 1209425.0, 2517439.0, 281468.0, 33595.0, 5546.0, 1366.0, 473.0, 182.0, 95.0, 50.0, 35.0, 24.0, 16.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.560546875, -0.5436553955078125, -0.526763916015625, -0.5098724365234375, -0.49298095703125, -0.4760894775390625, -0.459197998046875, -0.4423065185546875, -0.4254150390625, -0.4085235595703125, -0.391632080078125, -0.3747406005859375, -0.35784912109375, -0.3409576416015625, -0.324066162109375, -0.3071746826171875, -0.290283203125, -0.2733917236328125, -0.256500244140625, -0.2396087646484375, -0.22271728515625, -0.2058258056640625, -0.188934326171875, -0.1720428466796875, -0.1551513671875, -0.1382598876953125, -0.121368408203125, -0.1044769287109375, -0.08758544921875, -0.0706939697265625, -0.053802490234375, -0.0369110107421875, -0.02001953125, -0.0031280517578125, 0.013763427734375, 0.0306549072265625, 0.04754638671875, 0.0644378662109375, 0.081329345703125, 0.0982208251953125, 0.1151123046875, 0.1320037841796875, 0.148895263671875, 0.1657867431640625, 0.18267822265625, 0.1995697021484375, 0.216461181640625, 0.2333526611328125, 0.250244140625, 0.2671356201171875, 0.284027099609375, 0.3009185791015625, 0.31781005859375, 0.3347015380859375, 0.351593017578125, 0.3684844970703125, 0.3853759765625, 0.4022674560546875, 0.419158935546875, 0.4360504150390625, 0.45294189453125, 0.4698333740234375, 0.486724853515625, 0.5036163330078125, 0.5205078125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 3.0, 12.0, 15.0, 24.0, 41.0, 63.0, 104.0, 164.0, 237.0, 378.0, 551.0, 821.0, 614.0, 379.0, 259.0, 142.0, 86.0, 60.0, 52.0, 19.0, 13.0, 10.0, 5.0, 10.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18212890625, -0.17276763916015625, -0.1634063720703125, -0.15404510498046875, -0.144683837890625, -0.13532257080078125, -0.1259613037109375, -0.11660003662109375, -0.10723876953125, -0.09787750244140625, -0.0885162353515625, -0.07915496826171875, -0.069793701171875, -0.06043243408203125, -0.0510711669921875, -0.04170989990234375, -0.0323486328125, -0.02298736572265625, -0.0136260986328125, -0.00426483154296875, 0.005096435546875, 0.01445770263671875, 0.0238189697265625, 0.03318023681640625, 0.04254150390625, 0.05190277099609375, 0.0612640380859375, 0.07062530517578125, 0.079986572265625, 0.08934783935546875, 0.0987091064453125, 0.10807037353515625, 0.117431640625, 0.12679290771484375, 0.1361541748046875, 0.14551544189453125, 0.154876708984375, 0.16423797607421875, 0.1735992431640625, 0.18296051025390625, 0.19232177734375, 0.20168304443359375, 0.2110443115234375, 0.22040557861328125, 0.229766845703125, 0.23912811279296875, 0.2484893798828125, 0.25785064697265625, 0.2672119140625, 0.27657318115234375, 0.2859344482421875, 0.29529571533203125, 0.304656982421875, 0.31401824951171875, 0.3233795166015625, 0.33274078369140625, 0.34210205078125, 0.35146331787109375, 0.3608245849609375, 0.37018585205078125, 0.379547119140625, 0.38890838623046875, 0.3982696533203125, 0.40763092041015625, 0.4169921875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 10.0, 43.0, 281.0, 462.0, 177.0, 29.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2849271297454834, -2.1603193283081055, -2.0357117652893066, -1.9111040830612183, -1.7864964008331299, -1.6618887186050415, -1.5372810363769531, -1.4126733541488647, -1.2880656719207764, -1.163457989692688, -1.0388503074645996, -0.9142426252365112, -0.7896349430084229, -0.6650272607803345, -0.5404195785522461, -0.4158118963241577, -0.29120421409606934, -0.16659653186798096, -0.04198884963989258, 0.0826188325881958, 0.20722651481628418, 0.33183419704437256, 0.45644187927246094, 0.5810495615005493, 0.7056572437286377, 0.8302649259567261, 0.9548726081848145, 1.0794802904129028, 1.2040879726409912, 1.3286956548690796, 1.453303337097168, 1.5779110193252563, 1.7025184631347656, 1.827126145362854, 1.9517338275909424, 2.0763416290283203, 2.200949192047119, 2.325556755065918, 2.450164556503296, 2.574772357940674, 2.6993799209594727, 2.8239874839782715, 2.9485952854156494, 3.0732030868530273, 3.197810649871826, 3.322418212890625, 3.447026014328003, 3.571633815765381, 3.6962413787841797, 3.8208489418029785, 3.9454567432403564, 4.070064544677734, 4.194672107696533, 4.319279670715332, 4.443887710571289, 4.568495273590088, 4.693102836608887, 4.8177103996276855, 4.942317962646484, 5.066926002502441, 5.19153356552124, 5.316141128540039, 5.440749168395996, 5.565356731414795, 5.689964294433594]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 6.0, 7.0, 5.0, 9.0, 9.0, 9.0, 16.0, 18.0, 10.0, 15.0, 23.0, 17.0, 21.0, 28.0, 28.0, 34.0, 48.0, 38.0, 41.0, 41.0, 47.0, 40.0, 35.0, 38.0, 28.0, 30.0, 42.0, 34.0, 39.0, 32.0, 28.0, 31.0, 26.0, 16.0, 20.0, 15.0, 21.0, 15.0, 9.0, 5.0, 6.0, 3.0, 7.0, 8.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.5839733481407166, -0.5656446814537048, -0.5473159551620483, -0.5289872884750366, -0.5106586217880249, -0.4923299551010132, -0.4740012586116791, -0.45567256212234497, -0.43734389543533325, -0.41901522874832153, -0.4006865322589874, -0.3823578357696533, -0.3640291690826416, -0.3457005023956299, -0.3273718059062958, -0.30904310941696167, -0.29071444272994995, -0.27238577604293823, -0.2540570795536041, -0.2357283979654312, -0.2173997163772583, -0.1990710347890854, -0.18074235320091248, -0.16241367161273956, -0.14408499002456665, -0.12575630843639374, -0.10742762684822083, -0.08909894526004791, -0.070770263671875, -0.05244158208370209, -0.034112900495529175, -0.015784218907356262, 0.002544403076171875, 0.020873084664344788, 0.0392017662525177, 0.05753044784069061, 0.07585912942886353, 0.09418781101703644, 0.11251649260520935, 0.13084517419338226, 0.14917385578155518, 0.1675025373697281, 0.185831218957901, 0.2041599005460739, 0.22248858213424683, 0.24081726372241974, 0.25914594531059265, 0.27747464179992676, 0.2958033084869385, 0.3141319751739502, 0.3324606716632843, 0.3507893681526184, 0.3691180348396301, 0.38744670152664185, 0.40577539801597595, 0.42410409450531006, 0.4424327611923218, 0.4607614278793335, 0.4790901243686676, 0.4974188208580017, 0.5157474875450134, 0.5340761542320251, 0.5524048805236816, 0.5707335472106934, 0.5890622138977051]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 1.0, 10.0, 13.0, 12.0, 12.0, 25.0, 42.0, 59.0, 79.0, 132.0, 163.0, 244.0, 322.0, 538.0, 774.0, 1127.0, 1701.0, 2447.0, 3905.0, 5991.0, 9885.0, 18215.0, 35669.0, 75853.0, 162177.0, 264072.0, 228729.0, 118748.0, 54329.0, 26406.0, 14030.0, 7982.0, 5023.0, 3207.0, 2187.0, 1397.0, 921.0, 684.0, 471.0, 276.0, 204.0, 159.0, 106.0, 71.0, 51.0, 34.0, 28.0, 15.0, 10.0, 12.0, 3.0, 2.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.229736328125, -0.22250938415527344, -0.21528244018554688, -0.2080554962158203, -0.20082855224609375, -0.1936016082763672, -0.18637466430664062, -0.17914772033691406, -0.1719207763671875, -0.16469383239746094, -0.15746688842773438, -0.1502399444580078, -0.14301300048828125, -0.1357860565185547, -0.12855911254882812, -0.12133216857910156, -0.114105224609375, -0.10687828063964844, -0.09965133666992188, -0.09242439270019531, -0.08519744873046875, -0.07797050476074219, -0.07074356079101562, -0.06351661682128906, -0.0562896728515625, -0.04906272888183594, -0.041835784912109375, -0.03460884094238281, -0.02738189697265625, -0.020154953002929688, -0.012928009033203125, -0.0057010650634765625, 0.00152587890625, 0.008752822875976562, 0.015979766845703125, 0.023206710815429688, 0.03043365478515625, 0.03766059875488281, 0.044887542724609375, 0.05211448669433594, 0.0593414306640625, 0.06656837463378906, 0.07379531860351562, 0.08102226257324219, 0.08824920654296875, 0.09547615051269531, 0.10270309448242188, 0.10993003845214844, 0.117156982421875, 0.12438392639160156, 0.13161087036132812, 0.1388378143310547, 0.14606475830078125, 0.1532917022705078, 0.16051864624023438, 0.16774559020996094, 0.1749725341796875, 0.18219947814941406, 0.18942642211914062, 0.1966533660888672, 0.20388031005859375, 0.2111072540283203, 0.21833419799804688, 0.22556114196777344, 0.2327880859375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 5.0, 5.0, 6.0, 2.0, 7.0, 13.0, 12.0, 27.0, 18.0, 10.0, 14.0, 31.0, 23.0, 34.0, 31.0, 32.0, 42.0, 38.0, 50.0, 39.0, 43.0, 57.0, 53.0, 42.0, 54.0, 44.0, 45.0, 39.0, 28.0, 34.0, 21.0, 17.0, 19.0, 7.0, 16.0, 8.0, 10.0, 6.0, 10.0, 5.0, 8.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.11444091796875, -0.11114501953125, -0.10784912109375, -0.10455322265625, -0.10125732421875, -0.09796142578125, -0.09466552734375, -0.09136962890625, -0.08807373046875, -0.08477783203125, -0.08148193359375, -0.07818603515625, -0.07489013671875, -0.07159423828125, -0.06829833984375, -0.06500244140625, -0.06170654296875, -0.05841064453125, -0.05511474609375, -0.05181884765625, -0.04852294921875, -0.04522705078125, -0.04193115234375, -0.03863525390625, -0.03533935546875, -0.03204345703125, -0.02874755859375, -0.02545166015625, -0.02215576171875, -0.01885986328125, -0.01556396484375, -0.01226806640625, -0.00897216796875, -0.00567626953125, -0.00238037109375, 0.00091552734375, 0.00421142578125, 0.00750732421875, 0.01080322265625, 0.01409912109375, 0.01739501953125, 0.02069091796875, 0.02398681640625, 0.02728271484375, 0.03057861328125, 0.03387451171875, 0.03717041015625, 0.04046630859375, 0.04376220703125, 0.04705810546875, 0.05035400390625, 0.05364990234375, 0.05694580078125, 0.06024169921875, 0.06353759765625, 0.06683349609375, 0.07012939453125, 0.07342529296875, 0.07672119140625, 0.08001708984375, 0.08331298828125, 0.08660888671875, 0.08990478515625, 0.09320068359375, 0.09649658203125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 4.0, 5.0, 7.0, 16.0, 12.0, 22.0, 27.0, 35.0, 53.0, 75.0, 109.0, 200.0, 330.0, 622.0, 1247.0, 2697.0, 6321.0, 14896.0, 39916.0, 128249.0, 363345.0, 326719.0, 106444.0, 33631.0, 12976.0, 5603.0, 2385.0, 1170.0, 621.0, 275.0, 179.0, 102.0, 73.0, 57.0, 39.0, 26.0, 20.0, 16.0, 12.0, 8.0, 8.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.369384765625, -0.3581657409667969, -0.34694671630859375, -0.3357276916503906, -0.3245086669921875, -0.3132896423339844, -0.30207061767578125, -0.2908515930175781, -0.279632568359375, -0.2684135437011719, -0.25719451904296875, -0.24597549438476562, -0.2347564697265625, -0.22353744506835938, -0.21231842041015625, -0.20109939575195312, -0.18988037109375, -0.17866134643554688, -0.16744232177734375, -0.15622329711914062, -0.1450042724609375, -0.13378524780273438, -0.12256622314453125, -0.11134719848632812, -0.100128173828125, -0.08890914916992188, -0.07769012451171875, -0.06647109985351562, -0.0552520751953125, -0.044033050537109375, -0.03281402587890625, -0.021595001220703125, -0.0103759765625, 0.000843048095703125, 0.01206207275390625, 0.023281097412109375, 0.0345001220703125, 0.045719146728515625, 0.05693817138671875, 0.06815719604492188, 0.079376220703125, 0.09059524536132812, 0.10181427001953125, 0.11303329467773438, 0.1242523193359375, 0.13547134399414062, 0.14669036865234375, 0.15790939331054688, 0.16912841796875, 0.18034744262695312, 0.19156646728515625, 0.20278549194335938, 0.2140045166015625, 0.22522354125976562, 0.23644256591796875, 0.24766159057617188, 0.258880615234375, 0.2700996398925781, 0.28131866455078125, 0.2925376892089844, 0.3037567138671875, 0.3149757385253906, 0.32619476318359375, 0.3374137878417969, 0.3486328125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 9.0, 7.0, 5.0, 10.0, 8.0, 12.0, 12.0, 10.0, 28.0, 25.0, 18.0, 30.0, 38.0, 47.0, 42.0, 44.0, 40.0, 47.0, 58.0, 40.0, 41.0, 53.0, 42.0, 29.0, 43.0, 45.0, 33.0, 32.0, 20.0, 17.0, 28.0, 20.0, 20.0, 15.0, 9.0, 10.0, 4.0, 4.0, 1.0, 4.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.25048828125, -0.24302291870117188, -0.23555755615234375, -0.22809219360351562, -0.2206268310546875, -0.21316146850585938, -0.20569610595703125, -0.19823074340820312, -0.190765380859375, -0.18330001831054688, -0.17583465576171875, -0.16836929321289062, -0.1609039306640625, -0.15343856811523438, -0.14597320556640625, -0.13850784301757812, -0.13104248046875, -0.12357711791992188, -0.11611175537109375, -0.10864639282226562, -0.1011810302734375, -0.09371566772460938, -0.08625030517578125, -0.07878494262695312, -0.071319580078125, -0.06385421752929688, -0.05638885498046875, -0.048923492431640625, -0.0414581298828125, -0.033992767333984375, -0.02652740478515625, -0.019062042236328125, -0.0115966796875, -0.004131317138671875, 0.00333404541015625, 0.010799407958984375, 0.0182647705078125, 0.025730133056640625, 0.03319549560546875, 0.040660858154296875, 0.048126220703125, 0.055591583251953125, 0.06305694580078125, 0.07052230834960938, 0.0779876708984375, 0.08545303344726562, 0.09291839599609375, 0.10038375854492188, 0.10784912109375, 0.11531448364257812, 0.12277984619140625, 0.13024520874023438, 0.1377105712890625, 0.14517593383789062, 0.15264129638671875, 0.16010665893554688, 0.167572021484375, 0.17503738403320312, 0.18250274658203125, 0.18996810913085938, 0.1974334716796875, 0.20489883422851562, 0.21236419677734375, 0.21982955932617188, 0.227294921875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 12.0, 22.0, 19.0, 36.0, 64.0, 104.0, 171.0, 242.0, 386.0, 699.0, 1212.0, 2289.0, 6570.0, 96157.0, 893616.0, 37822.0, 4626.0, 1842.0, 1047.0, 643.0, 376.0, 246.0, 132.0, 82.0, 53.0, 21.0, 18.0, 12.0, 9.0, 7.0, 3.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.96142578125, -0.936370849609375, -0.91131591796875, -0.886260986328125, -0.8612060546875, -0.836151123046875, -0.81109619140625, -0.786041259765625, -0.760986328125, -0.735931396484375, -0.71087646484375, -0.685821533203125, -0.6607666015625, -0.635711669921875, -0.61065673828125, -0.585601806640625, -0.560546875, -0.535491943359375, -0.51043701171875, -0.485382080078125, -0.4603271484375, -0.435272216796875, -0.41021728515625, -0.385162353515625, -0.360107421875, -0.335052490234375, -0.30999755859375, -0.284942626953125, -0.2598876953125, -0.234832763671875, -0.20977783203125, -0.184722900390625, -0.15966796875, -0.134613037109375, -0.10955810546875, -0.084503173828125, -0.0594482421875, -0.034393310546875, -0.00933837890625, 0.015716552734375, 0.040771484375, 0.065826416015625, 0.09088134765625, 0.115936279296875, 0.1409912109375, 0.166046142578125, 0.19110107421875, 0.216156005859375, 0.2412109375, 0.266265869140625, 0.29132080078125, 0.316375732421875, 0.3414306640625, 0.366485595703125, 0.39154052734375, 0.416595458984375, 0.441650390625, 0.466705322265625, 0.49176025390625, 0.516815185546875, 0.5418701171875, 0.566925048828125, 0.59197998046875, 0.617034912109375, 0.64208984375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 3.0, 3.0, 8.0, 12.0, 22.0, 100.0, 454.0, 313.0, 48.0, 19.0, 4.0, 8.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00014853477478027344, -0.0001448923721909523, -0.00014124996960163116, -0.00013760756701231003, -0.0001339651644229889, -0.00013032276183366776, -0.00012668035924434662, -0.00012303795665502548, -0.00011939555406570435, -0.00011575315147638321, -0.00011211074888706207, -0.00010846834629774094, -0.0001048259437084198, -0.00010118354111909866, -9.754113852977753e-05, -9.389873594045639e-05, -9.025633335113525e-05, -8.661393076181412e-05, -8.297152817249298e-05, -7.932912558317184e-05, -7.568672299385071e-05, -7.204432040452957e-05, -6.840191781520844e-05, -6.47595152258873e-05, -6.111711263656616e-05, -5.7474710047245026e-05, -5.383230745792389e-05, -5.018990486860275e-05, -4.6547502279281616e-05, -4.290509968996048e-05, -3.926269710063934e-05, -3.562029451131821e-05, -3.197789192199707e-05, -2.8335489332675934e-05, -2.4693086743354797e-05, -2.105068415403366e-05, -1.7408281564712524e-05, -1.3765878975391388e-05, -1.0123476386070251e-05, -6.481073796749115e-06, -2.8386712074279785e-06, 8.03731381893158e-07, 4.4461339712142944e-06, 8.088536560535431e-06, 1.1730939149856567e-05, 1.5373341739177704e-05, 1.901574432849884e-05, 2.2658146917819977e-05, 2.6300549507141113e-05, 2.994295209646225e-05, 3.3585354685783386e-05, 3.722775727510452e-05, 4.087015986442566e-05, 4.4512562453746796e-05, 4.815496504306793e-05, 5.179736763238907e-05, 5.5439770221710205e-05, 5.908217281103134e-05, 6.272457540035248e-05, 6.636697798967361e-05, 7.000938057899475e-05, 7.365178316831589e-05, 7.729418575763702e-05, 8.093658834695816e-05, 8.45789909362793e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 3.0, 3.0, 13.0, 14.0, 13.0, 21.0, 28.0, 42.0, 54.0, 85.0, 101.0, 177.0, 260.0, 377.0, 744.0, 1211.0, 2143.0, 4044.0, 7678.0, 15528.0, 33179.0, 77820.0, 181143.0, 294902.0, 232895.0, 108498.0, 45631.0, 20426.0, 9811.0, 5201.0, 2779.0, 1426.0, 871.0, 490.0, 302.0, 192.0, 138.0, 81.0, 69.0, 49.0, 38.0, 26.0, 18.0, 8.0, 4.0, 5.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.127197265625, -0.1233062744140625, -0.119415283203125, -0.1155242919921875, -0.11163330078125, -0.1077423095703125, -0.103851318359375, -0.0999603271484375, -0.0960693359375, -0.0921783447265625, -0.088287353515625, -0.0843963623046875, -0.08050537109375, -0.0766143798828125, -0.072723388671875, -0.0688323974609375, -0.06494140625, -0.0610504150390625, -0.057159423828125, -0.0532684326171875, -0.04937744140625, -0.0454864501953125, -0.041595458984375, -0.0377044677734375, -0.0338134765625, -0.0299224853515625, -0.026031494140625, -0.0221405029296875, -0.01824951171875, -0.0143585205078125, -0.010467529296875, -0.0065765380859375, -0.002685546875, 0.0012054443359375, 0.005096435546875, 0.0089874267578125, 0.01287841796875, 0.0167694091796875, 0.020660400390625, 0.0245513916015625, 0.0284423828125, 0.0323333740234375, 0.036224365234375, 0.0401153564453125, 0.04400634765625, 0.0478973388671875, 0.051788330078125, 0.0556793212890625, 0.0595703125, 0.0634613037109375, 0.067352294921875, 0.0712432861328125, 0.07513427734375, 0.0790252685546875, 0.082916259765625, 0.0868072509765625, 0.0906982421875, 0.0945892333984375, 0.098480224609375, 0.1023712158203125, 0.10626220703125, 0.1101531982421875, 0.114044189453125, 0.1179351806640625, 0.121826171875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 4.0, 4.0, 11.0, 3.0, 10.0, 13.0, 12.0, 14.0, 20.0, 37.0, 33.0, 37.0, 39.0, 39.0, 41.0, 64.0, 52.0, 63.0, 58.0, 62.0, 59.0, 47.0, 43.0, 30.0, 34.0, 28.0, 18.0, 19.0, 22.0, 18.0, 15.0, 10.0, 9.0, 7.0, 9.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07611083984375, -0.07369804382324219, -0.07128524780273438, -0.06887245178222656, -0.06645965576171875, -0.06404685974121094, -0.061634063720703125, -0.05922126770019531, -0.0568084716796875, -0.05439567565917969, -0.051982879638671875, -0.04957008361816406, -0.04715728759765625, -0.04474449157714844, -0.042331695556640625, -0.03991889953613281, -0.037506103515625, -0.03509330749511719, -0.032680511474609375, -0.030267715454101562, -0.02785491943359375, -0.025442123413085938, -0.023029327392578125, -0.020616531372070312, -0.0182037353515625, -0.015790939331054688, -0.013378143310546875, -0.010965347290039062, -0.00855255126953125, -0.0061397552490234375, -0.003726959228515625, -0.0013141632080078125, 0.0010986328125, 0.0035114288330078125, 0.005924224853515625, 0.008337020874023438, 0.01074981689453125, 0.013162612915039062, 0.015575408935546875, 0.017988204956054688, 0.0204010009765625, 0.022813796997070312, 0.025226593017578125, 0.027639389038085938, 0.03005218505859375, 0.03246498107910156, 0.034877777099609375, 0.03729057312011719, 0.039703369140625, 0.04211616516113281, 0.044528961181640625, 0.04694175720214844, 0.04935455322265625, 0.05176734924316406, 0.054180145263671875, 0.05659294128417969, 0.0590057373046875, 0.06141853332519531, 0.06383132934570312, 0.06624412536621094, 0.06865692138671875, 0.07106971740722656, 0.07348251342773438, 0.07589530944824219, 0.07830810546875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 14.0, 84.0, 318.0, 424.0, 136.0, 32.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7269718647003174, -2.6042118072509766, -2.4814517498016357, -2.358691692352295, -2.235931634902954, -2.1131715774536133, -1.990411400794983, -1.867651343345642, -1.7448912858963013, -1.6221312284469604, -1.4993711709976196, -1.3766109943389893, -1.2538509368896484, -1.1310908794403076, -1.0083308219909668, -0.885570764541626, -0.7628107070922852, -0.6400506496429443, -0.5172905921936035, -0.3945304751396179, -0.2717704176902771, -0.14901036024093628, -0.026250243186950684, 0.09650981426239014, 0.21926987171173096, 0.3420299291610718, 0.464790016412735, 0.5875501036643982, 0.710310161113739, 0.8330702185630798, 0.9558303356170654, 1.0785903930664062, 1.201350212097168, 1.3241102695465088, 1.4468703269958496, 1.5696303844451904, 1.6923904418945312, 1.815150499343872, 1.9379106760025024, 2.060670852661133, 2.1834306716918945, 2.3061907291412354, 2.428950786590576, 2.551710844039917, 2.674470901489258, 2.7972309589385986, 2.9199910163879395, 3.0427513122558594, 3.1655113697052, 3.288271427154541, 3.411031484603882, 3.5337915420532227, 3.6565515995025635, 3.7793116569519043, 3.902071952819824, 4.024831771850586, 4.147592067718506, 4.270352363586426, 4.3931121826171875, 4.515872478485107, 4.638632297515869, 4.761392593383789, 4.884152412414551, 5.006912708282471, 5.129672527313232]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 5.0, 6.0, 4.0, 2.0, 8.0, 13.0, 14.0, 17.0, 20.0, 22.0, 21.0, 26.0, 38.0, 30.0, 40.0, 53.0, 40.0, 58.0, 45.0, 59.0, 39.0, 60.0, 50.0, 46.0, 42.0, 34.0, 35.0, 21.0, 28.0, 22.0, 23.0, 11.0, 19.0, 8.0, 8.0, 8.0, 7.0, 6.0, 1.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7051905393600464, -0.6822935938835144, -0.6593967080116272, -0.6364997625350952, -0.6136028170585632, -0.5907058715820312, -0.567808985710144, -0.5449120402336121, -0.5220150947570801, -0.4991181790828705, -0.4762212336063385, -0.4533243179321289, -0.4304273724555969, -0.40753045678138733, -0.38463354110717773, -0.36173659563064575, -0.33883970975875854, -0.31594279408454895, -0.29304584860801697, -0.2701489329338074, -0.24725200235843658, -0.2243550717830658, -0.2014581561088562, -0.1785612255334854, -0.15566429495811462, -0.13276736438274384, -0.10987044125795364, -0.08697351813316345, -0.06407658755779266, -0.041179656982421875, -0.01828274130821228, 0.004614189267158508, 0.027511179447174072, 0.05040810629725456, 0.07330503314733505, 0.09620195627212524, 0.11909888684749603, 0.14199581742286682, 0.16489273309707642, 0.1877896636724472, 0.210686594247818, 0.23358352482318878, 0.25648045539855957, 0.27937737107276917, 0.30227428674697876, 0.32517123222351074, 0.34806814789772034, 0.37096506357192993, 0.3938620090484619, 0.4167589247226715, 0.4396558701992035, 0.4625527858734131, 0.48544973134994507, 0.508346676826477, 0.5312435626983643, 0.5541405081748962, 0.5770374536514282, 0.5999343991279602, 0.6228312849998474, 0.6457282304763794, 0.6686251759529114, 0.6915221214294434, 0.7144190073013306, 0.7373159527778625, 0.7602128386497498]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 6.0, 5.0, 10.0, 8.0, 18.0, 18.0, 25.0, 36.0, 47.0, 90.0, 146.0, 280.0, 498.0, 1025.0, 2078.0, 4805.0, 12358.0, 35259.0, 117980.0, 517597.0, 1873977.0, 1245810.0, 273136.0, 71451.0, 23032.0, 8316.0, 3313.0, 1469.0, 697.0, 345.0, 173.0, 101.0, 56.0, 46.0, 29.0, 16.0, 10.0, 8.0, 2.0, 9.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.224365234375, -0.2177257537841797, -0.21108627319335938, -0.20444679260253906, -0.19780731201171875, -0.19116783142089844, -0.18452835083007812, -0.1778888702392578, -0.1712493896484375, -0.1646099090576172, -0.15797042846679688, -0.15133094787597656, -0.14469146728515625, -0.13805198669433594, -0.13141250610351562, -0.12477302551269531, -0.118133544921875, -0.11149406433105469, -0.10485458374023438, -0.09821510314941406, -0.09157562255859375, -0.08493614196777344, -0.07829666137695312, -0.07165718078613281, -0.0650177001953125, -0.05837821960449219, -0.051738739013671875, -0.04509925842285156, -0.03845977783203125, -0.03182029724121094, -0.025180816650390625, -0.018541336059570312, -0.01190185546875, -0.0052623748779296875, 0.001377105712890625, 0.008016586303710938, 0.01465606689453125, 0.021295547485351562, 0.027935028076171875, 0.03457450866699219, 0.0412139892578125, 0.04785346984863281, 0.054492950439453125, 0.06113243103027344, 0.06777191162109375, 0.07441139221191406, 0.08105087280273438, 0.08769035339355469, 0.094329833984375, 0.10096931457519531, 0.10760879516601562, 0.11424827575683594, 0.12088775634765625, 0.12752723693847656, 0.13416671752929688, 0.1408061981201172, 0.1474456787109375, 0.1540851593017578, 0.16072463989257812, 0.16736412048339844, 0.17400360107421875, 0.18064308166503906, 0.18728256225585938, 0.1939220428466797, 0.2005615234375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 5.0, 8.0, 16.0, 9.0, 18.0, 17.0, 19.0, 24.0, 33.0, 37.0, 28.0, 48.0, 42.0, 39.0, 52.0, 52.0, 40.0, 50.0, 56.0, 53.0, 56.0, 52.0, 28.0, 24.0, 29.0, 17.0, 30.0, 31.0, 11.0, 14.0, 7.0, 17.0, 9.0, 7.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.124755859375, -0.1212615966796875, -0.117767333984375, -0.1142730712890625, -0.11077880859375, -0.1072845458984375, -0.103790283203125, -0.1002960205078125, -0.0968017578125, -0.0933074951171875, -0.089813232421875, -0.0863189697265625, -0.08282470703125, -0.0793304443359375, -0.075836181640625, -0.0723419189453125, -0.06884765625, -0.0653533935546875, -0.061859130859375, -0.0583648681640625, -0.05487060546875, -0.0513763427734375, -0.047882080078125, -0.0443878173828125, -0.0408935546875, -0.0373992919921875, -0.033905029296875, -0.0304107666015625, -0.02691650390625, -0.0234222412109375, -0.019927978515625, -0.0164337158203125, -0.012939453125, -0.0094451904296875, -0.005950927734375, -0.0024566650390625, 0.00103759765625, 0.0045318603515625, 0.008026123046875, 0.0115203857421875, 0.0150146484375, 0.0185089111328125, 0.022003173828125, 0.0254974365234375, 0.02899169921875, 0.0324859619140625, 0.035980224609375, 0.0394744873046875, 0.04296875, 0.0464630126953125, 0.049957275390625, 0.0534515380859375, 0.05694580078125, 0.0604400634765625, 0.063934326171875, 0.0674285888671875, 0.0709228515625, 0.0744171142578125, 0.077911376953125, 0.0814056396484375, 0.08489990234375, 0.0883941650390625, 0.091888427734375, 0.0953826904296875, 0.098876953125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 3.0, 1.0, 7.0, 9.0, 15.0, 30.0, 46.0, 54.0, 72.0, 143.0, 302.0, 502.0, 1108.0, 3134.0, 9742.0, 35409.0, 141724.0, 565812.0, 1678470.0, 1276766.0, 358589.0, 89195.0, 22532.0, 6590.0, 2183.0, 899.0, 373.0, 219.0, 114.0, 84.0, 53.0, 36.0, 27.0, 16.0, 8.0, 8.0, 4.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.314453125, -0.30591583251953125, -0.2973785400390625, -0.28884124755859375, -0.280303955078125, -0.27176666259765625, -0.2632293701171875, -0.25469207763671875, -0.24615478515625, -0.23761749267578125, -0.2290802001953125, -0.22054290771484375, -0.212005615234375, -0.20346832275390625, -0.1949310302734375, -0.18639373779296875, -0.1778564453125, -0.16931915283203125, -0.1607818603515625, -0.15224456787109375, -0.143707275390625, -0.13516998291015625, -0.1266326904296875, -0.11809539794921875, -0.10955810546875, -0.10102081298828125, -0.0924835205078125, -0.08394622802734375, -0.075408935546875, -0.06687164306640625, -0.0583343505859375, -0.04979705810546875, -0.041259765625, -0.03272247314453125, -0.0241851806640625, -0.01564788818359375, -0.007110595703125, 0.00142669677734375, 0.0099639892578125, 0.01850128173828125, 0.02703857421875, 0.03557586669921875, 0.0441131591796875, 0.05265045166015625, 0.061187744140625, 0.06972503662109375, 0.0782623291015625, 0.08679962158203125, 0.0953369140625, 0.10387420654296875, 0.1124114990234375, 0.12094879150390625, 0.129486083984375, 0.13802337646484375, 0.1465606689453125, 0.15509796142578125, 0.16363525390625, 0.17217254638671875, 0.1807098388671875, 0.18924713134765625, 0.197784423828125, 0.20632171630859375, 0.2148590087890625, 0.22339630126953125, 0.23193359375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 5.0, 5.0, 9.0, 3.0, 11.0, 18.0, 26.0, 31.0, 45.0, 41.0, 65.0, 85.0, 106.0, 137.0, 185.0, 210.0, 272.0, 345.0, 353.0, 384.0, 370.0, 318.0, 244.0, 224.0, 158.0, 109.0, 87.0, 66.0, 54.0, 26.0, 24.0, 19.0, 14.0, 7.0, 7.0, 5.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1429443359375, -0.13652992248535156, -0.13011550903320312, -0.12370109558105469, -0.11728668212890625, -0.11087226867675781, -0.10445785522460938, -0.09804344177246094, -0.0916290283203125, -0.08521461486816406, -0.07880020141601562, -0.07238578796386719, -0.06597137451171875, -0.05955696105957031, -0.053142547607421875, -0.04672813415527344, -0.040313720703125, -0.03389930725097656, -0.027484893798828125, -0.021070480346679688, -0.01465606689453125, -0.008241653442382812, -0.001827239990234375, 0.0045871734619140625, 0.0110015869140625, 0.017416000366210938, 0.023830413818359375, 0.030244827270507812, 0.03665924072265625, 0.04307365417480469, 0.049488067626953125, 0.05590248107910156, 0.06231689453125, 0.06873130798339844, 0.07514572143554688, 0.08156013488769531, 0.08797454833984375, 0.09438896179199219, 0.10080337524414062, 0.10721778869628906, 0.1136322021484375, 0.12004661560058594, 0.12646102905273438, 0.1328754425048828, 0.13928985595703125, 0.1457042694091797, 0.15211868286132812, 0.15853309631347656, 0.164947509765625, 0.17136192321777344, 0.17777633666992188, 0.1841907501220703, 0.19060516357421875, 0.1970195770263672, 0.20343399047851562, 0.20984840393066406, 0.2162628173828125, 0.22267723083496094, 0.22909164428710938, 0.2355060577392578, 0.24192047119140625, 0.2483348846435547, 0.2547492980957031, 0.26116371154785156, 0.267578125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 8.0, 17.0, 32.0, 79.0, 137.0, 183.0, 211.0, 161.0, 118.0, 41.0, 19.0, 8.0, 2.0, 3.0], "bins": [-4.22857666015625, -4.153481960296631, -4.07838773727417, -4.003293037414551, -3.9281985759735107, -3.8531041145324707, -3.7780096530914307, -3.7029151916503906, -3.6278207302093506, -3.5527262687683105, -3.4776318073272705, -3.4025373458862305, -3.3274426460266113, -3.2523481845855713, -3.1772537231445312, -3.102159261703491, -3.027064800262451, -2.951970338821411, -2.876875877380371, -2.801781177520752, -2.726686716079712, -2.651592254638672, -2.576497793197632, -2.501403331756592, -2.4263086318969727, -2.3512141704559326, -2.2761197090148926, -2.2010250091552734, -2.1259305477142334, -2.0508360862731934, -1.9757416248321533, -1.9006471633911133, -1.8255524635314941, -1.750458002090454, -1.6753634214401245, -1.6002689599990845, -1.5251744985580444, -1.4500799179077148, -1.3749854564666748, -1.2998909950256348, -1.2247965335845947, -1.1497020721435547, -1.074607491493225, -0.9995130300521851, -0.924418568611145, -0.8493240475654602, -0.7742295265197754, -0.6991350650787354, -0.6240405440330505, -0.5489460229873657, -0.4738515615463257, -0.39875704050064087, -0.32366254925727844, -0.24856805801391602, -0.1734735369682312, -0.09837907552719116, -0.023284554481506348, 0.051809944212436676, 0.1269044429063797, 0.20199894905090332, 0.27709344029426575, 0.3521879315376282, 0.427282452583313, 0.502376914024353, 0.5774714350700378]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 10.0, 11.0, 11.0, 4.0, 11.0, 14.0, 22.0, 16.0, 21.0, 18.0, 32.0, 34.0, 40.0, 22.0, 32.0, 48.0, 39.0, 36.0, 47.0, 44.0, 35.0, 30.0, 39.0, 34.0, 41.0, 35.0, 29.0, 35.0, 24.0, 33.0, 23.0, 20.0, 18.0, 18.0, 11.0, 10.0, 3.0, 9.0, 12.0, 8.0, 1.0, 4.0, 6.0, 2.0, 5.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6475735306739807, -0.6264436841011047, -0.6053138971328735, -0.5841840505599976, -0.5630542039871216, -0.5419243574142456, -0.5207945704460144, -0.4996647238731384, -0.47853490710258484, -0.45740509033203125, -0.4362752437591553, -0.4151454269886017, -0.3940156102180481, -0.3728857636451721, -0.35175594687461853, -0.33062613010406494, -0.30949628353118896, -0.2883664667606354, -0.2672366201877594, -0.2461068034172058, -0.22497697174549103, -0.20384714007377625, -0.18271732330322266, -0.16158749163150787, -0.1404576599597931, -0.11932782828807831, -0.09819800406694412, -0.07706817984580994, -0.055938348174095154, -0.03480851650238037, -0.013678699731826782, 0.0074511319398880005, 0.028580963611602783, 0.04971079155802727, 0.07084061950445175, 0.09197044372558594, 0.11310027539730072, 0.1342301070690155, 0.1553599238395691, 0.17648975551128387, 0.19761958718299866, 0.21874941885471344, 0.23987925052642822, 0.2610090672969818, 0.2821388840675354, 0.3032687306404114, 0.32439854741096497, 0.34552836418151855, 0.36665821075439453, 0.3877880275249481, 0.4089178740978241, 0.4300476908683777, 0.45117753744125366, 0.47230735421180725, 0.49343717098236084, 0.5145670175552368, 0.5356968641281128, 0.5568267107009888, 0.57795649766922, 0.599086344242096, 0.6202161908149719, 0.6413459777832031, 0.6624758243560791, 0.6836056709289551, 0.7047354578971863]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 4.0, 9.0, 12.0, 14.0, 26.0, 30.0, 42.0, 106.0, 147.0, 258.0, 489.0, 1034.0, 1969.0, 4029.0, 8044.0, 16986.0, 34438.0, 68905.0, 131793.0, 212771.0, 232435.0, 160243.0, 87771.0, 44317.0, 21705.0, 10552.0, 5144.0, 2572.0, 1192.0, 631.0, 348.0, 209.0, 129.0, 69.0, 45.0, 34.0, 14.0, 11.0, 13.0, 8.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.220458984375, -0.21263504028320312, -0.20481109619140625, -0.19698715209960938, -0.1891632080078125, -0.18133926391601562, -0.17351531982421875, -0.16569137573242188, -0.157867431640625, -0.15004348754882812, -0.14221954345703125, -0.13439559936523438, -0.1265716552734375, -0.11874771118164062, -0.11092376708984375, -0.10309982299804688, -0.09527587890625, -0.08745193481445312, -0.07962799072265625, -0.07180404663085938, -0.0639801025390625, -0.056156158447265625, -0.04833221435546875, -0.040508270263671875, -0.032684326171875, -0.024860382080078125, -0.01703643798828125, -0.009212493896484375, -0.0013885498046875, 0.006435394287109375, 0.01425933837890625, 0.022083282470703125, 0.0299072265625, 0.037731170654296875, 0.04555511474609375, 0.053379058837890625, 0.0612030029296875, 0.06902694702148438, 0.07685089111328125, 0.08467483520507812, 0.092498779296875, 0.10032272338867188, 0.10814666748046875, 0.11597061157226562, 0.1237945556640625, 0.13161849975585938, 0.13944244384765625, 0.14726638793945312, 0.15509033203125, 0.16291427612304688, 0.17073822021484375, 0.17856216430664062, 0.1863861083984375, 0.19421005249023438, 0.20203399658203125, 0.20985794067382812, 0.217681884765625, 0.22550582885742188, 0.23332977294921875, 0.24115371704101562, 0.2489776611328125, 0.2568016052246094, 0.26462554931640625, 0.2724494934082031, 0.2802734375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 7.0, 10.0, 5.0, 21.0, 14.0, 16.0, 19.0, 22.0, 26.0, 34.0, 23.0, 49.0, 41.0, 62.0, 58.0, 60.0, 64.0, 54.0, 40.0, 55.0, 45.0, 44.0, 28.0, 35.0, 35.0, 22.0, 23.0, 25.0, 15.0, 12.0, 9.0, 9.0, 7.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.133544921875, -0.12995338439941406, -0.12636184692382812, -0.12277030944824219, -0.11917877197265625, -0.11558723449707031, -0.11199569702148438, -0.10840415954589844, -0.1048126220703125, -0.10122108459472656, -0.09762954711914062, -0.09403800964355469, -0.09044647216796875, -0.08685493469238281, -0.08326339721679688, -0.07967185974121094, -0.076080322265625, -0.07248878479003906, -0.06889724731445312, -0.06530570983886719, -0.06171417236328125, -0.05812263488769531, -0.054531097412109375, -0.05093955993652344, -0.0473480224609375, -0.04375648498535156, -0.040164947509765625, -0.03657341003417969, -0.03298187255859375, -0.029390335083007812, -0.025798797607421875, -0.022207260131835938, -0.01861572265625, -0.015024185180664062, -0.011432647705078125, -0.007841110229492188, -0.00424957275390625, -0.0006580352783203125, 0.002933502197265625, 0.0065250396728515625, 0.0101165771484375, 0.013708114624023438, 0.017299652099609375, 0.020891189575195312, 0.02448272705078125, 0.028074264526367188, 0.031665802001953125, 0.03525733947753906, 0.038848876953125, 0.04244041442871094, 0.046031951904296875, 0.04962348937988281, 0.05321502685546875, 0.05680656433105469, 0.060398101806640625, 0.06398963928222656, 0.0675811767578125, 0.07117271423339844, 0.07476425170898438, 0.07835578918457031, 0.08194732666015625, 0.08553886413574219, 0.08913040161132812, 0.09272193908691406, 0.0963134765625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 7.0, 11.0, 17.0, 23.0, 45.0, 65.0, 101.0, 175.0, 308.0, 519.0, 1000.0, 1974.0, 4355.0, 10259.0, 23958.0, 54793.0, 120487.0, 231894.0, 277755.0, 172822.0, 82286.0, 36552.0, 16124.0, 6877.0, 2991.0, 1451.0, 664.0, 399.0, 228.0, 155.0, 92.0, 66.0, 29.0, 26.0, 11.0, 10.0, 8.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.341796875, -0.33119964599609375, -0.3206024169921875, -0.31000518798828125, -0.299407958984375, -0.28881072998046875, -0.2782135009765625, -0.26761627197265625, -0.25701904296875, -0.24642181396484375, -0.2358245849609375, -0.22522735595703125, -0.214630126953125, -0.20403289794921875, -0.1934356689453125, -0.18283843994140625, -0.1722412109375, -0.16164398193359375, -0.1510467529296875, -0.14044952392578125, -0.129852294921875, -0.11925506591796875, -0.1086578369140625, -0.09806060791015625, -0.08746337890625, -0.07686614990234375, -0.0662689208984375, -0.05567169189453125, -0.045074462890625, -0.03447723388671875, -0.0238800048828125, -0.01328277587890625, -0.002685546875, 0.00791168212890625, 0.0185089111328125, 0.02910614013671875, 0.039703369140625, 0.05030059814453125, 0.0608978271484375, 0.07149505615234375, 0.08209228515625, 0.09268951416015625, 0.1032867431640625, 0.11388397216796875, 0.124481201171875, 0.13507843017578125, 0.1456756591796875, 0.15627288818359375, 0.1668701171875, 0.17746734619140625, 0.1880645751953125, 0.19866180419921875, 0.209259033203125, 0.21985626220703125, 0.2304534912109375, 0.24105072021484375, 0.25164794921875, 0.26224517822265625, 0.2728424072265625, 0.28343963623046875, 0.294036865234375, 0.30463409423828125, 0.3152313232421875, 0.32582855224609375, 0.33642578125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 10.0, 12.0, 5.0, 13.0, 9.0, 14.0, 24.0, 18.0, 16.0, 28.0, 37.0, 38.0, 33.0, 35.0, 55.0, 52.0, 48.0, 50.0, 57.0, 49.0, 42.0, 51.0, 43.0, 33.0, 29.0, 31.0, 21.0, 27.0, 28.0, 14.0, 18.0, 12.0, 9.0, 8.0, 13.0, 5.0, 6.0, 2.0, 3.0, 5.0, 1.0, 0.0, 3.0], "bins": [-0.364990234375, -0.35565757751464844, -0.3463249206542969, -0.3369922637939453, -0.32765960693359375, -0.3183269500732422, -0.3089942932128906, -0.29966163635253906, -0.2903289794921875, -0.28099632263183594, -0.2716636657714844, -0.2623310089111328, -0.25299835205078125, -0.2436656951904297, -0.23433303833007812, -0.22500038146972656, -0.215667724609375, -0.20633506774902344, -0.19700241088867188, -0.1876697540283203, -0.17833709716796875, -0.1690044403076172, -0.15967178344726562, -0.15033912658691406, -0.1410064697265625, -0.13167381286621094, -0.12234115600585938, -0.11300849914550781, -0.10367584228515625, -0.09434318542480469, -0.08501052856445312, -0.07567787170410156, -0.06634521484375, -0.05701255798339844, -0.047679901123046875, -0.03834724426269531, -0.02901458740234375, -0.019681930541992188, -0.010349273681640625, -0.0010166168212890625, 0.0083160400390625, 0.017648696899414062, 0.026981353759765625, 0.03631401062011719, 0.04564666748046875, 0.05497932434082031, 0.06431198120117188, 0.07364463806152344, 0.082977294921875, 0.09230995178222656, 0.10164260864257812, 0.11097526550292969, 0.12030792236328125, 0.1296405792236328, 0.13897323608398438, 0.14830589294433594, 0.1576385498046875, 0.16697120666503906, 0.17630386352539062, 0.1856365203857422, 0.19496917724609375, 0.2043018341064453, 0.21363449096679688, 0.22296714782714844, 0.2322998046875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 10.0, 7.0, 21.0, 26.0, 29.0, 35.0, 47.0, 71.0, 106.0, 123.0, 195.0, 309.0, 590.0, 917.0, 1513.0, 2746.0, 5894.0, 76542.0, 918515.0, 29938.0, 4911.0, 2412.0, 1408.0, 788.0, 467.0, 319.0, 167.0, 146.0, 77.0, 69.0, 47.0, 32.0, 27.0, 19.0, 13.0, 12.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.72705078125, -0.7038955688476562, -0.6807403564453125, -0.6575851440429688, -0.634429931640625, -0.6112747192382812, -0.5881195068359375, -0.5649642944335938, -0.54180908203125, -0.5186538696289062, -0.4954986572265625, -0.47234344482421875, -0.449188232421875, -0.42603302001953125, -0.4028778076171875, -0.37972259521484375, -0.3565673828125, -0.33341217041015625, -0.3102569580078125, -0.28710174560546875, -0.263946533203125, -0.24079132080078125, -0.2176361083984375, -0.19448089599609375, -0.17132568359375, -0.14817047119140625, -0.1250152587890625, -0.10186004638671875, -0.078704833984375, -0.05554962158203125, -0.0323944091796875, -0.00923919677734375, 0.013916015625, 0.03707122802734375, 0.0602264404296875, 0.08338165283203125, 0.106536865234375, 0.12969207763671875, 0.1528472900390625, 0.17600250244140625, 0.19915771484375, 0.22231292724609375, 0.2454681396484375, 0.26862335205078125, 0.291778564453125, 0.31493377685546875, 0.3380889892578125, 0.36124420166015625, 0.3843994140625, 0.40755462646484375, 0.4307098388671875, 0.45386505126953125, 0.477020263671875, 0.5001754760742188, 0.5233306884765625, 0.5464859008789062, 0.56964111328125, 0.5927963256835938, 0.6159515380859375, 0.6391067504882812, 0.662261962890625, 0.6854171752929688, 0.7085723876953125, 0.7317276000976562, 0.7548828125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 14.0, 23.0, 51.0, 138.0, 262.0, 271.0, 118.0, 65.0, 28.0, 10.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.173154830932617e-05, -8.886680006980896e-05, -8.600205183029175e-05, -8.313730359077454e-05, -8.027255535125732e-05, -7.740780711174011e-05, -7.45430588722229e-05, -7.167831063270569e-05, -6.881356239318848e-05, -6.594881415367126e-05, -6.308406591415405e-05, -6.021931767463684e-05, -5.735456943511963e-05, -5.448982119560242e-05, -5.1625072956085205e-05, -4.876032471656799e-05, -4.589557647705078e-05, -4.303082823753357e-05, -4.016607999801636e-05, -3.7301331758499146e-05, -3.4436583518981934e-05, -3.157183527946472e-05, -2.870708703994751e-05, -2.5842338800430298e-05, -2.2977590560913086e-05, -2.0112842321395874e-05, -1.7248094081878662e-05, -1.438334584236145e-05, -1.1518597602844238e-05, -8.653849363327026e-06, -5.7891011238098145e-06, -2.9243528842926025e-06, -5.960464477539063e-08, 2.8051435947418213e-06, 5.669891834259033e-06, 8.534640073776245e-06, 1.1399388313293457e-05, 1.4264136552810669e-05, 1.712888479232788e-05, 1.9993633031845093e-05, 2.2858381271362305e-05, 2.5723129510879517e-05, 2.858787775039673e-05, 3.145262598991394e-05, 3.431737422943115e-05, 3.7182122468948364e-05, 4.0046870708465576e-05, 4.291161894798279e-05, 4.57763671875e-05, 4.864111542701721e-05, 5.1505863666534424e-05, 5.4370611906051636e-05, 5.723536014556885e-05, 6.010010838508606e-05, 6.296485662460327e-05, 6.582960486412048e-05, 6.86943531036377e-05, 7.155910134315491e-05, 7.442384958267212e-05, 7.728859782218933e-05, 8.015334606170654e-05, 8.301809430122375e-05, 8.588284254074097e-05, 8.874759078025818e-05, 9.161233901977539e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 5.0, 12.0, 19.0, 22.0, 50.0, 63.0, 130.0, 200.0, 337.0, 614.0, 1212.0, 2558.0, 5701.0, 13944.0, 33770.0, 80170.0, 164366.0, 246464.0, 235764.0, 144817.0, 68515.0, 28551.0, 11723.0, 4950.0, 2217.0, 1018.0, 586.0, 299.0, 202.0, 111.0, 55.0, 41.0, 20.0, 21.0, 10.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11090087890625, -0.10781192779541016, -0.10472297668457031, -0.10163402557373047, -0.09854507446289062, -0.09545612335205078, -0.09236717224121094, -0.0892782211303711, -0.08618927001953125, -0.0831003189086914, -0.08001136779785156, -0.07692241668701172, -0.07383346557617188, -0.07074451446533203, -0.06765556335449219, -0.06456661224365234, -0.0614776611328125, -0.058388710021972656, -0.05529975891113281, -0.05221080780029297, -0.049121856689453125, -0.04603290557861328, -0.04294395446777344, -0.039855003356933594, -0.03676605224609375, -0.033677101135253906, -0.030588150024414062, -0.02749919891357422, -0.024410247802734375, -0.02132129669189453, -0.018232345581054688, -0.015143394470214844, -0.012054443359375, -0.008965492248535156, -0.0058765411376953125, -0.0027875900268554688, 0.000301361083984375, 0.0033903121948242188, 0.0064792633056640625, 0.009568214416503906, 0.01265716552734375, 0.015746116638183594, 0.018835067749023438, 0.02192401885986328, 0.025012969970703125, 0.02810192108154297, 0.031190872192382812, 0.034279823303222656, 0.0373687744140625, 0.040457725524902344, 0.04354667663574219, 0.04663562774658203, 0.049724578857421875, 0.05281352996826172, 0.05590248107910156, 0.058991432189941406, 0.06208038330078125, 0.0651693344116211, 0.06825828552246094, 0.07134723663330078, 0.07443618774414062, 0.07752513885498047, 0.08061408996582031, 0.08370304107666016, 0.0867919921875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 6.0, 12.0, 12.0, 16.0, 10.0, 20.0, 20.0, 31.0, 29.0, 32.0, 39.0, 45.0, 51.0, 49.0, 70.0, 67.0, 53.0, 53.0, 52.0, 54.0, 46.0, 29.0, 36.0, 25.0, 29.0, 21.0, 20.0, 15.0, 17.0, 11.0, 1.0, 7.0, 6.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06280517578125, -0.060814857482910156, -0.05882453918457031, -0.05683422088623047, -0.054843902587890625, -0.05285358428955078, -0.05086326599121094, -0.048872947692871094, -0.04688262939453125, -0.044892311096191406, -0.04290199279785156, -0.04091167449951172, -0.038921356201171875, -0.03693103790283203, -0.03494071960449219, -0.032950401306152344, -0.0309600830078125, -0.028969764709472656, -0.026979446411132812, -0.02498912811279297, -0.022998809814453125, -0.02100849151611328, -0.019018173217773438, -0.017027854919433594, -0.01503753662109375, -0.013047218322753906, -0.011056900024414062, -0.009066581726074219, -0.007076263427734375, -0.005085945129394531, -0.0030956268310546875, -0.0011053085327148438, 0.000885009765625, 0.0028753280639648438, 0.0048656463623046875, 0.006855964660644531, 0.008846282958984375, 0.010836601257324219, 0.012826919555664062, 0.014817237854003906, 0.01680755615234375, 0.018797874450683594, 0.020788192749023438, 0.02277851104736328, 0.024768829345703125, 0.02675914764404297, 0.028749465942382812, 0.030739784240722656, 0.0327301025390625, 0.034720420837402344, 0.03671073913574219, 0.03870105743408203, 0.040691375732421875, 0.04268169403076172, 0.04467201232910156, 0.046662330627441406, 0.04865264892578125, 0.050642967224121094, 0.05263328552246094, 0.05462360382080078, 0.056613922119140625, 0.05860424041748047, 0.06059455871582031, 0.06258487701416016, 0.0645751953125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 10.0, 13.0, 30.0, 64.0, 80.0, 143.0, 182.0, 134.0, 142.0, 91.0, 49.0, 26.0, 18.0, 7.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9887200593948364, -0.9365886449813843, -0.8844572901725769, -0.8323259353637695, -0.7801945209503174, -0.7280631065368652, -0.6759317517280579, -0.6238003969192505, -0.5716689825057983, -0.5195375680923462, -0.4674062132835388, -0.41527482867240906, -0.3631434440612793, -0.31101205945014954, -0.2588806748390198, -0.20674929022789001, -0.15461790561676025, -0.1024865210056305, -0.05035513639450073, 0.0017762482166290283, 0.05390763282775879, 0.10603901743888855, 0.1581704020500183, 0.21030178666114807, 0.26243317127227783, 0.3145645558834076, 0.36669594049453735, 0.4188273251056671, 0.4709587097167969, 0.523090124130249, 0.5752214789390564, 0.6273528337478638, 0.6794843673706055, 0.7316157817840576, 0.783747136592865, 0.8358784914016724, 0.8880099058151245, 0.9401413202285767, 0.992272675037384, 1.0444040298461914, 1.0965354442596436, 1.1486668586730957, 1.2007982730865479, 1.2529295682907104, 1.3050609827041626, 1.3571923971176147, 1.4093236923217773, 1.4614551067352295, 1.5135865211486816, 1.5657179355621338, 1.617849349975586, 1.6699806451797485, 1.7221120595932007, 1.7742434740066528, 1.8263747692108154, 1.8785061836242676, 1.9306375980377197, 1.9827690124511719, 2.034900426864624, 2.087031841278076, 2.139163017272949, 2.1912944316864014, 2.2434258460998535, 2.2955572605133057, 2.347688674926758]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 6.0, 7.0, 12.0, 10.0, 12.0, 12.0, 11.0, 33.0, 23.0, 27.0, 39.0, 45.0, 37.0, 50.0, 48.0, 57.0, 47.0, 38.0, 49.0, 36.0, 45.0, 50.0, 51.0, 38.0, 32.0, 33.0, 26.0, 28.0, 23.0, 18.0, 13.0, 13.0, 8.0, 8.0, 5.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9896751046180725, -0.9601157903671265, -0.9305564761161804, -0.9009971618652344, -0.8714378476142883, -0.8418785333633423, -0.8123192191123962, -0.7827599048614502, -0.7532005906105042, -0.7236412763595581, -0.6940819621086121, -0.664522647857666, -0.63496333360672, -0.6054040193557739, -0.5758447051048279, -0.5462853908538818, -0.5167261362075806, -0.4871668219566345, -0.4576075077056885, -0.42804819345474243, -0.3984888792037964, -0.36892956495285034, -0.3393702507019043, -0.30981093645095825, -0.2802516222000122, -0.25069230794906616, -0.22113299369812012, -0.19157367944717407, -0.16201436519622803, -0.13245506584644318, -0.10289575159549713, -0.07333643734455109, -0.04377710819244385, -0.014217795804142952, 0.015341516584157944, 0.04490082710981369, 0.07446014136075974, 0.10401944816112518, 0.13357876241207123, 0.16313807666301727, 0.19269739091396332, 0.22225670516490936, 0.2518160045146942, 0.28137531876564026, 0.3109346330165863, 0.34049394726753235, 0.3700532615184784, 0.39961257576942444, 0.4291718900203705, 0.45873120427131653, 0.4882905185222626, 0.5178498029708862, 0.5474091172218323, 0.5769684314727783, 0.6065277457237244, 0.6360870599746704, 0.6656463742256165, 0.6952056884765625, 0.7247650027275085, 0.7543243169784546, 0.7838836312294006, 0.8134429454803467, 0.8430022597312927, 0.8725615739822388, 0.9021208882331848]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 4.0, 10.0, 12.0, 13.0, 16.0, 22.0, 37.0, 47.0, 79.0, 127.0, 206.0, 405.0, 800.0, 1784.0, 4461.0, 13277.0, 46535.0, 221525.0, 1513383.0, 1977421.0, 326618.0, 61454.0, 16755.0, 5442.0, 2052.0, 841.0, 413.0, 184.0, 115.0, 54.0, 58.0, 39.0, 22.0, 12.0, 12.0, 8.0, 7.0, 6.0, 3.0, 4.0, 2.0, 0.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.246337890625, -0.2386646270751953, -0.23099136352539062, -0.22331809997558594, -0.21564483642578125, -0.20797157287597656, -0.20029830932617188, -0.1926250457763672, -0.1849517822265625, -0.1772785186767578, -0.16960525512695312, -0.16193199157714844, -0.15425872802734375, -0.14658546447753906, -0.13891220092773438, -0.1312389373779297, -0.123565673828125, -0.11589241027832031, -0.10821914672851562, -0.10054588317871094, -0.09287261962890625, -0.08519935607910156, -0.07752609252929688, -0.06985282897949219, -0.0621795654296875, -0.05450630187988281, -0.046833038330078125, -0.03915977478027344, -0.03148651123046875, -0.023813247680664062, -0.016139984130859375, -0.008466720581054688, -0.00079345703125, 0.0068798065185546875, 0.014553070068359375, 0.022226333618164062, 0.02989959716796875, 0.03757286071777344, 0.045246124267578125, 0.05291938781738281, 0.0605926513671875, 0.06826591491699219, 0.07593917846679688, 0.08361244201660156, 0.09128570556640625, 0.09895896911621094, 0.10663223266601562, 0.11430549621582031, 0.121978759765625, 0.1296520233154297, 0.13732528686523438, 0.14499855041503906, 0.15267181396484375, 0.16034507751464844, 0.16801834106445312, 0.1756916046142578, 0.1833648681640625, 0.1910381317138672, 0.19871139526367188, 0.20638465881347656, 0.21405792236328125, 0.22173118591308594, 0.22940444946289062, 0.2370777130126953, 0.2447509765625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 9.0, 8.0, 16.0, 10.0, 9.0, 29.0, 25.0, 32.0, 26.0, 33.0, 31.0, 51.0, 44.0, 39.0, 58.0, 43.0, 44.0, 44.0, 45.0, 50.0, 42.0, 33.0, 41.0, 36.0, 28.0, 31.0, 25.0, 22.0, 15.0, 22.0, 10.0, 9.0, 8.0, 5.0, 8.0, 3.0, 3.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11328125, -0.10982418060302734, -0.10636711120605469, -0.10291004180908203, -0.09945297241210938, -0.09599590301513672, -0.09253883361816406, -0.0890817642211914, -0.08562469482421875, -0.0821676254272461, -0.07871055603027344, -0.07525348663330078, -0.07179641723632812, -0.06833934783935547, -0.06488227844238281, -0.061425209045410156, -0.0579681396484375, -0.054511070251464844, -0.05105400085449219, -0.04759693145751953, -0.044139862060546875, -0.04068279266357422, -0.03722572326660156, -0.033768653869628906, -0.03031158447265625, -0.026854515075683594, -0.023397445678710938, -0.01994037628173828, -0.016483306884765625, -0.013026237487792969, -0.009569168090820312, -0.006112098693847656, -0.002655029296875, 0.0008020401000976562, 0.0042591094970703125, 0.007716178894042969, 0.011173248291015625, 0.014630317687988281, 0.018087387084960938, 0.021544456481933594, 0.02500152587890625, 0.028458595275878906, 0.03191566467285156, 0.03537273406982422, 0.038829803466796875, 0.04228687286376953, 0.04574394226074219, 0.049201011657714844, 0.0526580810546875, 0.056115150451660156, 0.05957221984863281, 0.06302928924560547, 0.06648635864257812, 0.06994342803955078, 0.07340049743652344, 0.0768575668334961, 0.08031463623046875, 0.0837717056274414, 0.08722877502441406, 0.09068584442138672, 0.09414291381835938, 0.09759998321533203, 0.10105705261230469, 0.10451412200927734, 0.10797119140625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 6.0, 10.0, 12.0, 22.0, 32.0, 42.0, 60.0, 107.0, 195.0, 319.0, 610.0, 1433.0, 3457.0, 9621.0, 29531.0, 97856.0, 337826.0, 1153466.0, 1690901.0, 615839.0, 175092.0, 51876.0, 16221.0, 5600.0, 2167.0, 967.0, 445.0, 214.0, 120.0, 78.0, 49.0, 36.0, 28.0, 12.0, 9.0, 7.0, 7.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.249755859375, -0.24266815185546875, -0.2355804443359375, -0.22849273681640625, -0.221405029296875, -0.21431732177734375, -0.2072296142578125, -0.20014190673828125, -0.19305419921875, -0.18596649169921875, -0.1788787841796875, -0.17179107666015625, -0.164703369140625, -0.15761566162109375, -0.1505279541015625, -0.14344024658203125, -0.1363525390625, -0.12926483154296875, -0.1221771240234375, -0.11508941650390625, -0.108001708984375, -0.10091400146484375, -0.0938262939453125, -0.08673858642578125, -0.07965087890625, -0.07256317138671875, -0.0654754638671875, -0.05838775634765625, -0.051300048828125, -0.04421234130859375, -0.0371246337890625, -0.03003692626953125, -0.02294921875, -0.01586151123046875, -0.0087738037109375, -0.00168609619140625, 0.005401611328125, 0.01248931884765625, 0.0195770263671875, 0.02666473388671875, 0.03375244140625, 0.04084014892578125, 0.0479278564453125, 0.05501556396484375, 0.062103271484375, 0.06919097900390625, 0.0762786865234375, 0.08336639404296875, 0.0904541015625, 0.09754180908203125, 0.1046295166015625, 0.11171722412109375, 0.118804931640625, 0.12589263916015625, 0.1329803466796875, 0.14006805419921875, 0.14715576171875, 0.15424346923828125, 0.1613311767578125, 0.16841888427734375, 0.175506591796875, 0.18259429931640625, 0.1896820068359375, 0.19676971435546875, 0.203857421875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 11.0, 7.0, 12.0, 14.0, 18.0, 25.0, 36.0, 51.0, 48.0, 76.0, 114.0, 124.0, 165.0, 217.0, 270.0, 370.0, 393.0, 402.0, 349.0, 313.0, 257.0, 181.0, 170.0, 137.0, 72.0, 63.0, 44.0, 47.0, 29.0, 19.0, 11.0, 9.0, 7.0, 8.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1925048828125, -0.18651390075683594, -0.18052291870117188, -0.1745319366455078, -0.16854095458984375, -0.1625499725341797, -0.15655899047851562, -0.15056800842285156, -0.1445770263671875, -0.13858604431152344, -0.13259506225585938, -0.1266040802001953, -0.12061309814453125, -0.11462211608886719, -0.10863113403320312, -0.10264015197753906, -0.096649169921875, -0.09065818786621094, -0.08466720581054688, -0.07867622375488281, -0.07268524169921875, -0.06669425964355469, -0.060703277587890625, -0.05471229553222656, -0.0487213134765625, -0.04273033142089844, -0.036739349365234375, -0.030748367309570312, -0.02475738525390625, -0.018766403198242188, -0.012775421142578125, -0.0067844390869140625, -0.00079345703125, 0.0051975250244140625, 0.011188507080078125, 0.017179489135742188, 0.02317047119140625, 0.029161453247070312, 0.035152435302734375, 0.04114341735839844, 0.0471343994140625, 0.05312538146972656, 0.059116363525390625, 0.06510734558105469, 0.07109832763671875, 0.07708930969238281, 0.08308029174804688, 0.08907127380371094, 0.095062255859375, 0.10105323791503906, 0.10704421997070312, 0.11303520202636719, 0.11902618408203125, 0.1250171661376953, 0.13100814819335938, 0.13699913024902344, 0.1429901123046875, 0.14898109436035156, 0.15497207641601562, 0.1609630584716797, 0.16695404052734375, 0.1729450225830078, 0.17893600463867188, 0.18492698669433594, 0.19091796875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 9.0, 15.0, 52.0, 106.0, 192.0, 223.0, 189.0, 125.0, 61.0, 26.0, 11.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.874919891357422, -3.801196575164795, -3.727473258972168, -3.65375018119812, -3.580026865005493, -3.506303548812866, -3.4325804710388184, -3.3588571548461914, -3.2851338386535645, -3.2114105224609375, -3.1376872062683105, -3.0639641284942627, -2.9902408123016357, -2.916517496109009, -2.842794418334961, -2.769071102142334, -2.695347785949707, -2.62162446975708, -2.547901153564453, -2.4741780757904053, -2.4004547595977783, -2.3267314434051514, -2.2530083656311035, -2.1792850494384766, -2.1055617332458496, -2.0318384170532227, -1.9581152200698853, -1.8843920230865479, -1.810668706893921, -1.736945390701294, -1.6632221937179565, -1.5894989967346191, -1.5157756805419922, -1.4420523643493652, -1.3683291673660278, -1.2946059703826904, -1.2208826541900635, -1.1471593379974365, -1.0734361410140991, -0.9997128844261169, -0.9259896874427795, -0.8522664308547974, -0.7785431742668152, -0.704819917678833, -0.6310966610908508, -0.5573734045028687, -0.4836501479148865, -0.4099268913269043, -0.3362036347389221, -0.26248037815093994, -0.18875712156295776, -0.11503386497497559, -0.04131060838699341, 0.03241264820098877, 0.10613590478897095, 0.17985916137695312, 0.2535824179649353, 0.3273056745529175, 0.40102893114089966, 0.47475218772888184, 0.548475444316864, 0.6221987009048462, 0.6959219574928284, 0.7696452140808105, 0.8433684706687927]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 8.0, 4.0, 4.0, 8.0, 7.0, 8.0, 13.0, 12.0, 12.0, 19.0, 12.0, 24.0, 33.0, 35.0, 36.0, 33.0, 47.0, 39.0, 39.0, 43.0, 36.0, 52.0, 37.0, 30.0, 48.0, 33.0, 29.0, 51.0, 38.0, 38.0, 35.0, 24.0, 19.0, 15.0, 19.0, 7.0, 18.0, 11.0, 5.0, 6.0, 9.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.661861002445221, -0.6409622430801392, -0.6200634837150574, -0.5991647243499756, -0.5782659649848938, -0.557367205619812, -0.5364683866500854, -0.5155696272850037, -0.4946708679199219, -0.4737721085548401, -0.4528733491897583, -0.4319745898246765, -0.41107580065727234, -0.39017704129219055, -0.36927828192710876, -0.3483794927597046, -0.3274807631969452, -0.3065820038318634, -0.2856832444667816, -0.26478445529937744, -0.24388569593429565, -0.22298693656921387, -0.20208817720413208, -0.1811894029378891, -0.1602906435728073, -0.13939188420772552, -0.11849310994148254, -0.09759435057640076, -0.07669558376073837, -0.05579681694507599, -0.0348980575799942, -0.01399928331375122, 0.006899476051330566, 0.0277982410043478, 0.048697005957365036, 0.06959576904773712, 0.0904945358633995, 0.11139330267906189, 0.13229206204414368, 0.15319083631038666, 0.17408959567546844, 0.19498835504055023, 0.2158871293067932, 0.236785888671875, 0.2576846480369568, 0.2785834074020386, 0.29948216676712036, 0.32038095593452454, 0.3412797152996063, 0.3621784746646881, 0.3830772340297699, 0.4039760231971741, 0.42487478256225586, 0.44577354192733765, 0.46667230129241943, 0.4875710606575012, 0.508469820022583, 0.5293685793876648, 0.5502673387527466, 0.5711660981178284, 0.5920648574829102, 0.6129636764526367, 0.6338623762130737, 0.6547611951828003, 0.6756599545478821]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 13.0, 12.0, 25.0, 30.0, 61.0, 91.0, 181.0, 317.0, 561.0, 959.0, 1781.0, 3366.0, 6408.0, 12381.0, 24849.0, 50923.0, 103512.0, 183665.0, 241774.0, 194216.0, 111886.0, 56277.0, 26977.0, 13496.0, 6747.0, 3598.0, 2017.0, 1091.0, 553.0, 302.0, 196.0, 100.0, 65.0, 35.0, 28.0, 21.0, 11.0, 6.0, 5.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2724609375, -0.2638282775878906, -0.25519561767578125, -0.24656295776367188, -0.2379302978515625, -0.22929763793945312, -0.22066497802734375, -0.21203231811523438, -0.203399658203125, -0.19476699829101562, -0.18613433837890625, -0.17750167846679688, -0.1688690185546875, -0.16023635864257812, -0.15160369873046875, -0.14297103881835938, -0.13433837890625, -0.12570571899414062, -0.11707305908203125, -0.10844039916992188, -0.0998077392578125, -0.09117507934570312, -0.08254241943359375, -0.07390975952148438, -0.065277099609375, -0.056644439697265625, -0.04801177978515625, -0.039379119873046875, -0.0307464599609375, -0.022113800048828125, -0.01348114013671875, -0.004848480224609375, 0.0037841796875, 0.012416839599609375, 0.02104949951171875, 0.029682159423828125, 0.0383148193359375, 0.046947479248046875, 0.05558013916015625, 0.06421279907226562, 0.072845458984375, 0.08147811889648438, 0.09011077880859375, 0.09874343872070312, 0.1073760986328125, 0.11600875854492188, 0.12464141845703125, 0.13327407836914062, 0.14190673828125, 0.15053939819335938, 0.15917205810546875, 0.16780471801757812, 0.1764373779296875, 0.18507003784179688, 0.19370269775390625, 0.20233535766601562, 0.210968017578125, 0.21960067749023438, 0.22823333740234375, 0.23686599731445312, 0.2454986572265625, 0.2541313171386719, 0.26276397705078125, 0.2713966369628906, 0.280029296875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 6.0, 6.0, 1.0, 4.0, 6.0, 12.0, 7.0, 12.0, 25.0, 18.0, 37.0, 42.0, 29.0, 35.0, 39.0, 51.0, 49.0, 50.0, 51.0, 50.0, 47.0, 41.0, 43.0, 35.0, 55.0, 46.0, 38.0, 28.0, 22.0, 36.0, 22.0, 10.0, 15.0, 16.0, 7.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 4.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.133056640625, -0.12950992584228516, -0.1259632110595703, -0.12241649627685547, -0.11886978149414062, -0.11532306671142578, -0.11177635192871094, -0.1082296371459961, -0.10468292236328125, -0.1011362075805664, -0.09758949279785156, -0.09404277801513672, -0.09049606323242188, -0.08694934844970703, -0.08340263366699219, -0.07985591888427734, -0.0763092041015625, -0.07276248931884766, -0.06921577453613281, -0.06566905975341797, -0.062122344970703125, -0.05857563018798828, -0.05502891540527344, -0.051482200622558594, -0.04793548583984375, -0.044388771057128906, -0.04084205627441406, -0.03729534149169922, -0.033748626708984375, -0.03020191192626953, -0.026655197143554688, -0.023108482360839844, -0.019561767578125, -0.016015052795410156, -0.012468338012695312, -0.008921623229980469, -0.005374908447265625, -0.0018281936645507812, 0.0017185211181640625, 0.005265235900878906, 0.00881195068359375, 0.012358665466308594, 0.015905380249023438, 0.01945209503173828, 0.022998809814453125, 0.02654552459716797, 0.030092239379882812, 0.033638954162597656, 0.0371856689453125, 0.040732383728027344, 0.04427909851074219, 0.04782581329345703, 0.051372528076171875, 0.05491924285888672, 0.05846595764160156, 0.062012672424316406, 0.06555938720703125, 0.0691061019897461, 0.07265281677246094, 0.07619953155517578, 0.07974624633789062, 0.08329296112060547, 0.08683967590332031, 0.09038639068603516, 0.09393310546875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 6.0, 5.0, 6.0, 13.0, 15.0, 40.0, 41.0, 50.0, 66.0, 114.0, 138.0, 202.0, 317.0, 533.0, 920.0, 1659.0, 3438.0, 7167.0, 15560.0, 34657.0, 74910.0, 145387.0, 226879.0, 233116.0, 152508.0, 80570.0, 37772.0, 16770.0, 7591.0, 3632.0, 1805.0, 918.0, 585.0, 326.0, 264.0, 158.0, 116.0, 85.0, 63.0, 53.0, 35.0, 22.0, 17.0, 11.0, 10.0, 2.0, 2.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.262939453125, -0.2544708251953125, -0.246002197265625, -0.2375335693359375, -0.22906494140625, -0.2205963134765625, -0.212127685546875, -0.2036590576171875, -0.1951904296875, -0.1867218017578125, -0.178253173828125, -0.1697845458984375, -0.16131591796875, -0.1528472900390625, -0.144378662109375, -0.1359100341796875, -0.12744140625, -0.1189727783203125, -0.110504150390625, -0.1020355224609375, -0.09356689453125, -0.0850982666015625, -0.076629638671875, -0.0681610107421875, -0.0596923828125, -0.0512237548828125, -0.042755126953125, -0.0342864990234375, -0.02581787109375, -0.0173492431640625, -0.008880615234375, -0.0004119873046875, 0.008056640625, 0.0165252685546875, 0.024993896484375, 0.0334625244140625, 0.04193115234375, 0.0503997802734375, 0.058868408203125, 0.0673370361328125, 0.0758056640625, 0.0842742919921875, 0.092742919921875, 0.1012115478515625, 0.10968017578125, 0.1181488037109375, 0.126617431640625, 0.1350860595703125, 0.1435546875, 0.1520233154296875, 0.160491943359375, 0.1689605712890625, 0.17742919921875, 0.1858978271484375, 0.194366455078125, 0.2028350830078125, 0.2113037109375, 0.2197723388671875, 0.228240966796875, 0.2367095947265625, 0.24517822265625, 0.2536468505859375, 0.262115478515625, 0.2705841064453125, 0.279052734375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 0.0, 6.0, 1.0, 7.0, 10.0, 10.0, 9.0, 10.0, 12.0, 8.0, 11.0, 18.0, 33.0, 23.0, 28.0, 22.0, 34.0, 48.0, 40.0, 25.0, 36.0, 24.0, 26.0, 46.0, 32.0, 40.0, 33.0, 35.0, 46.0, 33.0, 30.0, 27.0, 37.0, 36.0, 21.0, 17.0, 20.0, 23.0, 10.0, 11.0, 4.0, 9.0, 12.0, 6.0, 11.0, 8.0, 3.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0], "bins": [-0.26171875, -0.25424766540527344, -0.24677658081054688, -0.2393054962158203, -0.23183441162109375, -0.2243633270263672, -0.21689224243164062, -0.20942115783691406, -0.2019500732421875, -0.19447898864746094, -0.18700790405273438, -0.1795368194580078, -0.17206573486328125, -0.1645946502685547, -0.15712356567382812, -0.14965248107910156, -0.142181396484375, -0.13471031188964844, -0.12723922729492188, -0.11976814270019531, -0.11229705810546875, -0.10482597351074219, -0.09735488891601562, -0.08988380432128906, -0.0824127197265625, -0.07494163513183594, -0.06747055053710938, -0.05999946594238281, -0.05252838134765625, -0.04505729675292969, -0.037586212158203125, -0.030115127563476562, -0.02264404296875, -0.015172958374023438, -0.007701873779296875, -0.0002307891845703125, 0.00724029541015625, 0.014711380004882812, 0.022182464599609375, 0.029653549194335938, 0.0371246337890625, 0.04459571838378906, 0.052066802978515625, 0.05953788757324219, 0.06700897216796875, 0.07448005676269531, 0.08195114135742188, 0.08942222595214844, 0.096893310546875, 0.10436439514160156, 0.11183547973632812, 0.11930656433105469, 0.12677764892578125, 0.1342487335205078, 0.14171981811523438, 0.14919090270996094, 0.1566619873046875, 0.16413307189941406, 0.17160415649414062, 0.1790752410888672, 0.18654632568359375, 0.1940174102783203, 0.20148849487304688, 0.20895957946777344, 0.2164306640625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 16.0, 18.0, 34.0, 68.0, 112.0, 271.0, 700.0, 1880.0, 6061.0, 22966.0, 99122.0, 343345.0, 397231.0, 134111.0, 30716.0, 7995.0, 2377.0, 882.0, 314.0, 162.0, 74.0, 38.0, 25.0, 11.0, 5.0, 2.0, 7.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.150634765625, -0.14594268798828125, -0.1412506103515625, -0.13655853271484375, -0.131866455078125, -0.12717437744140625, -0.1224822998046875, -0.11779022216796875, -0.11309814453125, -0.10840606689453125, -0.1037139892578125, -0.09902191162109375, -0.094329833984375, -0.08963775634765625, -0.0849456787109375, -0.08025360107421875, -0.0755615234375, -0.07086944580078125, -0.0661773681640625, -0.06148529052734375, -0.056793212890625, -0.05210113525390625, -0.0474090576171875, -0.04271697998046875, -0.03802490234375, -0.03333282470703125, -0.0286407470703125, -0.02394866943359375, -0.019256591796875, -0.01456451416015625, -0.0098724365234375, -0.00518035888671875, -0.00048828125, 0.00420379638671875, 0.0088958740234375, 0.01358795166015625, 0.018280029296875, 0.02297210693359375, 0.0276641845703125, 0.03235626220703125, 0.03704833984375, 0.04174041748046875, 0.0464324951171875, 0.05112457275390625, 0.055816650390625, 0.06050872802734375, 0.0652008056640625, 0.06989288330078125, 0.0745849609375, 0.07927703857421875, 0.0839691162109375, 0.08866119384765625, 0.093353271484375, 0.09804534912109375, 0.1027374267578125, 0.10742950439453125, 0.11212158203125, 0.11681365966796875, 0.1215057373046875, 0.12619781494140625, 0.130889892578125, 0.13558197021484375, 0.1402740478515625, 0.14496612548828125, 0.149658203125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 7.0, 2.0, 7.0, 6.0, 10.0, 8.0, 15.0, 15.0, 23.0, 37.0, 28.0, 49.0, 51.0, 70.0, 78.0, 86.0, 84.0, 69.0, 77.0, 62.0, 48.0, 39.0, 35.0, 18.0, 20.0, 16.0, 7.0, 7.0, 9.0, 5.0, 5.0, 4.0, 1.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.288818359375e-05, -2.215523272752762e-05, -2.1422281861305237e-05, -2.0689330995082855e-05, -1.9956380128860474e-05, -1.9223429262638092e-05, -1.849047839641571e-05, -1.775752753019333e-05, -1.7024576663970947e-05, -1.6291625797748566e-05, -1.5558674931526184e-05, -1.4825724065303802e-05, -1.4092773199081421e-05, -1.335982233285904e-05, -1.2626871466636658e-05, -1.1893920600414276e-05, -1.1160969734191895e-05, -1.0428018867969513e-05, -9.695068001747131e-06, -8.96211713552475e-06, -8.229166269302368e-06, -7.4962154030799866e-06, -6.763264536857605e-06, -6.030313670635223e-06, -5.297362804412842e-06, -4.56441193819046e-06, -3.831461071968079e-06, -3.098510205745697e-06, -2.3655593395233154e-06, -1.6326084733009338e-06, -8.996576070785522e-07, -1.6670674085617065e-07, 5.662441253662109e-07, 1.2991949915885925e-06, 2.032145857810974e-06, 2.7650967240333557e-06, 3.4980475902557373e-06, 4.230998456478119e-06, 4.9639493227005005e-06, 5.696900188922882e-06, 6.429851055145264e-06, 7.162801921367645e-06, 7.895752787590027e-06, 8.628703653812408e-06, 9.36165452003479e-06, 1.0094605386257172e-05, 1.0827556252479553e-05, 1.1560507118701935e-05, 1.2293457984924316e-05, 1.3026408851146698e-05, 1.375935971736908e-05, 1.4492310583591461e-05, 1.5225261449813843e-05, 1.5958212316036224e-05, 1.6691163182258606e-05, 1.7424114048480988e-05, 1.815706491470337e-05, 1.889001578092575e-05, 1.9622966647148132e-05, 2.0355917513370514e-05, 2.1088868379592896e-05, 2.1821819245815277e-05, 2.255477011203766e-05, 2.328772097826004e-05, 2.4020671844482422e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 7.0, 10.0, 14.0, 23.0, 35.0, 50.0, 98.0, 189.0, 312.0, 668.0, 1405.0, 3967.0, 13224.0, 47966.0, 179690.0, 402722.0, 281803.0, 83804.0, 22093.0, 6460.0, 2189.0, 860.0, 419.0, 197.0, 134.0, 79.0, 55.0, 25.0, 17.0, 13.0, 8.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1534423828125, -0.14937305450439453, -0.14530372619628906, -0.1412343978881836, -0.13716506958007812, -0.13309574127197266, -0.1290264129638672, -0.12495708465576172, -0.12088775634765625, -0.11681842803955078, -0.11274909973144531, -0.10867977142333984, -0.10461044311523438, -0.1005411148071289, -0.09647178649902344, -0.09240245819091797, -0.0883331298828125, -0.08426380157470703, -0.08019447326660156, -0.0761251449584961, -0.07205581665039062, -0.06798648834228516, -0.06391716003417969, -0.05984783172607422, -0.05577850341796875, -0.05170917510986328, -0.04763984680175781, -0.043570518493652344, -0.039501190185546875, -0.035431861877441406, -0.03136253356933594, -0.02729320526123047, -0.023223876953125, -0.01915454864501953, -0.015085220336914062, -0.011015892028808594, -0.006946563720703125, -0.0028772354125976562, 0.0011920928955078125, 0.005261421203613281, 0.00933074951171875, 0.013400077819824219, 0.017469406127929688, 0.021538734436035156, 0.025608062744140625, 0.029677391052246094, 0.03374671936035156, 0.03781604766845703, 0.0418853759765625, 0.04595470428466797, 0.05002403259277344, 0.054093360900878906, 0.058162689208984375, 0.062232017517089844, 0.06630134582519531, 0.07037067413330078, 0.07444000244140625, 0.07850933074951172, 0.08257865905761719, 0.08664798736572266, 0.09071731567382812, 0.0947866439819336, 0.09885597229003906, 0.10292530059814453, 0.10699462890625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 3.0, 8.0, 3.0, 13.0, 10.0, 13.0, 14.0, 13.0, 25.0, 34.0, 39.0, 43.0, 53.0, 60.0, 61.0, 62.0, 60.0, 74.0, 63.0, 68.0, 32.0, 46.0, 49.0, 43.0, 25.0, 14.0, 24.0, 4.0, 8.0, 9.0, 9.0, 5.0, 7.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.068115234375, -0.06589603424072266, -0.06367683410644531, -0.06145763397216797, -0.059238433837890625, -0.05701923370361328, -0.05480003356933594, -0.052580833435058594, -0.05036163330078125, -0.048142433166503906, -0.04592323303222656, -0.04370403289794922, -0.041484832763671875, -0.03926563262939453, -0.03704643249511719, -0.034827232360839844, -0.0326080322265625, -0.030388832092285156, -0.028169631958007812, -0.02595043182373047, -0.023731231689453125, -0.02151203155517578, -0.019292831420898438, -0.017073631286621094, -0.01485443115234375, -0.012635231018066406, -0.010416030883789062, -0.008196830749511719, -0.005977630615234375, -0.0037584304809570312, -0.0015392303466796875, 0.0006799697875976562, 0.002899169921875, 0.005118370056152344, 0.0073375701904296875, 0.009556770324707031, 0.011775970458984375, 0.013995170593261719, 0.016214370727539062, 0.018433570861816406, 0.02065277099609375, 0.022871971130371094, 0.025091171264648438, 0.02731037139892578, 0.029529571533203125, 0.03174877166748047, 0.03396797180175781, 0.036187171936035156, 0.0384063720703125, 0.040625572204589844, 0.04284477233886719, 0.04506397247314453, 0.047283172607421875, 0.04950237274169922, 0.05172157287597656, 0.053940773010253906, 0.05615997314453125, 0.058379173278808594, 0.06059837341308594, 0.06281757354736328, 0.06503677368164062, 0.06725597381591797, 0.06947517395019531, 0.07169437408447266, 0.07391357421875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 30.0, 111.0, 261.0, 327.0, 181.0, 78.0, 11.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.086669445037842, -2.9812710285186768, -2.875872850418091, -2.770474433898926, -2.6650760173797607, -2.5596776008605957, -2.4542794227600098, -2.3488810062408447, -2.2434825897216797, -2.1380841732025146, -2.0326859951019287, -1.9272875785827637, -1.8218891620635986, -1.7164908647537231, -1.6110925674438477, -1.5056941509246826, -1.4002959728240967, -1.2948976755142212, -1.1894992589950562, -1.0841009616851807, -0.9787026047706604, -0.8733042478561401, -0.7679059505462646, -0.6625075936317444, -0.5571092367172241, -0.45171087980270386, -0.346312552690506, -0.2409142255783081, -0.13551586866378784, -0.030117511749267578, 0.07528078556060791, 0.18067914247512817, 0.28607726097106934, 0.3914756178855896, 0.4968739449977875, 0.6022722721099854, 0.7076706290245056, 0.8130689859390259, 0.9184672832489014, 1.0238656997680664, 1.129263997077942, 1.2346622943878174, 1.3400607109069824, 1.445459008216858, 1.5508573055267334, 1.6562557220458984, 1.761654019355774, 1.8670523166656494, 1.9724507331848145, 2.0778491497039795, 2.1832473278045654, 2.2886457443237305, 2.3940441608428955, 2.4994425773620605, 2.6048407554626465, 2.7102391719818115, 2.8156375885009766, 2.9210360050201416, 3.0264341831207275, 3.1318325996398926, 3.2372310161590576, 3.3426294326782227, 3.4480276107788086, 3.5534260272979736, 3.6588242053985596]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 2.0, 6.0, 3.0, 9.0, 12.0, 12.0, 23.0, 28.0, 28.0, 25.0, 27.0, 47.0, 33.0, 42.0, 49.0, 52.0, 49.0, 40.0, 49.0, 65.0, 41.0, 53.0, 35.0, 39.0, 39.0, 38.0, 28.0, 28.0, 22.0, 15.0, 18.0, 15.0, 6.0, 10.0, 8.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7350797057151794, -0.7062202095985413, -0.6773606538772583, -0.6485011577606201, -0.6196416616439819, -0.5907821655273438, -0.5619226694107056, -0.5330631136894226, -0.5042036175727844, -0.47534412145614624, -0.44648459553718567, -0.4176250696182251, -0.3887655735015869, -0.35990607738494873, -0.33104655146598816, -0.3021870255470276, -0.2733275294303894, -0.24446801841259003, -0.21560850739479065, -0.18674899637699127, -0.1578894853591919, -0.12902997434139252, -0.10017046332359314, -0.07131095230579376, -0.042451441287994385, -0.013591930270195007, 0.01526758074760437, 0.04412709176540375, 0.07298660278320312, 0.1018461138010025, 0.13070562481880188, 0.15956513583660126, 0.18842458724975586, 0.21728409826755524, 0.24614360928535461, 0.2750031352043152, 0.30386263132095337, 0.33272212743759155, 0.3615816533565521, 0.3904411792755127, 0.4193006753921509, 0.44816017150878906, 0.47701969742774963, 0.5058792233467102, 0.5347387194633484, 0.5635982155799866, 0.5924577713012695, 0.6213172674179077, 0.6501767635345459, 0.6790362596511841, 0.7078957557678223, 0.7367553114891052, 0.7656148076057434, 0.7944743037223816, 0.8233338594436646, 0.8521933555603027, 0.8810528516769409, 0.9099123477935791, 0.9387718439102173, 0.9676313996315002, 0.9964908957481384, 1.0253504514694214, 1.0542099475860596, 1.0830694437026978, 1.111928939819336]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 2.0, 5.0, 3.0, 3.0, 5.0, 14.0, 7.0, 12.0, 29.0, 35.0, 40.0, 65.0, 78.0, 107.0, 187.0, 233.0, 415.0, 639.0, 993.0, 1567.0, 2776.0, 4446.0, 8431.0, 15537.0, 31299.0, 67415.0, 166003.0, 501450.0, 1272089.0, 1301510.0, 510362.0, 171747.0, 69329.0, 32166.0, 15719.0, 8500.0, 4453.0, 2635.0, 1490.0, 940.0, 568.0, 373.0, 234.0, 154.0, 99.0, 44.0, 27.0, 18.0, 18.0, 9.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.1473388671875, -0.14313030242919922, -0.13892173767089844, -0.13471317291259766, -0.13050460815429688, -0.1262960433959961, -0.12208747863769531, -0.11787891387939453, -0.11367034912109375, -0.10946178436279297, -0.10525321960449219, -0.1010446548461914, -0.09683609008789062, -0.09262752532958984, -0.08841896057128906, -0.08421039581298828, -0.0800018310546875, -0.07579326629638672, -0.07158470153808594, -0.06737613677978516, -0.06316757202148438, -0.058959007263183594, -0.05475044250488281, -0.05054187774658203, -0.04633331298828125, -0.04212474822998047, -0.03791618347167969, -0.033707618713378906, -0.029499053955078125, -0.025290489196777344, -0.021081924438476562, -0.01687335968017578, -0.012664794921875, -0.008456230163574219, -0.0042476654052734375, -3.910064697265625e-05, 0.004169464111328125, 0.008378028869628906, 0.012586593627929688, 0.01679515838623047, 0.02100372314453125, 0.02521228790283203, 0.029420852661132812, 0.033629417419433594, 0.037837982177734375, 0.042046546936035156, 0.04625511169433594, 0.05046367645263672, 0.0546722412109375, 0.05888080596923828, 0.06308937072753906, 0.06729793548583984, 0.07150650024414062, 0.0757150650024414, 0.07992362976074219, 0.08413219451904297, 0.08834075927734375, 0.09254932403564453, 0.09675788879394531, 0.1009664535522461, 0.10517501831054688, 0.10938358306884766, 0.11359214782714844, 0.11780071258544922, 0.12200927734375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 2.0, 3.0, 9.0, 6.0, 14.0, 13.0, 13.0, 21.0, 13.0, 21.0, 32.0, 30.0, 35.0, 31.0, 41.0, 47.0, 50.0, 52.0, 47.0, 37.0, 44.0, 49.0, 38.0, 40.0, 35.0, 24.0, 35.0, 32.0, 28.0, 30.0, 19.0, 20.0, 11.0, 21.0, 15.0, 14.0, 6.0, 7.0, 2.0, 7.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.104736328125, -0.10153865814208984, -0.09834098815917969, -0.09514331817626953, -0.09194564819335938, -0.08874797821044922, -0.08555030822753906, -0.0823526382446289, -0.07915496826171875, -0.0759572982788086, -0.07275962829589844, -0.06956195831298828, -0.06636428833007812, -0.06316661834716797, -0.05996894836425781, -0.056771278381347656, -0.0535736083984375, -0.050375938415527344, -0.04717826843261719, -0.04398059844970703, -0.040782928466796875, -0.03758525848388672, -0.03438758850097656, -0.031189918518066406, -0.02799224853515625, -0.024794578552246094, -0.021596908569335938, -0.01839923858642578, -0.015201568603515625, -0.012003898620605469, -0.008806228637695312, -0.005608558654785156, -0.002410888671875, 0.0007867813110351562, 0.0039844512939453125, 0.007182121276855469, 0.010379791259765625, 0.013577461242675781, 0.016775131225585938, 0.019972801208496094, 0.02317047119140625, 0.026368141174316406, 0.029565811157226562, 0.03276348114013672, 0.035961151123046875, 0.03915882110595703, 0.04235649108886719, 0.045554161071777344, 0.0487518310546875, 0.051949501037597656, 0.05514717102050781, 0.05834484100341797, 0.061542510986328125, 0.06474018096923828, 0.06793785095214844, 0.0711355209350586, 0.07433319091796875, 0.0775308609008789, 0.08072853088378906, 0.08392620086669922, 0.08712387084960938, 0.09032154083251953, 0.09351921081542969, 0.09671688079833984, 0.09991455078125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 8.0, 7.0, 8.0, 22.0, 24.0, 43.0, 40.0, 103.0, 168.0, 286.0, 667.0, 1836.0, 5293.0, 18770.0, 71141.0, 309187.0, 1385003.0, 1814398.0, 449506.0, 101490.0, 25072.0, 7238.0, 2289.0, 841.0, 377.0, 190.0, 117.0, 45.0, 38.0, 24.0, 10.0, 14.0, 11.0, 2.0, 2.0, 6.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.256591796875, -0.24860382080078125, -0.2406158447265625, -0.23262786865234375, -0.224639892578125, -0.21665191650390625, -0.2086639404296875, -0.20067596435546875, -0.19268798828125, -0.18470001220703125, -0.1767120361328125, -0.16872406005859375, -0.160736083984375, -0.15274810791015625, -0.1447601318359375, -0.13677215576171875, -0.1287841796875, -0.12079620361328125, -0.1128082275390625, -0.10482025146484375, -0.096832275390625, -0.08884429931640625, -0.0808563232421875, -0.07286834716796875, -0.06488037109375, -0.05689239501953125, -0.0489044189453125, -0.04091644287109375, -0.032928466796875, -0.02494049072265625, -0.0169525146484375, -0.00896453857421875, -0.0009765625, 0.00701141357421875, 0.0149993896484375, 0.02298736572265625, 0.030975341796875, 0.03896331787109375, 0.0469512939453125, 0.05493927001953125, 0.06292724609375, 0.07091522216796875, 0.0789031982421875, 0.08689117431640625, 0.094879150390625, 0.10286712646484375, 0.1108551025390625, 0.11884307861328125, 0.1268310546875, 0.13481903076171875, 0.1428070068359375, 0.15079498291015625, 0.158782958984375, 0.16677093505859375, 0.1747589111328125, 0.18274688720703125, 0.19073486328125, 0.19872283935546875, 0.2067108154296875, 0.21469879150390625, 0.222686767578125, 0.23067474365234375, 0.2386627197265625, 0.24665069580078125, 0.254638671875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 7.0, 4.0, 5.0, 15.0, 15.0, 19.0, 21.0, 33.0, 49.0, 63.0, 76.0, 127.0, 138.0, 157.0, 230.0, 276.0, 331.0, 410.0, 410.0, 351.0, 281.0, 229.0, 187.0, 155.0, 134.0, 88.0, 59.0, 43.0, 38.0, 31.0, 27.0, 21.0, 16.0, 8.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1898193359375, -0.1842632293701172, -0.17870712280273438, -0.17315101623535156, -0.16759490966796875, -0.16203880310058594, -0.15648269653320312, -0.1509265899658203, -0.1453704833984375, -0.1398143768310547, -0.13425827026367188, -0.12870216369628906, -0.12314605712890625, -0.11758995056152344, -0.11203384399414062, -0.10647773742675781, -0.100921630859375, -0.09536552429199219, -0.08980941772460938, -0.08425331115722656, -0.07869720458984375, -0.07314109802246094, -0.06758499145507812, -0.06202888488769531, -0.0564727783203125, -0.05091667175292969, -0.045360565185546875, -0.03980445861816406, -0.03424835205078125, -0.028692245483398438, -0.023136138916015625, -0.017580032348632812, -0.01202392578125, -0.0064678192138671875, -0.000911712646484375, 0.0046443939208984375, 0.01020050048828125, 0.015756607055664062, 0.021312713623046875, 0.026868820190429688, 0.0324249267578125, 0.03798103332519531, 0.043537139892578125, 0.04909324645996094, 0.05464935302734375, 0.06020545959472656, 0.06576156616210938, 0.07131767272949219, 0.076873779296875, 0.08242988586425781, 0.08798599243164062, 0.09354209899902344, 0.09909820556640625, 0.10465431213378906, 0.11021041870117188, 0.11576652526855469, 0.1213226318359375, 0.1268787384033203, 0.13243484497070312, 0.13799095153808594, 0.14354705810546875, 0.14910316467285156, 0.15465927124023438, 0.1602153778076172, 0.165771484375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 8.0, 16.0, 20.0, 25.0, 38.0, 61.0, 96.0, 111.0, 115.0, 115.0, 120.0, 95.0, 60.0, 46.0, 30.0, 20.0, 12.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8820130825042725, -0.841962456703186, -0.8019118309020996, -0.7618612051010132, -0.7218105792999268, -0.6817599534988403, -0.6417093276977539, -0.6016587018966675, -0.561608076095581, -0.5215574502944946, -0.4815068244934082, -0.4414561986923218, -0.40140557289123535, -0.3613549470901489, -0.3213043212890625, -0.2812536954879761, -0.24120306968688965, -0.20115244388580322, -0.1611018180847168, -0.12105119228363037, -0.08100056648254395, -0.04094994068145752, -0.0008993148803710938, 0.03915131092071533, 0.07920193672180176, 0.11925256252288818, 0.1593031883239746, 0.19935381412506104, 0.23940443992614746, 0.2794550657272339, 0.3195056915283203, 0.35955631732940674, 0.3996068239212036, 0.43965744972229004, 0.47970807552337646, 0.5197587013244629, 0.5598093271255493, 0.5998599529266357, 0.6399105787277222, 0.6799612045288086, 0.720011830329895, 0.7600624561309814, 0.8001130819320679, 0.8401637077331543, 0.8802143335342407, 0.9202649593353271, 0.9603155851364136, 1.0003662109375, 1.0404168367385864, 1.0804674625396729, 1.1205180883407593, 1.1605687141418457, 1.2006193399429321, 1.2406699657440186, 1.280720591545105, 1.3207712173461914, 1.3608218431472778, 1.4008724689483643, 1.4409230947494507, 1.480973720550537, 1.5210243463516235, 1.56107497215271, 1.6011255979537964, 1.6411762237548828, 1.6812268495559692]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 7.0, 5.0, 7.0, 5.0, 12.0, 17.0, 11.0, 15.0, 17.0, 10.0, 21.0, 23.0, 28.0, 22.0, 29.0, 30.0, 43.0, 34.0, 37.0, 37.0, 41.0, 44.0, 39.0, 34.0, 35.0, 33.0, 38.0, 38.0, 33.0, 31.0, 26.0, 25.0, 24.0, 17.0, 21.0, 35.0, 10.0, 10.0, 10.0, 11.0, 9.0, 6.0, 4.0, 10.0, 0.0, 5.0, 3.0, 4.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.6030954718589783, -0.5853657126426697, -0.5676358938217163, -0.5499061346054077, -0.5321763157844543, -0.5144465565681458, -0.4967167377471924, -0.4789869785308838, -0.4612571597099304, -0.44352737069129944, -0.42579758167266846, -0.4080677926540375, -0.3903380036354065, -0.3726082146167755, -0.35487842559814453, -0.33714866638183594, -0.31941887736320496, -0.301689088344574, -0.283959299325943, -0.266229510307312, -0.24849972128868103, -0.23076993227005005, -0.21304015815258026, -0.19531036913394928, -0.1775805801153183, -0.15985079109668732, -0.14212100207805634, -0.12439122051000595, -0.10666143149137497, -0.08893164247274399, -0.0712018609046936, -0.05347207188606262, -0.03574228286743164, -0.01801249571144581, -0.0002827085554599762, 0.017447076737880707, 0.03517686575651169, 0.05290665477514267, 0.07063643634319305, 0.08836622536182404, 0.10609601438045502, 0.123825803399086, 0.14155559241771698, 0.15928536653518677, 0.17701515555381775, 0.19474494457244873, 0.2124747335910797, 0.2302045226097107, 0.24793431162834167, 0.26566410064697266, 0.28339388966560364, 0.3011236786842346, 0.3188534677028656, 0.3365832567214966, 0.3543130159378052, 0.37204283475875854, 0.38977259397506714, 0.4075023829936981, 0.4252321720123291, 0.4429619610309601, 0.46069175004959106, 0.47842153906822205, 0.496151328086853, 0.5138810873031616, 0.531610906124115]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 3.0, 7.0, 10.0, 12.0, 19.0, 16.0, 27.0, 41.0, 71.0, 102.0, 173.0, 253.0, 418.0, 708.0, 1254.0, 2132.0, 4076.0, 7234.0, 13056.0, 23778.0, 43876.0, 77518.0, 130588.0, 188748.0, 199790.0, 148343.0, 91025.0, 51599.0, 28677.0, 15411.0, 8616.0, 4700.0, 2537.0, 1511.0, 866.0, 497.0, 301.0, 190.0, 118.0, 85.0, 50.0, 41.0, 27.0, 17.0, 12.0, 8.0, 9.0, 3.0, 0.0, 3.0, 0.0, 3.0], "bins": [-0.22900390625, -0.22266769409179688, -0.21633148193359375, -0.20999526977539062, -0.2036590576171875, -0.19732284545898438, -0.19098663330078125, -0.18465042114257812, -0.178314208984375, -0.17197799682617188, -0.16564178466796875, -0.15930557250976562, -0.1529693603515625, -0.14663314819335938, -0.14029693603515625, -0.13396072387695312, -0.12762451171875, -0.12128829956054688, -0.11495208740234375, -0.10861587524414062, -0.1022796630859375, -0.09594345092773438, -0.08960723876953125, -0.08327102661132812, -0.076934814453125, -0.07059860229492188, -0.06426239013671875, -0.057926177978515625, -0.0515899658203125, -0.045253753662109375, -0.03891754150390625, -0.032581329345703125, -0.0262451171875, -0.019908905029296875, -0.01357269287109375, -0.007236480712890625, -0.0009002685546875, 0.005435943603515625, 0.01177215576171875, 0.018108367919921875, 0.024444580078125, 0.030780792236328125, 0.03711700439453125, 0.043453216552734375, 0.0497894287109375, 0.056125640869140625, 0.06246185302734375, 0.06879806518554688, 0.07513427734375, 0.08147048950195312, 0.08780670166015625, 0.09414291381835938, 0.1004791259765625, 0.10681533813476562, 0.11315155029296875, 0.11948776245117188, 0.125823974609375, 0.13216018676757812, 0.13849639892578125, 0.14483261108398438, 0.1511688232421875, 0.15750503540039062, 0.16384124755859375, 0.17017745971679688, 0.176513671875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 5.0, 15.0, 12.0, 12.0, 30.0, 23.0, 25.0, 29.0, 28.0, 47.0, 37.0, 38.0, 52.0, 46.0, 49.0, 39.0, 57.0, 45.0, 36.0, 39.0, 46.0, 26.0, 22.0, 33.0, 35.0, 27.0, 30.0, 26.0, 18.0, 10.0, 16.0, 8.0, 9.0, 12.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.12005615234375, -0.11682987213134766, -0.11360359191894531, -0.11037731170654297, -0.10715103149414062, -0.10392475128173828, -0.10069847106933594, -0.0974721908569336, -0.09424591064453125, -0.0910196304321289, -0.08779335021972656, -0.08456707000732422, -0.08134078979492188, -0.07811450958251953, -0.07488822937011719, -0.07166194915771484, -0.0684356689453125, -0.06520938873291016, -0.06198310852050781, -0.05875682830810547, -0.055530548095703125, -0.05230426788330078, -0.04907798767089844, -0.045851707458496094, -0.04262542724609375, -0.039399147033691406, -0.03617286682128906, -0.03294658660888672, -0.029720306396484375, -0.02649402618408203, -0.023267745971679688, -0.020041465759277344, -0.016815185546875, -0.013588905334472656, -0.010362625122070312, -0.007136344909667969, -0.003910064697265625, -0.0006837844848632812, 0.0025424957275390625, 0.005768775939941406, 0.00899505615234375, 0.012221336364746094, 0.015447616577148438, 0.01867389678955078, 0.021900177001953125, 0.02512645721435547, 0.028352737426757812, 0.031579017639160156, 0.0348052978515625, 0.038031578063964844, 0.04125785827636719, 0.04448413848876953, 0.047710418701171875, 0.05093669891357422, 0.05416297912597656, 0.057389259338378906, 0.06061553955078125, 0.0638418197631836, 0.06706809997558594, 0.07029438018798828, 0.07352066040039062, 0.07674694061279297, 0.07997322082519531, 0.08319950103759766, 0.08642578125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 6.0, 8.0, 7.0, 15.0, 22.0, 28.0, 47.0, 63.0, 97.0, 126.0, 204.0, 342.0, 603.0, 1140.0, 2084.0, 3740.0, 7098.0, 12961.0, 23252.0, 41111.0, 69668.0, 112072.0, 161170.0, 185944.0, 158832.0, 109612.0, 67615.0, 40227.0, 22842.0, 12487.0, 6865.0, 3633.0, 1974.0, 1049.0, 602.0, 341.0, 232.0, 135.0, 102.0, 72.0, 37.0, 25.0, 22.0, 16.0, 10.0, 6.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1966552734375, -0.1905994415283203, -0.18454360961914062, -0.17848777770996094, -0.17243194580078125, -0.16637611389160156, -0.16032028198242188, -0.1542644500732422, -0.1482086181640625, -0.1421527862548828, -0.13609695434570312, -0.13004112243652344, -0.12398529052734375, -0.11792945861816406, -0.11187362670898438, -0.10581779479980469, -0.099761962890625, -0.09370613098144531, -0.08765029907226562, -0.08159446716308594, -0.07553863525390625, -0.06948280334472656, -0.06342697143554688, -0.05737113952636719, -0.0513153076171875, -0.04525947570800781, -0.039203643798828125, -0.03314781188964844, -0.02709197998046875, -0.021036148071289062, -0.014980316162109375, -0.008924484252929688, -0.00286865234375, 0.0031871795654296875, 0.009243011474609375, 0.015298843383789062, 0.02135467529296875, 0.027410507202148438, 0.033466339111328125, 0.03952217102050781, 0.0455780029296875, 0.05163383483886719, 0.057689666748046875, 0.06374549865722656, 0.06980133056640625, 0.07585716247558594, 0.08191299438476562, 0.08796882629394531, 0.094024658203125, 0.10008049011230469, 0.10613632202148438, 0.11219215393066406, 0.11824798583984375, 0.12430381774902344, 0.13035964965820312, 0.1364154815673828, 0.1424713134765625, 0.1485271453857422, 0.15458297729492188, 0.16063880920410156, 0.16669464111328125, 0.17275047302246094, 0.17880630493164062, 0.1848621368408203, 0.19091796875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 8.0, 9.0, 10.0, 7.0, 15.0, 17.0, 19.0, 25.0, 30.0, 23.0, 36.0, 31.0, 42.0, 45.0, 38.0, 47.0, 36.0, 38.0, 37.0, 37.0, 41.0, 57.0, 45.0, 38.0, 31.0, 26.0, 34.0, 30.0, 16.0, 18.0, 22.0, 15.0, 19.0, 16.0, 9.0, 10.0, 4.0, 5.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.26123046875, -0.2529869079589844, -0.24474334716796875, -0.23649978637695312, -0.2282562255859375, -0.22001266479492188, -0.21176910400390625, -0.20352554321289062, -0.195281982421875, -0.18703842163085938, -0.17879486083984375, -0.17055130004882812, -0.1623077392578125, -0.15406417846679688, -0.14582061767578125, -0.13757705688476562, -0.12933349609375, -0.12108993530273438, -0.11284637451171875, -0.10460281372070312, -0.0963592529296875, -0.08811569213867188, -0.07987213134765625, -0.07162857055664062, -0.063385009765625, -0.055141448974609375, -0.04689788818359375, -0.038654327392578125, -0.0304107666015625, -0.022167205810546875, -0.01392364501953125, -0.005680084228515625, 0.0025634765625, 0.010807037353515625, 0.01905059814453125, 0.027294158935546875, 0.0355377197265625, 0.043781280517578125, 0.05202484130859375, 0.060268402099609375, 0.068511962890625, 0.07675552368164062, 0.08499908447265625, 0.09324264526367188, 0.1014862060546875, 0.10972976684570312, 0.11797332763671875, 0.12621688842773438, 0.13446044921875, 0.14270401000976562, 0.15094757080078125, 0.15919113159179688, 0.1674346923828125, 0.17567825317382812, 0.18392181396484375, 0.19216537475585938, 0.200408935546875, 0.20865249633789062, 0.21689605712890625, 0.22513961791992188, 0.2333831787109375, 0.24162673950195312, 0.24987030029296875, 0.2581138610839844, 0.266357421875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 2.0, 2.0, 5.0, 9.0, 13.0, 36.0, 61.0, 85.0, 190.0, 342.0, 711.0, 1883.0, 5156.0, 15195.0, 48061.0, 138654.0, 290525.0, 307345.0, 156813.0, 55826.0, 18020.0, 5860.0, 2111.0, 881.0, 385.0, 165.0, 93.0, 56.0, 31.0, 9.0, 12.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0972900390625, -0.0940542221069336, -0.09081840515136719, -0.08758258819580078, -0.08434677124023438, -0.08111095428466797, -0.07787513732910156, -0.07463932037353516, -0.07140350341796875, -0.06816768646240234, -0.06493186950683594, -0.06169605255126953, -0.058460235595703125, -0.05522441864013672, -0.05198860168457031, -0.048752784729003906, -0.0455169677734375, -0.042281150817871094, -0.03904533386230469, -0.03580951690673828, -0.032573699951171875, -0.02933788299560547, -0.026102066040039062, -0.022866249084472656, -0.01963043212890625, -0.016394615173339844, -0.013158798217773438, -0.009922981262207031, -0.006687164306640625, -0.0034513473510742188, -0.0002155303955078125, 0.0030202865600585938, 0.006256103515625, 0.009491920471191406, 0.012727737426757812, 0.01596355438232422, 0.019199371337890625, 0.02243518829345703, 0.025671005249023438, 0.028906822204589844, 0.03214263916015625, 0.035378456115722656, 0.03861427307128906, 0.04185009002685547, 0.045085906982421875, 0.04832172393798828, 0.05155754089355469, 0.054793357849121094, 0.0580291748046875, 0.061264991760253906, 0.06450080871582031, 0.06773662567138672, 0.07097244262695312, 0.07420825958251953, 0.07744407653808594, 0.08067989349365234, 0.08391571044921875, 0.08715152740478516, 0.09038734436035156, 0.09362316131591797, 0.09685897827148438, 0.10009479522705078, 0.10333061218261719, 0.1065664291381836, 0.10980224609375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 5.0, 6.0, 6.0, 10.0, 10.0, 12.0, 13.0, 23.0, 28.0, 29.0, 57.0, 45.0, 59.0, 73.0, 69.0, 87.0, 94.0, 85.0, 58.0, 42.0, 40.0, 35.0, 26.0, 27.0, 7.0, 14.0, 6.0, 8.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.193450927734375e-05, -2.1209940314292908e-05, -2.0485371351242065e-05, -1.9760802388191223e-05, -1.903623342514038e-05, -1.831166446208954e-05, -1.7587095499038696e-05, -1.6862526535987854e-05, -1.6137957572937012e-05, -1.541338860988617e-05, -1.4688819646835327e-05, -1.3964250683784485e-05, -1.3239681720733643e-05, -1.25151127576828e-05, -1.1790543794631958e-05, -1.1065974831581116e-05, -1.0341405868530273e-05, -9.616836905479431e-06, -8.892267942428589e-06, -8.167698979377747e-06, -7.443130016326904e-06, -6.718561053276062e-06, -5.99399209022522e-06, -5.2694231271743774e-06, -4.544854164123535e-06, -3.820285201072693e-06, -3.0957162380218506e-06, -2.3711472749710083e-06, -1.646578311920166e-06, -9.220093488693237e-07, -1.9744038581848145e-07, 5.271285772323608e-07, 1.2516975402832031e-06, 1.9762665033340454e-06, 2.7008354663848877e-06, 3.42540442943573e-06, 4.149973392486572e-06, 4.8745423555374146e-06, 5.599111318588257e-06, 6.323680281639099e-06, 7.048249244689941e-06, 7.772818207740784e-06, 8.497387170791626e-06, 9.221956133842468e-06, 9.94652509689331e-06, 1.0671094059944153e-05, 1.1395663022994995e-05, 1.2120231986045837e-05, 1.284480094909668e-05, 1.3569369912147522e-05, 1.4293938875198364e-05, 1.5018507838249207e-05, 1.574307680130005e-05, 1.646764576435089e-05, 1.7192214727401733e-05, 1.7916783690452576e-05, 1.8641352653503418e-05, 1.936592161655426e-05, 2.0090490579605103e-05, 2.0815059542655945e-05, 2.1539628505706787e-05, 2.226419746875763e-05, 2.298876643180847e-05, 2.3713335394859314e-05, 2.4437904357910156e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 7.0, 19.0, 19.0, 28.0, 59.0, 95.0, 205.0, 347.0, 632.0, 1182.0, 2652.0, 5883.0, 13263.0, 29954.0, 65498.0, 128343.0, 205318.0, 231091.0, 176303.0, 100217.0, 48284.0, 21298.0, 9488.0, 4198.0, 2036.0, 1018.0, 492.0, 290.0, 141.0, 73.0, 47.0, 25.0, 11.0, 11.0, 3.0, 7.0, 5.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0614013671875, -0.05937480926513672, -0.05734825134277344, -0.055321693420410156, -0.053295135498046875, -0.051268577575683594, -0.04924201965332031, -0.04721546173095703, -0.04518890380859375, -0.04316234588623047, -0.04113578796386719, -0.039109230041503906, -0.037082672119140625, -0.035056114196777344, -0.03302955627441406, -0.03100299835205078, -0.0289764404296875, -0.02694988250732422, -0.024923324584960938, -0.022896766662597656, -0.020870208740234375, -0.018843650817871094, -0.016817092895507812, -0.014790534973144531, -0.01276397705078125, -0.010737419128417969, -0.008710861206054688, -0.006684303283691406, -0.004657745361328125, -0.0026311874389648438, -0.0006046295166015625, 0.0014219284057617188, 0.003448486328125, 0.005475044250488281, 0.0075016021728515625, 0.009528160095214844, 0.011554718017578125, 0.013581275939941406, 0.015607833862304688, 0.01763439178466797, 0.01966094970703125, 0.02168750762939453, 0.023714065551757812, 0.025740623474121094, 0.027767181396484375, 0.029793739318847656, 0.03182029724121094, 0.03384685516357422, 0.0358734130859375, 0.03789997100830078, 0.03992652893066406, 0.041953086853027344, 0.043979644775390625, 0.046006202697753906, 0.04803276062011719, 0.05005931854248047, 0.05208587646484375, 0.05411243438720703, 0.05613899230957031, 0.058165550231933594, 0.060192108154296875, 0.062218666076660156, 0.06424522399902344, 0.06627178192138672, 0.06829833984375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 4.0, 12.0, 8.0, 11.0, 29.0, 33.0, 42.0, 42.0, 59.0, 52.0, 57.0, 57.0, 75.0, 69.0, 72.0, 60.0, 51.0, 48.0, 46.0, 32.0, 35.0, 32.0, 19.0, 20.0, 7.0, 9.0, 11.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0638427734375, -0.06175518035888672, -0.05966758728027344, -0.057579994201660156, -0.055492401123046875, -0.053404808044433594, -0.05131721496582031, -0.04922962188720703, -0.04714202880859375, -0.04505443572998047, -0.04296684265136719, -0.040879249572753906, -0.038791656494140625, -0.036704063415527344, -0.03461647033691406, -0.03252887725830078, -0.0304412841796875, -0.02835369110107422, -0.026266098022460938, -0.024178504943847656, -0.022090911865234375, -0.020003318786621094, -0.017915725708007812, -0.01582813262939453, -0.01374053955078125, -0.011652946472167969, -0.009565353393554688, -0.007477760314941406, -0.005390167236328125, -0.0033025741577148438, -0.0012149810791015625, 0.0008726119995117188, 0.002960205078125, 0.005047798156738281, 0.0071353912353515625, 0.009222984313964844, 0.011310577392578125, 0.013398170471191406, 0.015485763549804688, 0.01757335662841797, 0.01966094970703125, 0.02174854278564453, 0.023836135864257812, 0.025923728942871094, 0.028011322021484375, 0.030098915100097656, 0.03218650817871094, 0.03427410125732422, 0.0363616943359375, 0.03844928741455078, 0.04053688049316406, 0.042624473571777344, 0.044712066650390625, 0.046799659729003906, 0.04888725280761719, 0.05097484588623047, 0.05306243896484375, 0.05515003204345703, 0.05723762512207031, 0.059325218200683594, 0.061412811279296875, 0.06350040435791016, 0.06558799743652344, 0.06767559051513672, 0.06976318359375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 8.0, 16.0, 29.0, 57.0, 112.0, 126.0, 192.0, 174.0, 140.0, 60.0, 37.0, 34.0, 11.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8707690238952637, -0.8124346733093262, -0.7541002631187439, -0.6957659125328064, -0.6374315023422241, -0.5790971517562866, -0.5207628011703491, -0.46242842078208923, -0.40409404039382935, -0.34575966000556946, -0.28742527961730957, -0.22909092903137207, -0.17075654864311218, -0.1124221682548523, -0.054087817668914795, 0.004246562719345093, 0.06258094310760498, 0.12091531604528427, 0.17924968898296356, 0.23758405447006226, 0.29591843485832214, 0.35425281524658203, 0.41258716583251953, 0.4709215462207794, 0.5292559266090393, 0.5875902771949768, 0.6459246873855591, 0.7042590379714966, 0.7625933885574341, 0.8209277987480164, 0.8792621493339539, 0.9375965595245361, 0.9959309101104736, 1.0542652606964111, 1.1125996112823486, 1.1709339618682861, 1.2292684316635132, 1.2876027822494507, 1.3459371328353882, 1.4042714834213257, 1.4626059532165527, 1.5209403038024902, 1.5792746543884277, 1.6376090049743652, 1.6959434747695923, 1.7542778253555298, 1.8126121759414673, 1.8709465265274048, 1.9292808771133423, 1.9876152276992798, 2.045949697494507, 2.1042840480804443, 2.162618398666382, 2.2209527492523193, 2.279287099838257, 2.3376214504241943, 2.395955801010132, 2.4542901515960693, 2.512624502182007, 2.5709588527679443, 2.629293203353882, 2.6876277923583984, 2.745962142944336, 2.8042964935302734, 2.862630844116211]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 3.0, 1.0, 9.0, 12.0, 8.0, 7.0, 18.0, 12.0, 26.0, 23.0, 35.0, 43.0, 38.0, 36.0, 44.0, 54.0, 53.0, 44.0, 52.0, 58.0, 46.0, 41.0, 43.0, 46.0, 45.0, 16.0, 30.0, 28.0, 18.0, 18.0, 19.0, 13.0, 10.0, 17.0, 9.0, 10.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.791124165058136, -0.7636244893074036, -0.7361248135566711, -0.7086251378059387, -0.6811254620552063, -0.6536257863044739, -0.6261261105537415, -0.598626434803009, -0.5711267590522766, -0.5436270833015442, -0.5161274075508118, -0.48862773180007935, -0.4611280560493469, -0.4336283802986145, -0.4061287045478821, -0.37862902879714966, -0.35112935304641724, -0.3236296772956848, -0.2961300015449524, -0.26863032579421997, -0.24113065004348755, -0.21363097429275513, -0.1861312985420227, -0.15863162279129028, -0.13113194704055786, -0.10363227128982544, -0.07613259553909302, -0.048632919788360596, -0.021133244037628174, 0.006366431713104248, 0.03386610746383667, 0.06136578321456909, 0.08886545896530151, 0.11636513471603394, 0.14386481046676636, 0.17136448621749878, 0.1988641619682312, 0.22636383771896362, 0.25386351346969604, 0.28136318922042847, 0.3088628649711609, 0.3363625407218933, 0.36386221647262573, 0.39136189222335815, 0.4188615679740906, 0.446361243724823, 0.4738609194755554, 0.5013605952262878, 0.5288602709770203, 0.5563599467277527, 0.5838596224784851, 0.6113592982292175, 0.63885897397995, 0.6663586497306824, 0.6938583254814148, 0.7213580012321472, 0.7488576769828796, 0.7763573527336121, 0.8038570284843445, 0.8313567042350769, 0.8588563799858093, 0.8863560557365417, 0.9138557314872742, 0.9413554072380066, 0.968855082988739]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 7.0, 12.0, 9.0, 12.0, 15.0, 31.0, 44.0, 50.0, 88.0, 120.0, 223.0, 358.0, 706.0, 1343.0, 2673.0, 5980.0, 15207.0, 43388.0, 154964.0, 817244.0, 2199277.0, 738848.0, 146830.0, 42023.0, 14449.0, 5591.0, 2407.0, 1100.0, 563.0, 289.0, 166.0, 101.0, 48.0, 39.0, 22.0, 15.0, 19.0, 6.0, 5.0, 4.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2181396484375, -0.21142196655273438, -0.20470428466796875, -0.19798660278320312, -0.1912689208984375, -0.18455123901367188, -0.17783355712890625, -0.17111587524414062, -0.164398193359375, -0.15768051147460938, -0.15096282958984375, -0.14424514770507812, -0.1375274658203125, -0.13080978393554688, -0.12409210205078125, -0.11737442016601562, -0.11065673828125, -0.10393905639648438, -0.09722137451171875, -0.09050369262695312, -0.0837860107421875, -0.07706832885742188, -0.07035064697265625, -0.06363296508789062, -0.056915283203125, -0.050197601318359375, -0.04347991943359375, -0.036762237548828125, -0.0300445556640625, -0.023326873779296875, -0.01660919189453125, -0.009891510009765625, -0.003173828125, 0.003543853759765625, 0.01026153564453125, 0.016979217529296875, 0.0236968994140625, 0.030414581298828125, 0.03713226318359375, 0.043849945068359375, 0.050567626953125, 0.057285308837890625, 0.06400299072265625, 0.07072067260742188, 0.0774383544921875, 0.08415603637695312, 0.09087371826171875, 0.09759140014648438, 0.10430908203125, 0.11102676391601562, 0.11774444580078125, 0.12446212768554688, 0.1311798095703125, 0.13789749145507812, 0.14461517333984375, 0.15133285522460938, 0.158050537109375, 0.16476821899414062, 0.17148590087890625, 0.17820358276367188, 0.1849212646484375, 0.19163894653320312, 0.19835662841796875, 0.20507431030273438, 0.2117919921875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 7.0, 5.0, 7.0, 8.0, 12.0, 15.0, 20.0, 26.0, 16.0, 41.0, 39.0, 49.0, 41.0, 44.0, 57.0, 42.0, 49.0, 45.0, 54.0, 53.0, 50.0, 46.0, 39.0, 32.0, 34.0, 44.0, 21.0, 17.0, 23.0, 21.0, 8.0, 7.0, 6.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.117919921875, -0.11414623260498047, -0.11037254333496094, -0.1065988540649414, -0.10282516479492188, -0.09905147552490234, -0.09527778625488281, -0.09150409698486328, -0.08773040771484375, -0.08395671844482422, -0.08018302917480469, -0.07640933990478516, -0.07263565063476562, -0.0688619613647461, -0.06508827209472656, -0.06131458282470703, -0.0575408935546875, -0.05376720428466797, -0.04999351501464844, -0.046219825744628906, -0.042446136474609375, -0.038672447204589844, -0.03489875793457031, -0.03112506866455078, -0.02735137939453125, -0.02357769012451172, -0.019804000854492188, -0.016030311584472656, -0.012256622314453125, -0.008482933044433594, -0.0047092437744140625, -0.0009355545043945312, 0.002838134765625, 0.006611824035644531, 0.010385513305664062, 0.014159202575683594, 0.017932891845703125, 0.021706581115722656, 0.025480270385742188, 0.02925395965576172, 0.03302764892578125, 0.03680133819580078, 0.04057502746582031, 0.044348716735839844, 0.048122406005859375, 0.051896095275878906, 0.05566978454589844, 0.05944347381591797, 0.0632171630859375, 0.06699085235595703, 0.07076454162597656, 0.0745382308959961, 0.07831192016601562, 0.08208560943603516, 0.08585929870605469, 0.08963298797607422, 0.09340667724609375, 0.09718036651611328, 0.10095405578613281, 0.10472774505615234, 0.10850143432617188, 0.1122751235961914, 0.11604881286621094, 0.11982250213623047, 0.12359619140625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 6.0, 20.0, 27.0, 37.0, 70.0, 193.0, 351.0, 1009.0, 3348.0, 13052.0, 59775.0, 319367.0, 1815096.0, 1632465.0, 280557.0, 52796.0, 11550.0, 3037.0, 919.0, 334.0, 135.0, 65.0, 27.0, 15.0, 15.0, 8.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27099609375, -0.2619514465332031, -0.25290679931640625, -0.24386215209960938, -0.2348175048828125, -0.22577285766601562, -0.21672821044921875, -0.20768356323242188, -0.198638916015625, -0.18959426879882812, -0.18054962158203125, -0.17150497436523438, -0.1624603271484375, -0.15341567993164062, -0.14437103271484375, -0.13532638549804688, -0.12628173828125, -0.11723709106445312, -0.10819244384765625, -0.09914779663085938, -0.0901031494140625, -0.08105850219726562, -0.07201385498046875, -0.06296920776367188, -0.053924560546875, -0.044879913330078125, -0.03583526611328125, -0.026790618896484375, -0.0177459716796875, -0.008701324462890625, 0.00034332275390625, 0.009387969970703125, 0.0184326171875, 0.027477264404296875, 0.03652191162109375, 0.045566558837890625, 0.0546112060546875, 0.06365585327148438, 0.07270050048828125, 0.08174514770507812, 0.090789794921875, 0.09983444213867188, 0.10887908935546875, 0.11792373657226562, 0.1269683837890625, 0.13601303100585938, 0.14505767822265625, 0.15410232543945312, 0.16314697265625, 0.17219161987304688, 0.18123626708984375, 0.19028091430664062, 0.1993255615234375, 0.20837020874023438, 0.21741485595703125, 0.22645950317382812, 0.235504150390625, 0.24454879760742188, 0.25359344482421875, 0.2626380920410156, 0.2716827392578125, 0.2807273864746094, 0.28977203369140625, 0.2988166809082031, 0.307861328125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 4.0, 8.0, 1.0, 7.0, 18.0, 21.0, 19.0, 37.0, 49.0, 45.0, 57.0, 85.0, 109.0, 130.0, 145.0, 232.0, 279.0, 343.0, 417.0, 427.0, 344.0, 282.0, 219.0, 172.0, 118.0, 119.0, 93.0, 65.0, 55.0, 41.0, 28.0, 23.0, 14.0, 15.0, 11.0, 10.0, 9.0, 5.0, 3.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1552734375, -0.15009307861328125, -0.1449127197265625, -0.13973236083984375, -0.134552001953125, -0.12937164306640625, -0.1241912841796875, -0.11901092529296875, -0.11383056640625, -0.10865020751953125, -0.1034698486328125, -0.09828948974609375, -0.093109130859375, -0.08792877197265625, -0.0827484130859375, -0.07756805419921875, -0.0723876953125, -0.06720733642578125, -0.0620269775390625, -0.05684661865234375, -0.051666259765625, -0.04648590087890625, -0.0413055419921875, -0.03612518310546875, -0.03094482421875, -0.02576446533203125, -0.0205841064453125, -0.01540374755859375, -0.010223388671875, -0.00504302978515625, 0.0001373291015625, 0.00531768798828125, 0.010498046875, 0.01567840576171875, 0.0208587646484375, 0.02603912353515625, 0.031219482421875, 0.03639984130859375, 0.0415802001953125, 0.04676055908203125, 0.05194091796875, 0.05712127685546875, 0.0623016357421875, 0.06748199462890625, 0.072662353515625, 0.07784271240234375, 0.0830230712890625, 0.08820343017578125, 0.0933837890625, 0.09856414794921875, 0.1037445068359375, 0.10892486572265625, 0.114105224609375, 0.11928558349609375, 0.1244659423828125, 0.12964630126953125, 0.13482666015625, 0.14000701904296875, 0.1451873779296875, 0.15036773681640625, 0.155548095703125, 0.16072845458984375, 0.1659088134765625, 0.17108917236328125, 0.17626953125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 9.0, 11.0, 14.0, 27.0, 42.0, 35.0, 67.0, 94.0, 94.0, 107.0, 111.0, 89.0, 91.0, 69.0, 56.0, 29.0, 23.0, 13.0, 17.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.5622539520263672, -1.5258125066757202, -1.4893710613250732, -1.4529296159744263, -1.4164881706237793, -1.3800467252731323, -1.3436052799224854, -1.307163953781128, -1.2707223892211914, -1.2342809438705444, -1.1978394985198975, -1.1613980531692505, -1.1249566078186035, -1.0885151624679565, -1.0520737171173096, -1.0156323909759521, -0.9791909456253052, -0.9427495002746582, -0.9063080549240112, -0.8698666095733643, -0.8334251642227173, -0.7969837188720703, -0.7605423331260681, -0.7241008877754211, -0.6876594424247742, -0.6512179970741272, -0.6147765517234802, -0.5783351063728333, -0.541893720626831, -0.5054522752761841, -0.4690108299255371, -0.43256938457489014, -0.3961278796195984, -0.3596864342689514, -0.32324498891830444, -0.28680357336997986, -0.2503621280193329, -0.2139206826686859, -0.17747925221920013, -0.14103782176971436, -0.10459637641906738, -0.06815493851900101, -0.03171350061893463, 0.004727937281131744, 0.04116937518119812, 0.07761082053184509, 0.11405225098133087, 0.15049368143081665, 0.18693512678146362, 0.2233765721321106, 0.25981801748275757, 0.29625943303108215, 0.3327008783817291, 0.3691423237323761, 0.4055837392807007, 0.44202518463134766, 0.47846662998199463, 0.5149080753326416, 0.5513495206832886, 0.5877909660339355, 0.6242324113845825, 0.6606738567352295, 0.6971152424812317, 0.7335566878318787, 0.7699981331825256]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 9.0, 9.0, 3.0, 7.0, 10.0, 10.0, 13.0, 15.0, 10.0, 19.0, 20.0, 16.0, 35.0, 23.0, 29.0, 25.0, 22.0, 34.0, 36.0, 28.0, 44.0, 41.0, 46.0, 35.0, 41.0, 36.0, 25.0, 46.0, 30.0, 32.0, 30.0, 33.0, 31.0, 26.0, 17.0, 17.0, 16.0, 18.0, 16.0, 8.0, 16.0, 5.0, 7.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.5353688597679138, -0.5183150768280029, -0.5012613534927368, -0.4842075705528259, -0.46715378761291504, -0.45010003447532654, -0.43304628133773804, -0.41599249839782715, -0.39893874526023865, -0.38188499212265015, -0.36483120918273926, -0.34777745604515076, -0.33072370290756226, -0.31366991996765137, -0.29661616683006287, -0.27956241369247437, -0.2625086307525635, -0.24545486271381378, -0.2284010946750641, -0.21134734153747559, -0.1942935734987259, -0.1772398054599762, -0.1601860523223877, -0.143132284283638, -0.1260785162448883, -0.10902474820613861, -0.09197098761796951, -0.07491722702980042, -0.05786345899105072, -0.040809690952301025, -0.023755930364131927, -0.00670216977596283, 0.010351598262786865, 0.02740536257624626, 0.04445912688970566, 0.061512891203165054, 0.07856665551662445, 0.09562042355537415, 0.11267418414354324, 0.12972794473171234, 0.14678171277046204, 0.16383548080921173, 0.18088924884796143, 0.19794300198554993, 0.21499677002429962, 0.23205053806304932, 0.24910429120063782, 0.2661580443382263, 0.2832118272781372, 0.3002655804157257, 0.3173193633556366, 0.3343731164932251, 0.351426899433136, 0.3684806525707245, 0.385534405708313, 0.4025881886482239, 0.4196419417858124, 0.4366956949234009, 0.45374947786331177, 0.47080323100090027, 0.48785698413848877, 0.5049107670783997, 0.5219645500183105, 0.5390182733535767, 0.5560720562934875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 2.0, 5.0, 11.0, 16.0, 17.0, 33.0, 42.0, 74.0, 112.0, 178.0, 377.0, 677.0, 1266.0, 2352.0, 4756.0, 9494.0, 19492.0, 40917.0, 84172.0, 157854.0, 230392.0, 217913.0, 138613.0, 72362.0, 34570.0, 16501.0, 7977.0, 3951.0, 1964.0, 1104.0, 564.0, 316.0, 192.0, 93.0, 71.0, 48.0, 23.0, 25.0, 11.0, 5.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3212890625, -0.3108863830566406, -0.30048370361328125, -0.2900810241699219, -0.2796783447265625, -0.2692756652832031, -0.25887298583984375, -0.24847030639648438, -0.238067626953125, -0.22766494750976562, -0.21726226806640625, -0.20685958862304688, -0.1964569091796875, -0.18605422973632812, -0.17565155029296875, -0.16524887084960938, -0.15484619140625, -0.14444351196289062, -0.13404083251953125, -0.12363815307617188, -0.1132354736328125, -0.10283279418945312, -0.09243011474609375, -0.08202743530273438, -0.071624755859375, -0.061222076416015625, -0.05081939697265625, -0.040416717529296875, -0.0300140380859375, -0.019611358642578125, -0.00920867919921875, 0.001194000244140625, 0.0115966796875, 0.021999359130859375, 0.03240203857421875, 0.042804718017578125, 0.0532073974609375, 0.06361007690429688, 0.07401275634765625, 0.08441543579101562, 0.094818115234375, 0.10522079467773438, 0.11562347412109375, 0.12602615356445312, 0.1364288330078125, 0.14683151245117188, 0.15723419189453125, 0.16763687133789062, 0.17803955078125, 0.18844223022460938, 0.19884490966796875, 0.20924758911132812, 0.2196502685546875, 0.23005294799804688, 0.24045562744140625, 0.2508583068847656, 0.261260986328125, 0.2716636657714844, 0.28206634521484375, 0.2924690246582031, 0.3028717041015625, 0.3132743835449219, 0.32367706298828125, 0.3340797424316406, 0.344482421875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 5.0, 6.0, 17.0, 6.0, 16.0, 20.0, 30.0, 29.0, 22.0, 33.0, 29.0, 40.0, 48.0, 35.0, 50.0, 51.0, 48.0, 54.0, 41.0, 48.0, 38.0, 53.0, 51.0, 27.0, 30.0, 32.0, 26.0, 16.0, 20.0, 19.0, 12.0, 13.0, 7.0, 6.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11126708984375, -0.1078042984008789, -0.10434150695800781, -0.10087871551513672, -0.09741592407226562, -0.09395313262939453, -0.09049034118652344, -0.08702754974365234, -0.08356475830078125, -0.08010196685791016, -0.07663917541503906, -0.07317638397216797, -0.06971359252929688, -0.06625080108642578, -0.06278800964355469, -0.059325218200683594, -0.0558624267578125, -0.052399635314941406, -0.04893684387207031, -0.04547405242919922, -0.042011260986328125, -0.03854846954345703, -0.03508567810058594, -0.031622886657714844, -0.02816009521484375, -0.024697303771972656, -0.021234512329101562, -0.01777172088623047, -0.014308929443359375, -0.010846138000488281, -0.0073833465576171875, -0.003920555114746094, -0.000457763671875, 0.0030050277709960938, 0.0064678192138671875, 0.009930610656738281, 0.013393402099609375, 0.01685619354248047, 0.020318984985351562, 0.023781776428222656, 0.02724456787109375, 0.030707359313964844, 0.03417015075683594, 0.03763294219970703, 0.041095733642578125, 0.04455852508544922, 0.04802131652832031, 0.051484107971191406, 0.0549468994140625, 0.058409690856933594, 0.06187248229980469, 0.06533527374267578, 0.06879806518554688, 0.07226085662841797, 0.07572364807128906, 0.07918643951416016, 0.08264923095703125, 0.08611202239990234, 0.08957481384277344, 0.09303760528564453, 0.09650039672851562, 0.09996318817138672, 0.10342597961425781, 0.1068887710571289, 0.1103515625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 6.0, 10.0, 12.0, 17.0, 10.0, 27.0, 47.0, 59.0, 80.0, 126.0, 153.0, 226.0, 388.0, 642.0, 1130.0, 1988.0, 3761.0, 7152.0, 14022.0, 27596.0, 52949.0, 93032.0, 144365.0, 185561.0, 183647.0, 140104.0, 87959.0, 49505.0, 25959.0, 12968.0, 6828.0, 3458.0, 1885.0, 1099.0, 637.0, 366.0, 231.0, 166.0, 129.0, 81.0, 47.0, 52.0, 24.0, 11.0, 14.0, 10.0, 9.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2362060546875, -0.2285747528076172, -0.22094345092773438, -0.21331214904785156, -0.20568084716796875, -0.19804954528808594, -0.19041824340820312, -0.1827869415283203, -0.1751556396484375, -0.1675243377685547, -0.15989303588867188, -0.15226173400878906, -0.14463043212890625, -0.13699913024902344, -0.12936782836914062, -0.12173652648925781, -0.114105224609375, -0.10647392272949219, -0.09884262084960938, -0.09121131896972656, -0.08358001708984375, -0.07594871520996094, -0.06831741333007812, -0.06068611145019531, -0.0530548095703125, -0.04542350769042969, -0.037792205810546875, -0.030160903930664062, -0.02252960205078125, -0.014898300170898438, -0.007266998291015625, 0.0003643035888671875, 0.00799560546875, 0.015626907348632812, 0.023258209228515625, 0.030889511108398438, 0.03852081298828125, 0.04615211486816406, 0.053783416748046875, 0.06141471862792969, 0.0690460205078125, 0.07667732238769531, 0.08430862426757812, 0.09193992614746094, 0.09957122802734375, 0.10720252990722656, 0.11483383178710938, 0.12246513366699219, 0.130096435546875, 0.1377277374267578, 0.14535903930664062, 0.15299034118652344, 0.16062164306640625, 0.16825294494628906, 0.17588424682617188, 0.1835155487060547, 0.1911468505859375, 0.1987781524658203, 0.20640945434570312, 0.21404075622558594, 0.22167205810546875, 0.22930335998535156, 0.23693466186523438, 0.2445659637451172, 0.252197265625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 7.0, 4.0, 6.0, 5.0, 4.0, 8.0, 9.0, 12.0, 14.0, 14.0, 29.0, 18.0, 31.0, 33.0, 35.0, 36.0, 32.0, 33.0, 39.0, 40.0, 25.0, 40.0, 55.0, 44.0, 42.0, 52.0, 45.0, 35.0, 30.0, 30.0, 32.0, 23.0, 29.0, 24.0, 15.0, 14.0, 15.0, 4.0, 10.0, 10.0, 4.0, 6.0, 2.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2958984375, -0.28714752197265625, -0.2783966064453125, -0.26964569091796875, -0.260894775390625, -0.25214385986328125, -0.2433929443359375, -0.23464202880859375, -0.22589111328125, -0.21714019775390625, -0.2083892822265625, -0.19963836669921875, -0.190887451171875, -0.18213653564453125, -0.1733856201171875, -0.16463470458984375, -0.1558837890625, -0.14713287353515625, -0.1383819580078125, -0.12963104248046875, -0.120880126953125, -0.11212921142578125, -0.1033782958984375, -0.09462738037109375, -0.08587646484375, -0.07712554931640625, -0.0683746337890625, -0.05962371826171875, -0.050872802734375, -0.04212188720703125, -0.0333709716796875, -0.02462005615234375, -0.015869140625, -0.00711822509765625, 0.0016326904296875, 0.01038360595703125, 0.019134521484375, 0.02788543701171875, 0.0366363525390625, 0.04538726806640625, 0.05413818359375, 0.06288909912109375, 0.0716400146484375, 0.08039093017578125, 0.089141845703125, 0.09789276123046875, 0.1066436767578125, 0.11539459228515625, 0.1241455078125, 0.13289642333984375, 0.1416473388671875, 0.15039825439453125, 0.159149169921875, 0.16790008544921875, 0.1766510009765625, 0.18540191650390625, 0.19415283203125, 0.20290374755859375, 0.2116546630859375, 0.22040557861328125, 0.229156494140625, 0.23790740966796875, 0.2466583251953125, 0.25540924072265625, 0.26416015625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 15.0, 12.0, 29.0, 38.0, 57.0, 109.0, 161.0, 305.0, 510.0, 869.0, 1671.0, 3116.0, 5958.0, 11731.0, 23691.0, 50187.0, 105027.0, 192436.0, 248800.0, 195280.0, 107635.0, 51300.0, 24393.0, 11939.0, 6090.0, 3222.0, 1717.0, 925.0, 522.0, 298.0, 206.0, 114.0, 71.0, 45.0, 30.0, 12.0, 9.0, 7.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09979248046875, -0.09672355651855469, -0.09365463256835938, -0.09058570861816406, -0.08751678466796875, -0.08444786071777344, -0.08137893676757812, -0.07831001281738281, -0.0752410888671875, -0.07217216491699219, -0.06910324096679688, -0.06603431701660156, -0.06296539306640625, -0.05989646911621094, -0.056827545166015625, -0.05375862121582031, -0.050689697265625, -0.04762077331542969, -0.044551849365234375, -0.04148292541503906, -0.03841400146484375, -0.03534507751464844, -0.032276153564453125, -0.029207229614257812, -0.0261383056640625, -0.023069381713867188, -0.020000457763671875, -0.016931533813476562, -0.01386260986328125, -0.010793685913085938, -0.007724761962890625, -0.0046558380126953125, -0.0015869140625, 0.0014820098876953125, 0.004550933837890625, 0.0076198577880859375, 0.01068878173828125, 0.013757705688476562, 0.016826629638671875, 0.019895553588867188, 0.0229644775390625, 0.026033401489257812, 0.029102325439453125, 0.03217124938964844, 0.03524017333984375, 0.03830909729003906, 0.041378021240234375, 0.04444694519042969, 0.047515869140625, 0.05058479309082031, 0.053653717041015625, 0.05672264099121094, 0.05979156494140625, 0.06286048889160156, 0.06592941284179688, 0.06899833679199219, 0.0720672607421875, 0.07513618469238281, 0.07820510864257812, 0.08127403259277344, 0.08434295654296875, 0.08741188049316406, 0.09048080444335938, 0.09354972839355469, 0.09661865234375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 11.0, 2.0, 9.0, 12.0, 16.0, 16.0, 20.0, 37.0, 37.0, 49.0, 50.0, 66.0, 69.0, 87.0, 87.0, 70.0, 64.0, 63.0, 49.0, 32.0, 34.0, 32.0, 26.0, 13.0, 10.0, 7.0, 11.0, 3.0, 4.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.17692756652832e-05, -3.0782073736190796e-05, -2.979487180709839e-05, -2.880766987800598e-05, -2.7820467948913574e-05, -2.6833266019821167e-05, -2.584606409072876e-05, -2.4858862161636353e-05, -2.3871660232543945e-05, -2.2884458303451538e-05, -2.189725637435913e-05, -2.0910054445266724e-05, -1.9922852516174316e-05, -1.893565058708191e-05, -1.7948448657989502e-05, -1.6961246728897095e-05, -1.5974044799804688e-05, -1.498684287071228e-05, -1.3999640941619873e-05, -1.3012439012527466e-05, -1.2025237083435059e-05, -1.1038035154342651e-05, -1.0050833225250244e-05, -9.063631296157837e-06, -8.07642936706543e-06, -7.0892274379730225e-06, -6.102025508880615e-06, -5.114823579788208e-06, -4.127621650695801e-06, -3.1404197216033936e-06, -2.1532177925109863e-06, -1.166015863418579e-06, -1.7881393432617188e-07, 8.083879947662354e-07, 1.7955899238586426e-06, 2.78279185295105e-06, 3.769993782043457e-06, 4.757195711135864e-06, 5.7443976402282715e-06, 6.731599569320679e-06, 7.718801498413086e-06, 8.706003427505493e-06, 9.6932053565979e-06, 1.0680407285690308e-05, 1.1667609214782715e-05, 1.2654811143875122e-05, 1.364201307296753e-05, 1.4629215002059937e-05, 1.5616416931152344e-05, 1.660361886024475e-05, 1.7590820789337158e-05, 1.8578022718429565e-05, 1.9565224647521973e-05, 2.055242657661438e-05, 2.1539628505706787e-05, 2.2526830434799194e-05, 2.35140323638916e-05, 2.450123429298401e-05, 2.5488436222076416e-05, 2.6475638151168823e-05, 2.746284008026123e-05, 2.8450042009353638e-05, 2.9437243938446045e-05, 3.0424445867538452e-05, 3.141164779663086e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 2.0, 3.0, 4.0, 12.0, 15.0, 14.0, 24.0, 32.0, 66.0, 97.0, 158.0, 237.0, 382.0, 732.0, 1250.0, 2413.0, 4740.0, 10606.0, 28131.0, 83558.0, 228165.0, 350553.0, 214649.0, 77145.0, 25787.0, 10041.0, 4559.0, 2194.0, 1277.0, 676.0, 370.0, 253.0, 130.0, 87.0, 57.0, 42.0, 32.0, 23.0, 13.0, 13.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11920166015625, -0.11528873443603516, -0.11137580871582031, -0.10746288299560547, -0.10354995727539062, -0.09963703155517578, -0.09572410583496094, -0.0918111801147461, -0.08789825439453125, -0.0839853286743164, -0.08007240295410156, -0.07615947723388672, -0.07224655151367188, -0.06833362579345703, -0.06442070007324219, -0.060507774353027344, -0.0565948486328125, -0.052681922912597656, -0.04876899719238281, -0.04485607147216797, -0.040943145751953125, -0.03703022003173828, -0.03311729431152344, -0.029204368591308594, -0.02529144287109375, -0.021378517150878906, -0.017465591430664062, -0.013552665710449219, -0.009639739990234375, -0.005726814270019531, -0.0018138885498046875, 0.0020990371704101562, 0.006011962890625, 0.009924888610839844, 0.013837814331054688, 0.01775074005126953, 0.021663665771484375, 0.02557659149169922, 0.029489517211914062, 0.033402442932128906, 0.03731536865234375, 0.041228294372558594, 0.04514122009277344, 0.04905414581298828, 0.052967071533203125, 0.05687999725341797, 0.06079292297363281, 0.06470584869384766, 0.0686187744140625, 0.07253170013427734, 0.07644462585449219, 0.08035755157470703, 0.08427047729492188, 0.08818340301513672, 0.09209632873535156, 0.0960092544555664, 0.09992218017578125, 0.1038351058959961, 0.10774803161621094, 0.11166095733642578, 0.11557388305664062, 0.11948680877685547, 0.12339973449707031, 0.12731266021728516, 0.1312255859375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 4.0, 3.0, 9.0, 13.0, 11.0, 22.0, 22.0, 31.0, 32.0, 42.0, 56.0, 70.0, 85.0, 69.0, 84.0, 80.0, 61.0, 59.0, 53.0, 36.0, 32.0, 31.0, 17.0, 18.0, 14.0, 7.0, 8.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.09039306640625, -0.08748340606689453, -0.08457374572753906, -0.0816640853881836, -0.07875442504882812, -0.07584476470947266, -0.07293510437011719, -0.07002544403076172, -0.06711578369140625, -0.06420612335205078, -0.06129646301269531, -0.058386802673339844, -0.055477142333984375, -0.052567481994628906, -0.04965782165527344, -0.04674816131591797, -0.0438385009765625, -0.04092884063720703, -0.03801918029785156, -0.035109519958496094, -0.032199859619140625, -0.029290199279785156, -0.026380538940429688, -0.02347087860107422, -0.02056121826171875, -0.01765155792236328, -0.014741897583007812, -0.011832237243652344, -0.008922576904296875, -0.006012916564941406, -0.0031032562255859375, -0.00019359588623046875, 0.002716064453125, 0.005625724792480469, 0.008535385131835938, 0.011445045471191406, 0.014354705810546875, 0.017264366149902344, 0.020174026489257812, 0.02308368682861328, 0.02599334716796875, 0.02890300750732422, 0.03181266784667969, 0.034722328186035156, 0.037631988525390625, 0.040541648864746094, 0.04345130920410156, 0.04636096954345703, 0.0492706298828125, 0.05218029022216797, 0.05508995056152344, 0.057999610900878906, 0.060909271240234375, 0.06381893157958984, 0.06672859191894531, 0.06963825225830078, 0.07254791259765625, 0.07545757293701172, 0.07836723327636719, 0.08127689361572266, 0.08418655395507812, 0.0870962142944336, 0.09000587463378906, 0.09291553497314453, 0.0958251953125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 12.0, 18.0, 19.0, 31.0, 46.0, 59.0, 85.0, 113.0, 116.0, 116.0, 101.0, 95.0, 59.0, 56.0, 28.0, 19.0, 8.0, 8.0, 9.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1217647790908813, -1.0725327730178833, -1.0233006477355957, -0.9740686416625977, -0.9248365759849548, -0.875604510307312, -0.826372504234314, -0.7771404385566711, -0.7279083728790283, -0.6786763072013855, -0.6294442415237427, -0.5802122354507446, -0.5309801697731018, -0.481748104095459, -0.43251606822013855, -0.3832840323448181, -0.3340519666671753, -0.28481990098953247, -0.23558786511421204, -0.1863558143377304, -0.13712376356124878, -0.08789171278476715, -0.03865966200828552, 0.010572373867034912, 0.059804439544677734, 0.10903649032115936, 0.158268541097641, 0.20750059187412262, 0.25673264265060425, 0.30596470832824707, 0.3551967442035675, 0.40442878007888794, 0.4536607265472412, 0.502892792224884, 0.5521248579025269, 0.6013568639755249, 0.6505889296531677, 0.6998209953308105, 0.7490530014038086, 0.7982850670814514, 0.8475171327590942, 0.8967491984367371, 0.9459812641143799, 0.9952132701873779, 1.044445276260376, 1.0936774015426636, 1.1429094076156616, 1.1921415328979492, 1.2413735389709473, 1.2906055450439453, 1.339837670326233, 1.389069676399231, 1.4383018016815186, 1.4875338077545166, 1.5367658138275146, 1.5859978199005127, 1.6352299451828003, 1.6844619512557983, 1.733694076538086, 1.782926082611084, 1.832158088684082, 1.8813902139663696, 1.9306222200393677, 1.9798543453216553, 2.0290863513946533]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 6.0, 9.0, 8.0, 6.0, 15.0, 23.0, 12.0, 23.0, 23.0, 37.0, 27.0, 27.0, 40.0, 38.0, 47.0, 47.0, 46.0, 55.0, 51.0, 46.0, 41.0, 38.0, 47.0, 43.0, 36.0, 26.0, 29.0, 23.0, 32.0, 24.0, 18.0, 16.0, 13.0, 13.0, 1.0, 4.0, 3.0, 4.0, 6.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.1989262104034424, -1.166624903678894, -1.1343235969543457, -1.102022409439087, -1.0697211027145386, -1.0374197959899902, -1.0051186084747314, -0.9728173017501831, -0.9405159950256348, -0.9082146883010864, -0.8759134411811829, -0.8436121940612793, -0.811310887336731, -0.7790095806121826, -0.746708333492279, -0.7144070863723755, -0.6821057796478271, -0.6498044729232788, -0.6175032258033752, -0.5852019786834717, -0.5529006719589233, -0.520599365234375, -0.48829811811447144, -0.4559968411922455, -0.42369556427001953, -0.3913942873477936, -0.3590930104255676, -0.3267917335033417, -0.2944904565811157, -0.26218917965888977, -0.22988790273666382, -0.19758662581443787, -0.16528522968292236, -0.1329839527606964, -0.10068267583847046, -0.0683813989162445, -0.036080121994018555, -0.0037788450717926025, 0.02852243185043335, 0.0608237087726593, 0.09312498569488525, 0.1254262626171112, 0.15772753953933716, 0.1900288164615631, 0.22233009338378906, 0.254631370306015, 0.28693264722824097, 0.3192339241504669, 0.35153520107269287, 0.3838364779949188, 0.4161377549171448, 0.4484390318393707, 0.4807403087615967, 0.513041615486145, 0.5453428626060486, 0.5776441097259521, 0.6099454164505005, 0.6422467231750488, 0.6745479702949524, 0.706849217414856, 0.7391505241394043, 0.7714518308639526, 0.8037530779838562, 0.8360543251037598, 0.8683556318283081]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 8.0, 4.0, 7.0, 9.0, 16.0, 22.0, 23.0, 46.0, 57.0, 94.0, 133.0, 198.0, 295.0, 439.0, 756.0, 1152.0, 1984.0, 3547.0, 6527.0, 13102.0, 27169.0, 62468.0, 170870.0, 574417.0, 1488432.0, 1223699.0, 395118.0, 127072.0, 49615.0, 22674.0, 11126.0, 5780.0, 3086.0, 1754.0, 976.0, 609.0, 356.0, 242.0, 153.0, 98.0, 53.0, 36.0, 24.0, 15.0, 9.0, 3.0, 6.0, 5.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.1669921875, -0.16205978393554688, -0.15712738037109375, -0.15219497680664062, -0.1472625732421875, -0.14233016967773438, -0.13739776611328125, -0.13246536254882812, -0.127532958984375, -0.12260055541992188, -0.11766815185546875, -0.11273574829101562, -0.1078033447265625, -0.10287094116210938, -0.09793853759765625, -0.09300613403320312, -0.08807373046875, -0.08314132690429688, -0.07820892333984375, -0.07327651977539062, -0.0683441162109375, -0.06341171264648438, -0.05847930908203125, -0.053546905517578125, -0.048614501953125, -0.043682098388671875, -0.03874969482421875, -0.033817291259765625, -0.0288848876953125, -0.023952484130859375, -0.01902008056640625, -0.014087677001953125, -0.0091552734375, -0.004222869873046875, 0.00070953369140625, 0.005641937255859375, 0.0105743408203125, 0.015506744384765625, 0.02043914794921875, 0.025371551513671875, 0.030303955078125, 0.035236358642578125, 0.04016876220703125, 0.045101165771484375, 0.0500335693359375, 0.054965972900390625, 0.05989837646484375, 0.06483078002929688, 0.06976318359375, 0.07469558715820312, 0.07962799072265625, 0.08456039428710938, 0.0894927978515625, 0.09442520141601562, 0.09935760498046875, 0.10429000854492188, 0.109222412109375, 0.11415481567382812, 0.11908721923828125, 0.12401962280273438, 0.1289520263671875, 0.13388442993164062, 0.13881683349609375, 0.14374923706054688, 0.148681640625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 2.0, 6.0, 2.0, 5.0, 9.0, 10.0, 14.0, 13.0, 13.0, 18.0, 25.0, 26.0, 27.0, 42.0, 37.0, 32.0, 40.0, 41.0, 44.0, 37.0, 51.0, 39.0, 44.0, 40.0, 42.0, 38.0, 32.0, 39.0, 36.0, 32.0, 17.0, 27.0, 16.0, 15.0, 23.0, 12.0, 14.0, 9.0, 12.0, 4.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1258544921875, -0.12205219268798828, -0.11824989318847656, -0.11444759368896484, -0.11064529418945312, -0.1068429946899414, -0.10304069519042969, -0.09923839569091797, -0.09543609619140625, -0.09163379669189453, -0.08783149719238281, -0.0840291976928711, -0.08022689819335938, -0.07642459869384766, -0.07262229919433594, -0.06881999969482422, -0.0650177001953125, -0.06121540069580078, -0.05741310119628906, -0.053610801696777344, -0.049808502197265625, -0.046006202697753906, -0.04220390319824219, -0.03840160369873047, -0.03459930419921875, -0.03079700469970703, -0.026994705200195312, -0.023192405700683594, -0.019390106201171875, -0.015587806701660156, -0.011785507202148438, -0.007983207702636719, -0.004180908203125, -0.00037860870361328125, 0.0034236907958984375, 0.007225990295410156, 0.011028289794921875, 0.014830589294433594, 0.018632888793945312, 0.02243518829345703, 0.02623748779296875, 0.03003978729248047, 0.03384208679199219, 0.037644386291503906, 0.041446685791015625, 0.045248985290527344, 0.04905128479003906, 0.05285358428955078, 0.0566558837890625, 0.06045818328857422, 0.06426048278808594, 0.06806278228759766, 0.07186508178710938, 0.0756673812866211, 0.07946968078613281, 0.08327198028564453, 0.08707427978515625, 0.09087657928466797, 0.09467887878417969, 0.0984811782836914, 0.10228347778320312, 0.10608577728271484, 0.10988807678222656, 0.11369037628173828, 0.11749267578125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 16.0, 11.0, 29.0, 36.0, 53.0, 87.0, 139.0, 248.0, 488.0, 900.0, 1858.0, 3793.0, 8889.0, 21211.0, 56031.0, 159324.0, 483393.0, 1481617.0, 1333008.0, 420411.0, 139335.0, 49470.0, 18872.0, 7896.0, 3555.0, 1738.0, 809.0, 455.0, 241.0, 142.0, 83.0, 49.0, 32.0, 17.0, 16.0, 9.0, 7.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.22216796875, -0.2159862518310547, -0.20980453491210938, -0.20362281799316406, -0.19744110107421875, -0.19125938415527344, -0.18507766723632812, -0.1788959503173828, -0.1727142333984375, -0.1665325164794922, -0.16035079956054688, -0.15416908264160156, -0.14798736572265625, -0.14180564880371094, -0.13562393188476562, -0.1294422149658203, -0.123260498046875, -0.11707878112792969, -0.11089706420898438, -0.10471534729003906, -0.09853363037109375, -0.09235191345214844, -0.08617019653320312, -0.07998847961425781, -0.0738067626953125, -0.06762504577636719, -0.061443328857421875, -0.05526161193847656, -0.04907989501953125, -0.04289817810058594, -0.036716461181640625, -0.030534744262695312, -0.02435302734375, -0.018171310424804688, -0.011989593505859375, -0.0058078765869140625, 0.00037384033203125, 0.0065555572509765625, 0.012737274169921875, 0.018918991088867188, 0.0251007080078125, 0.03128242492675781, 0.037464141845703125, 0.04364585876464844, 0.04982757568359375, 0.05600929260253906, 0.062191009521484375, 0.06837272644042969, 0.074554443359375, 0.08073616027832031, 0.08691787719726562, 0.09309959411621094, 0.09928131103515625, 0.10546302795410156, 0.11164474487304688, 0.11782646179199219, 0.1240081787109375, 0.1301898956298828, 0.13637161254882812, 0.14255332946777344, 0.14873504638671875, 0.15491676330566406, 0.16109848022460938, 0.1672801971435547, 0.1734619140625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 9.0, 11.0, 6.0, 11.0, 13.0, 9.0, 19.0, 31.0, 23.0, 45.0, 49.0, 61.0, 93.0, 112.0, 129.0, 162.0, 231.0, 276.0, 400.0, 399.0, 404.0, 350.0, 276.0, 198.0, 174.0, 124.0, 101.0, 90.0, 61.0, 51.0, 21.0, 30.0, 23.0, 15.0, 17.0, 14.0, 6.0, 9.0, 8.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.199951171875, -0.19408416748046875, -0.1882171630859375, -0.18235015869140625, -0.176483154296875, -0.17061614990234375, -0.1647491455078125, -0.15888214111328125, -0.15301513671875, -0.14714813232421875, -0.1412811279296875, -0.13541412353515625, -0.129547119140625, -0.12368011474609375, -0.1178131103515625, -0.11194610595703125, -0.1060791015625, -0.10021209716796875, -0.0943450927734375, -0.08847808837890625, -0.082611083984375, -0.07674407958984375, -0.0708770751953125, -0.06501007080078125, -0.05914306640625, -0.05327606201171875, -0.0474090576171875, -0.04154205322265625, -0.035675048828125, -0.02980804443359375, -0.0239410400390625, -0.01807403564453125, -0.01220703125, -0.00634002685546875, -0.0004730224609375, 0.00539398193359375, 0.011260986328125, 0.01712799072265625, 0.0229949951171875, 0.02886199951171875, 0.03472900390625, 0.04059600830078125, 0.0464630126953125, 0.05233001708984375, 0.058197021484375, 0.06406402587890625, 0.0699310302734375, 0.07579803466796875, 0.0816650390625, 0.08753204345703125, 0.0933990478515625, 0.09926605224609375, 0.105133056640625, 0.11100006103515625, 0.1168670654296875, 0.12273406982421875, 0.12860107421875, 0.13446807861328125, 0.1403350830078125, 0.14620208740234375, 0.152069091796875, 0.15793609619140625, 0.1638031005859375, 0.16967010498046875, 0.175537109375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 8.0, 8.0, 22.0, 26.0, 35.0, 49.0, 61.0, 76.0, 75.0, 115.0, 111.0, 95.0, 74.0, 63.0, 45.0, 45.0, 34.0, 14.0, 15.0, 9.0, 6.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4031206369400024, -1.3667858839035034, -1.330451250076294, -1.294116497039795, -1.2577818632125854, -1.2214471101760864, -1.185112476348877, -1.148777723312378, -1.112442970275879, -1.0761082172393799, -1.0397735834121704, -1.0034388303756714, -0.9671041965484619, -0.9307694435119629, -0.8944347500801086, -0.8581000566482544, -0.8217654228210449, -0.7854307293891907, -0.7490960359573364, -0.7127613425254822, -0.6764266490936279, -0.6400918960571289, -0.6037572026252747, -0.5674225091934204, -0.5310878157615662, -0.4947531223297119, -0.45841842889785767, -0.42208370566368103, -0.3857490122318268, -0.34941431879997253, -0.3130795955657959, -0.27674490213394165, -0.2404102087020874, -0.20407551527023315, -0.1677408069372177, -0.13140609860420227, -0.09507140517234802, -0.058736711740493774, -0.022402003407478333, 0.01393270492553711, 0.05026739835739136, 0.0866020992398262, 0.12293680012226105, 0.1592715084552765, 0.19560620188713074, 0.23194089531898499, 0.2682756185531616, 0.30461031198501587, 0.3409450054168701, 0.37727969884872437, 0.4136143922805786, 0.44994911551475525, 0.4862838089466095, 0.5226185321807861, 0.5589532256126404, 0.5952879190444946, 0.6316226124763489, 0.6679573059082031, 0.7042919993400574, 0.7406266927719116, 0.7769614458084106, 0.8132960796356201, 0.8496308326721191, 0.8859655261039734, 0.9223002195358276]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 7.0, 3.0, 4.0, 7.0, 10.0, 10.0, 9.0, 10.0, 8.0, 14.0, 19.0, 17.0, 15.0, 30.0, 22.0, 38.0, 30.0, 27.0, 35.0, 26.0, 39.0, 35.0, 53.0, 45.0, 40.0, 40.0, 45.0, 24.0, 42.0, 37.0, 23.0, 30.0, 26.0, 17.0, 29.0, 21.0, 18.0, 16.0, 14.0, 12.0, 11.0, 7.0, 9.0, 10.0, 7.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.6756497621536255, -0.6547505855560303, -0.6338513493537903, -0.6129521727561951, -0.5920529365539551, -0.5711537599563599, -0.5502545833587646, -0.5293553471565247, -0.5084561109542847, -0.48755690455436707, -0.46665769815444946, -0.44575852155685425, -0.42485928535461426, -0.40396010875701904, -0.38306090235710144, -0.36216169595718384, -0.3412625193595886, -0.320363312959671, -0.2994641065597534, -0.2785649299621582, -0.2576656937599182, -0.2367665022611618, -0.2158673107624054, -0.1949681043624878, -0.1740688979625702, -0.1531696915626526, -0.13227048516273499, -0.11137129366397858, -0.09047208726406097, -0.06957288086414337, -0.04867368936538696, -0.02777448296546936, -0.006875216960906982, 0.014023985713720322, 0.034923188388347626, 0.05582238733768463, 0.07672159373760223, 0.09762080013751984, 0.11851999163627625, 0.13941919803619385, 0.16031840443611145, 0.18121761083602905, 0.20211681723594666, 0.22301600873470306, 0.24391521513462067, 0.26481443643569946, 0.2857136130332947, 0.3066128194332123, 0.3275120258331299, 0.3484112322330475, 0.3693104386329651, 0.3902096152305603, 0.4111088514328003, 0.4320080280303955, 0.4529072344303131, 0.4738064408302307, 0.4947056472301483, 0.5156048536300659, 0.5365040302276611, 0.5574032664299011, 0.5783024430274963, 0.5992016792297363, 0.6201008558273315, 0.6410000324249268, 0.6618992686271667]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 6.0, 10.0, 17.0, 9.0, 20.0, 43.0, 46.0, 64.0, 112.0, 157.0, 233.0, 382.0, 605.0, 1075.0, 1659.0, 3090.0, 5297.0, 9340.0, 16183.0, 28120.0, 47789.0, 82249.0, 137493.0, 200356.0, 196614.0, 131657.0, 77457.0, 45329.0, 26534.0, 15529.0, 8808.0, 5208.0, 2855.0, 1661.0, 977.0, 569.0, 349.0, 220.0, 139.0, 75.0, 64.0, 39.0, 22.0, 23.0, 18.0, 21.0, 4.0, 10.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.2235107421875, -0.21628952026367188, -0.20906829833984375, -0.20184707641601562, -0.1946258544921875, -0.18740463256835938, -0.18018341064453125, -0.17296218872070312, -0.165740966796875, -0.15851974487304688, -0.15129852294921875, -0.14407730102539062, -0.1368560791015625, -0.12963485717773438, -0.12241363525390625, -0.11519241333007812, -0.10797119140625, -0.10074996948242188, -0.09352874755859375, -0.08630752563476562, -0.0790863037109375, -0.07186508178710938, -0.06464385986328125, -0.057422637939453125, -0.050201416015625, -0.042980194091796875, -0.03575897216796875, -0.028537750244140625, -0.0213165283203125, -0.014095306396484375, -0.00687408447265625, 0.000347137451171875, 0.007568359375, 0.014789581298828125, 0.02201080322265625, 0.029232025146484375, 0.0364532470703125, 0.043674468994140625, 0.05089569091796875, 0.058116912841796875, 0.065338134765625, 0.07255935668945312, 0.07978057861328125, 0.08700180053710938, 0.0942230224609375, 0.10144424438476562, 0.10866546630859375, 0.11588668823242188, 0.12310791015625, 0.13032913208007812, 0.13755035400390625, 0.14477157592773438, 0.1519927978515625, 0.15921401977539062, 0.16643524169921875, 0.17365646362304688, 0.180877685546875, 0.18809890747070312, 0.19532012939453125, 0.20254135131835938, 0.2097625732421875, 0.21698379516601562, 0.22420501708984375, 0.23142623901367188, 0.2386474609375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 11.0, 5.0, 11.0, 5.0, 8.0, 22.0, 11.0, 13.0, 19.0, 30.0, 22.0, 27.0, 29.0, 35.0, 37.0, 37.0, 47.0, 38.0, 56.0, 46.0, 48.0, 38.0, 44.0, 43.0, 41.0, 32.0, 26.0, 29.0, 31.0, 26.0, 27.0, 15.0, 15.0, 19.0, 16.0, 9.0, 9.0, 9.0, 8.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.124267578125, -0.12069225311279297, -0.11711692810058594, -0.1135416030883789, -0.10996627807617188, -0.10639095306396484, -0.10281562805175781, -0.09924030303955078, -0.09566497802734375, -0.09208965301513672, -0.08851432800292969, -0.08493900299072266, -0.08136367797851562, -0.0777883529663086, -0.07421302795410156, -0.07063770294189453, -0.0670623779296875, -0.06348705291748047, -0.05991172790527344, -0.056336402893066406, -0.052761077880859375, -0.049185752868652344, -0.04561042785644531, -0.04203510284423828, -0.03845977783203125, -0.03488445281982422, -0.03130912780761719, -0.027733802795410156, -0.024158477783203125, -0.020583152770996094, -0.017007827758789062, -0.013432502746582031, -0.009857177734375, -0.006281852722167969, -0.0027065277099609375, 0.0008687973022460938, 0.004444122314453125, 0.008019447326660156, 0.011594772338867188, 0.015170097351074219, 0.01874542236328125, 0.02232074737548828, 0.025896072387695312, 0.029471397399902344, 0.033046722412109375, 0.036622047424316406, 0.04019737243652344, 0.04377269744873047, 0.0473480224609375, 0.05092334747314453, 0.05449867248535156, 0.058073997497558594, 0.061649322509765625, 0.06522464752197266, 0.06879997253417969, 0.07237529754638672, 0.07595062255859375, 0.07952594757080078, 0.08310127258300781, 0.08667659759521484, 0.09025192260742188, 0.0938272476196289, 0.09740257263183594, 0.10097789764404297, 0.10455322265625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 4.0, 9.0, 10.0, 19.0, 35.0, 50.0, 82.0, 105.0, 177.0, 310.0, 700.0, 1718.0, 5153.0, 16969.0, 56681.0, 168839.0, 356665.0, 282997.0, 107798.0, 34140.0, 10468.0, 3244.0, 1170.0, 504.0, 276.0, 159.0, 104.0, 57.0, 43.0, 26.0, 12.0, 12.0, 5.0, 7.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39599609375, -0.38391876220703125, -0.3718414306640625, -0.35976409912109375, -0.347686767578125, -0.33560943603515625, -0.3235321044921875, -0.31145477294921875, -0.29937744140625, -0.28730010986328125, -0.2752227783203125, -0.26314544677734375, -0.251068115234375, -0.23899078369140625, -0.2269134521484375, -0.21483612060546875, -0.2027587890625, -0.19068145751953125, -0.1786041259765625, -0.16652679443359375, -0.154449462890625, -0.14237213134765625, -0.1302947998046875, -0.11821746826171875, -0.10614013671875, -0.09406280517578125, -0.0819854736328125, -0.06990814208984375, -0.057830810546875, -0.04575347900390625, -0.0336761474609375, -0.02159881591796875, -0.009521484375, 0.00255584716796875, 0.0146331787109375, 0.02671051025390625, 0.038787841796875, 0.05086517333984375, 0.0629425048828125, 0.07501983642578125, 0.08709716796875, 0.09917449951171875, 0.1112518310546875, 0.12332916259765625, 0.135406494140625, 0.14748382568359375, 0.1595611572265625, 0.17163848876953125, 0.1837158203125, 0.19579315185546875, 0.2078704833984375, 0.21994781494140625, 0.232025146484375, 0.24410247802734375, 0.2561798095703125, 0.26825714111328125, 0.28033447265625, 0.29241180419921875, 0.3044891357421875, 0.31656646728515625, 0.328643798828125, 0.34072113037109375, 0.3527984619140625, 0.36487579345703125, 0.376953125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 2.0, 9.0, 6.0, 11.0, 13.0, 18.0, 16.0, 16.0, 22.0, 19.0, 36.0, 32.0, 30.0, 37.0, 34.0, 45.0, 56.0, 37.0, 52.0, 38.0, 44.0, 53.0, 52.0, 37.0, 42.0, 41.0, 41.0, 23.0, 20.0, 17.0, 22.0, 17.0, 11.0, 12.0, 13.0, 9.0, 4.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.280517578125, -0.27014923095703125, -0.2597808837890625, -0.24941253662109375, -0.239044189453125, -0.22867584228515625, -0.2183074951171875, -0.20793914794921875, -0.19757080078125, -0.18720245361328125, -0.1768341064453125, -0.16646575927734375, -0.156097412109375, -0.14572906494140625, -0.1353607177734375, -0.12499237060546875, -0.1146240234375, -0.10425567626953125, -0.0938873291015625, -0.08351898193359375, -0.073150634765625, -0.06278228759765625, -0.0524139404296875, -0.04204559326171875, -0.03167724609375, -0.02130889892578125, -0.0109405517578125, -0.00057220458984375, 0.009796142578125, 0.02016448974609375, 0.0305328369140625, 0.04090118408203125, 0.05126953125, 0.06163787841796875, 0.0720062255859375, 0.08237457275390625, 0.092742919921875, 0.10311126708984375, 0.1134796142578125, 0.12384796142578125, 0.13421630859375, 0.14458465576171875, 0.1549530029296875, 0.16532135009765625, 0.175689697265625, 0.18605804443359375, 0.1964263916015625, 0.20679473876953125, 0.2171630859375, 0.22753143310546875, 0.2378997802734375, 0.24826812744140625, 0.258636474609375, 0.26900482177734375, 0.2793731689453125, 0.28974151611328125, 0.30010986328125, 0.31047821044921875, 0.3208465576171875, 0.33121490478515625, 0.341583251953125, 0.35195159912109375, 0.3623199462890625, 0.37268829345703125, 0.383056640625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 6.0, 5.0, 4.0, 4.0, 14.0, 27.0, 39.0, 68.0, 115.0, 216.0, 454.0, 815.0, 1660.0, 3428.0, 7411.0, 15822.0, 33211.0, 75328.0, 186174.0, 324384.0, 228208.0, 94229.0, 40803.0, 18978.0, 8971.0, 4160.0, 1896.0, 984.0, 523.0, 249.0, 144.0, 81.0, 59.0, 26.0, 22.0, 13.0, 10.0, 8.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.131591796875, -0.1277914047241211, -0.12399101257324219, -0.12019062042236328, -0.11639022827148438, -0.11258983612060547, -0.10878944396972656, -0.10498905181884766, -0.10118865966796875, -0.09738826751708984, -0.09358787536621094, -0.08978748321533203, -0.08598709106445312, -0.08218669891357422, -0.07838630676269531, -0.0745859146118164, -0.0707855224609375, -0.0669851303100586, -0.06318473815917969, -0.05938434600830078, -0.055583953857421875, -0.05178356170654297, -0.04798316955566406, -0.044182777404785156, -0.04038238525390625, -0.036581993103027344, -0.03278160095214844, -0.02898120880126953, -0.025180816650390625, -0.02138042449951172, -0.017580032348632812, -0.013779640197753906, -0.009979248046875, -0.006178855895996094, -0.0023784637451171875, 0.0014219284057617188, 0.005222320556640625, 0.009022712707519531, 0.012823104858398438, 0.016623497009277344, 0.02042388916015625, 0.024224281311035156, 0.028024673461914062, 0.03182506561279297, 0.035625457763671875, 0.03942584991455078, 0.04322624206542969, 0.047026634216308594, 0.0508270263671875, 0.054627418518066406, 0.05842781066894531, 0.06222820281982422, 0.06602859497070312, 0.06982898712158203, 0.07362937927246094, 0.07742977142333984, 0.08123016357421875, 0.08503055572509766, 0.08883094787597656, 0.09263134002685547, 0.09643173217773438, 0.10023212432861328, 0.10403251647949219, 0.1078329086303711, 0.11163330078125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 5.0, 4.0, 3.0, 13.0, 12.0, 15.0, 15.0, 18.0, 17.0, 31.0, 42.0, 41.0, 60.0, 85.0, 108.0, 81.0, 92.0, 69.0, 53.0, 55.0, 28.0, 30.0, 31.0, 20.0, 22.0, 9.0, 10.0, 6.0, 8.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9385089874267578e-05, -2.838950604200363e-05, -2.7393922209739685e-05, -2.639833837747574e-05, -2.5402754545211792e-05, -2.4407170712947845e-05, -2.34115868806839e-05, -2.2416003048419952e-05, -2.1420419216156006e-05, -2.042483538389206e-05, -1.9429251551628113e-05, -1.8433667719364166e-05, -1.743808388710022e-05, -1.6442500054836273e-05, -1.5446916222572327e-05, -1.445133239030838e-05, -1.3455748558044434e-05, -1.2460164725780487e-05, -1.146458089351654e-05, -1.0468997061252594e-05, -9.473413228988647e-06, -8.477829396724701e-06, -7.482245564460754e-06, -6.486661732196808e-06, -5.491077899932861e-06, -4.495494067668915e-06, -3.4999102354049683e-06, -2.5043264031410217e-06, -1.5087425708770752e-06, -5.131587386131287e-07, 4.824250936508179e-07, 1.4780089259147644e-06, 2.473592758178711e-06, 3.4691765904426575e-06, 4.464760422706604e-06, 5.4603442549705505e-06, 6.455928087234497e-06, 7.451511919498444e-06, 8.44709575176239e-06, 9.442679584026337e-06, 1.0438263416290283e-05, 1.143384724855423e-05, 1.2429431080818176e-05, 1.3425014913082123e-05, 1.442059874534607e-05, 1.5416182577610016e-05, 1.6411766409873962e-05, 1.740735024213791e-05, 1.8402934074401855e-05, 1.9398517906665802e-05, 2.039410173892975e-05, 2.1389685571193695e-05, 2.238526940345764e-05, 2.3380853235721588e-05, 2.4376437067985535e-05, 2.537202090024948e-05, 2.6367604732513428e-05, 2.7363188564777374e-05, 2.835877239704132e-05, 2.9354356229305267e-05, 3.0349940061569214e-05, 3.134552389383316e-05, 3.234110772609711e-05, 3.3336691558361053e-05, 3.4332275390625e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 13.0, 8.0, 8.0, 24.0, 22.0, 31.0, 38.0, 55.0, 74.0, 112.0, 166.0, 244.0, 431.0, 841.0, 1546.0, 3588.0, 7715.0, 17941.0, 39491.0, 97033.0, 271888.0, 353975.0, 151329.0, 56211.0, 24692.0, 11246.0, 4940.0, 2241.0, 1103.0, 625.0, 332.0, 214.0, 118.0, 69.0, 48.0, 45.0, 26.0, 13.0, 10.0, 12.0, 14.0, 10.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.12164306640625, -0.11786651611328125, -0.1140899658203125, -0.11031341552734375, -0.106536865234375, -0.10276031494140625, -0.0989837646484375, -0.09520721435546875, -0.0914306640625, -0.08765411376953125, -0.0838775634765625, -0.08010101318359375, -0.076324462890625, -0.07254791259765625, -0.0687713623046875, -0.06499481201171875, -0.06121826171875, -0.05744171142578125, -0.0536651611328125, -0.04988861083984375, -0.046112060546875, -0.04233551025390625, -0.0385589599609375, -0.03478240966796875, -0.031005859375, -0.02722930908203125, -0.0234527587890625, -0.01967620849609375, -0.015899658203125, -0.01212310791015625, -0.0083465576171875, -0.00457000732421875, -0.00079345703125, 0.00298309326171875, 0.0067596435546875, 0.01053619384765625, 0.014312744140625, 0.01808929443359375, 0.0218658447265625, 0.02564239501953125, 0.0294189453125, 0.03319549560546875, 0.0369720458984375, 0.04074859619140625, 0.044525146484375, 0.04830169677734375, 0.0520782470703125, 0.05585479736328125, 0.05963134765625, 0.06340789794921875, 0.0671844482421875, 0.07096099853515625, 0.074737548828125, 0.07851409912109375, 0.0822906494140625, 0.08606719970703125, 0.08984375, 0.09362030029296875, 0.0973968505859375, 0.10117340087890625, 0.104949951171875, 0.10872650146484375, 0.1125030517578125, 0.11627960205078125, 0.12005615234375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 7.0, 4.0, 12.0, 9.0, 13.0, 22.0, 38.0, 59.0, 53.0, 86.0, 115.0, 103.0, 105.0, 80.0, 77.0, 66.0, 43.0, 27.0, 28.0, 11.0, 13.0, 3.0, 13.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.135498046875, -0.130950927734375, -0.12640380859375, -0.121856689453125, -0.1173095703125, -0.112762451171875, -0.10821533203125, -0.103668212890625, -0.09912109375, -0.094573974609375, -0.09002685546875, -0.085479736328125, -0.0809326171875, -0.076385498046875, -0.07183837890625, -0.067291259765625, -0.062744140625, -0.058197021484375, -0.05364990234375, -0.049102783203125, -0.0445556640625, -0.040008544921875, -0.03546142578125, -0.030914306640625, -0.0263671875, -0.021820068359375, -0.01727294921875, -0.012725830078125, -0.0081787109375, -0.003631591796875, 0.00091552734375, 0.005462646484375, 0.010009765625, 0.014556884765625, 0.01910400390625, 0.023651123046875, 0.0281982421875, 0.032745361328125, 0.03729248046875, 0.041839599609375, 0.04638671875, 0.050933837890625, 0.05548095703125, 0.060028076171875, 0.0645751953125, 0.069122314453125, 0.07366943359375, 0.078216552734375, 0.082763671875, 0.087310791015625, 0.09185791015625, 0.096405029296875, 0.1009521484375, 0.105499267578125, 0.11004638671875, 0.114593505859375, 0.119140625, 0.123687744140625, 0.12823486328125, 0.132781982421875, 0.1373291015625, 0.141876220703125, 0.14642333984375, 0.150970458984375, 0.155517578125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 6.0, 14.0, 40.0, 85.0, 150.0, 216.0, 202.0, 154.0, 78.0, 40.0, 16.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9534810781478882, -1.8747016191482544, -1.7959221601486206, -1.7171427011489868, -1.6383633613586426, -1.5595839023590088, -1.480804443359375, -1.4020249843597412, -1.3232455253601074, -1.2444660663604736, -1.1656866073608398, -1.086907148361206, -1.0081276893615723, -0.9293482899665833, -0.8505688905715942, -0.7717894315719604, -0.6930099725723267, -0.6142305135726929, -0.5354510545730591, -0.45667165517807007, -0.3778921961784363, -0.2991127371788025, -0.2203333079814911, -0.1415538787841797, -0.0627744197845459, 0.016005024313926697, 0.09478446841239929, 0.1735639125108719, 0.2523433566093445, 0.33112281560897827, 0.4099022448062897, 0.4886816740036011, 0.5674610137939453, 0.6462404727935791, 0.7250199317932129, 0.8037993311882019, 0.8825787901878357, 0.9613582491874695, 1.0401376485824585, 1.1189171075820923, 1.197696566581726, 1.2764760255813599, 1.3552554845809937, 1.4340349435806274, 1.5128142833709717, 1.5915937423706055, 1.6703732013702393, 1.749152660369873, 1.8279321193695068, 1.9067115783691406, 1.9854910373687744, 2.064270496368408, 2.143049955368042, 2.221829414367676, 2.3006088733673096, 2.3793883323669434, 2.458167552947998, 2.536947011947632, 2.6157264709472656, 2.6945059299468994, 2.773285388946533, 2.852064847946167, 2.930844306945801, 3.0096235275268555, 3.0884032249450684]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 6.0, 2.0, 5.0, 11.0, 16.0, 10.0, 12.0, 21.0, 24.0, 29.0, 36.0, 42.0, 38.0, 38.0, 40.0, 38.0, 31.0, 46.0, 34.0, 42.0, 42.0, 34.0, 44.0, 42.0, 39.0, 37.0, 23.0, 36.0, 30.0, 27.0, 24.0, 18.0, 13.0, 19.0, 11.0, 9.0, 10.0, 5.0, 6.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.9091084599494934, -0.8811596035957336, -0.8532107472419739, -0.8252619504928589, -0.7973130941390991, -0.7693642377853394, -0.7414153814315796, -0.7134665250778198, -0.6855176687240601, -0.6575688123703003, -0.6296199560165405, -0.6016710996627808, -0.5737223029136658, -0.545773446559906, -0.5178245902061462, -0.4898757338523865, -0.4619269371032715, -0.4339780807495117, -0.40602925419807434, -0.3780803978443146, -0.3501315712928772, -0.32218271493911743, -0.29423385858535767, -0.2662850022315979, -0.23833617568016052, -0.21038733422756195, -0.18243849277496338, -0.1544896364212036, -0.12654079496860504, -0.09859195351600647, -0.0706430971622467, -0.04269425570964813, -0.014745473861694336, 0.013203371316194534, 0.041152216494083405, 0.06910106539726257, 0.09704990684986115, 0.12499874830245972, 0.15294760465621948, 0.18089644610881805, 0.20884528756141663, 0.2367941290140152, 0.26474297046661377, 0.29269182682037354, 0.3206406831741333, 0.3485895097255707, 0.37653836607933044, 0.4044871926307678, 0.4324360489845276, 0.46038490533828735, 0.48833373188972473, 0.5162825584411621, 0.5442314147949219, 0.5721802711486816, 0.6001291275024414, 0.6280779838562012, 0.6560268402099609, 0.6839756965637207, 0.7119245529174805, 0.7398734092712402, 0.7678222060203552, 0.795771062374115, 0.8237199187278748, 0.8516687750816345, 0.8796175718307495]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 0.0, 5.0, 3.0, 14.0, 18.0, 24.0, 35.0, 52.0, 67.0, 116.0, 198.0, 302.0, 542.0, 1095.0, 2104.0, 4443.0, 9853.0, 23771.0, 64329.0, 204638.0, 838113.0, 1980389.0, 769270.0, 191383.0, 62000.0, 23449.0, 9524.0, 4301.0, 2011.0, 996.0, 562.0, 286.0, 155.0, 94.0, 50.0, 36.0, 17.0, 10.0, 5.0, 9.0, 6.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.25146484375, -0.24492835998535156, -0.23839187622070312, -0.2318553924560547, -0.22531890869140625, -0.2187824249267578, -0.21224594116210938, -0.20570945739746094, -0.1991729736328125, -0.19263648986816406, -0.18610000610351562, -0.1795635223388672, -0.17302703857421875, -0.1664905548095703, -0.15995407104492188, -0.15341758728027344, -0.146881103515625, -0.14034461975097656, -0.13380813598632812, -0.1272716522216797, -0.12073516845703125, -0.11419868469238281, -0.10766220092773438, -0.10112571716308594, -0.0945892333984375, -0.08805274963378906, -0.08151626586914062, -0.07497978210449219, -0.06844329833984375, -0.06190681457519531, -0.055370330810546875, -0.04883384704589844, -0.04229736328125, -0.03576087951660156, -0.029224395751953125, -0.022687911987304688, -0.01615142822265625, -0.009614944458007812, -0.003078460693359375, 0.0034580230712890625, 0.0099945068359375, 0.016530990600585938, 0.023067474365234375, 0.029603958129882812, 0.03614044189453125, 0.04267692565917969, 0.049213409423828125, 0.05574989318847656, 0.062286376953125, 0.06882286071777344, 0.07535934448242188, 0.08189582824707031, 0.08843231201171875, 0.09496879577636719, 0.10150527954101562, 0.10804176330566406, 0.1145782470703125, 0.12111473083496094, 0.12765121459960938, 0.1341876983642578, 0.14072418212890625, 0.1472606658935547, 0.15379714965820312, 0.16033363342285156, 0.1668701171875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 6.0, 4.0, 7.0, 7.0, 7.0, 11.0, 16.0, 19.0, 20.0, 23.0, 16.0, 21.0, 30.0, 28.0, 35.0, 30.0, 41.0, 38.0, 43.0, 43.0, 37.0, 41.0, 45.0, 45.0, 55.0, 38.0, 33.0, 41.0, 27.0, 23.0, 25.0, 24.0, 25.0, 13.0, 24.0, 9.0, 3.0, 8.0, 8.0, 8.0, 6.0, 4.0, 9.0, 1.0, 7.0, 2.0, 4.0, 1.0], "bins": [-0.1402587890625, -0.13648509979248047, -0.13271141052246094, -0.1289377212524414, -0.12516403198242188, -0.12139034271240234, -0.11761665344238281, -0.11384296417236328, -0.11006927490234375, -0.10629558563232422, -0.10252189636230469, -0.09874820709228516, -0.09497451782226562, -0.0912008285522461, -0.08742713928222656, -0.08365345001220703, -0.0798797607421875, -0.07610607147216797, -0.07233238220214844, -0.0685586929321289, -0.06478500366210938, -0.061011314392089844, -0.05723762512207031, -0.05346393585205078, -0.04969024658203125, -0.04591655731201172, -0.04214286804199219, -0.038369178771972656, -0.034595489501953125, -0.030821800231933594, -0.027048110961914062, -0.02327442169189453, -0.019500732421875, -0.01572704315185547, -0.011953353881835938, -0.008179664611816406, -0.004405975341796875, -0.0006322860717773438, 0.0031414031982421875, 0.006915092468261719, 0.01068878173828125, 0.014462471008300781, 0.018236160278320312, 0.022009849548339844, 0.025783538818359375, 0.029557228088378906, 0.03333091735839844, 0.03710460662841797, 0.0408782958984375, 0.04465198516845703, 0.04842567443847656, 0.052199363708496094, 0.055973052978515625, 0.059746742248535156, 0.06352043151855469, 0.06729412078857422, 0.07106781005859375, 0.07484149932861328, 0.07861518859863281, 0.08238887786865234, 0.08616256713867188, 0.0899362564086914, 0.09370994567871094, 0.09748363494873047, 0.10125732421875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 2.0, 6.0, 7.0, 10.0, 25.0, 17.0, 28.0, 50.0, 78.0, 115.0, 152.0, 262.0, 421.0, 827.0, 1393.0, 2736.0, 5472.0, 10964.0, 23738.0, 53686.0, 124371.0, 299705.0, 758373.0, 1468235.0, 856040.0, 337399.0, 138758.0, 60081.0, 26680.0, 12200.0, 5774.0, 2878.0, 1549.0, 899.0, 491.0, 289.0, 183.0, 130.0, 67.0, 63.0, 46.0, 27.0, 18.0, 16.0, 8.0, 5.0, 2.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1688232421875, -0.16363906860351562, -0.15845489501953125, -0.15327072143554688, -0.1480865478515625, -0.14290237426757812, -0.13771820068359375, -0.13253402709960938, -0.127349853515625, -0.12216567993164062, -0.11698150634765625, -0.11179733276367188, -0.1066131591796875, -0.10142898559570312, -0.09624481201171875, -0.09106063842773438, -0.08587646484375, -0.08069229125976562, -0.07550811767578125, -0.07032394409179688, -0.0651397705078125, -0.059955596923828125, -0.05477142333984375, -0.049587249755859375, -0.044403076171875, -0.039218902587890625, -0.03403472900390625, -0.028850555419921875, -0.0236663818359375, -0.018482208251953125, -0.01329803466796875, -0.008113861083984375, -0.0029296875, 0.002254486083984375, 0.00743865966796875, 0.012622833251953125, 0.0178070068359375, 0.022991180419921875, 0.02817535400390625, 0.033359527587890625, 0.038543701171875, 0.043727874755859375, 0.04891204833984375, 0.054096221923828125, 0.0592803955078125, 0.06446456909179688, 0.06964874267578125, 0.07483291625976562, 0.08001708984375, 0.08520126342773438, 0.09038543701171875, 0.09556961059570312, 0.1007537841796875, 0.10593795776367188, 0.11112213134765625, 0.11630630493164062, 0.121490478515625, 0.12667465209960938, 0.13185882568359375, 0.13704299926757812, 0.1422271728515625, 0.14741134643554688, 0.15259552001953125, 0.15777969360351562, 0.1629638671875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 4.0, 6.0, 11.0, 13.0, 19.0, 31.0, 21.0, 42.0, 54.0, 52.0, 106.0, 157.0, 221.0, 301.0, 450.0, 540.0, 551.0, 427.0, 287.0, 198.0, 149.0, 123.0, 73.0, 67.0, 54.0, 32.0, 31.0, 12.0, 16.0, 8.0, 6.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.201904296875, -0.19412994384765625, -0.1863555908203125, -0.17858123779296875, -0.170806884765625, -0.16303253173828125, -0.1552581787109375, -0.14748382568359375, -0.13970947265625, -0.13193511962890625, -0.1241607666015625, -0.11638641357421875, -0.108612060546875, -0.10083770751953125, -0.0930633544921875, -0.08528900146484375, -0.0775146484375, -0.06974029541015625, -0.0619659423828125, -0.05419158935546875, -0.046417236328125, -0.03864288330078125, -0.0308685302734375, -0.02309417724609375, -0.01531982421875, -0.00754547119140625, 0.0002288818359375, 0.00800323486328125, 0.015777587890625, 0.02355194091796875, 0.0313262939453125, 0.03910064697265625, 0.046875, 0.05464935302734375, 0.0624237060546875, 0.07019805908203125, 0.077972412109375, 0.08574676513671875, 0.0935211181640625, 0.10129547119140625, 0.10906982421875, 0.11684417724609375, 0.1246185302734375, 0.13239288330078125, 0.140167236328125, 0.14794158935546875, 0.1557159423828125, 0.16349029541015625, 0.1712646484375, 0.17903900146484375, 0.1868133544921875, 0.19458770751953125, 0.202362060546875, 0.21013641357421875, 0.2179107666015625, 0.22568511962890625, 0.23345947265625, 0.24123382568359375, 0.2490081787109375, 0.25678253173828125, 0.264556884765625, 0.27233123779296875, 0.2801055908203125, 0.28787994384765625, 0.295654296875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 9.0, 9.0, 9.0, 18.0, 20.0, 25.0, 33.0, 37.0, 61.0, 72.0, 75.0, 73.0, 79.0, 76.0, 74.0, 67.0, 52.0, 40.0, 52.0, 31.0, 29.0, 20.0, 13.0, 12.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9013108611106873, -0.8709077835083008, -0.8405046463012695, -0.8101015686988831, -0.7796984314918518, -0.7492953538894653, -0.7188922166824341, -0.6884891390800476, -0.6580860614776611, -0.6276829838752747, -0.5972798466682434, -0.5668767690658569, -0.5364736318588257, -0.5060705542564392, -0.47566744685173035, -0.4452643394470215, -0.41486120223999023, -0.38445809483528137, -0.3540549874305725, -0.32365190982818604, -0.2932487726211548, -0.2628456950187683, -0.23244258761405945, -0.20203948020935059, -0.17163637280464172, -0.14123326539993286, -0.1108301654458046, -0.08042706549167633, -0.05002395808696747, -0.019620850682258606, 0.010782241821289062, 0.041185349225997925, 0.07158839702606201, 0.10199150443077087, 0.13239461183547974, 0.1627977043390274, 0.19320081174373627, 0.22360391914844513, 0.2540070116519928, 0.28441011905670166, 0.3148132264614105, 0.3452163338661194, 0.37561944127082825, 0.4060225486755371, 0.4364256262779236, 0.46682876348495483, 0.4972318410873413, 0.5276349782943726, 0.558038055896759, 0.5884411334991455, 0.6188442707061768, 0.6492473483085632, 0.6796504855155945, 0.710053563117981, 0.7404567003250122, 0.7708597779273987, 0.8012628555297852, 0.8316659331321716, 0.8620690703392029, 0.8924721479415894, 0.9228752851486206, 0.9532783627510071, 0.9836814403533936, 1.0140845775604248, 1.044487714767456]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 10.0, 12.0, 11.0, 9.0, 15.0, 19.0, 31.0, 24.0, 32.0, 30.0, 32.0, 40.0, 42.0, 38.0, 42.0, 38.0, 46.0, 43.0, 52.0, 42.0, 33.0, 32.0, 44.0, 45.0, 29.0, 32.0, 31.0, 21.0, 21.0, 28.0, 13.0, 8.0, 11.0, 12.0, 4.0, 5.0, 8.0, 6.0, 1.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6664804816246033, -0.6417678594589233, -0.6170551776885986, -0.5923425555229187, -0.5676299333572388, -0.5429172515869141, -0.5182046294212341, -0.4934920072555542, -0.4687793552875519, -0.44406670331954956, -0.41935408115386963, -0.3946414291858673, -0.369928777217865, -0.34521615505218506, -0.32050350308418274, -0.2957908511161804, -0.2710782289505005, -0.24636559188365936, -0.22165295481681824, -0.19694030284881592, -0.1722276657819748, -0.14751502871513367, -0.12280237674713135, -0.09808973968029022, -0.0733771026134491, -0.04866446182131767, -0.02395182102918625, 0.0007608234882354736, 0.0254734605550766, 0.050186097621917725, 0.07489874958992004, 0.09961138665676117, 0.12432408332824707, 0.1490367203950882, 0.17374935746192932, 0.19846200942993164, 0.22317464649677277, 0.2478872835636139, 0.2725999355316162, 0.29731255769729614, 0.32202520966529846, 0.3467378616333008, 0.3714504837989807, 0.39616313576698303, 0.42087578773498535, 0.4455884099006653, 0.4703010618686676, 0.4950137138366699, 0.5197263360023499, 0.5444389581680298, 0.5691516399383545, 0.5938642621040344, 0.6185768842697144, 0.6432895660400391, 0.668002188205719, 0.6927148103713989, 0.7174274921417236, 0.7421401143074036, 0.7668527960777283, 0.7915654182434082, 0.8162780404090881, 0.8409906625747681, 0.8657033443450928, 0.8904159665107727, 0.9151285886764526]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 20.0, 15.0, 25.0, 29.0, 35.0, 47.0, 103.0, 135.0, 224.0, 325.0, 585.0, 972.0, 1795.0, 3131.0, 5548.0, 9845.0, 17481.0, 29939.0, 49923.0, 81526.0, 123659.0, 171249.0, 180242.0, 138900.0, 92431.0, 58222.0, 34889.0, 20297.0, 11817.0, 6517.0, 3643.0, 2128.0, 1115.0, 655.0, 376.0, 262.0, 152.0, 105.0, 56.0, 39.0, 26.0, 25.0, 13.0, 8.0, 6.0, 5.0, 1.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.2490234375, -0.24151039123535156, -0.23399734497070312, -0.2264842987060547, -0.21897125244140625, -0.2114582061767578, -0.20394515991210938, -0.19643211364746094, -0.1889190673828125, -0.18140602111816406, -0.17389297485351562, -0.1663799285888672, -0.15886688232421875, -0.1513538360595703, -0.14384078979492188, -0.13632774353027344, -0.128814697265625, -0.12130165100097656, -0.11378860473632812, -0.10627555847167969, -0.09876251220703125, -0.09124946594238281, -0.08373641967773438, -0.07622337341308594, -0.0687103271484375, -0.06119728088378906, -0.053684234619140625, -0.04617118835449219, -0.03865814208984375, -0.031145095825195312, -0.023632049560546875, -0.016119003295898438, -0.00860595703125, -0.0010929107666015625, 0.006420135498046875, 0.013933181762695312, 0.02144622802734375, 0.028959274291992188, 0.036472320556640625, 0.04398536682128906, 0.0514984130859375, 0.05901145935058594, 0.06652450561523438, 0.07403755187988281, 0.08155059814453125, 0.08906364440917969, 0.09657669067382812, 0.10408973693847656, 0.111602783203125, 0.11911582946777344, 0.12662887573242188, 0.1341419219970703, 0.14165496826171875, 0.1491680145263672, 0.15668106079101562, 0.16419410705566406, 0.1717071533203125, 0.17922019958496094, 0.18673324584960938, 0.1942462921142578, 0.20175933837890625, 0.2092723846435547, 0.21678543090820312, 0.22429847717285156, 0.2318115234375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 5.0, 4.0, 8.0, 3.0, 4.0, 9.0, 12.0, 7.0, 14.0, 12.0, 23.0, 18.0, 25.0, 21.0, 25.0, 31.0, 34.0, 32.0, 41.0, 36.0, 38.0, 40.0, 34.0, 53.0, 49.0, 35.0, 42.0, 40.0, 31.0, 25.0, 32.0, 24.0, 37.0, 26.0, 24.0, 17.0, 13.0, 18.0, 8.0, 7.0, 11.0, 8.0, 9.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1112060546875, -0.10775566101074219, -0.10430526733398438, -0.10085487365722656, -0.09740447998046875, -0.09395408630371094, -0.09050369262695312, -0.08705329895019531, -0.0836029052734375, -0.08015251159667969, -0.07670211791992188, -0.07325172424316406, -0.06980133056640625, -0.06635093688964844, -0.06290054321289062, -0.05945014953613281, -0.055999755859375, -0.05254936218261719, -0.049098968505859375, -0.04564857482910156, -0.04219818115234375, -0.03874778747558594, -0.035297393798828125, -0.03184700012207031, -0.0283966064453125, -0.024946212768554688, -0.021495819091796875, -0.018045425415039062, -0.01459503173828125, -0.011144638061523438, -0.007694244384765625, -0.0042438507080078125, -0.00079345703125, 0.0026569366455078125, 0.006107330322265625, 0.009557723999023438, 0.01300811767578125, 0.016458511352539062, 0.019908905029296875, 0.023359298706054688, 0.0268096923828125, 0.030260086059570312, 0.033710479736328125, 0.03716087341308594, 0.04061126708984375, 0.04406166076660156, 0.047512054443359375, 0.05096244812011719, 0.054412841796875, 0.05786323547363281, 0.061313629150390625, 0.06476402282714844, 0.06821441650390625, 0.07166481018066406, 0.07511520385742188, 0.07856559753417969, 0.0820159912109375, 0.08546638488769531, 0.08891677856445312, 0.09236717224121094, 0.09581756591796875, 0.09926795959472656, 0.10271835327148438, 0.10616874694824219, 0.109619140625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 10.0, 10.0, 9.0, 18.0, 31.0, 33.0, 51.0, 60.0, 88.0, 121.0, 251.0, 420.0, 804.0, 1662.0, 3546.0, 7510.0, 16413.0, 34450.0, 70856.0, 131476.0, 210870.0, 231887.0, 161376.0, 90058.0, 45448.0, 21772.0, 10165.0, 4667.0, 2103.0, 1037.0, 524.0, 285.0, 187.0, 102.0, 57.0, 55.0, 45.0, 20.0, 16.0, 14.0, 9.0, 8.0, 6.0, 5.0, 3.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2568359375, -0.24803543090820312, -0.23923492431640625, -0.23043441772460938, -0.2216339111328125, -0.21283340454101562, -0.20403289794921875, -0.19523239135742188, -0.186431884765625, -0.17763137817382812, -0.16883087158203125, -0.16003036499023438, -0.1512298583984375, -0.14242935180664062, -0.13362884521484375, -0.12482833862304688, -0.11602783203125, -0.10722732543945312, -0.09842681884765625, -0.08962631225585938, -0.0808258056640625, -0.07202529907226562, -0.06322479248046875, -0.054424285888671875, -0.045623779296875, -0.036823272705078125, -0.02802276611328125, -0.019222259521484375, -0.0104217529296875, -0.001621246337890625, 0.00717926025390625, 0.015979766845703125, 0.0247802734375, 0.033580780029296875, 0.04238128662109375, 0.051181793212890625, 0.0599822998046875, 0.06878280639648438, 0.07758331298828125, 0.08638381958007812, 0.095184326171875, 0.10398483276367188, 0.11278533935546875, 0.12158584594726562, 0.1303863525390625, 0.13918685913085938, 0.14798736572265625, 0.15678787231445312, 0.16558837890625, 0.17438888549804688, 0.18318939208984375, 0.19198989868164062, 0.2007904052734375, 0.20959091186523438, 0.21839141845703125, 0.22719192504882812, 0.235992431640625, 0.24479293823242188, 0.25359344482421875, 0.2623939514160156, 0.2711944580078125, 0.2799949645996094, 0.28879547119140625, 0.2975959777832031, 0.306396484375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 6.0, 7.0, 10.0, 11.0, 17.0, 12.0, 13.0, 25.0, 24.0, 38.0, 36.0, 29.0, 41.0, 40.0, 47.0, 38.0, 31.0, 45.0, 38.0, 46.0, 39.0, 51.0, 45.0, 36.0, 27.0, 31.0, 32.0, 29.0, 24.0, 24.0, 16.0, 17.0, 16.0, 14.0, 7.0, 7.0, 6.0, 8.0, 3.0, 1.0, 5.0, 1.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.371826171875, -0.3612098693847656, -0.35059356689453125, -0.3399772644042969, -0.3293609619140625, -0.3187446594238281, -0.30812835693359375, -0.2975120544433594, -0.286895751953125, -0.2762794494628906, -0.26566314697265625, -0.2550468444824219, -0.2444305419921875, -0.23381423950195312, -0.22319793701171875, -0.21258163452148438, -0.20196533203125, -0.19134902954101562, -0.18073272705078125, -0.17011642456054688, -0.1595001220703125, -0.14888381958007812, -0.13826751708984375, -0.12765121459960938, -0.117034912109375, -0.10641860961914062, -0.09580230712890625, -0.08518600463867188, -0.0745697021484375, -0.06395339965820312, -0.05333709716796875, -0.042720794677734375, -0.0321044921875, -0.021488189697265625, -0.01087188720703125, -0.000255584716796875, 0.0103607177734375, 0.020977020263671875, 0.03159332275390625, 0.042209625244140625, 0.052825927734375, 0.06344223022460938, 0.07405853271484375, 0.08467483520507812, 0.0952911376953125, 0.10590744018554688, 0.11652374267578125, 0.12714004516601562, 0.13775634765625, 0.14837265014648438, 0.15898895263671875, 0.16960525512695312, 0.1802215576171875, 0.19083786010742188, 0.20145416259765625, 0.21207046508789062, 0.222686767578125, 0.23330307006835938, 0.24391937255859375, 0.2545356750488281, 0.2651519775390625, 0.2757682800292969, 0.28638458251953125, 0.2970008850097656, 0.3076171875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 13.0, 11.0, 14.0, 24.0, 33.0, 55.0, 111.0, 152.0, 255.0, 413.0, 700.0, 1305.0, 2378.0, 4249.0, 7600.0, 13902.0, 25046.0, 43501.0, 73482.0, 117287.0, 164099.0, 182994.0, 153573.0, 105560.0, 65078.0, 37969.0, 21792.0, 11990.0, 6699.0, 3571.0, 2042.0, 1089.0, 615.0, 357.0, 225.0, 128.0, 77.0, 62.0, 32.0, 18.0, 17.0, 16.0, 6.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.08966064453125, -0.0869741439819336, -0.08428764343261719, -0.08160114288330078, -0.07891464233398438, -0.07622814178466797, -0.07354164123535156, -0.07085514068603516, -0.06816864013671875, -0.06548213958740234, -0.06279563903808594, -0.06010913848876953, -0.057422637939453125, -0.05473613739013672, -0.05204963684082031, -0.049363136291503906, -0.0466766357421875, -0.043990135192871094, -0.04130363464355469, -0.03861713409423828, -0.035930633544921875, -0.03324413299560547, -0.030557632446289062, -0.027871131896972656, -0.02518463134765625, -0.022498130798339844, -0.019811630249023438, -0.01712512969970703, -0.014438629150390625, -0.011752128601074219, -0.009065628051757812, -0.006379127502441406, -0.003692626953125, -0.0010061264038085938, 0.0016803741455078125, 0.004366874694824219, 0.007053375244140625, 0.009739875793457031, 0.012426376342773438, 0.015112876892089844, 0.01779937744140625, 0.020485877990722656, 0.023172378540039062, 0.02585887908935547, 0.028545379638671875, 0.03123188018798828, 0.03391838073730469, 0.036604881286621094, 0.0392913818359375, 0.041977882385253906, 0.04466438293457031, 0.04735088348388672, 0.050037384033203125, 0.05272388458251953, 0.05541038513183594, 0.058096885681152344, 0.06078338623046875, 0.06346988677978516, 0.06615638732910156, 0.06884288787841797, 0.07152938842773438, 0.07421588897705078, 0.07690238952636719, 0.0795888900756836, 0.082275390625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 7.0, 4.0, 8.0, 9.0, 14.0, 12.0, 21.0, 25.0, 31.0, 32.0, 29.0, 42.0, 62.0, 77.0, 73.0, 87.0, 94.0, 50.0, 60.0, 48.0, 38.0, 29.0, 31.0, 16.0, 20.0, 12.0, 7.0, 11.0, 12.0, 12.0, 6.0, 2.0, 8.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.641843795776367e-05, -3.539677709341049e-05, -3.437511622905731e-05, -3.335345536470413e-05, -3.233179450035095e-05, -3.131013363599777e-05, -3.0288472771644592e-05, -2.9266811907291412e-05, -2.8245151042938232e-05, -2.7223490178585052e-05, -2.6201829314231873e-05, -2.5180168449878693e-05, -2.4158507585525513e-05, -2.3136846721172333e-05, -2.2115185856819153e-05, -2.1093524992465973e-05, -2.0071864128112793e-05, -1.9050203263759613e-05, -1.8028542399406433e-05, -1.7006881535053253e-05, -1.5985220670700073e-05, -1.4963559806346893e-05, -1.3941898941993713e-05, -1.2920238077640533e-05, -1.1898577213287354e-05, -1.0876916348934174e-05, -9.855255484580994e-06, -8.833594620227814e-06, -7.811933755874634e-06, -6.790272891521454e-06, -5.768612027168274e-06, -4.746951162815094e-06, -3.725290298461914e-06, -2.703629434108734e-06, -1.6819685697555542e-06, -6.603077054023743e-07, 3.6135315895080566e-07, 1.3830140233039856e-06, 2.4046748876571655e-06, 3.4263357520103455e-06, 4.447996616363525e-06, 5.469657480716705e-06, 6.491318345069885e-06, 7.512979209423065e-06, 8.534640073776245e-06, 9.556300938129425e-06, 1.0577961802482605e-05, 1.1599622666835785e-05, 1.2621283531188965e-05, 1.3642944395542145e-05, 1.4664605259895325e-05, 1.5686266124248505e-05, 1.6707926988601685e-05, 1.7729587852954865e-05, 1.8751248717308044e-05, 1.9772909581661224e-05, 2.0794570446014404e-05, 2.1816231310367584e-05, 2.2837892174720764e-05, 2.3859553039073944e-05, 2.4881213903427124e-05, 2.5902874767780304e-05, 2.6924535632133484e-05, 2.7946196496486664e-05, 2.8967857360839844e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 6.0, 12.0, 6.0, 13.0, 19.0, 39.0, 53.0, 54.0, 94.0, 153.0, 290.0, 535.0, 1237.0, 2597.0, 5428.0, 11988.0, 26274.0, 57560.0, 118648.0, 209842.0, 254092.0, 180138.0, 95778.0, 45455.0, 20616.0, 9444.0, 4235.0, 1933.0, 987.0, 455.0, 222.0, 136.0, 67.0, 46.0, 34.0, 23.0, 9.0, 15.0, 8.0, 8.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10662841796875, -0.1032266616821289, -0.09982490539550781, -0.09642314910888672, -0.09302139282226562, -0.08961963653564453, -0.08621788024902344, -0.08281612396240234, -0.07941436767578125, -0.07601261138916016, -0.07261085510253906, -0.06920909881591797, -0.06580734252929688, -0.06240558624267578, -0.05900382995605469, -0.055602073669433594, -0.0522003173828125, -0.048798561096191406, -0.04539680480957031, -0.04199504852294922, -0.038593292236328125, -0.03519153594970703, -0.03178977966308594, -0.028388023376464844, -0.02498626708984375, -0.021584510803222656, -0.018182754516601562, -0.014780998229980469, -0.011379241943359375, -0.007977485656738281, -0.0045757293701171875, -0.0011739730834960938, 0.002227783203125, 0.005629539489746094, 0.009031295776367188, 0.012433052062988281, 0.015834808349609375, 0.01923656463623047, 0.022638320922851562, 0.026040077209472656, 0.02944183349609375, 0.032843589782714844, 0.03624534606933594, 0.03964710235595703, 0.043048858642578125, 0.04645061492919922, 0.04985237121582031, 0.053254127502441406, 0.0566558837890625, 0.060057640075683594, 0.06345939636230469, 0.06686115264892578, 0.07026290893554688, 0.07366466522216797, 0.07706642150878906, 0.08046817779541016, 0.08386993408203125, 0.08727169036865234, 0.09067344665527344, 0.09407520294189453, 0.09747695922851562, 0.10087871551513672, 0.10428047180175781, 0.1076822280883789, 0.111083984375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 6.0, 5.0, 7.0, 7.0, 16.0, 18.0, 14.0, 26.0, 25.0, 26.0, 27.0, 32.0, 62.0, 42.0, 66.0, 58.0, 55.0, 62.0, 56.0, 60.0, 54.0, 36.0, 41.0, 34.0, 20.0, 26.0, 16.0, 22.0, 10.0, 10.0, 16.0, 10.0, 7.0, 9.0, 2.0, 5.0, 1.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09613037109375, -0.09320926666259766, -0.09028816223144531, -0.08736705780029297, -0.08444595336914062, -0.08152484893798828, -0.07860374450683594, -0.0756826400756836, -0.07276153564453125, -0.0698404312133789, -0.06691932678222656, -0.06399822235107422, -0.061077117919921875, -0.05815601348876953, -0.05523490905761719, -0.052313804626464844, -0.0493927001953125, -0.046471595764160156, -0.04355049133300781, -0.04062938690185547, -0.037708282470703125, -0.03478717803955078, -0.03186607360839844, -0.028944969177246094, -0.02602386474609375, -0.023102760314941406, -0.020181655883789062, -0.01726055145263672, -0.014339447021484375, -0.011418342590332031, -0.008497238159179688, -0.005576133728027344, -0.002655029296875, 0.00026607513427734375, 0.0031871795654296875, 0.006108283996582031, 0.009029388427734375, 0.011950492858886719, 0.014871597290039062, 0.017792701721191406, 0.02071380615234375, 0.023634910583496094, 0.026556015014648438, 0.02947711944580078, 0.032398223876953125, 0.03531932830810547, 0.03824043273925781, 0.041161537170410156, 0.0440826416015625, 0.047003746032714844, 0.04992485046386719, 0.05284595489501953, 0.055767059326171875, 0.05868816375732422, 0.06160926818847656, 0.0645303726196289, 0.06745147705078125, 0.0703725814819336, 0.07329368591308594, 0.07621479034423828, 0.07913589477539062, 0.08205699920654297, 0.08497810363769531, 0.08789920806884766, 0.0908203125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 7.0, 6.0, 14.0, 29.0, 37.0, 45.0, 70.0, 78.0, 107.0, 111.0, 105.0, 107.0, 82.0, 60.0, 50.0, 39.0, 22.0, 12.0, 17.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.929495096206665, -1.8840177059173584, -1.8385404348373413, -1.7930631637573242, -1.7475857734680176, -1.702108383178711, -1.6566311120986938, -1.6111538410186768, -1.5656764507293701, -1.5201990604400635, -1.4747217893600464, -1.4292445182800293, -1.3837671279907227, -1.338289737701416, -1.292812466621399, -1.2473351955413818, -1.2018578052520752, -1.1563804149627686, -1.1109031438827515, -1.0654258728027344, -1.0199484825134277, -0.9744711518287659, -0.928993821144104, -0.8835164904594421, -0.8380391597747803, -0.7925618290901184, -0.7470844984054565, -0.7016071677207947, -0.6561298370361328, -0.610652506351471, -0.5651751756668091, -0.5196978449821472, -0.4742205739021301, -0.42874324321746826, -0.3832659125328064, -0.33778858184814453, -0.29231125116348267, -0.2468339204788208, -0.20135658979415894, -0.15587925910949707, -0.1104019284248352, -0.06492459774017334, -0.019447267055511475, 0.02603006362915039, 0.07150739431381226, 0.11698472499847412, 0.162462055683136, 0.20793938636779785, 0.2534167170524597, 0.2988940477371216, 0.34437137842178345, 0.3898487091064453, 0.4353260397911072, 0.48080337047576904, 0.5262807011604309, 0.5717580318450928, 0.6172353625297546, 0.6627126932144165, 0.7081900238990784, 0.7536673545837402, 0.7991446852684021, 0.844622015953064, 0.8900993466377258, 0.9355766773223877, 0.9810540080070496]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 4.0, 7.0, 5.0, 6.0, 12.0, 10.0, 12.0, 11.0, 14.0, 17.0, 23.0, 17.0, 26.0, 15.0, 17.0, 33.0, 26.0, 33.0, 25.0, 41.0, 52.0, 46.0, 53.0, 35.0, 36.0, 43.0, 42.0, 28.0, 27.0, 29.0, 36.0, 27.0, 28.0, 23.0, 20.0, 21.0, 15.0, 15.0, 8.0, 18.0, 12.0, 8.0, 8.0, 8.0, 6.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.8066449761390686, -0.7823349833488464, -0.758025050163269, -0.7337150573730469, -0.7094050645828247, -0.6850950717926025, -0.6607850790023804, -0.636475145816803, -0.6121651530265808, -0.5878551602363586, -0.5635452270507812, -0.5392352342605591, -0.5149252414703369, -0.49061524868011475, -0.46630528569221497, -0.4419953227043152, -0.417685329914093, -0.39337533712387085, -0.36906537413597107, -0.3447554111480713, -0.3204454183578491, -0.29613542556762695, -0.2718254625797272, -0.2475154846906662, -0.22320550680160522, -0.19889552891254425, -0.17458555102348328, -0.1502755731344223, -0.12596559524536133, -0.10165561735630035, -0.07734563946723938, -0.053035661578178406, -0.028725624084472656, -0.004415646195411682, 0.019894331693649292, 0.044204309582710266, 0.06851428747177124, 0.09282426536083221, 0.11713424324989319, 0.14144422113895416, 0.16575419902801514, 0.1900641769170761, 0.21437415480613708, 0.23868413269519806, 0.26299411058425903, 0.2873041033744812, 0.311614066362381, 0.33592402935028076, 0.36023402214050293, 0.3845440149307251, 0.4088539779186249, 0.43316394090652466, 0.4574739336967468, 0.481783926486969, 0.5060938596725464, 0.5304038524627686, 0.5547138452529907, 0.5790238380432129, 0.6033338308334351, 0.6276437640190125, 0.6519537568092346, 0.6762637495994568, 0.7005736827850342, 0.7248836755752563, 0.7491936683654785]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 6.0, 16.0, 16.0, 22.0, 26.0, 53.0, 78.0, 131.0, 184.0, 286.0, 464.0, 826.0, 1488.0, 3095.0, 6647.0, 14566.0, 35309.0, 94261.0, 305403.0, 1251536.0, 1800266.0, 466303.0, 131737.0, 46763.0, 18613.0, 8122.0, 3851.0, 1883.0, 997.0, 517.0, 311.0, 202.0, 118.0, 60.0, 31.0, 33.0, 21.0, 10.0, 8.0, 4.0, 10.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2054443359375, -0.19905471801757812, -0.19266510009765625, -0.18627548217773438, -0.1798858642578125, -0.17349624633789062, -0.16710662841796875, -0.16071701049804688, -0.154327392578125, -0.14793777465820312, -0.14154815673828125, -0.13515853881835938, -0.1287689208984375, -0.12237930297851562, -0.11598968505859375, -0.10960006713867188, -0.10321044921875, -0.09682083129882812, -0.09043121337890625, -0.08404159545898438, -0.0776519775390625, -0.07126235961914062, -0.06487274169921875, -0.058483123779296875, -0.052093505859375, -0.045703887939453125, -0.03931427001953125, -0.032924652099609375, -0.0265350341796875, -0.020145416259765625, -0.01375579833984375, -0.007366180419921875, -0.0009765625, 0.005413055419921875, 0.01180267333984375, 0.018192291259765625, 0.0245819091796875, 0.030971527099609375, 0.03736114501953125, 0.043750762939453125, 0.050140380859375, 0.056529998779296875, 0.06291961669921875, 0.06930923461914062, 0.0756988525390625, 0.08208847045898438, 0.08847808837890625, 0.09486770629882812, 0.10125732421875, 0.10764694213867188, 0.11403656005859375, 0.12042617797851562, 0.1268157958984375, 0.13320541381835938, 0.13959503173828125, 0.14598464965820312, 0.152374267578125, 0.15876388549804688, 0.16515350341796875, 0.17154312133789062, 0.1779327392578125, 0.18432235717773438, 0.19071197509765625, 0.19710159301757812, 0.2034912109375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 9.0, 6.0, 7.0, 6.0, 9.0, 22.0, 16.0, 20.0, 26.0, 23.0, 20.0, 26.0, 35.0, 32.0, 29.0, 38.0, 32.0, 36.0, 48.0, 48.0, 41.0, 44.0, 51.0, 36.0, 36.0, 35.0, 46.0, 28.0, 33.0, 21.0, 21.0, 23.0, 10.0, 15.0, 12.0, 9.0, 12.0, 11.0, 6.0, 3.0, 2.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.1309814453125, -0.12713909149169922, -0.12329673767089844, -0.11945438385009766, -0.11561203002929688, -0.1117696762084961, -0.10792732238769531, -0.10408496856689453, -0.10024261474609375, -0.09640026092529297, -0.09255790710449219, -0.0887155532836914, -0.08487319946289062, -0.08103084564208984, -0.07718849182128906, -0.07334613800048828, -0.0695037841796875, -0.06566143035888672, -0.06181907653808594, -0.057976722717285156, -0.054134368896484375, -0.050292015075683594, -0.04644966125488281, -0.04260730743408203, -0.03876495361328125, -0.03492259979248047, -0.031080245971679688, -0.027237892150878906, -0.023395538330078125, -0.019553184509277344, -0.015710830688476562, -0.011868476867675781, -0.008026123046875, -0.004183769226074219, -0.0003414154052734375, 0.0035009384155273438, 0.007343292236328125, 0.011185646057128906, 0.015027999877929688, 0.01887035369873047, 0.02271270751953125, 0.02655506134033203, 0.030397415161132812, 0.034239768981933594, 0.038082122802734375, 0.041924476623535156, 0.04576683044433594, 0.04960918426513672, 0.0534515380859375, 0.05729389190673828, 0.06113624572753906, 0.06497859954833984, 0.06882095336914062, 0.0726633071899414, 0.07650566101074219, 0.08034801483154297, 0.08419036865234375, 0.08803272247314453, 0.09187507629394531, 0.0957174301147461, 0.09955978393554688, 0.10340213775634766, 0.10724449157714844, 0.11108684539794922, 0.11492919921875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 6.0, 9.0, 10.0, 17.0, 24.0, 36.0, 38.0, 68.0, 82.0, 141.0, 208.0, 310.0, 459.0, 767.0, 1307.0, 2386.0, 4371.0, 8912.0, 18282.0, 40476.0, 93554.0, 233689.0, 621566.0, 1478330.0, 1039192.0, 384765.0, 148838.0, 61930.0, 27503.0, 12884.0, 6262.0, 3220.0, 1802.0, 1013.0, 623.0, 429.0, 227.0, 165.0, 103.0, 74.0, 55.0, 44.0, 24.0, 19.0, 19.0, 13.0, 7.0, 9.0, 8.0, 0.0, 3.0, 3.0, 2.0], "bins": [-0.2030029296875, -0.19716262817382812, -0.19132232666015625, -0.18548202514648438, -0.1796417236328125, -0.17380142211914062, -0.16796112060546875, -0.16212081909179688, -0.156280517578125, -0.15044021606445312, -0.14459991455078125, -0.13875961303710938, -0.1329193115234375, -0.12707901000976562, -0.12123870849609375, -0.11539840698242188, -0.10955810546875, -0.10371780395507812, -0.09787750244140625, -0.09203720092773438, -0.0861968994140625, -0.08035659790039062, -0.07451629638671875, -0.06867599487304688, -0.062835693359375, -0.056995391845703125, -0.05115509033203125, -0.045314788818359375, -0.0394744873046875, -0.033634185791015625, -0.02779388427734375, -0.021953582763671875, -0.01611328125, -0.010272979736328125, -0.00443267822265625, 0.001407623291015625, 0.0072479248046875, 0.013088226318359375, 0.01892852783203125, 0.024768829345703125, 0.030609130859375, 0.036449432373046875, 0.04228973388671875, 0.048130035400390625, 0.0539703369140625, 0.059810638427734375, 0.06565093994140625, 0.07149124145507812, 0.07733154296875, 0.08317184448242188, 0.08901214599609375, 0.09485244750976562, 0.1006927490234375, 0.10653305053710938, 0.11237335205078125, 0.11821365356445312, 0.124053955078125, 0.12989425659179688, 0.13573455810546875, 0.14157485961914062, 0.1474151611328125, 0.15325546264648438, 0.15909576416015625, 0.16493606567382812, 0.1707763671875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 13.0, 14.0, 10.0, 8.0, 20.0, 21.0, 31.0, 47.0, 74.0, 102.0, 112.0, 164.0, 233.0, 339.0, 430.0, 558.0, 537.0, 415.0, 271.0, 197.0, 128.0, 93.0, 68.0, 49.0, 29.0, 25.0, 20.0, 16.0, 14.0, 10.0, 5.0, 8.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1912841796875, -0.18386268615722656, -0.17644119262695312, -0.1690196990966797, -0.16159820556640625, -0.1541767120361328, -0.14675521850585938, -0.13933372497558594, -0.1319122314453125, -0.12449073791503906, -0.11706924438476562, -0.10964775085449219, -0.10222625732421875, -0.09480476379394531, -0.08738327026367188, -0.07996177673339844, -0.072540283203125, -0.06511878967285156, -0.057697296142578125, -0.05027580261230469, -0.04285430908203125, -0.03543281555175781, -0.028011322021484375, -0.020589828491210938, -0.0131683349609375, -0.0057468414306640625, 0.001674652099609375, 0.009096145629882812, 0.01651763916015625, 0.023939132690429688, 0.031360626220703125, 0.03878211975097656, 0.04620361328125, 0.05362510681152344, 0.061046600341796875, 0.06846809387207031, 0.07588958740234375, 0.08331108093261719, 0.09073257446289062, 0.09815406799316406, 0.1055755615234375, 0.11299705505371094, 0.12041854858398438, 0.1278400421142578, 0.13526153564453125, 0.1426830291748047, 0.15010452270507812, 0.15752601623535156, 0.164947509765625, 0.17236900329589844, 0.17979049682617188, 0.1872119903564453, 0.19463348388671875, 0.2020549774169922, 0.20947647094726562, 0.21689796447753906, 0.2243194580078125, 0.23174095153808594, 0.23916244506835938, 0.2465839385986328, 0.25400543212890625, 0.2614269256591797, 0.2688484191894531, 0.27626991271972656, 0.28369140625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 5.0, 9.0, 12.0, 15.0, 21.0, 32.0, 29.0, 38.0, 50.0, 61.0, 78.0, 84.0, 74.0, 84.0, 74.0, 67.0, 66.0, 53.0, 47.0, 39.0, 22.0, 10.0, 6.0, 6.0, 4.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.221909999847412, -1.1901782751083374, -1.1584465503692627, -1.126714825630188, -1.0949831008911133, -1.0632513761520386, -1.0315196514129639, -0.9997879862785339, -0.9680562615394592, -0.9363245368003845, -0.9045928120613098, -0.8728610873222351, -0.8411294221878052, -0.8093976974487305, -0.7776659727096558, -0.745934247970581, -0.7142025232315063, -0.6824707984924316, -0.6507390737533569, -0.6190073490142822, -0.5872756242752075, -0.5555438995361328, -0.5238122344017029, -0.4920805096626282, -0.46034878492355347, -0.42861706018447876, -0.39688533544540405, -0.36515364050865173, -0.333421915769577, -0.3016901910305023, -0.26995849609375, -0.2382267713546753, -0.20649516582489014, -0.17476344108581543, -0.14303173124790192, -0.1113000139594078, -0.0795682966709137, -0.04783657193183899, -0.016104862093925476, 0.015626847743988037, 0.047358572483062744, 0.07909028977155685, 0.11082200706005096, 0.14255371689796448, 0.17428544163703918, 0.2060171663761139, 0.2377488762140274, 0.2694805860519409, 0.3012123107910156, 0.33294403553009033, 0.36467576026916504, 0.39640745520591736, 0.42813917994499207, 0.4598709046840668, 0.4916025996208191, 0.5233343243598938, 0.5550660490989685, 0.5867977738380432, 0.6185294985771179, 0.6502612233161926, 0.6819928884506226, 0.7137246131896973, 0.745456337928772, 0.7771880626678467, 0.8089197874069214]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 1.0, 6.0, 8.0, 6.0, 10.0, 8.0, 8.0, 18.0, 15.0, 23.0, 24.0, 19.0, 31.0, 30.0, 26.0, 31.0, 39.0, 27.0, 32.0, 45.0, 38.0, 38.0, 42.0, 46.0, 39.0, 38.0, 45.0, 27.0, 24.0, 33.0, 26.0, 38.0, 27.0, 20.0, 10.0, 21.0, 16.0, 6.0, 10.0, 15.0, 6.0, 7.0, 5.0, 5.0, 1.0, 7.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5798817873001099, -0.5607486963272095, -0.5416156053543091, -0.5224825143814087, -0.5033494234085083, -0.4842163324356079, -0.46508321166038513, -0.44595012068748474, -0.42681702971458435, -0.40768393874168396, -0.38855084776878357, -0.3694177567958832, -0.3502846360206604, -0.33115154504776, -0.3120184540748596, -0.29288536310195923, -0.27375227212905884, -0.25461918115615845, -0.23548609018325806, -0.21635298430919647, -0.19721989333629608, -0.1780868023633957, -0.1589536964893341, -0.13982060551643372, -0.12068751454353333, -0.10155442357063293, -0.08242132514715195, -0.06328822672367096, -0.04415513575077057, -0.025022044777870178, -0.005888946354389191, 0.013244152069091797, 0.03237724304199219, 0.05151033774018288, 0.07064343243837357, 0.08977653086185455, 0.10890962183475494, 0.12804271280765533, 0.14717581868171692, 0.1663089096546173, 0.1854420006275177, 0.2045750916004181, 0.22370818257331848, 0.24284128844738007, 0.26197439432144165, 0.28110748529434204, 0.30024057626724243, 0.3193736672401428, 0.3385067582130432, 0.3576398491859436, 0.376772940158844, 0.3959060311317444, 0.4150391221046448, 0.43417221307754517, 0.45330533385276794, 0.47243842482566833, 0.4915715157985687, 0.5107046365737915, 0.5298377275466919, 0.5489708185195923, 0.5681039094924927, 0.5872370004653931, 0.6063700914382935, 0.6255031824111938, 0.6446362733840942]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 4.0, 6.0, 6.0, 11.0, 19.0, 20.0, 42.0, 47.0, 66.0, 102.0, 175.0, 275.0, 512.0, 802.0, 1310.0, 2291.0, 3973.0, 6465.0, 10770.0, 18264.0, 30796.0, 53986.0, 96231.0, 165452.0, 218230.0, 182256.0, 109484.0, 61618.0, 34942.0, 20328.0, 12193.0, 7184.0, 4297.0, 2627.0, 1536.0, 860.0, 523.0, 322.0, 214.0, 116.0, 73.0, 46.0, 30.0, 15.0, 12.0, 6.0, 5.0, 5.0, 7.0, 3.0, 0.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2275390625, -0.22034072875976562, -0.21314239501953125, -0.20594406127929688, -0.1987457275390625, -0.19154739379882812, -0.18434906005859375, -0.17715072631835938, -0.169952392578125, -0.16275405883789062, -0.15555572509765625, -0.14835739135742188, -0.1411590576171875, -0.13396072387695312, -0.12676239013671875, -0.11956405639648438, -0.11236572265625, -0.10516738891601562, -0.09796905517578125, -0.09077072143554688, -0.0835723876953125, -0.07637405395507812, -0.06917572021484375, -0.061977386474609375, -0.054779052734375, -0.047580718994140625, -0.04038238525390625, -0.033184051513671875, -0.0259857177734375, -0.018787384033203125, -0.01158905029296875, -0.004390716552734375, 0.0028076171875, 0.010005950927734375, 0.01720428466796875, 0.024402618408203125, 0.0316009521484375, 0.038799285888671875, 0.04599761962890625, 0.053195953369140625, 0.060394287109375, 0.06759262084960938, 0.07479095458984375, 0.08198928833007812, 0.0891876220703125, 0.09638595581054688, 0.10358428955078125, 0.11078262329101562, 0.11798095703125, 0.12517929077148438, 0.13237762451171875, 0.13957595825195312, 0.1467742919921875, 0.15397262573242188, 0.16117095947265625, 0.16836929321289062, 0.175567626953125, 0.18276596069335938, 0.18996429443359375, 0.19716262817382812, 0.2043609619140625, 0.21155929565429688, 0.21875762939453125, 0.22595596313476562, 0.233154296875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 4.0, 3.0, 8.0, 6.0, 6.0, 20.0, 14.0, 13.0, 15.0, 25.0, 25.0, 28.0, 31.0, 19.0, 36.0, 22.0, 33.0, 42.0, 43.0, 57.0, 33.0, 41.0, 49.0, 37.0, 40.0, 40.0, 32.0, 43.0, 31.0, 30.0, 29.0, 31.0, 11.0, 18.0, 13.0, 12.0, 8.0, 13.0, 9.0, 6.0, 11.0, 4.0, 5.0, 0.0, 6.0, 2.0, 0.0, 1.0], "bins": [-0.1378173828125, -0.13410091400146484, -0.1303844451904297, -0.12666797637939453, -0.12295150756835938, -0.11923503875732422, -0.11551856994628906, -0.1118021011352539, -0.10808563232421875, -0.1043691635131836, -0.10065269470214844, -0.09693622589111328, -0.09321975708007812, -0.08950328826904297, -0.08578681945800781, -0.08207035064697266, -0.0783538818359375, -0.07463741302490234, -0.07092094421386719, -0.06720447540283203, -0.06348800659179688, -0.05977153778076172, -0.05605506896972656, -0.052338600158691406, -0.04862213134765625, -0.044905662536621094, -0.04118919372558594, -0.03747272491455078, -0.033756256103515625, -0.03003978729248047, -0.026323318481445312, -0.022606849670410156, -0.018890380859375, -0.015173912048339844, -0.011457443237304688, -0.007740974426269531, -0.004024505615234375, -0.00030803680419921875, 0.0034084320068359375, 0.007124900817871094, 0.01084136962890625, 0.014557838439941406, 0.018274307250976562, 0.02199077606201172, 0.025707244873046875, 0.02942371368408203, 0.03314018249511719, 0.036856651306152344, 0.0405731201171875, 0.044289588928222656, 0.04800605773925781, 0.05172252655029297, 0.055438995361328125, 0.05915546417236328, 0.06287193298339844, 0.0665884017944336, 0.07030487060546875, 0.0740213394165039, 0.07773780822753906, 0.08145427703857422, 0.08517074584960938, 0.08888721466064453, 0.09260368347167969, 0.09632015228271484, 0.10003662109375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 8.0, 6.0, 11.0, 19.0, 20.0, 29.0, 42.0, 51.0, 87.0, 124.0, 216.0, 332.0, 676.0, 1433.0, 3312.0, 7643.0, 19223.0, 49847.0, 137064.0, 328339.0, 304614.0, 121281.0, 44446.0, 17233.0, 6889.0, 2901.0, 1238.0, 628.0, 306.0, 179.0, 127.0, 66.0, 59.0, 43.0, 22.0, 7.0, 18.0, 3.0, 3.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.356201171875, -0.34468841552734375, -0.3331756591796875, -0.32166290283203125, -0.310150146484375, -0.29863739013671875, -0.2871246337890625, -0.27561187744140625, -0.26409912109375, -0.25258636474609375, -0.2410736083984375, -0.22956085205078125, -0.218048095703125, -0.20653533935546875, -0.1950225830078125, -0.18350982666015625, -0.1719970703125, -0.16048431396484375, -0.1489715576171875, -0.13745880126953125, -0.125946044921875, -0.11443328857421875, -0.1029205322265625, -0.09140777587890625, -0.07989501953125, -0.06838226318359375, -0.0568695068359375, -0.04535675048828125, -0.033843994140625, -0.02233123779296875, -0.0108184814453125, 0.00069427490234375, 0.01220703125, 0.02371978759765625, 0.0352325439453125, 0.04674530029296875, 0.058258056640625, 0.06977081298828125, 0.0812835693359375, 0.09279632568359375, 0.10430908203125, 0.11582183837890625, 0.1273345947265625, 0.13884735107421875, 0.150360107421875, 0.16187286376953125, 0.1733856201171875, 0.18489837646484375, 0.1964111328125, 0.20792388916015625, 0.2194366455078125, 0.23094940185546875, 0.242462158203125, 0.25397491455078125, 0.2654876708984375, 0.27700042724609375, 0.28851318359375, 0.30002593994140625, 0.3115386962890625, 0.32305145263671875, 0.334564208984375, 0.34607696533203125, 0.3575897216796875, 0.36910247802734375, 0.380615234375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 7.0, 5.0, 5.0, 16.0, 13.0, 17.0, 29.0, 33.0, 26.0, 32.0, 45.0, 58.0, 46.0, 48.0, 48.0, 50.0, 56.0, 50.0, 53.0, 54.0, 50.0, 47.0, 44.0, 36.0, 25.0, 19.0, 24.0, 18.0, 15.0, 9.0, 10.0, 3.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.42333984375, -0.4097023010253906, -0.39606475830078125, -0.3824272155761719, -0.3687896728515625, -0.3551521301269531, -0.34151458740234375, -0.3278770446777344, -0.314239501953125, -0.3006019592285156, -0.28696441650390625, -0.2733268737792969, -0.2596893310546875, -0.24605178833007812, -0.23241424560546875, -0.21877670288085938, -0.20513916015625, -0.19150161743164062, -0.17786407470703125, -0.16422653198242188, -0.1505889892578125, -0.13695144653320312, -0.12331390380859375, -0.10967636108398438, -0.096038818359375, -0.08240127563476562, -0.06876373291015625, -0.055126190185546875, -0.0414886474609375, -0.027851104736328125, -0.01421356201171875, -0.000576019287109375, 0.0130615234375, 0.026699066162109375, 0.04033660888671875, 0.053974151611328125, 0.0676116943359375, 0.08124923706054688, 0.09488677978515625, 0.10852432250976562, 0.122161865234375, 0.13579940795898438, 0.14943695068359375, 0.16307449340820312, 0.1767120361328125, 0.19034957885742188, 0.20398712158203125, 0.21762466430664062, 0.23126220703125, 0.24489974975585938, 0.25853729248046875, 0.2721748352050781, 0.2858123779296875, 0.2994499206542969, 0.31308746337890625, 0.3267250061035156, 0.340362548828125, 0.3540000915527344, 0.36763763427734375, 0.3812751770019531, 0.3949127197265625, 0.4085502624511719, 0.42218780517578125, 0.4358253479003906, 0.449462890625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 4.0, 2.0, 6.0, 13.0, 14.0, 20.0, 35.0, 36.0, 57.0, 84.0, 121.0, 203.0, 281.0, 412.0, 591.0, 898.0, 1394.0, 2109.0, 3222.0, 5058.0, 8361.0, 13888.0, 23944.0, 43136.0, 84008.0, 165840.0, 248412.0, 206098.0, 110240.0, 55602.0, 29592.0, 17096.0, 10114.0, 6383.0, 3904.0, 2516.0, 1609.0, 1091.0, 727.0, 473.0, 320.0, 219.0, 156.0, 79.0, 61.0, 49.0, 36.0, 13.0, 17.0, 7.0, 8.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09161376953125, -0.08852863311767578, -0.08544349670410156, -0.08235836029052734, -0.07927322387695312, -0.0761880874633789, -0.07310295104980469, -0.07001781463623047, -0.06693267822265625, -0.06384754180908203, -0.06076240539550781, -0.057677268981933594, -0.054592132568359375, -0.051506996154785156, -0.04842185974121094, -0.04533672332763672, -0.0422515869140625, -0.03916645050048828, -0.03608131408691406, -0.032996177673339844, -0.029911041259765625, -0.026825904846191406, -0.023740768432617188, -0.02065563201904297, -0.01757049560546875, -0.014485359191894531, -0.011400222778320312, -0.008315086364746094, -0.005229949951171875, -0.0021448135375976562, 0.0009403228759765625, 0.004025459289550781, 0.007110595703125, 0.010195732116699219, 0.013280868530273438, 0.016366004943847656, 0.019451141357421875, 0.022536277770996094, 0.025621414184570312, 0.02870655059814453, 0.03179168701171875, 0.03487682342529297, 0.03796195983886719, 0.041047096252441406, 0.044132232666015625, 0.047217369079589844, 0.05030250549316406, 0.05338764190673828, 0.0564727783203125, 0.05955791473388672, 0.06264305114746094, 0.06572818756103516, 0.06881332397460938, 0.0718984603881836, 0.07498359680175781, 0.07806873321533203, 0.08115386962890625, 0.08423900604248047, 0.08732414245605469, 0.0904092788696289, 0.09349441528320312, 0.09657955169677734, 0.09966468811035156, 0.10274982452392578, 0.1058349609375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 6.0, 6.0, 4.0, 4.0, 8.0, 3.0, 4.0, 10.0, 12.0, 13.0, 21.0, 21.0, 26.0, 30.0, 45.0, 72.0, 94.0, 92.0, 116.0, 93.0, 82.0, 59.0, 44.0, 26.0, 20.0, 21.0, 14.0, 19.0, 7.0, 4.0, 4.0, 5.0, 5.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.266334533691406e-05, -3.161188215017319e-05, -3.056041896343231e-05, -2.9508955776691437e-05, -2.845749258995056e-05, -2.7406029403209686e-05, -2.635456621646881e-05, -2.5303103029727936e-05, -2.425163984298706e-05, -2.3200176656246185e-05, -2.214871346950531e-05, -2.1097250282764435e-05, -2.004578709602356e-05, -1.8994323909282684e-05, -1.794286072254181e-05, -1.6891397535800934e-05, -1.583993434906006e-05, -1.4788471162319183e-05, -1.3737007975578308e-05, -1.2685544788837433e-05, -1.1634081602096558e-05, -1.0582618415355682e-05, -9.531155228614807e-06, -8.479692041873932e-06, -7.428228855133057e-06, -6.376765668392181e-06, -5.325302481651306e-06, -4.273839294910431e-06, -3.2223761081695557e-06, -2.1709129214286804e-06, -1.1194497346878052e-06, -6.798654794692993e-08, 9.834766387939453e-07, 2.0349398255348206e-06, 3.086403012275696e-06, 4.137866199016571e-06, 5.189329385757446e-06, 6.2407925724983215e-06, 7.292255759239197e-06, 8.343718945980072e-06, 9.395182132720947e-06, 1.0446645319461823e-05, 1.1498108506202698e-05, 1.2549571692943573e-05, 1.3601034879684448e-05, 1.4652498066425323e-05, 1.57039612531662e-05, 1.6755424439907074e-05, 1.780688762664795e-05, 1.8858350813388824e-05, 1.99098140001297e-05, 2.0961277186870575e-05, 2.201274037361145e-05, 2.3064203560352325e-05, 2.41156667470932e-05, 2.5167129933834076e-05, 2.621859312057495e-05, 2.7270056307315826e-05, 2.83215194940567e-05, 2.9372982680797577e-05, 3.0424445867538452e-05, 3.147590905427933e-05, 3.25273722410202e-05, 3.357883542776108e-05, 3.463029861450195e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 14.0, 6.0, 13.0, 18.0, 31.0, 52.0, 97.0, 136.0, 327.0, 624.0, 1386.0, 3218.0, 7961.0, 21456.0, 66396.0, 230578.0, 436293.0, 192961.0, 56193.0, 18620.0, 6877.0, 2816.0, 1258.0, 577.0, 282.0, 137.0, 92.0, 50.0, 32.0, 20.0, 11.0, 7.0, 6.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1492919921875, -0.14384841918945312, -0.13840484619140625, -0.13296127319335938, -0.1275177001953125, -0.12207412719726562, -0.11663055419921875, -0.11118698120117188, -0.105743408203125, -0.10029983520507812, -0.09485626220703125, -0.08941268920898438, -0.0839691162109375, -0.07852554321289062, -0.07308197021484375, -0.06763839721679688, -0.06219482421875, -0.056751251220703125, -0.05130767822265625, -0.045864105224609375, -0.0404205322265625, -0.034976959228515625, -0.02953338623046875, -0.024089813232421875, -0.018646240234375, -0.013202667236328125, -0.00775909423828125, -0.002315521240234375, 0.0031280517578125, 0.008571624755859375, 0.01401519775390625, 0.019458770751953125, 0.02490234375, 0.030345916748046875, 0.03578948974609375, 0.041233062744140625, 0.0466766357421875, 0.052120208740234375, 0.05756378173828125, 0.06300735473632812, 0.068450927734375, 0.07389450073242188, 0.07933807373046875, 0.08478164672851562, 0.0902252197265625, 0.09566879272460938, 0.10111236572265625, 0.10655593872070312, 0.11199951171875, 0.11744308471679688, 0.12288665771484375, 0.12833023071289062, 0.1337738037109375, 0.13921737670898438, 0.14466094970703125, 0.15010452270507812, 0.155548095703125, 0.16099166870117188, 0.16643524169921875, 0.17187881469726562, 0.1773223876953125, 0.18276596069335938, 0.18820953369140625, 0.19365310668945312, 0.1990966796875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 6.0, 2.0, 4.0, 7.0, 9.0, 20.0, 26.0, 31.0, 36.0, 56.0, 72.0, 72.0, 92.0, 84.0, 97.0, 82.0, 62.0, 54.0, 46.0, 40.0, 24.0, 20.0, 15.0, 10.0, 6.0, 6.0, 7.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.156982421875, -0.15264415740966797, -0.14830589294433594, -0.1439676284790039, -0.13962936401367188, -0.13529109954833984, -0.1309528350830078, -0.12661457061767578, -0.12227630615234375, -0.11793804168701172, -0.11359977722167969, -0.10926151275634766, -0.10492324829101562, -0.1005849838256836, -0.09624671936035156, -0.09190845489501953, -0.0875701904296875, -0.08323192596435547, -0.07889366149902344, -0.0745553970336914, -0.07021713256835938, -0.06587886810302734, -0.06154060363769531, -0.05720233917236328, -0.05286407470703125, -0.04852581024169922, -0.04418754577636719, -0.039849281311035156, -0.035511016845703125, -0.031172752380371094, -0.026834487915039062, -0.02249622344970703, -0.018157958984375, -0.013819694519042969, -0.009481430053710938, -0.005143165588378906, -0.000804901123046875, 0.0035333633422851562, 0.007871627807617188, 0.012209892272949219, 0.01654815673828125, 0.02088642120361328, 0.025224685668945312, 0.029562950134277344, 0.033901214599609375, 0.038239479064941406, 0.04257774353027344, 0.04691600799560547, 0.0512542724609375, 0.05559253692626953, 0.05993080139160156, 0.0642690658569336, 0.06860733032226562, 0.07294559478759766, 0.07728385925292969, 0.08162212371826172, 0.08596038818359375, 0.09029865264892578, 0.09463691711425781, 0.09897518157958984, 0.10331344604492188, 0.1076517105102539, 0.11198997497558594, 0.11632823944091797, 0.12066650390625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 6.0, 8.0, 6.0, 13.0, 17.0, 15.0, 24.0, 27.0, 24.0, 48.0, 44.0, 53.0, 61.0, 69.0, 73.0, 71.0, 69.0, 63.0, 51.0, 51.0, 32.0, 40.0, 31.0, 30.0, 14.0, 20.0, 12.0, 11.0, 11.0, 7.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8308272957801819, -0.8008356690406799, -0.770844042301178, -0.740852415561676, -0.7108608484268188, -0.6808692216873169, -0.6508775949478149, -0.620885968208313, -0.590894341468811, -0.5609027147293091, -0.5309110879898071, -0.5009194612503052, -0.4709278643131256, -0.44093623757362366, -0.4109446406364441, -0.38095301389694214, -0.3509613871574402, -0.32096976041793823, -0.2909781336784363, -0.2609865367412567, -0.23099491000175476, -0.2010032832622528, -0.17101167142391205, -0.1410200595855713, -0.11102843284606934, -0.08103681355714798, -0.051045194268226624, -0.021053574979305267, 0.008938044309616089, 0.03892967104911804, 0.0689212828874588, 0.09891289472579956, 0.1289045810699463, 0.15889620780944824, 0.188887819647789, 0.21887943148612976, 0.2488710582256317, 0.27886268496513367, 0.30885428190231323, 0.3388459086418152, 0.36883753538131714, 0.3988291621208191, 0.42882078886032104, 0.4588123857975006, 0.48880401253700256, 0.5187956094741821, 0.5487872362136841, 0.578778862953186, 0.608770489692688, 0.6387621164321899, 0.6687537431716919, 0.6987453699111938, 0.7287369966506958, 0.7587286233901978, 0.7887201905250549, 0.8187118172645569, 0.8487034440040588, 0.8786950707435608, 0.9086866974830627, 0.9386783242225647, 0.9686698913574219, 0.9986615180969238, 1.0286531448364258, 1.0586447715759277, 1.0886363983154297]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 5.0, 7.0, 8.0, 13.0, 15.0, 11.0, 14.0, 21.0, 21.0, 30.0, 31.0, 35.0, 30.0, 42.0, 29.0, 30.0, 35.0, 40.0, 41.0, 49.0, 38.0, 50.0, 38.0, 34.0, 30.0, 28.0, 28.0, 31.0, 28.0, 23.0, 23.0, 24.0, 16.0, 17.0, 12.0, 12.0, 14.0, 6.0, 5.0, 7.0, 2.0, 6.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8224474191665649, -0.7953444719314575, -0.7682415246963501, -0.7411385774612427, -0.7140356302261353, -0.6869326829910278, -0.6598297953605652, -0.6327268481254578, -0.6056239008903503, -0.5785209536552429, -0.5514180064201355, -0.5243150591850281, -0.49721214175224304, -0.4701091945171356, -0.4430062770843506, -0.41590332984924316, -0.38880038261413574, -0.3616974353790283, -0.3345944881439209, -0.30749157071113586, -0.28038862347602844, -0.253285676240921, -0.2261827439069748, -0.19907981157302856, -0.17197686433792114, -0.14487391710281372, -0.11777098476886749, -0.09066804498434067, -0.06356510519981384, -0.03646215796470642, -0.009359225630760193, 0.017743706703186035, 0.04484671354293823, 0.07194965332746506, 0.09905259311199188, 0.1261555254459381, 0.15325847268104553, 0.18036141991615295, 0.20746435225009918, 0.2345672845840454, 0.26167023181915283, 0.28877317905426025, 0.3158761262893677, 0.3429790437221527, 0.37008199095726013, 0.39718493819236755, 0.4242878556251526, 0.45139080286026, 0.47849375009536743, 0.5055966973304749, 0.5326996445655823, 0.5598025918006897, 0.5869054794311523, 0.6140084266662598, 0.6411113739013672, 0.6682143211364746, 0.695317268371582, 0.7224202156066895, 0.7495231628417969, 0.7766261100769043, 0.8037290573120117, 0.8308320045471191, 0.8579348921775818, 0.8850378394126892, 0.9121407866477966]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 12.0, 5.0, 11.0, 18.0, 19.0, 30.0, 53.0, 71.0, 122.0, 199.0, 337.0, 821.0, 2073.0, 6638.0, 25211.0, 128680.0, 1186571.0, 2535768.0, 251543.0, 41604.0, 9815.0, 2810.0, 1014.0, 345.0, 196.0, 103.0, 74.0, 40.0, 29.0, 20.0, 22.0, 7.0, 9.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0], "bins": [-0.48291015625, -0.4711799621582031, -0.45944976806640625, -0.4477195739746094, -0.4359893798828125, -0.4242591857910156, -0.41252899169921875, -0.4007987976074219, -0.389068603515625, -0.3773384094238281, -0.36560821533203125, -0.3538780212402344, -0.3421478271484375, -0.3304176330566406, -0.31868743896484375, -0.3069572448730469, -0.29522705078125, -0.2834968566894531, -0.27176666259765625, -0.2600364685058594, -0.2483062744140625, -0.23657608032226562, -0.22484588623046875, -0.21311569213867188, -0.201385498046875, -0.18965530395507812, -0.17792510986328125, -0.16619491577148438, -0.1544647216796875, -0.14273452758789062, -0.13100433349609375, -0.11927413940429688, -0.1075439453125, -0.09581375122070312, -0.08408355712890625, -0.07235336303710938, -0.0606231689453125, -0.048892974853515625, -0.03716278076171875, -0.025432586669921875, -0.013702392578125, -0.001972198486328125, 0.00975799560546875, 0.021488189697265625, 0.0332183837890625, 0.044948577880859375, 0.05667877197265625, 0.06840896606445312, 0.08013916015625, 0.09186935424804688, 0.10359954833984375, 0.11532974243164062, 0.1270599365234375, 0.13879013061523438, 0.15052032470703125, 0.16225051879882812, 0.173980712890625, 0.18571090698242188, 0.19744110107421875, 0.20917129516601562, 0.2209014892578125, 0.23263168334960938, 0.24436187744140625, 0.2560920715332031, 0.267822265625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 5.0, 1.0, 7.0, 3.0, 4.0, 8.0, 10.0, 8.0, 12.0, 13.0, 13.0, 17.0, 10.0, 20.0, 20.0, 30.0, 28.0, 24.0, 36.0, 33.0, 36.0, 40.0, 51.0, 50.0, 43.0, 46.0, 45.0, 28.0, 36.0, 36.0, 33.0, 27.0, 39.0, 18.0, 33.0, 25.0, 23.0, 14.0, 9.0, 12.0, 15.0, 9.0, 6.0, 7.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1292724609375, -0.12526702880859375, -0.1212615966796875, -0.11725616455078125, -0.113250732421875, -0.10924530029296875, -0.1052398681640625, -0.10123443603515625, -0.09722900390625, -0.09322357177734375, -0.0892181396484375, -0.08521270751953125, -0.081207275390625, -0.07720184326171875, -0.0731964111328125, -0.06919097900390625, -0.065185546875, -0.06118011474609375, -0.0571746826171875, -0.05316925048828125, -0.049163818359375, -0.04515838623046875, -0.0411529541015625, -0.03714752197265625, -0.03314208984375, -0.02913665771484375, -0.0251312255859375, -0.02112579345703125, -0.017120361328125, -0.01311492919921875, -0.0091094970703125, -0.00510406494140625, -0.0010986328125, 0.00290679931640625, 0.0069122314453125, 0.01091766357421875, 0.014923095703125, 0.01892852783203125, 0.0229339599609375, 0.02693939208984375, 0.03094482421875, 0.03495025634765625, 0.0389556884765625, 0.04296112060546875, 0.046966552734375, 0.05097198486328125, 0.0549774169921875, 0.05898284912109375, 0.06298828125, 0.06699371337890625, 0.0709991455078125, 0.07500457763671875, 0.079010009765625, 0.08301544189453125, 0.0870208740234375, 0.09102630615234375, 0.09503173828125, 0.09903717041015625, 0.1030426025390625, 0.10704803466796875, 0.111053466796875, 0.11505889892578125, 0.1190643310546875, 0.12306976318359375, 0.1270751953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 8.0, 12.0, 21.0, 18.0, 41.0, 49.0, 62.0, 104.0, 166.0, 215.0, 425.0, 784.0, 1569.0, 3431.0, 8146.0, 22223.0, 71210.0, 257656.0, 1083535.0, 2012095.0, 532972.0, 136185.0, 39783.0, 13461.0, 5250.0, 2302.0, 1069.0, 561.0, 340.0, 219.0, 122.0, 75.0, 49.0, 36.0, 16.0, 15.0, 25.0, 7.0, 7.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.331787109375, -0.3218116760253906, -0.31183624267578125, -0.3018608093261719, -0.2918853759765625, -0.2819099426269531, -0.27193450927734375, -0.2619590759277344, -0.251983642578125, -0.24200820922851562, -0.23203277587890625, -0.22205734252929688, -0.2120819091796875, -0.20210647583007812, -0.19213104248046875, -0.18215560913085938, -0.17218017578125, -0.16220474243164062, -0.15222930908203125, -0.14225387573242188, -0.1322784423828125, -0.12230300903320312, -0.11232757568359375, -0.10235214233398438, -0.092376708984375, -0.08240127563476562, -0.07242584228515625, -0.062450408935546875, -0.0524749755859375, -0.042499542236328125, -0.03252410888671875, -0.022548675537109375, -0.0125732421875, -0.002597808837890625, 0.00737762451171875, 0.017353057861328125, 0.0273284912109375, 0.037303924560546875, 0.04727935791015625, 0.057254791259765625, 0.067230224609375, 0.07720565795898438, 0.08718109130859375, 0.09715652465820312, 0.1071319580078125, 0.11710739135742188, 0.12708282470703125, 0.13705825805664062, 0.14703369140625, 0.15700912475585938, 0.16698455810546875, 0.17695999145507812, 0.1869354248046875, 0.19691085815429688, 0.20688629150390625, 0.21686172485351562, 0.226837158203125, 0.23681259155273438, 0.24678802490234375, 0.2567634582519531, 0.2667388916015625, 0.2767143249511719, 0.28668975830078125, 0.2966651916503906, 0.306640625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 1.0, 9.0, 7.0, 14.0, 12.0, 14.0, 15.0, 44.0, 57.0, 68.0, 112.0, 130.0, 200.0, 281.0, 422.0, 605.0, 654.0, 435.0, 323.0, 230.0, 142.0, 97.0, 62.0, 42.0, 27.0, 24.0, 13.0, 11.0, 7.0, 7.0, 4.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.299072265625, -0.2902984619140625, -0.281524658203125, -0.2727508544921875, -0.26397705078125, -0.2552032470703125, -0.246429443359375, -0.2376556396484375, -0.2288818359375, -0.2201080322265625, -0.211334228515625, -0.2025604248046875, -0.19378662109375, -0.1850128173828125, -0.176239013671875, -0.1674652099609375, -0.15869140625, -0.1499176025390625, -0.141143798828125, -0.1323699951171875, -0.12359619140625, -0.1148223876953125, -0.106048583984375, -0.0972747802734375, -0.0885009765625, -0.0797271728515625, -0.070953369140625, -0.0621795654296875, -0.05340576171875, -0.0446319580078125, -0.035858154296875, -0.0270843505859375, -0.018310546875, -0.0095367431640625, -0.000762939453125, 0.0080108642578125, 0.01678466796875, 0.0255584716796875, 0.034332275390625, 0.0431060791015625, 0.0518798828125, 0.0606536865234375, 0.069427490234375, 0.0782012939453125, 0.08697509765625, 0.0957489013671875, 0.104522705078125, 0.1132965087890625, 0.1220703125, 0.1308441162109375, 0.139617919921875, 0.1483917236328125, 0.15716552734375, 0.1659393310546875, 0.174713134765625, 0.1834869384765625, 0.1922607421875, 0.2010345458984375, 0.209808349609375, 0.2185821533203125, 0.22735595703125, 0.2361297607421875, 0.244903564453125, 0.2536773681640625, 0.262451171875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 6.0, 6.0, 17.0, 22.0, 22.0, 28.0, 42.0, 57.0, 57.0, 66.0, 69.0, 85.0, 80.0, 76.0, 59.0, 74.0, 46.0, 45.0, 34.0, 37.0, 29.0, 12.0, 13.0, 8.0, 4.0, 5.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3001172542572021, -1.2667630910873413, -1.2334089279174805, -1.2000547647476196, -1.1667006015777588, -1.133346438407898, -1.099992275238037, -1.0666382312774658, -1.0332839488983154, -0.9999297857284546, -0.9665756225585938, -0.9332214593887329, -0.8998672962188721, -0.8665131330490112, -0.8331590294837952, -0.7998048663139343, -0.7664507627487183, -0.7330965995788574, -0.6997424364089966, -0.6663882732391357, -0.6330341100692749, -0.5996799468994141, -0.566325843334198, -0.5329716801643372, -0.4996175169944763, -0.4662633538246155, -0.43290919065475464, -0.3995550572872162, -0.36620089411735535, -0.3328467309474945, -0.29949259757995605, -0.2661384344100952, -0.2327842116355896, -0.19943004846572876, -0.1660759001970291, -0.13272175192832947, -0.09936758875846863, -0.06601342558860779, -0.03265927731990814, 0.0006948709487915039, 0.034049034118652344, 0.06740318983793259, 0.10075734555721283, 0.13411149382591248, 0.16746565699577332, 0.20081982016563416, 0.2341739684343338, 0.26752811670303345, 0.3008822798728943, 0.3342364430427551, 0.36759060621261597, 0.4009447395801544, 0.43429890275001526, 0.4676530659198761, 0.5010071992874146, 0.5343613624572754, 0.5677155256271362, 0.6010696887969971, 0.6344238519668579, 0.6677780151367188, 0.7011321783065796, 0.7344863414764404, 0.7678404450416565, 0.8011946082115173, 0.8345487713813782]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 5.0, 4.0, 1.0, 2.0, 8.0, 5.0, 7.0, 5.0, 12.0, 12.0, 5.0, 25.0, 17.0, 18.0, 29.0, 33.0, 27.0, 28.0, 28.0, 28.0, 31.0, 47.0, 36.0, 30.0, 39.0, 37.0, 38.0, 41.0, 36.0, 41.0, 28.0, 44.0, 21.0, 28.0, 28.0, 29.0, 18.0, 14.0, 15.0, 19.0, 22.0, 11.0, 10.0, 11.0, 6.0, 9.0, 4.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5925029516220093, -0.5726257562637329, -0.5527485609054565, -0.5328713655471802, -0.512994110584259, -0.49311691522598267, -0.4732397198677063, -0.45336252450942993, -0.43348532915115356, -0.4136081337928772, -0.39373090863227844, -0.3738537132740021, -0.3539765179157257, -0.33409929275512695, -0.3142220973968506, -0.2943449020385742, -0.27446767687797546, -0.2545904815196991, -0.23471327126026154, -0.21483606100082397, -0.1949588656425476, -0.17508165538311005, -0.15520444512367249, -0.13532724976539612, -0.11545003950595856, -0.09557283669710159, -0.07569563388824463, -0.05581842362880707, -0.035941220819950104, -0.01606401801109314, 0.0038131922483444214, 0.02369038760662079, 0.04356759786605835, 0.06344480067491531, 0.08332200348377228, 0.10319921374320984, 0.1230764165520668, 0.14295361936092377, 0.16283082962036133, 0.1827080249786377, 0.20258523523807526, 0.22246244549751282, 0.24233964085578918, 0.26221686601638794, 0.2820940613746643, 0.3019712567329407, 0.32184845209121704, 0.3417256474494934, 0.36160287261009216, 0.38148006796836853, 0.4013572931289673, 0.42123448848724365, 0.44111168384552, 0.4609888792037964, 0.48086610436439514, 0.5007432699203491, 0.5206205248832703, 0.5404977202415466, 0.560374915599823, 0.5802521705627441, 0.6001293659210205, 0.6200065612792969, 0.6398837566375732, 0.6597609519958496, 0.679638147354126]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 9.0, 10.0, 7.0, 14.0, 25.0, 42.0, 69.0, 120.0, 169.0, 299.0, 491.0, 827.0, 1430.0, 2322.0, 3779.0, 5709.0, 9240.0, 14391.0, 22810.0, 37097.0, 63884.0, 120000.0, 219574.0, 234024.0, 133905.0, 70849.0, 40334.0, 24764.0, 15692.0, 9821.0, 6432.0, 3995.0, 2488.0, 1559.0, 975.0, 564.0, 343.0, 184.0, 106.0, 77.0, 43.0, 34.0, 17.0, 12.0, 13.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.209716796875, -0.20318031311035156, -0.19664382934570312, -0.1901073455810547, -0.18357086181640625, -0.1770343780517578, -0.17049789428710938, -0.16396141052246094, -0.1574249267578125, -0.15088844299316406, -0.14435195922851562, -0.1378154754638672, -0.13127899169921875, -0.12474250793457031, -0.11820602416992188, -0.11166954040527344, -0.105133056640625, -0.09859657287597656, -0.09206008911132812, -0.08552360534667969, -0.07898712158203125, -0.07245063781738281, -0.06591415405273438, -0.05937767028808594, -0.0528411865234375, -0.04630470275878906, -0.039768218994140625, -0.03323173522949219, -0.02669525146484375, -0.020158767700195312, -0.013622283935546875, -0.0070858001708984375, -0.00054931640625, 0.0059871673583984375, 0.012523651123046875, 0.019060134887695312, 0.02559661865234375, 0.03213310241699219, 0.038669586181640625, 0.04520606994628906, 0.0517425537109375, 0.05827903747558594, 0.06481552124023438, 0.07135200500488281, 0.07788848876953125, 0.08442497253417969, 0.09096145629882812, 0.09749794006347656, 0.104034423828125, 0.11057090759277344, 0.11710739135742188, 0.12364387512207031, 0.13018035888671875, 0.1367168426513672, 0.14325332641601562, 0.14978981018066406, 0.1563262939453125, 0.16286277770996094, 0.16939926147460938, 0.1759357452392578, 0.18247222900390625, 0.1890087127685547, 0.19554519653320312, 0.20208168029785156, 0.2086181640625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 3.0, 8.0, 5.0, 11.0, 8.0, 13.0, 13.0, 15.0, 18.0, 15.0, 32.0, 17.0, 25.0, 23.0, 29.0, 36.0, 29.0, 43.0, 43.0, 37.0, 46.0, 48.0, 53.0, 38.0, 31.0, 49.0, 27.0, 41.0, 26.0, 30.0, 28.0, 33.0, 24.0, 14.0, 12.0, 12.0, 18.0, 8.0, 13.0, 5.0, 6.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.149169921875, -0.14483261108398438, -0.14049530029296875, -0.13615798950195312, -0.1318206787109375, -0.12748336791992188, -0.12314605712890625, -0.11880874633789062, -0.114471435546875, -0.11013412475585938, -0.10579681396484375, -0.10145950317382812, -0.0971221923828125, -0.09278488159179688, -0.08844757080078125, -0.08411026000976562, -0.07977294921875, -0.07543563842773438, -0.07109832763671875, -0.06676101684570312, -0.0624237060546875, -0.058086395263671875, -0.05374908447265625, -0.049411773681640625, -0.045074462890625, -0.040737152099609375, -0.03639984130859375, -0.032062530517578125, -0.0277252197265625, -0.023387908935546875, -0.01905059814453125, -0.014713287353515625, -0.0103759765625, -0.006038665771484375, -0.00170135498046875, 0.002635955810546875, 0.0069732666015625, 0.011310577392578125, 0.01564788818359375, 0.019985198974609375, 0.024322509765625, 0.028659820556640625, 0.03299713134765625, 0.037334442138671875, 0.0416717529296875, 0.046009063720703125, 0.05034637451171875, 0.054683685302734375, 0.05902099609375, 0.06335830688476562, 0.06769561767578125, 0.07203292846679688, 0.0763702392578125, 0.08070755004882812, 0.08504486083984375, 0.08938217163085938, 0.093719482421875, 0.09805679321289062, 0.10239410400390625, 0.10673141479492188, 0.1110687255859375, 0.11540603637695312, 0.11974334716796875, 0.12408065795898438, 0.12841796875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 16.0, 10.0, 16.0, 20.0, 17.0, 37.0, 30.0, 44.0, 55.0, 82.0, 135.0, 172.0, 302.0, 559.0, 1146.0, 2731.0, 6849.0, 17915.0, 47704.0, 159104.0, 519493.0, 200673.0, 56664.0, 20649.0, 7998.0, 3195.0, 1377.0, 603.0, 334.0, 153.0, 115.0, 98.0, 55.0, 45.0, 33.0, 21.0, 28.0, 15.0, 13.0, 10.0, 16.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45654296875, -0.44161224365234375, -0.4266815185546875, -0.41175079345703125, -0.396820068359375, -0.38188934326171875, -0.3669586181640625, -0.35202789306640625, -0.33709716796875, -0.32216644287109375, -0.3072357177734375, -0.29230499267578125, -0.277374267578125, -0.26244354248046875, -0.2475128173828125, -0.23258209228515625, -0.2176513671875, -0.20272064208984375, -0.1877899169921875, -0.17285919189453125, -0.157928466796875, -0.14299774169921875, -0.1280670166015625, -0.11313629150390625, -0.09820556640625, -0.08327484130859375, -0.0683441162109375, -0.05341339111328125, -0.038482666015625, -0.02355194091796875, -0.0086212158203125, 0.00630950927734375, 0.021240234375, 0.03617095947265625, 0.0511016845703125, 0.06603240966796875, 0.080963134765625, 0.09589385986328125, 0.1108245849609375, 0.12575531005859375, 0.14068603515625, 0.15561676025390625, 0.1705474853515625, 0.18547821044921875, 0.200408935546875, 0.21533966064453125, 0.2302703857421875, 0.24520111083984375, 0.2601318359375, 0.27506256103515625, 0.2899932861328125, 0.30492401123046875, 0.319854736328125, 0.33478546142578125, 0.3497161865234375, 0.36464691162109375, 0.37957763671875, 0.39450836181640625, 0.4094390869140625, 0.42436981201171875, 0.439300537109375, 0.45423126220703125, 0.4691619873046875, 0.48409271240234375, 0.4990234375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 6.0, 6.0, 8.0, 10.0, 12.0, 20.0, 20.0, 20.0, 33.0, 41.0, 46.0, 66.0, 69.0, 67.0, 64.0, 64.0, 60.0, 73.0, 61.0, 54.0, 37.0, 34.0, 30.0, 25.0, 18.0, 16.0, 9.0, 15.0, 6.0, 6.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.74755859375, -0.7274169921875, -0.707275390625, -0.6871337890625, -0.6669921875, -0.6468505859375, -0.626708984375, -0.6065673828125, -0.58642578125, -0.5662841796875, -0.546142578125, -0.5260009765625, -0.505859375, -0.4857177734375, -0.465576171875, -0.4454345703125, -0.42529296875, -0.4051513671875, -0.385009765625, -0.3648681640625, -0.3447265625, -0.3245849609375, -0.304443359375, -0.2843017578125, -0.26416015625, -0.2440185546875, -0.223876953125, -0.2037353515625, -0.18359375, -0.1634521484375, -0.143310546875, -0.1231689453125, -0.10302734375, -0.0828857421875, -0.062744140625, -0.0426025390625, -0.0224609375, -0.0023193359375, 0.017822265625, 0.0379638671875, 0.05810546875, 0.0782470703125, 0.098388671875, 0.1185302734375, 0.138671875, 0.1588134765625, 0.178955078125, 0.1990966796875, 0.21923828125, 0.2393798828125, 0.259521484375, 0.2796630859375, 0.2998046875, 0.3199462890625, 0.340087890625, 0.3602294921875, 0.38037109375, 0.4005126953125, 0.420654296875, 0.4407958984375, 0.4609375, 0.4810791015625, 0.501220703125, 0.5213623046875, 0.54150390625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 1.0, 4.0, 5.0, 7.0, 8.0, 12.0, 13.0, 25.0, 45.0, 53.0, 75.0, 171.0, 294.0, 678.0, 1441.0, 3303.0, 7413.0, 17737.0, 50561.0, 337079.0, 524063.0, 67592.0, 21835.0, 8778.0, 3882.0, 1747.0, 827.0, 376.0, 226.0, 119.0, 62.0, 38.0, 27.0, 19.0, 14.0, 10.0, 8.0, 3.0, 4.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34375, -0.33367156982421875, -0.3235931396484375, -0.31351470947265625, -0.303436279296875, -0.29335784912109375, -0.2832794189453125, -0.27320098876953125, -0.26312255859375, -0.25304412841796875, -0.2429656982421875, -0.23288726806640625, -0.222808837890625, -0.21273040771484375, -0.2026519775390625, -0.19257354736328125, -0.1824951171875, -0.17241668701171875, -0.1623382568359375, -0.15225982666015625, -0.142181396484375, -0.13210296630859375, -0.1220245361328125, -0.11194610595703125, -0.10186767578125, -0.09178924560546875, -0.0817108154296875, -0.07163238525390625, -0.061553955078125, -0.05147552490234375, -0.0413970947265625, -0.03131866455078125, -0.021240234375, -0.01116180419921875, -0.0010833740234375, 0.00899505615234375, 0.019073486328125, 0.02915191650390625, 0.0392303466796875, 0.04930877685546875, 0.05938720703125, 0.06946563720703125, 0.0795440673828125, 0.08962249755859375, 0.099700927734375, 0.10977935791015625, 0.1198577880859375, 0.12993621826171875, 0.1400146484375, 0.15009307861328125, 0.1601715087890625, 0.17024993896484375, 0.180328369140625, 0.19040679931640625, 0.2004852294921875, 0.21056365966796875, 0.22064208984375, 0.23072052001953125, 0.2407989501953125, 0.25087738037109375, 0.260955810546875, 0.27103424072265625, 0.2811126708984375, 0.29119110107421875, 0.30126953125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 1.0, 7.0, 4.0, 3.0, 6.0, 7.0, 10.0, 11.0, 12.0, 13.0, 22.0, 35.0, 52.0, 79.0, 101.0, 137.0, 125.0, 109.0, 71.0, 44.0, 35.0, 22.0, 13.0, 16.0, 2.0, 9.0, 8.0, 9.0, 8.0, 6.0, 3.0, 1.0, 5.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.464387893676758e-05, -4.336237907409668e-05, -4.208087921142578e-05, -4.079937934875488e-05, -3.9517879486083984e-05, -3.8236379623413086e-05, -3.695487976074219e-05, -3.567337989807129e-05, -3.439188003540039e-05, -3.311038017272949e-05, -3.1828880310058594e-05, -3.0547380447387695e-05, -2.9265880584716797e-05, -2.79843807220459e-05, -2.6702880859375e-05, -2.54213809967041e-05, -2.4139881134033203e-05, -2.2858381271362305e-05, -2.1576881408691406e-05, -2.0295381546020508e-05, -1.901388168334961e-05, -1.773238182067871e-05, -1.6450881958007812e-05, -1.5169382095336914e-05, -1.3887882232666016e-05, -1.2606382369995117e-05, -1.1324882507324219e-05, -1.004338264465332e-05, -8.761882781982422e-06, -7.4803829193115234e-06, -6.198883056640625e-06, -4.9173831939697266e-06, -3.635883331298828e-06, -2.3543834686279297e-06, -1.0728836059570312e-06, 2.086162567138672e-07, 1.4901161193847656e-06, 2.771615982055664e-06, 4.0531158447265625e-06, 5.334615707397461e-06, 6.616115570068359e-06, 7.897615432739258e-06, 9.179115295410156e-06, 1.0460615158081055e-05, 1.1742115020751953e-05, 1.3023614883422852e-05, 1.430511474609375e-05, 1.558661460876465e-05, 1.6868114471435547e-05, 1.8149614334106445e-05, 1.9431114196777344e-05, 2.0712614059448242e-05, 2.199411392211914e-05, 2.327561378479004e-05, 2.4557113647460938e-05, 2.5838613510131836e-05, 2.7120113372802734e-05, 2.8401613235473633e-05, 2.968311309814453e-05, 3.096461296081543e-05, 3.224611282348633e-05, 3.3527612686157227e-05, 3.4809112548828125e-05, 3.6090612411499023e-05, 3.737211227416992e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 2.0, 4.0, 7.0, 11.0, 15.0, 9.0, 21.0, 28.0, 38.0, 61.0, 91.0, 158.0, 323.0, 620.0, 1568.0, 3919.0, 10656.0, 30482.0, 119600.0, 618824.0, 198519.0, 40988.0, 13920.0, 4979.0, 1985.0, 843.0, 363.0, 167.0, 127.0, 78.0, 50.0, 37.0, 16.0, 11.0, 12.0, 3.0, 5.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.259521484375, -0.250762939453125, -0.24200439453125, -0.233245849609375, -0.2244873046875, -0.215728759765625, -0.20697021484375, -0.198211669921875, -0.189453125, -0.180694580078125, -0.17193603515625, -0.163177490234375, -0.1544189453125, -0.145660400390625, -0.13690185546875, -0.128143310546875, -0.119384765625, -0.110626220703125, -0.10186767578125, -0.093109130859375, -0.0843505859375, -0.075592041015625, -0.06683349609375, -0.058074951171875, -0.04931640625, -0.040557861328125, -0.03179931640625, -0.023040771484375, -0.0142822265625, -0.005523681640625, 0.00323486328125, 0.011993408203125, 0.020751953125, 0.029510498046875, 0.03826904296875, 0.047027587890625, 0.0557861328125, 0.064544677734375, 0.07330322265625, 0.082061767578125, 0.0908203125, 0.099578857421875, 0.10833740234375, 0.117095947265625, 0.1258544921875, 0.134613037109375, 0.14337158203125, 0.152130126953125, 0.160888671875, 0.169647216796875, 0.17840576171875, 0.187164306640625, 0.1959228515625, 0.204681396484375, 0.21343994140625, 0.222198486328125, 0.23095703125, 0.239715576171875, 0.24847412109375, 0.257232666015625, 0.2659912109375, 0.274749755859375, 0.28350830078125, 0.292266845703125, 0.301025390625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 5.0, 0.0, 1.0, 3.0, 4.0, 6.0, 8.0, 10.0, 15.0, 15.0, 19.0, 41.0, 53.0, 82.0, 138.0, 168.0, 126.0, 105.0, 50.0, 39.0, 33.0, 19.0, 15.0, 9.0, 7.0, 7.0, 4.0, 6.0, 2.0, 4.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1971435546875, -0.18942832946777344, -0.18171310424804688, -0.1739978790283203, -0.16628265380859375, -0.1585674285888672, -0.15085220336914062, -0.14313697814941406, -0.1354217529296875, -0.12770652770996094, -0.11999130249023438, -0.11227607727050781, -0.10456085205078125, -0.09684562683105469, -0.08913040161132812, -0.08141517639160156, -0.073699951171875, -0.06598472595214844, -0.058269500732421875, -0.05055427551269531, -0.04283905029296875, -0.03512382507324219, -0.027408599853515625, -0.019693374633789062, -0.0119781494140625, -0.0042629241943359375, 0.003452301025390625, 0.011167526245117188, 0.01888275146484375, 0.026597976684570312, 0.034313201904296875, 0.04202842712402344, 0.04974365234375, 0.05745887756347656, 0.06517410278320312, 0.07288932800292969, 0.08060455322265625, 0.08831977844238281, 0.09603500366210938, 0.10375022888183594, 0.1114654541015625, 0.11918067932128906, 0.12689590454101562, 0.1346111297607422, 0.14232635498046875, 0.1500415802001953, 0.15775680541992188, 0.16547203063964844, 0.173187255859375, 0.18090248107910156, 0.18861770629882812, 0.1963329315185547, 0.20404815673828125, 0.2117633819580078, 0.21947860717773438, 0.22719383239746094, 0.2349090576171875, 0.24262428283691406, 0.2503395080566406, 0.2580547332763672, 0.26576995849609375, 0.2734851837158203, 0.2812004089355469, 0.28891563415527344, 0.296630859375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 6.0, 4.0, 7.0, 15.0, 35.0, 37.0, 62.0, 81.0, 95.0, 95.0, 108.0, 97.0, 124.0, 77.0, 53.0, 45.0, 25.0, 13.0, 13.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.670444369316101, -1.6092681884765625, -1.548092007637024, -1.4869158267974854, -1.4257397651672363, -1.3645634651184082, -1.3033874034881592, -1.2422112226486206, -1.181035041809082, -1.1198588609695435, -1.0586826801300049, -0.9975065588951111, -0.9363303780555725, -0.8751541972160339, -0.8139780759811401, -0.7528018951416016, -0.691625714302063, -0.6304495334625244, -0.5692733526229858, -0.508097231388092, -0.44692105054855347, -0.3857448697090149, -0.3245687186717987, -0.2633925676345825, -0.20221638679504395, -0.14104022085666656, -0.07986405491828918, -0.018687888979911804, 0.042488276958465576, 0.10366445779800415, 0.16484060883522034, 0.22601675987243652, 0.28719305992126465, 0.3483692407608032, 0.4095453917980194, 0.4707215428352356, 0.5318977236747742, 0.5930739045143127, 0.6542500257492065, 0.7154262065887451, 0.7766023874282837, 0.8377785682678223, 0.8989547491073608, 0.9601308703422546, 1.0213069915771484, 1.0824832916259766, 1.1436593532562256, 1.2048355340957642, 1.2660117149353027, 1.3271878957748413, 1.3883640766143799, 1.4495402574539185, 1.510716438293457, 1.571892499923706, 1.6330686807632446, 1.6942448616027832, 1.7554210424423218, 1.8165972232818604, 1.877773404121399, 1.9389495849609375, 2.0001256465911865, 2.0613019466400146, 2.1224780082702637, 2.183654308319092, 2.244830369949341]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 8.0, 7.0, 7.0, 12.0, 8.0, 17.0, 19.0, 25.0, 24.0, 25.0, 28.0, 26.0, 43.0, 31.0, 44.0, 37.0, 32.0, 38.0, 37.0, 48.0, 46.0, 35.0, 37.0, 36.0, 42.0, 33.0, 38.0, 21.0, 16.0, 25.0, 27.0, 19.0, 11.0, 20.0, 10.0, 12.0, 14.0, 4.0, 10.0, 8.0, 4.0, 3.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1940932273864746, -1.158704161643982, -1.1233150959014893, -1.0879260301589966, -1.052536964416504, -1.0171478986740112, -0.9817587733268738, -0.9463697075843811, -0.9109806418418884, -0.8755915760993958, -0.8402025103569031, -0.8048134446144104, -0.769424319267273, -0.7340352535247803, -0.6986461877822876, -0.6632571220397949, -0.6278680562973022, -0.5924789905548096, -0.5570899248123169, -0.5217008590698242, -0.48631176352500916, -0.4509226977825165, -0.4155336022377014, -0.38014453649520874, -0.34475547075271606, -0.3093664050102234, -0.2739773392677307, -0.23858824372291565, -0.20319917798042297, -0.1678101122379303, -0.13242103159427643, -0.09703195095062256, -0.061643004417419434, -0.02625393122434616, 0.009135141968727112, 0.044524215161800385, 0.07991328835487366, 0.11530235409736633, 0.1506914347410202, 0.18608051538467407, 0.22146958112716675, 0.2568586468696594, 0.2922477126121521, 0.32763680815696716, 0.36302587389945984, 0.3984149396419525, 0.4338040351867676, 0.46919310092926025, 0.5045821666717529, 0.5399712324142456, 0.5753602981567383, 0.610749363899231, 0.6461384296417236, 0.6815274953842163, 0.7169166207313538, 0.7523056864738464, 0.7876947522163391, 0.8230838179588318, 0.8584728837013245, 0.8938619494438171, 0.9292510747909546, 0.9646401405334473, 1.00002920627594, 1.0354182720184326, 1.0708073377609253]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 9.0, 17.0, 22.0, 37.0, 41.0, 75.0, 126.0, 199.0, 355.0, 573.0, 1051.0, 1873.0, 3558.0, 6933.0, 13668.0, 29102.0, 63329.0, 147165.0, 379257.0, 1245951.0, 1542764.0, 450125.0, 170834.0, 72489.0, 32850.0, 15658.0, 7738.0, 3832.0, 2072.0, 1073.0, 623.0, 338.0, 196.0, 106.0, 94.0, 57.0, 35.0, 22.0, 12.0, 10.0, 10.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2113037109375, -0.20528030395507812, -0.19925689697265625, -0.19323348999023438, -0.1872100830078125, -0.18118667602539062, -0.17516326904296875, -0.16913986206054688, -0.163116455078125, -0.15709304809570312, -0.15106964111328125, -0.14504623413085938, -0.1390228271484375, -0.13299942016601562, -0.12697601318359375, -0.12095260620117188, -0.11492919921875, -0.10890579223632812, -0.10288238525390625, -0.09685897827148438, -0.0908355712890625, -0.08481216430664062, -0.07878875732421875, -0.07276535034179688, -0.066741943359375, -0.060718536376953125, -0.05469512939453125, -0.048671722412109375, -0.0426483154296875, -0.036624908447265625, -0.03060150146484375, -0.024578094482421875, -0.0185546875, -0.012531280517578125, -0.00650787353515625, -0.000484466552734375, 0.0055389404296875, 0.011562347412109375, 0.01758575439453125, 0.023609161376953125, 0.029632568359375, 0.035655975341796875, 0.04167938232421875, 0.047702789306640625, 0.0537261962890625, 0.059749603271484375, 0.06577301025390625, 0.07179641723632812, 0.07781982421875, 0.08384323120117188, 0.08986663818359375, 0.09589004516601562, 0.1019134521484375, 0.10793685913085938, 0.11396026611328125, 0.11998367309570312, 0.126007080078125, 0.13203048706054688, 0.13805389404296875, 0.14407730102539062, 0.1501007080078125, 0.15612411499023438, 0.16214752197265625, 0.16817092895507812, 0.1741943359375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 0.0, 2.0, 8.0, 3.0, 8.0, 10.0, 6.0, 7.0, 17.0, 16.0, 18.0, 18.0, 23.0, 26.0, 26.0, 29.0, 30.0, 38.0, 44.0, 42.0, 38.0, 49.0, 56.0, 46.0, 50.0, 55.0, 32.0, 43.0, 31.0, 33.0, 29.0, 28.0, 27.0, 23.0, 14.0, 15.0, 15.0, 13.0, 8.0, 9.0, 7.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.171630859375, -0.16605377197265625, -0.1604766845703125, -0.15489959716796875, -0.149322509765625, -0.14374542236328125, -0.1381683349609375, -0.13259124755859375, -0.12701416015625, -0.12143707275390625, -0.1158599853515625, -0.11028289794921875, -0.104705810546875, -0.09912872314453125, -0.0935516357421875, -0.08797454833984375, -0.0823974609375, -0.07682037353515625, -0.0712432861328125, -0.06566619873046875, -0.060089111328125, -0.05451202392578125, -0.0489349365234375, -0.04335784912109375, -0.03778076171875, -0.03220367431640625, -0.0266265869140625, -0.02104949951171875, -0.015472412109375, -0.00989532470703125, -0.0043182373046875, 0.00125885009765625, 0.0068359375, 0.01241302490234375, 0.0179901123046875, 0.02356719970703125, 0.029144287109375, 0.03472137451171875, 0.0402984619140625, 0.04587554931640625, 0.05145263671875, 0.05702972412109375, 0.0626068115234375, 0.06818389892578125, 0.073760986328125, 0.07933807373046875, 0.0849151611328125, 0.09049224853515625, 0.0960693359375, 0.10164642333984375, 0.1072235107421875, 0.11280059814453125, 0.118377685546875, 0.12395477294921875, 0.1295318603515625, 0.13510894775390625, 0.14068603515625, 0.14626312255859375, 0.1518402099609375, 0.15741729736328125, 0.162994384765625, 0.16857147216796875, 0.1741485595703125, 0.17972564697265625, 0.185302734375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 11.0, 7.0, 9.0, 18.0, 17.0, 27.0, 46.0, 49.0, 68.0, 98.0, 142.0, 181.0, 286.0, 457.0, 804.0, 1573.0, 3158.0, 7431.0, 19474.0, 57065.0, 185844.0, 718559.0, 2143822.0, 763113.0, 197014.0, 59579.0, 20385.0, 7880.0, 3275.0, 1529.0, 849.0, 504.0, 284.0, 220.0, 125.0, 118.0, 69.0, 44.0, 32.0, 22.0, 26.0, 17.0, 14.0, 4.0, 10.0, 6.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.36962890625, -0.35790252685546875, -0.3461761474609375, -0.33444976806640625, -0.322723388671875, -0.31099700927734375, -0.2992706298828125, -0.28754425048828125, -0.27581787109375, -0.26409149169921875, -0.2523651123046875, -0.24063873291015625, -0.228912353515625, -0.21718597412109375, -0.2054595947265625, -0.19373321533203125, -0.1820068359375, -0.17028045654296875, -0.1585540771484375, -0.14682769775390625, -0.135101318359375, -0.12337493896484375, -0.1116485595703125, -0.09992218017578125, -0.08819580078125, -0.07646942138671875, -0.0647430419921875, -0.05301666259765625, -0.041290283203125, -0.02956390380859375, -0.0178375244140625, -0.00611114501953125, 0.005615234375, 0.01734161376953125, 0.0290679931640625, 0.04079437255859375, 0.052520751953125, 0.06424713134765625, 0.0759735107421875, 0.08769989013671875, 0.09942626953125, 0.11115264892578125, 0.1228790283203125, 0.13460540771484375, 0.146331787109375, 0.15805816650390625, 0.1697845458984375, 0.18151092529296875, 0.1932373046875, 0.20496368408203125, 0.2166900634765625, 0.22841644287109375, 0.240142822265625, 0.25186920166015625, 0.2635955810546875, 0.27532196044921875, 0.28704833984375, 0.29877471923828125, 0.3105010986328125, 0.32222747802734375, 0.333953857421875, 0.34568023681640625, 0.3574066162109375, 0.36913299560546875, 0.380859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 8.0, 13.0, 23.0, 23.0, 46.0, 65.0, 84.0, 140.0, 207.0, 376.0, 557.0, 738.0, 597.0, 426.0, 270.0, 155.0, 120.0, 72.0, 57.0, 22.0, 24.0, 18.0, 11.0, 5.0, 5.0, 1.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.312744140625, -0.3010520935058594, -0.28936004638671875, -0.2776679992675781, -0.2659759521484375, -0.2542839050292969, -0.24259185791015625, -0.23089981079101562, -0.219207763671875, -0.20751571655273438, -0.19582366943359375, -0.18413162231445312, -0.1724395751953125, -0.16074752807617188, -0.14905548095703125, -0.13736343383789062, -0.12567138671875, -0.11397933959960938, -0.10228729248046875, -0.09059524536132812, -0.0789031982421875, -0.06721115112304688, -0.05551910400390625, -0.043827056884765625, -0.032135009765625, -0.020442962646484375, -0.00875091552734375, 0.002941131591796875, 0.0146331787109375, 0.026325225830078125, 0.03801727294921875, 0.049709320068359375, 0.0614013671875, 0.07309341430664062, 0.08478546142578125, 0.09647750854492188, 0.1081695556640625, 0.11986160278320312, 0.13155364990234375, 0.14324569702148438, 0.154937744140625, 0.16662979125976562, 0.17832183837890625, 0.19001388549804688, 0.2017059326171875, 0.21339797973632812, 0.22509002685546875, 0.23678207397460938, 0.24847412109375, 0.2601661682128906, 0.27185821533203125, 0.2835502624511719, 0.2952423095703125, 0.3069343566894531, 0.31862640380859375, 0.3303184509277344, 0.342010498046875, 0.3537025451660156, 0.36539459228515625, 0.3770866394042969, 0.3887786865234375, 0.4004707336425781, 0.41216278076171875, 0.4238548278808594, 0.435546875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 2.0, 6.0, 6.0, 5.0, 11.0, 16.0, 23.0, 36.0, 38.0, 58.0, 64.0, 74.0, 80.0, 80.0, 79.0, 89.0, 78.0, 61.0, 48.0, 39.0, 30.0, 25.0, 13.0, 16.0, 10.0, 7.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1421663761138916, -1.1003005504608154, -1.0584347248077393, -1.016568899154663, -0.9747030735015869, -0.9328372478485107, -0.8909713625907898, -0.8491055369377136, -0.8072397112846375, -0.7653738856315613, -0.7235080599784851, -0.6816421747207642, -0.639776349067688, -0.5979105234146118, -0.5560446977615356, -0.5141788721084595, -0.4723130464553833, -0.43044722080230713, -0.38858139514923096, -0.3467155396938324, -0.3048497140407562, -0.26298388838768005, -0.2211180329322815, -0.17925220727920532, -0.13738638162612915, -0.09552054852247238, -0.05365471541881561, -0.011788874864578247, 0.030076950788497925, 0.0719427764415741, 0.11380863189697266, 0.15567445755004883, 0.19754040241241455, 0.23940622806549072, 0.2812720537185669, 0.32313790917396545, 0.3650037348270416, 0.4068695604801178, 0.44873541593551636, 0.49060124158859253, 0.5324670672416687, 0.5743328928947449, 0.616198718547821, 0.658064603805542, 0.6999304294586182, 0.7417962551116943, 0.7836620807647705, 0.8255279064178467, 0.8673937320709229, 0.909259557723999, 0.9511253833770752, 0.9929912090301514, 1.0348570346832275, 1.0767228603363037, 1.1185886859893799, 1.160454511642456, 1.2023203372955322, 1.2441861629486084, 1.2860519886016846, 1.3279178142547607, 1.369783639907837, 1.411649465560913, 1.4535152912139893, 1.4953811168670654, 1.5372470617294312]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 6.0, 3.0, 3.0, 4.0, 6.0, 6.0, 15.0, 15.0, 10.0, 17.0, 18.0, 19.0, 19.0, 18.0, 24.0, 32.0, 42.0, 33.0, 43.0, 41.0, 31.0, 53.0, 44.0, 40.0, 37.0, 41.0, 38.0, 46.0, 44.0, 34.0, 28.0, 30.0, 32.0, 18.0, 11.0, 18.0, 16.0, 10.0, 17.0, 11.0, 7.0, 7.0, 8.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.9363552927970886, -0.9088358879089355, -0.8813164830207825, -0.8537970781326294, -0.8262777328491211, -0.7987582683563232, -0.7712389230728149, -0.7437195181846619, -0.7162001132965088, -0.6886807084083557, -0.6611613035202026, -0.6336418986320496, -0.6061224937438965, -0.5786031484603882, -0.5510837435722351, -0.523564338684082, -0.49604493379592896, -0.4685255289077759, -0.4410061240196228, -0.4134867489337921, -0.38596734404563904, -0.35844793915748596, -0.3309285640716553, -0.3034091591835022, -0.2758897542953491, -0.24837034940719604, -0.22085095942020416, -0.19333156943321228, -0.1658121645450592, -0.13829275965690613, -0.11077336966991425, -0.08325397968292236, -0.05573451519012451, -0.028215117752552032, -0.0006957203149795532, 0.026823677122592926, 0.054343074560165405, 0.08186247944831848, 0.10938186943531036, 0.13690125942230225, 0.16442066431045532, 0.1919400691986084, 0.21945945918560028, 0.24697884917259216, 0.27449825406074524, 0.3020176589488983, 0.329537034034729, 0.3570564389228821, 0.38457584381103516, 0.41209524869918823, 0.4396146535873413, 0.467134028673172, 0.4946534335613251, 0.5221728086471558, 0.5496922135353088, 0.5772116184234619, 0.604731023311615, 0.6322504281997681, 0.6597698330879211, 0.6872892379760742, 0.7148085832595825, 0.7423280477523804, 0.7698473930358887, 0.7973667979240417, 0.8248862028121948]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 9.0, 5.0, 9.0, 13.0, 20.0, 46.0, 69.0, 85.0, 145.0, 306.0, 561.0, 925.0, 1659.0, 3179.0, 5592.0, 10356.0, 18828.0, 34198.0, 65468.0, 131509.0, 262631.0, 253103.0, 124701.0, 62351.0, 32655.0, 18019.0, 9920.0, 5457.0, 2936.0, 1677.0, 929.0, 506.0, 262.0, 177.0, 96.0, 56.0, 36.0, 24.0, 10.0, 13.0, 6.0, 4.0, 8.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.228271484375, -0.22039031982421875, -0.2125091552734375, -0.20462799072265625, -0.196746826171875, -0.18886566162109375, -0.1809844970703125, -0.17310333251953125, -0.16522216796875, -0.15734100341796875, -0.1494598388671875, -0.14157867431640625, -0.133697509765625, -0.12581634521484375, -0.1179351806640625, -0.11005401611328125, -0.1021728515625, -0.09429168701171875, -0.0864105224609375, -0.07852935791015625, -0.070648193359375, -0.06276702880859375, -0.0548858642578125, -0.04700469970703125, -0.03912353515625, -0.03124237060546875, -0.0233612060546875, -0.01548004150390625, -0.007598876953125, 0.00028228759765625, 0.0081634521484375, 0.01604461669921875, 0.02392578125, 0.03180694580078125, 0.0396881103515625, 0.04756927490234375, 0.055450439453125, 0.06333160400390625, 0.0712127685546875, 0.07909393310546875, 0.08697509765625, 0.09485626220703125, 0.1027374267578125, 0.11061859130859375, 0.118499755859375, 0.12638092041015625, 0.1342620849609375, 0.14214324951171875, 0.1500244140625, 0.15790557861328125, 0.1657867431640625, 0.17366790771484375, 0.181549072265625, 0.18943023681640625, 0.1973114013671875, 0.20519256591796875, 0.21307373046875, 0.22095489501953125, 0.2288360595703125, 0.23671722412109375, 0.244598388671875, 0.25247955322265625, 0.2603607177734375, 0.26824188232421875, 0.276123046875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 9.0, 8.0, 3.0, 7.0, 13.0, 12.0, 17.0, 19.0, 12.0, 17.0, 21.0, 26.0, 33.0, 27.0, 46.0, 47.0, 42.0, 38.0, 69.0, 49.0, 48.0, 49.0, 36.0, 43.0, 42.0, 39.0, 26.0, 27.0, 25.0, 29.0, 20.0, 23.0, 15.0, 20.0, 11.0, 10.0, 8.0, 3.0, 2.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1783447265625, -0.17239761352539062, -0.16645050048828125, -0.16050338745117188, -0.1545562744140625, -0.14860916137695312, -0.14266204833984375, -0.13671493530273438, -0.130767822265625, -0.12482070922851562, -0.11887359619140625, -0.11292648315429688, -0.1069793701171875, -0.10103225708007812, -0.09508514404296875, -0.08913803100585938, -0.08319091796875, -0.07724380493164062, -0.07129669189453125, -0.06534957885742188, -0.0594024658203125, -0.053455352783203125, -0.04750823974609375, -0.041561126708984375, -0.035614013671875, -0.029666900634765625, -0.02371978759765625, -0.017772674560546875, -0.0118255615234375, -0.005878448486328125, 6.866455078125e-05, 0.006015777587890625, 0.011962890625, 0.017910003662109375, 0.02385711669921875, 0.029804229736328125, 0.0357513427734375, 0.041698455810546875, 0.04764556884765625, 0.053592681884765625, 0.059539794921875, 0.06548690795898438, 0.07143402099609375, 0.07738113403320312, 0.0833282470703125, 0.08927536010742188, 0.09522247314453125, 0.10116958618164062, 0.10711669921875, 0.11306381225585938, 0.11901092529296875, 0.12495803833007812, 0.1309051513671875, 0.13685226440429688, 0.14279937744140625, 0.14874649047851562, 0.154693603515625, 0.16064071655273438, 0.16658782958984375, 0.17253494262695312, 0.1784820556640625, 0.18442916870117188, 0.19037628173828125, 0.19632339477539062, 0.2022705078125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 1.0, 8.0, 14.0, 11.0, 22.0, 18.0, 32.0, 41.0, 52.0, 74.0, 82.0, 133.0, 200.0, 329.0, 647.0, 1720.0, 4316.0, 12248.0, 35916.0, 113185.0, 475149.0, 294799.0, 71736.0, 24091.0, 8202.0, 3003.0, 1164.0, 506.0, 244.0, 176.0, 93.0, 83.0, 47.0, 41.0, 40.0, 35.0, 14.0, 26.0, 12.0, 13.0, 8.0, 4.0, 5.0, 6.0, 1.0, 2.0, 1.0, 3.0, 2.0], "bins": [-0.65283203125, -0.6346054077148438, -0.6163787841796875, -0.5981521606445312, -0.579925537109375, -0.5616989135742188, -0.5434722900390625, -0.5252456665039062, -0.50701904296875, -0.48879241943359375, -0.4705657958984375, -0.45233917236328125, -0.434112548828125, -0.41588592529296875, -0.3976593017578125, -0.37943267822265625, -0.3612060546875, -0.34297943115234375, -0.3247528076171875, -0.30652618408203125, -0.288299560546875, -0.27007293701171875, -0.2518463134765625, -0.23361968994140625, -0.21539306640625, -0.19716644287109375, -0.1789398193359375, -0.16071319580078125, -0.142486572265625, -0.12425994873046875, -0.1060333251953125, -0.08780670166015625, -0.069580078125, -0.05135345458984375, -0.0331268310546875, -0.01490020751953125, 0.003326416015625, 0.02155303955078125, 0.0397796630859375, 0.05800628662109375, 0.07623291015625, 0.09445953369140625, 0.1126861572265625, 0.13091278076171875, 0.149139404296875, 0.16736602783203125, 0.1855926513671875, 0.20381927490234375, 0.2220458984375, 0.24027252197265625, 0.2584991455078125, 0.27672576904296875, 0.294952392578125, 0.31317901611328125, 0.3314056396484375, 0.34963226318359375, 0.36785888671875, 0.38608551025390625, 0.4043121337890625, 0.42253875732421875, 0.440765380859375, 0.45899200439453125, 0.4772186279296875, 0.49544525146484375, 0.513671875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 9.0, 8.0, 13.0, 15.0, 13.0, 17.0, 19.0, 30.0, 23.0, 39.0, 45.0, 47.0, 43.0, 59.0, 41.0, 52.0, 52.0, 55.0, 40.0, 37.0, 50.0, 35.0, 37.0, 43.0, 29.0, 25.0, 27.0, 15.0, 17.0, 7.0, 10.0, 6.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.56787109375, -0.5475997924804688, -0.5273284912109375, -0.5070571899414062, -0.486785888671875, -0.46651458740234375, -0.4462432861328125, -0.42597198486328125, -0.40570068359375, -0.38542938232421875, -0.3651580810546875, -0.34488677978515625, -0.324615478515625, -0.30434417724609375, -0.2840728759765625, -0.26380157470703125, -0.2435302734375, -0.22325897216796875, -0.2029876708984375, -0.18271636962890625, -0.162445068359375, -0.14217376708984375, -0.1219024658203125, -0.10163116455078125, -0.08135986328125, -0.06108856201171875, -0.0408172607421875, -0.02054595947265625, -0.000274658203125, 0.01999664306640625, 0.0402679443359375, 0.06053924560546875, 0.080810546875, 0.10108184814453125, 0.1213531494140625, 0.14162445068359375, 0.161895751953125, 0.18216705322265625, 0.2024383544921875, 0.22270965576171875, 0.24298095703125, 0.26325225830078125, 0.2835235595703125, 0.30379486083984375, 0.324066162109375, 0.34433746337890625, 0.3646087646484375, 0.38488006591796875, 0.4051513671875, 0.42542266845703125, 0.4456939697265625, 0.46596527099609375, 0.486236572265625, 0.5065078735351562, 0.5267791748046875, 0.5470504760742188, 0.56732177734375, 0.5875930786132812, 0.6078643798828125, 0.6281356811523438, 0.648406982421875, 0.6686782836914062, 0.6889495849609375, 0.7092208862304688, 0.7294921875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 4.0, 20.0, 29.0, 43.0, 73.0, 110.0, 236.0, 432.0, 1027.0, 2525.0, 7524.0, 23405.0, 72063.0, 330633.0, 471225.0, 94133.0, 29818.0, 9699.0, 3190.0, 1222.0, 549.0, 243.0, 144.0, 87.0, 40.0, 31.0, 17.0, 12.0, 8.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.280029296875, -0.27072906494140625, -0.2614288330078125, -0.25212860107421875, -0.242828369140625, -0.23352813720703125, -0.2242279052734375, -0.21492767333984375, -0.20562744140625, -0.19632720947265625, -0.1870269775390625, -0.17772674560546875, -0.168426513671875, -0.15912628173828125, -0.1498260498046875, -0.14052581787109375, -0.1312255859375, -0.12192535400390625, -0.1126251220703125, -0.10332489013671875, -0.094024658203125, -0.08472442626953125, -0.0754241943359375, -0.06612396240234375, -0.05682373046875, -0.04752349853515625, -0.0382232666015625, -0.02892303466796875, -0.019622802734375, -0.01032257080078125, -0.0010223388671875, 0.00827789306640625, 0.017578125, 0.02687835693359375, 0.0361785888671875, 0.04547882080078125, 0.054779052734375, 0.06407928466796875, 0.0733795166015625, 0.08267974853515625, 0.09197998046875, 0.10128021240234375, 0.1105804443359375, 0.11988067626953125, 0.129180908203125, 0.13848114013671875, 0.1477813720703125, 0.15708160400390625, 0.1663818359375, 0.17568206787109375, 0.1849822998046875, 0.19428253173828125, 0.203582763671875, 0.21288299560546875, 0.2221832275390625, 0.23148345947265625, 0.24078369140625, 0.25008392333984375, 0.2593841552734375, 0.26868438720703125, 0.277984619140625, 0.28728485107421875, 0.2965850830078125, 0.30588531494140625, 0.315185546875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 3.0, 10.0, 4.0, 8.0, 8.0, 15.0, 22.0, 17.0, 38.0, 42.0, 64.0, 113.0, 104.0, 148.0, 138.0, 90.0, 55.0, 31.0, 23.0, 21.0, 11.0, 8.0, 5.0, 6.0, 3.0, 6.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.410743713378906e-05, -4.2426399886608124e-05, -4.0745362639427185e-05, -3.9064325392246246e-05, -3.738328814506531e-05, -3.570225089788437e-05, -3.402121365070343e-05, -3.234017640352249e-05, -3.065913915634155e-05, -2.8978101909160614e-05, -2.7297064661979675e-05, -2.5616027414798737e-05, -2.3934990167617798e-05, -2.225395292043686e-05, -2.057291567325592e-05, -1.889187842607498e-05, -1.7210841178894043e-05, -1.5529803931713104e-05, -1.3848766684532166e-05, -1.2167729437351227e-05, -1.0486692190170288e-05, -8.80565494298935e-06, -7.124617695808411e-06, -5.443580448627472e-06, -3.762543201446533e-06, -2.0815059542655945e-06, -4.0046870708465576e-07, 1.280568540096283e-06, 2.9616057872772217e-06, 4.64264303445816e-06, 6.323680281639099e-06, 8.004717528820038e-06, 9.685754776000977e-06, 1.1366792023181915e-05, 1.3047829270362854e-05, 1.4728866517543793e-05, 1.640990376472473e-05, 1.809094101190567e-05, 1.977197825908661e-05, 2.1453015506267548e-05, 2.3134052753448486e-05, 2.4815090000629425e-05, 2.6496127247810364e-05, 2.8177164494991302e-05, 2.985820174217224e-05, 3.153923898935318e-05, 3.322027623653412e-05, 3.490131348371506e-05, 3.6582350730895996e-05, 3.8263387978076935e-05, 3.9944425225257874e-05, 4.162546247243881e-05, 4.330649971961975e-05, 4.498753696680069e-05, 4.666857421398163e-05, 4.834961146116257e-05, 5.0030648708343506e-05, 5.1711685955524445e-05, 5.339272320270538e-05, 5.507376044988632e-05, 5.675479769706726e-05, 5.84358349442482e-05, 6.011687219142914e-05, 6.179790943861008e-05, 6.347894668579102e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 8.0, 8.0, 9.0, 7.0, 15.0, 30.0, 31.0, 48.0, 62.0, 87.0, 113.0, 163.0, 261.0, 529.0, 1391.0, 4457.0, 16199.0, 57652.0, 242910.0, 544108.0, 130813.0, 35218.0, 9610.0, 2758.0, 980.0, 398.0, 208.0, 142.0, 84.0, 74.0, 43.0, 38.0, 31.0, 22.0, 15.0, 7.0, 5.0, 5.0, 3.0, 5.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.251953125, -0.24335479736328125, -0.2347564697265625, -0.22615814208984375, -0.217559814453125, -0.20896148681640625, -0.2003631591796875, -0.19176483154296875, -0.18316650390625, -0.17456817626953125, -0.1659698486328125, -0.15737152099609375, -0.148773193359375, -0.14017486572265625, -0.1315765380859375, -0.12297821044921875, -0.1143798828125, -0.10578155517578125, -0.0971832275390625, -0.08858489990234375, -0.079986572265625, -0.07138824462890625, -0.0627899169921875, -0.05419158935546875, -0.04559326171875, -0.03699493408203125, -0.0283966064453125, -0.01979827880859375, -0.011199951171875, -0.00260162353515625, 0.0059967041015625, 0.01459503173828125, 0.023193359375, 0.03179168701171875, 0.0403900146484375, 0.04898834228515625, 0.057586669921875, 0.06618499755859375, 0.0747833251953125, 0.08338165283203125, 0.09197998046875, 0.10057830810546875, 0.1091766357421875, 0.11777496337890625, 0.126373291015625, 0.13497161865234375, 0.1435699462890625, 0.15216827392578125, 0.1607666015625, 0.16936492919921875, 0.1779632568359375, 0.18656158447265625, 0.195159912109375, 0.20375823974609375, 0.2123565673828125, 0.22095489501953125, 0.22955322265625, 0.23815155029296875, 0.2467498779296875, 0.25534820556640625, 0.263946533203125, 0.27254486083984375, 0.2811431884765625, 0.28974151611328125, 0.29833984375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 5.0, 12.0, 7.0, 15.0, 16.0, 24.0, 23.0, 37.0, 59.0, 89.0, 139.0, 167.0, 142.0, 85.0, 46.0, 35.0, 22.0, 20.0, 20.0, 11.0, 10.0, 5.0, 4.0, 1.0, 5.0, 3.0, 2.0, 6.0, 0.0, 0.0, 3.0], "bins": [-0.408203125, -0.3990459442138672, -0.3898887634277344, -0.38073158264160156, -0.37157440185546875, -0.36241722106933594, -0.3532600402832031, -0.3441028594970703, -0.3349456787109375, -0.3257884979248047, -0.3166313171386719, -0.30747413635253906, -0.29831695556640625, -0.28915977478027344, -0.2800025939941406, -0.2708454132080078, -0.261688232421875, -0.2525310516357422, -0.24337387084960938, -0.23421669006347656, -0.22505950927734375, -0.21590232849121094, -0.20674514770507812, -0.1975879669189453, -0.1884307861328125, -0.1792736053466797, -0.17011642456054688, -0.16095924377441406, -0.15180206298828125, -0.14264488220214844, -0.13348770141601562, -0.12433052062988281, -0.11517333984375, -0.10601615905761719, -0.09685897827148438, -0.08770179748535156, -0.07854461669921875, -0.06938743591308594, -0.060230255126953125, -0.05107307434082031, -0.0419158935546875, -0.03275871276855469, -0.023601531982421875, -0.014444351196289062, -0.00528717041015625, 0.0038700103759765625, 0.013027191162109375, 0.022184371948242188, 0.031341552734375, 0.04049873352050781, 0.049655914306640625, 0.05881309509277344, 0.06797027587890625, 0.07712745666503906, 0.08628463745117188, 0.09544181823730469, 0.1045989990234375, 0.11375617980957031, 0.12291336059570312, 0.13207054138183594, 0.14122772216796875, 0.15038490295410156, 0.15954208374023438, 0.1686992645263672, 0.1778564453125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 20.0, 37.0, 64.0, 136.0, 200.0, 196.0, 151.0, 101.0, 59.0, 15.0, 14.0, 6.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.455748558044434, -4.339577674865723, -4.22340726852417, -4.107236385345459, -3.991065740585327, -3.8748950958251953, -3.7587244510650635, -3.6425538063049316, -3.5263829231262207, -3.410212278366089, -3.294041633605957, -3.177870750427246, -3.0617001056671143, -2.9455294609069824, -2.8293588161468506, -2.7131881713867188, -2.597017526626587, -2.480846881866455, -2.3646762371063232, -2.2485055923461914, -2.1323347091674805, -2.0161640644073486, -1.8999934196472168, -1.783822774887085, -1.6676520109176636, -1.5514813661575317, -1.4353106021881104, -1.3191399574279785, -1.2029693126678467, -1.0867985486984253, -0.9706279039382935, -0.8544571995735168, -0.7382864952087402, -0.6221157908439636, -0.505945086479187, -0.3897744417190552, -0.27360373735427856, -0.15743303298950195, -0.04126238822937012, 0.0749083161354065, 0.1910790205001831, 0.3072497248649597, 0.42342039942741394, 0.5395910739898682, 0.6557617783546448, 0.7719324827194214, 0.8881031274795532, 1.0042738914489746, 1.1204445362091064, 1.2366151809692383, 1.3527859449386597, 1.4689565896987915, 1.585127353668213, 1.7012979984283447, 1.8174686431884766, 1.9336392879486084, 2.0498099327087402, 2.165980577468872, 2.282151222229004, 2.398322105407715, 2.5144927501678467, 2.6306633949279785, 2.7468340396881104, 2.863004684448242, 2.979175567626953]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 12.0, 10.0, 10.0, 12.0, 14.0, 14.0, 13.0, 21.0, 36.0, 33.0, 27.0, 32.0, 29.0, 39.0, 34.0, 46.0, 34.0, 45.0, 36.0, 55.0, 41.0, 38.0, 36.0, 35.0, 34.0, 33.0, 33.0, 30.0, 31.0, 17.0, 20.0, 17.0, 12.0, 15.0, 11.0, 7.0, 5.0, 7.0, 8.0, 5.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3328157663345337, -1.2871006727218628, -1.241385579109192, -1.195670485496521, -1.1499555110931396, -1.1042404174804688, -1.0585253238677979, -1.012810230255127, -0.967095136642456, -0.9213800430297852, -0.8756649494171143, -0.8299499154090881, -0.7842348217964172, -0.7385197281837463, -0.6928046941757202, -0.6470896005630493, -0.6013745069503784, -0.5556594133377075, -0.5099443197250366, -0.4642292857170105, -0.4185141921043396, -0.3727990984916687, -0.3270840346813202, -0.2813689708709717, -0.23565387725830078, -0.18993879854679108, -0.14422371983528137, -0.09850864112377167, -0.05279356241226196, -0.007078483700752258, 0.038636595010757446, 0.08435165882110596, 0.1300668716430664, 0.1757819503545761, 0.22149702906608582, 0.2672120928764343, 0.3129271864891052, 0.3586422801017761, 0.40435734391212463, 0.45007240772247314, 0.49578750133514404, 0.5415025949478149, 0.5872176885604858, 0.632932722568512, 0.6786478161811829, 0.7243629097938538, 0.7700779438018799, 0.8157930374145508, 0.8615081310272217, 0.9072232246398926, 0.9529383182525635, 0.9986533522605896, 1.0443685054779053, 1.0900834798812866, 1.1357985734939575, 1.1815136671066284, 1.2272287607192993, 1.2729438543319702, 1.3186589479446411, 1.364374041557312, 1.4100890159606934, 1.4558041095733643, 1.5015192031860352, 1.547234296798706, 1.592949390411377]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 5.0, 7.0, 8.0, 15.0, 34.0, 37.0, 54.0, 74.0, 124.0, 211.0, 311.0, 431.0, 731.0, 1103.0, 1777.0, 2951.0, 4770.0, 8232.0, 13789.0, 24391.0, 43849.0, 82592.0, 164262.0, 356059.0, 850955.0, 1340528.0, 689899.0, 301127.0, 142512.0, 73008.0, 38895.0, 21646.0, 12054.0, 7051.0, 4179.0, 2500.0, 1534.0, 931.0, 620.0, 365.0, 235.0, 151.0, 108.0, 52.0, 43.0, 23.0, 23.0, 10.0, 8.0, 9.0, 2.0, 3.0, 2.0], "bins": [-0.1968994140625, -0.19148826599121094, -0.18607711791992188, -0.1806659698486328, -0.17525482177734375, -0.1698436737060547, -0.16443252563476562, -0.15902137756347656, -0.1536102294921875, -0.14819908142089844, -0.14278793334960938, -0.1373767852783203, -0.13196563720703125, -0.1265544891357422, -0.12114334106445312, -0.11573219299316406, -0.110321044921875, -0.10490989685058594, -0.09949874877929688, -0.09408760070800781, -0.08867645263671875, -0.08326530456542969, -0.07785415649414062, -0.07244300842285156, -0.0670318603515625, -0.06162071228027344, -0.056209564208984375, -0.05079841613769531, -0.04538726806640625, -0.03997611999511719, -0.034564971923828125, -0.029153823852539062, -0.02374267578125, -0.018331527709960938, -0.012920379638671875, -0.0075092315673828125, -0.00209808349609375, 0.0033130645751953125, 0.008724212646484375, 0.014135360717773438, 0.0195465087890625, 0.024957656860351562, 0.030368804931640625, 0.03577995300292969, 0.04119110107421875, 0.04660224914550781, 0.052013397216796875, 0.05742454528808594, 0.062835693359375, 0.06824684143066406, 0.07365798950195312, 0.07906913757324219, 0.08448028564453125, 0.08989143371582031, 0.09530258178710938, 0.10071372985839844, 0.1061248779296875, 0.11153602600097656, 0.11694717407226562, 0.12235832214355469, 0.12776947021484375, 0.1331806182861328, 0.13859176635742188, 0.14400291442871094, 0.1494140625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 3.0, 4.0, 1.0, 5.0, 1.0, 4.0, 4.0, 7.0, 14.0, 9.0, 16.0, 16.0, 22.0, 20.0, 25.0, 22.0, 27.0, 32.0, 29.0, 29.0, 50.0, 37.0, 42.0, 41.0, 39.0, 38.0, 43.0, 42.0, 41.0, 47.0, 41.0, 44.0, 27.0, 25.0, 28.0, 28.0, 18.0, 12.0, 18.0, 6.0, 14.0, 10.0, 10.0, 5.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1710205078125, -0.16487503051757812, -0.15872955322265625, -0.15258407592773438, -0.1464385986328125, -0.14029312133789062, -0.13414764404296875, -0.12800216674804688, -0.121856689453125, -0.11571121215820312, -0.10956573486328125, -0.10342025756835938, -0.0972747802734375, -0.09112930297851562, -0.08498382568359375, -0.07883834838867188, -0.07269287109375, -0.06654739379882812, -0.06040191650390625, -0.054256439208984375, -0.0481109619140625, -0.041965484619140625, -0.03582000732421875, -0.029674530029296875, -0.023529052734375, -0.017383575439453125, -0.01123809814453125, -0.005092620849609375, 0.0010528564453125, 0.007198333740234375, 0.01334381103515625, 0.019489288330078125, 0.025634765625, 0.031780242919921875, 0.03792572021484375, 0.044071197509765625, 0.0502166748046875, 0.056362152099609375, 0.06250762939453125, 0.06865310668945312, 0.074798583984375, 0.08094406127929688, 0.08708953857421875, 0.09323501586914062, 0.0993804931640625, 0.10552597045898438, 0.11167144775390625, 0.11781692504882812, 0.12396240234375, 0.13010787963867188, 0.13625335693359375, 0.14239883422851562, 0.1485443115234375, 0.15468978881835938, 0.16083526611328125, 0.16698074340820312, 0.173126220703125, 0.17927169799804688, 0.18541717529296875, 0.19156265258789062, 0.1977081298828125, 0.20385360717773438, 0.20999908447265625, 0.21614456176757812, 0.2222900390625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 9.0, 10.0, 8.0, 11.0, 11.0, 17.0, 35.0, 32.0, 32.0, 66.0, 69.0, 83.0, 123.0, 191.0, 342.0, 581.0, 1035.0, 2104.0, 5127.0, 14529.0, 47196.0, 190048.0, 1082841.0, 2308938.0, 410806.0, 89892.0, 25169.0, 8298.0, 3253.0, 1404.0, 759.0, 418.0, 236.0, 161.0, 110.0, 74.0, 71.0, 50.0, 32.0, 29.0, 21.0, 22.0, 8.0, 12.0, 6.0, 5.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.57861328125, -0.5617141723632812, -0.5448150634765625, -0.5279159545898438, -0.511016845703125, -0.49411773681640625, -0.4772186279296875, -0.46031951904296875, -0.44342041015625, -0.42652130126953125, -0.4096221923828125, -0.39272308349609375, -0.375823974609375, -0.35892486572265625, -0.3420257568359375, -0.32512664794921875, -0.3082275390625, -0.29132843017578125, -0.2744293212890625, -0.25753021240234375, -0.240631103515625, -0.22373199462890625, -0.2068328857421875, -0.18993377685546875, -0.17303466796875, -0.15613555908203125, -0.1392364501953125, -0.12233734130859375, -0.105438232421875, -0.08853912353515625, -0.0716400146484375, -0.05474090576171875, -0.037841796875, -0.02094268798828125, -0.0040435791015625, 0.01285552978515625, 0.029754638671875, 0.04665374755859375, 0.0635528564453125, 0.08045196533203125, 0.09735107421875, 0.11425018310546875, 0.1311492919921875, 0.14804840087890625, 0.164947509765625, 0.18184661865234375, 0.1987457275390625, 0.21564483642578125, 0.2325439453125, 0.24944305419921875, 0.2663421630859375, 0.28324127197265625, 0.300140380859375, 0.31703948974609375, 0.3339385986328125, 0.35083770751953125, 0.36773681640625, 0.38463592529296875, 0.4015350341796875, 0.41843414306640625, 0.435333251953125, 0.45223236083984375, 0.4691314697265625, 0.48603057861328125, 0.5029296875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 7.0, 2.0, 6.0, 10.0, 16.0, 22.0, 29.0, 39.0, 67.0, 108.0, 166.0, 291.0, 480.0, 781.0, 821.0, 498.0, 280.0, 172.0, 96.0, 61.0, 41.0, 32.0, 20.0, 8.0, 11.0, 7.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.73779296875, -0.7184371948242188, -0.6990814208984375, -0.6797256469726562, -0.660369873046875, -0.6410140991210938, -0.6216583251953125, -0.6023025512695312, -0.58294677734375, -0.5635910034179688, -0.5442352294921875, -0.5248794555664062, -0.505523681640625, -0.48616790771484375, -0.4668121337890625, -0.44745635986328125, -0.4281005859375, -0.40874481201171875, -0.3893890380859375, -0.37003326416015625, -0.350677490234375, -0.33132171630859375, -0.3119659423828125, -0.29261016845703125, -0.27325439453125, -0.25389862060546875, -0.2345428466796875, -0.21518707275390625, -0.195831298828125, -0.17647552490234375, -0.1571197509765625, -0.13776397705078125, -0.118408203125, -0.09905242919921875, -0.0796966552734375, -0.06034088134765625, -0.040985107421875, -0.02162933349609375, -0.0022735595703125, 0.01708221435546875, 0.03643798828125, 0.05579376220703125, 0.0751495361328125, 0.09450531005859375, 0.113861083984375, 0.13321685791015625, 0.1525726318359375, 0.17192840576171875, 0.1912841796875, 0.21063995361328125, 0.2299957275390625, 0.24935150146484375, 0.268707275390625, 0.28806304931640625, 0.3074188232421875, 0.32677459716796875, 0.34613037109375, 0.36548614501953125, 0.3848419189453125, 0.40419769287109375, 0.423553466796875, 0.44290924072265625, 0.4622650146484375, 0.48162078857421875, 0.5009765625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 1.0, 2.0, 5.0, 14.0, 22.0, 28.0, 40.0, 47.0, 78.0, 83.0, 117.0, 108.0, 95.0, 107.0, 82.0, 57.0, 51.0, 25.0, 16.0, 8.0, 4.0, 4.0, 5.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.010375499725342, -2.927600383758545, -2.844825029373169, -2.762049913406372, -2.679274797439575, -2.596499443054199, -2.5137243270874023, -2.4309492111206055, -2.3481738567352295, -2.2653987407684326, -2.1826233863830566, -2.0998482704162598, -2.017073154449463, -1.934297800064087, -1.85152268409729, -1.7687474489212036, -1.6859723329544067, -1.6031970977783203, -1.5204219818115234, -1.437646746635437, -1.3548715114593506, -1.2720963954925537, -1.1893211603164673, -1.1065459251403809, -1.023770809173584, -0.9409956336021423, -0.8582203984260559, -0.7754452228546143, -0.6926699876785278, -0.6098948121070862, -0.5271196365356445, -0.4443444013595581, -0.3615691661834717, -0.27879396080970764, -0.1960187703371048, -0.11324357986450195, -0.030468374490737915, 0.05230683088302612, 0.13508200645446777, 0.2178572416305542, 0.30063241720199585, 0.3834076225757599, 0.4661828279495239, 0.5489580035209656, 0.6317331790924072, 0.7145084142684937, 0.7972835898399353, 0.8800588250160217, 0.9628340005874634, 1.0456092357635498, 1.1283843517303467, 1.211159586906433, 1.2939348220825195, 1.3767099380493164, 1.4594851732254028, 1.5422604084014893, 1.6250355243682861, 1.7078107595443726, 1.7905858755111694, 1.8733611106872559, 1.9561363458633423, 2.0389115810394287, 2.1216866970062256, 2.2044620513916016, 2.2872371673583984]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 3.0, 11.0, 7.0, 3.0, 14.0, 17.0, 16.0, 17.0, 19.0, 17.0, 30.0, 30.0, 25.0, 36.0, 34.0, 51.0, 41.0, 29.0, 46.0, 50.0, 46.0, 52.0, 45.0, 39.0, 47.0, 34.0, 47.0, 29.0, 28.0, 17.0, 17.0, 23.0, 17.0, 20.0, 16.0, 7.0, 8.0, 4.0, 8.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2766914367675781, -1.2308825254440308, -1.185073733329773, -1.1392648220062256, -1.0934559106826782, -1.0476469993591309, -1.001838207244873, -0.9560292959213257, -0.9102203845977783, -0.8644115328788757, -0.8186026215553284, -0.7727937698364258, -0.7269848585128784, -0.6811760067939758, -0.6353671550750732, -0.5895582437515259, -0.5437493920326233, -0.4979405105113983, -0.45213162899017334, -0.40632277727127075, -0.3605138659477234, -0.3147050142288208, -0.2688961327075958, -0.22308725118637085, -0.17727836966514587, -0.1314694881439209, -0.08566061407327652, -0.03985174000263214, 0.0059571415185928345, 0.05176602303981781, 0.09757488965988159, 0.14338377118110657, 0.18919265270233154, 0.23500153422355652, 0.2808104157447815, 0.3266192674636841, 0.37242817878723145, 0.41823703050613403, 0.464045912027359, 0.509854793548584, 0.5556637048721313, 0.6014725565910339, 0.6472814679145813, 0.6930903196334839, 0.7388992309570312, 0.7847080826759338, 0.8305169343948364, 0.8763258457183838, 0.9221346974372864, 0.967943549156189, 1.0137524604797363, 1.0595613718032837, 1.1053701639175415, 1.1511790752410889, 1.1969879865646362, 1.2427968978881836, 1.2886056900024414, 1.3344146013259888, 1.3802233934402466, 1.426032304763794, 1.4718412160873413, 1.5176501274108887, 1.5634589195251465, 1.6092678308486938, 1.6550767421722412]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 5.0, 4.0, 11.0, 22.0, 28.0, 45.0, 61.0, 84.0, 140.0, 216.0, 341.0, 516.0, 808.0, 1346.0, 1931.0, 3061.0, 4649.0, 7013.0, 10407.0, 16070.0, 25176.0, 40532.0, 68103.0, 116395.0, 190196.0, 209944.0, 139378.0, 81115.0, 47527.0, 29253.0, 18830.0, 12256.0, 7961.0, 5284.0, 3426.0, 2264.0, 1450.0, 965.0, 609.0, 419.0, 256.0, 169.0, 93.0, 66.0, 41.0, 29.0, 21.0, 15.0, 10.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.22998046875, -0.22260093688964844, -0.21522140502929688, -0.2078418731689453, -0.20046234130859375, -0.1930828094482422, -0.18570327758789062, -0.17832374572753906, -0.1709442138671875, -0.16356468200683594, -0.15618515014648438, -0.1488056182861328, -0.14142608642578125, -0.1340465545654297, -0.12666702270507812, -0.11928749084472656, -0.111907958984375, -0.10452842712402344, -0.09714889526367188, -0.08976936340332031, -0.08238983154296875, -0.07501029968261719, -0.06763076782226562, -0.06025123596191406, -0.0528717041015625, -0.04549217224121094, -0.038112640380859375, -0.030733108520507812, -0.02335357666015625, -0.015974044799804688, -0.008594512939453125, -0.0012149810791015625, 0.00616455078125, 0.013544082641601562, 0.020923614501953125, 0.028303146362304688, 0.03568267822265625, 0.04306221008300781, 0.050441741943359375, 0.05782127380371094, 0.0652008056640625, 0.07258033752441406, 0.07995986938476562, 0.08733940124511719, 0.09471893310546875, 0.10209846496582031, 0.10947799682617188, 0.11685752868652344, 0.124237060546875, 0.13161659240722656, 0.13899612426757812, 0.1463756561279297, 0.15375518798828125, 0.1611347198486328, 0.16851425170898438, 0.17589378356933594, 0.1832733154296875, 0.19065284729003906, 0.19803237915039062, 0.2054119110107422, 0.21279144287109375, 0.2201709747314453, 0.22755050659179688, 0.23493003845214844, 0.2423095703125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 4.0, 2.0, 7.0, 8.0, 13.0, 13.0, 15.0, 15.0, 14.0, 21.0, 25.0, 22.0, 28.0, 27.0, 35.0, 26.0, 29.0, 33.0, 42.0, 33.0, 36.0, 34.0, 43.0, 54.0, 38.0, 32.0, 46.0, 36.0, 44.0, 37.0, 23.0, 24.0, 17.0, 25.0, 11.0, 14.0, 20.0, 14.0, 8.0, 12.0, 3.0, 4.0, 5.0, 0.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.2021484375, -0.19617843627929688, -0.19020843505859375, -0.18423843383789062, -0.1782684326171875, -0.17229843139648438, -0.16632843017578125, -0.16035842895507812, -0.154388427734375, -0.14841842651367188, -0.14244842529296875, -0.13647842407226562, -0.1305084228515625, -0.12453842163085938, -0.11856842041015625, -0.11259841918945312, -0.10662841796875, -0.10065841674804688, -0.09468841552734375, -0.08871841430664062, -0.0827484130859375, -0.07677841186523438, -0.07080841064453125, -0.06483840942382812, -0.058868408203125, -0.052898406982421875, -0.04692840576171875, -0.040958404541015625, -0.0349884033203125, -0.029018402099609375, -0.02304840087890625, -0.017078399658203125, -0.0111083984375, -0.005138397216796875, 0.00083160400390625, 0.006801605224609375, 0.0127716064453125, 0.018741607666015625, 0.02471160888671875, 0.030681610107421875, 0.036651611328125, 0.042621612548828125, 0.04859161376953125, 0.054561614990234375, 0.0605316162109375, 0.06650161743164062, 0.07247161865234375, 0.07844161987304688, 0.08441162109375, 0.09038162231445312, 0.09635162353515625, 0.10232162475585938, 0.1082916259765625, 0.11426162719726562, 0.12023162841796875, 0.12620162963867188, 0.132171630859375, 0.13814163208007812, 0.14411163330078125, 0.15008163452148438, 0.1560516357421875, 0.16202163696289062, 0.16799163818359375, 0.17396163940429688, 0.179931640625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 4.0, 10.0, 8.0, 11.0, 20.0, 31.0, 38.0, 55.0, 106.0, 193.0, 259.0, 563.0, 1659.0, 8460.0, 56322.0, 421969.0, 480558.0, 65236.0, 9810.0, 1817.0, 598.0, 332.0, 190.0, 90.0, 85.0, 41.0, 32.0, 19.0, 19.0, 8.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.056640625, -1.0225982666015625, -0.988555908203125, -0.9545135498046875, -0.92047119140625, -0.8864288330078125, -0.852386474609375, -0.8183441162109375, -0.7843017578125, -0.7502593994140625, -0.716217041015625, -0.6821746826171875, -0.64813232421875, -0.6140899658203125, -0.580047607421875, -0.5460052490234375, -0.511962890625, -0.4779205322265625, -0.443878173828125, -0.4098358154296875, -0.37579345703125, -0.3417510986328125, -0.307708740234375, -0.2736663818359375, -0.2396240234375, -0.2055816650390625, -0.171539306640625, -0.1374969482421875, -0.10345458984375, -0.0694122314453125, -0.035369873046875, -0.0013275146484375, 0.03271484375, 0.0667572021484375, 0.100799560546875, 0.1348419189453125, 0.16888427734375, 0.2029266357421875, 0.236968994140625, 0.2710113525390625, 0.3050537109375, 0.3390960693359375, 0.373138427734375, 0.4071807861328125, 0.44122314453125, 0.4752655029296875, 0.509307861328125, 0.5433502197265625, 0.577392578125, 0.6114349365234375, 0.645477294921875, 0.6795196533203125, 0.71356201171875, 0.7476043701171875, 0.781646728515625, 0.8156890869140625, 0.8497314453125, 0.8837738037109375, 0.917816162109375, 0.9518585205078125, 0.98590087890625, 1.0199432373046875, 1.053985595703125, 1.0880279541015625, 1.1220703125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 2.0, 6.0, 10.0, 5.0, 10.0, 12.0, 11.0, 14.0, 18.0, 23.0, 26.0, 25.0, 27.0, 29.0, 40.0, 35.0, 45.0, 40.0, 44.0, 53.0, 37.0, 34.0, 36.0, 40.0, 51.0, 51.0, 43.0, 39.0, 33.0, 28.0, 20.0, 25.0, 16.0, 13.0, 7.0, 12.0, 11.0, 6.0, 5.0, 7.0, 6.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.81396484375, -0.7909622192382812, -0.7679595947265625, -0.7449569702148438, -0.721954345703125, -0.6989517211914062, -0.6759490966796875, -0.6529464721679688, -0.62994384765625, -0.6069412231445312, -0.5839385986328125, -0.5609359741210938, -0.537933349609375, -0.5149307250976562, -0.4919281005859375, -0.46892547607421875, -0.4459228515625, -0.42292022705078125, -0.3999176025390625, -0.37691497802734375, -0.353912353515625, -0.33090972900390625, -0.3079071044921875, -0.28490447998046875, -0.26190185546875, -0.23889923095703125, -0.2158966064453125, -0.19289398193359375, -0.169891357421875, -0.14688873291015625, -0.1238861083984375, -0.10088348388671875, -0.077880859375, -0.05487823486328125, -0.0318756103515625, -0.00887298583984375, 0.014129638671875, 0.03713226318359375, 0.0601348876953125, 0.08313751220703125, 0.10614013671875, 0.12914276123046875, 0.1521453857421875, 0.17514801025390625, 0.198150634765625, 0.22115325927734375, 0.2441558837890625, 0.26715850830078125, 0.2901611328125, 0.31316375732421875, 0.3361663818359375, 0.35916900634765625, 0.382171630859375, 0.40517425537109375, 0.4281768798828125, 0.45117950439453125, 0.47418212890625, 0.49718475341796875, 0.5201873779296875, 0.5431900024414062, 0.566192626953125, 0.5891952514648438, 0.6121978759765625, 0.6352005004882812, 0.658203125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 7.0, 5.0, 9.0, 10.0, 20.0, 19.0, 37.0, 46.0, 85.0, 149.0, 203.0, 289.0, 569.0, 1095.0, 2323.0, 5615.0, 14296.0, 38078.0, 101270.0, 276831.0, 372793.0, 145922.0, 54070.0, 20588.0, 7893.0, 3212.0, 1393.0, 714.0, 353.0, 231.0, 124.0, 73.0, 68.0, 61.0, 32.0, 12.0, 16.0, 14.0, 9.0, 4.0, 4.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.268798828125, -0.2613697052001953, -0.2539405822753906, -0.24651145935058594, -0.23908233642578125, -0.23165321350097656, -0.22422409057617188, -0.2167949676513672, -0.2093658447265625, -0.2019367218017578, -0.19450759887695312, -0.18707847595214844, -0.17964935302734375, -0.17222023010253906, -0.16479110717773438, -0.1573619842529297, -0.149932861328125, -0.1425037384033203, -0.13507461547851562, -0.12764549255371094, -0.12021636962890625, -0.11278724670410156, -0.10535812377929688, -0.09792900085449219, -0.0904998779296875, -0.08307075500488281, -0.07564163208007812, -0.06821250915527344, -0.06078338623046875, -0.05335426330566406, -0.045925140380859375, -0.03849601745605469, -0.03106689453125, -0.023637771606445312, -0.016208648681640625, -0.008779525756835938, -0.00135040283203125, 0.0060787200927734375, 0.013507843017578125, 0.020936965942382812, 0.0283660888671875, 0.03579521179199219, 0.043224334716796875, 0.05065345764160156, 0.05808258056640625, 0.06551170349121094, 0.07294082641601562, 0.08036994934082031, 0.087799072265625, 0.09522819519042969, 0.10265731811523438, 0.11008644104003906, 0.11751556396484375, 0.12494468688964844, 0.13237380981445312, 0.1398029327392578, 0.1472320556640625, 0.1546611785888672, 0.16209030151367188, 0.16951942443847656, 0.17694854736328125, 0.18437767028808594, 0.19180679321289062, 0.1992359161376953, 0.2066650390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 2.0, 4.0, 9.0, 5.0, 10.0, 16.0, 14.0, 26.0, 31.0, 34.0, 41.0, 58.0, 90.0, 102.0, 101.0, 96.0, 75.0, 64.0, 44.0, 38.0, 25.0, 24.0, 16.0, 8.0, 17.0, 5.0, 10.0, 8.0, 8.0, 2.0, 9.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.780292510986328e-05, -4.628114402294159e-05, -4.47593629360199e-05, -4.3237581849098206e-05, -4.1715800762176514e-05, -4.019401967525482e-05, -3.867223858833313e-05, -3.715045750141144e-05, -3.5628676414489746e-05, -3.4106895327568054e-05, -3.258511424064636e-05, -3.106333315372467e-05, -2.954155206680298e-05, -2.8019770979881287e-05, -2.6497989892959595e-05, -2.4976208806037903e-05, -2.345442771911621e-05, -2.193264663219452e-05, -2.0410865545272827e-05, -1.8889084458351135e-05, -1.7367303371429443e-05, -1.584552228450775e-05, -1.432374119758606e-05, -1.2801960110664368e-05, -1.1280179023742676e-05, -9.758397936820984e-06, -8.236616849899292e-06, -6.7148357629776e-06, -5.193054676055908e-06, -3.6712735891342163e-06, -2.1494925022125244e-06, -6.277114152908325e-07, 8.940696716308594e-07, 2.4158507585525513e-06, 3.937631845474243e-06, 5.459412932395935e-06, 6.981194019317627e-06, 8.502975106239319e-06, 1.002475619316101e-05, 1.1546537280082703e-05, 1.3068318367004395e-05, 1.4590099453926086e-05, 1.611188054084778e-05, 1.763366162776947e-05, 1.9155442714691162e-05, 2.0677223801612854e-05, 2.2199004888534546e-05, 2.3720785975456238e-05, 2.524256706237793e-05, 2.676434814929962e-05, 2.8286129236221313e-05, 2.9807910323143005e-05, 3.13296914100647e-05, 3.285147249698639e-05, 3.437325358390808e-05, 3.589503467082977e-05, 3.7416815757751465e-05, 3.893859684467316e-05, 4.046037793159485e-05, 4.198215901851654e-05, 4.350394010543823e-05, 4.5025721192359924e-05, 4.6547502279281616e-05, 4.806928336620331e-05, 4.9591064453125e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 7.0, 9.0, 7.0, 11.0, 23.0, 14.0, 47.0, 57.0, 79.0, 98.0, 158.0, 294.0, 662.0, 1493.0, 4430.0, 15705.0, 57710.0, 210430.0, 469899.0, 207879.0, 56757.0, 15461.0, 4428.0, 1531.0, 583.0, 283.0, 144.0, 113.0, 72.0, 39.0, 39.0, 27.0, 10.0, 13.0, 7.0, 7.0, 7.0, 5.0, 3.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.31201171875, -0.30269622802734375, -0.2933807373046875, -0.28406524658203125, -0.274749755859375, -0.26543426513671875, -0.2561187744140625, -0.24680328369140625, -0.23748779296875, -0.22817230224609375, -0.2188568115234375, -0.20954132080078125, -0.200225830078125, -0.19091033935546875, -0.1815948486328125, -0.17227935791015625, -0.1629638671875, -0.15364837646484375, -0.1443328857421875, -0.13501739501953125, -0.125701904296875, -0.11638641357421875, -0.1070709228515625, -0.09775543212890625, -0.08843994140625, -0.07912445068359375, -0.0698089599609375, -0.06049346923828125, -0.051177978515625, -0.04186248779296875, -0.0325469970703125, -0.02323150634765625, -0.013916015625, -0.00460052490234375, 0.0047149658203125, 0.01403045654296875, 0.023345947265625, 0.03266143798828125, 0.0419769287109375, 0.05129241943359375, 0.06060791015625, 0.06992340087890625, 0.0792388916015625, 0.08855438232421875, 0.097869873046875, 0.10718536376953125, 0.1165008544921875, 0.12581634521484375, 0.1351318359375, 0.14444732666015625, 0.1537628173828125, 0.16307830810546875, 0.172393798828125, 0.18170928955078125, 0.1910247802734375, 0.20034027099609375, 0.20965576171875, 0.21897125244140625, 0.2282867431640625, 0.23760223388671875, 0.246917724609375, 0.25623321533203125, 0.2655487060546875, 0.27486419677734375, 0.2841796875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 6.0, 8.0, 12.0, 14.0, 17.0, 14.0, 22.0, 21.0, 25.0, 35.0, 26.0, 39.0, 47.0, 61.0, 73.0, 56.0, 60.0, 64.0, 47.0, 42.0, 54.0, 31.0, 42.0, 31.0, 23.0, 17.0, 14.0, 14.0, 15.0, 12.0, 10.0, 6.0, 10.0, 6.0, 4.0, 3.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1826171875, -0.17694854736328125, -0.1712799072265625, -0.16561126708984375, -0.159942626953125, -0.15427398681640625, -0.1486053466796875, -0.14293670654296875, -0.13726806640625, -0.13159942626953125, -0.1259307861328125, -0.12026214599609375, -0.114593505859375, -0.10892486572265625, -0.1032562255859375, -0.09758758544921875, -0.0919189453125, -0.08625030517578125, -0.0805816650390625, -0.07491302490234375, -0.069244384765625, -0.06357574462890625, -0.0579071044921875, -0.05223846435546875, -0.04656982421875, -0.04090118408203125, -0.0352325439453125, -0.02956390380859375, -0.023895263671875, -0.01822662353515625, -0.0125579833984375, -0.00688934326171875, -0.001220703125, 0.00444793701171875, 0.0101165771484375, 0.01578521728515625, 0.021453857421875, 0.02712249755859375, 0.0327911376953125, 0.03845977783203125, 0.04412841796875, 0.04979705810546875, 0.0554656982421875, 0.06113433837890625, 0.066802978515625, 0.07247161865234375, 0.0781402587890625, 0.08380889892578125, 0.0894775390625, 0.09514617919921875, 0.1008148193359375, 0.10648345947265625, 0.112152099609375, 0.11782073974609375, 0.1234893798828125, 0.12915802001953125, 0.13482666015625, 0.14049530029296875, 0.1461639404296875, 0.15183258056640625, 0.157501220703125, 0.16316986083984375, 0.1688385009765625, 0.17450714111328125, 0.18017578125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [6.0, 0.0, 2.0, 3.0, 5.0, 11.0, 12.0, 34.0, 64.0, 128.0, 148.0, 178.0, 189.0, 120.0, 70.0, 28.0, 7.0, 4.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.685758113861084, -1.539783239364624, -1.393808364868164, -1.2478336095809937, -1.1018587350845337, -0.9558838605880737, -0.8099090456962585, -0.6639342308044434, -0.5179593563079834, -0.3719845116138458, -0.22600966691970825, -0.08003482222557068, 0.0659400224685669, 0.21191489696502686, 0.35788971185684204, 0.5038645267486572, 0.6498394012451172, 0.7958142757415771, 0.9417890906333923, 1.0877639055252075, 1.2337387800216675, 1.3797136545181274, 1.5256884098052979, 1.6716632843017578, 1.8176381587982178, 1.9636130332946777, 2.1095879077911377, 2.2555627822875977, 2.4015374183654785, 2.5475125312805176, 2.6934871673583984, 2.8394620418548584, 2.9854373931884766, 3.1314122676849365, 3.2773871421813965, 3.4233620166778564, 3.5693368911743164, 3.7153115272521973, 3.8612864017486572, 4.007261276245117, 4.153236389160156, 4.299211025238037, 4.445186138153076, 4.591160774230957, 4.737135887145996, 4.883110523223877, 5.029085636138916, 5.175060272216797, 5.321034908294678, 5.467009544372559, 5.612984657287598, 5.7589592933654785, 5.904934406280518, 6.050909042358398, 6.1968841552734375, 6.342858791351318, 6.488833427429199, 6.63480806350708, 6.780783176422119, 6.9267578125, 7.072732925415039, 7.21870756149292, 7.364682674407959, 7.51065731048584, 7.656632423400879]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 5.0, 8.0, 3.0, 6.0, 8.0, 5.0, 11.0, 20.0, 13.0, 11.0, 15.0, 29.0, 34.0, 14.0, 30.0, 34.0, 33.0, 35.0, 27.0, 32.0, 41.0, 38.0, 48.0, 31.0, 33.0, 31.0, 33.0, 39.0, 38.0, 36.0, 21.0, 31.0, 20.0, 29.0, 29.0, 10.0, 12.0, 15.0, 12.0, 16.0, 21.0, 10.0, 5.0, 8.0, 8.0, 2.0, 2.0, 3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0], "bins": [-1.900040626525879, -1.8429653644561768, -1.7858901023864746, -1.7288148403167725, -1.6717395782470703, -1.6146643161773682, -1.5575891733169556, -1.5005139112472534, -1.4434386491775513, -1.3863633871078491, -1.329288125038147, -1.2722128629684448, -1.2151377201080322, -1.15806245803833, -1.100987195968628, -1.0439119338989258, -0.9868366718292236, -0.9297614097595215, -0.8726861476898193, -0.815610945224762, -0.7585356831550598, -0.7014604210853577, -0.6443852186203003, -0.5873099565505981, -0.530234694480896, -0.47315943241119385, -0.4160842001438141, -0.3590089678764343, -0.3019337058067322, -0.24485844373703003, -0.18778321146965027, -0.1307079792022705, -0.07363271713256836, -0.016557469964027405, 0.04051777720451355, 0.0975930243730545, 0.15466827154159546, 0.2117435336112976, 0.26881876587867737, 0.32589399814605713, 0.3829692602157593, 0.4400445222854614, 0.4971197545528412, 0.554194986820221, 0.6112702488899231, 0.6683455109596252, 0.7254207134246826, 0.7824959754943848, 0.8395712375640869, 0.8966464996337891, 0.9537217617034912, 1.0107970237731934, 1.0678722858428955, 1.1249475479125977, 1.1820226907730103, 1.2390979528427124, 1.2961732149124146, 1.3532484769821167, 1.4103237390518188, 1.467399001121521, 1.5244741439819336, 1.5815494060516357, 1.638624668121338, 1.69569993019104, 1.7527751922607422]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 8.0, 9.0, 6.0, 5.0, 16.0, 31.0, 42.0, 61.0, 93.0, 145.0, 239.0, 375.0, 610.0, 1042.0, 1816.0, 3158.0, 5713.0, 10698.0, 20597.0, 40688.0, 83411.0, 184666.0, 468752.0, 1278393.0, 1275893.0, 466154.0, 183399.0, 82956.0, 40553.0, 20778.0, 10731.0, 5710.0, 3208.0, 1763.0, 961.0, 615.0, 372.0, 229.0, 133.0, 86.0, 54.0, 36.0, 33.0, 19.0, 14.0, 7.0, 4.0, 3.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.277099609375, -0.26940155029296875, -0.2617034912109375, -0.25400543212890625, -0.246307373046875, -0.23860931396484375, -0.2309112548828125, -0.22321319580078125, -0.21551513671875, -0.20781707763671875, -0.2001190185546875, -0.19242095947265625, -0.184722900390625, -0.17702484130859375, -0.1693267822265625, -0.16162872314453125, -0.1539306640625, -0.14623260498046875, -0.1385345458984375, -0.13083648681640625, -0.123138427734375, -0.11544036865234375, -0.1077423095703125, -0.10004425048828125, -0.09234619140625, -0.08464813232421875, -0.0769500732421875, -0.06925201416015625, -0.061553955078125, -0.05385589599609375, -0.0461578369140625, -0.03845977783203125, -0.03076171875, -0.02306365966796875, -0.0153656005859375, -0.00766754150390625, 3.0517578125e-05, 0.00772857666015625, 0.0154266357421875, 0.02312469482421875, 0.03082275390625, 0.03852081298828125, 0.0462188720703125, 0.05391693115234375, 0.061614990234375, 0.06931304931640625, 0.0770111083984375, 0.08470916748046875, 0.0924072265625, 0.10010528564453125, 0.1078033447265625, 0.11550140380859375, 0.123199462890625, 0.13089752197265625, 0.1385955810546875, 0.14629364013671875, 0.15399169921875, 0.16168975830078125, 0.1693878173828125, 0.17708587646484375, 0.184783935546875, 0.19248199462890625, 0.2001800537109375, 0.20787811279296875, 0.215576171875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 2.0, 4.0, 16.0, 14.0, 8.0, 15.0, 16.0, 22.0, 23.0, 29.0, 24.0, 24.0, 38.0, 35.0, 37.0, 30.0, 47.0, 31.0, 43.0, 35.0, 33.0, 54.0, 40.0, 44.0, 31.0, 36.0, 29.0, 29.0, 22.0, 27.0, 25.0, 17.0, 21.0, 17.0, 9.0, 9.0, 9.0, 8.0, 9.0, 9.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.23486328125, -0.22769737243652344, -0.22053146362304688, -0.2133655548095703, -0.20619964599609375, -0.1990337371826172, -0.19186782836914062, -0.18470191955566406, -0.1775360107421875, -0.17037010192871094, -0.16320419311523438, -0.1560382843017578, -0.14887237548828125, -0.1417064666748047, -0.13454055786132812, -0.12737464904785156, -0.120208740234375, -0.11304283142089844, -0.10587692260742188, -0.09871101379394531, -0.09154510498046875, -0.08437919616699219, -0.07721328735351562, -0.07004737854003906, -0.0628814697265625, -0.05571556091308594, -0.048549652099609375, -0.04138374328613281, -0.03421783447265625, -0.027051925659179688, -0.019886016845703125, -0.012720108032226562, -0.00555419921875, 0.0016117095947265625, 0.008777618408203125, 0.015943527221679688, 0.02310943603515625, 0.030275344848632812, 0.037441253662109375, 0.04460716247558594, 0.0517730712890625, 0.05893898010253906, 0.06610488891601562, 0.07327079772949219, 0.08043670654296875, 0.08760261535644531, 0.09476852416992188, 0.10193443298339844, 0.109100341796875, 0.11626625061035156, 0.12343215942382812, 0.1305980682373047, 0.13776397705078125, 0.1449298858642578, 0.15209579467773438, 0.15926170349121094, 0.1664276123046875, 0.17359352111816406, 0.18075942993164062, 0.1879253387451172, 0.19509124755859375, 0.2022571563720703, 0.20942306518554688, 0.21658897399902344, 0.2237548828125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 15.0, 12.0, 31.0, 38.0, 50.0, 60.0, 81.0, 126.0, 208.0, 328.0, 547.0, 912.0, 1765.0, 3688.0, 8643.0, 21244.0, 55631.0, 156396.0, 494934.0, 1772566.0, 1184726.0, 318051.0, 107297.0, 38719.0, 15371.0, 6466.0, 2879.0, 1388.0, 805.0, 428.0, 260.0, 179.0, 126.0, 83.0, 74.0, 42.0, 31.0, 28.0, 18.0, 9.0, 10.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39794921875, -0.38364410400390625, -0.3693389892578125, -0.35503387451171875, -0.340728759765625, -0.32642364501953125, -0.3121185302734375, -0.29781341552734375, -0.28350830078125, -0.26920318603515625, -0.2548980712890625, -0.24059295654296875, -0.226287841796875, -0.21198272705078125, -0.1976776123046875, -0.18337249755859375, -0.1690673828125, -0.15476226806640625, -0.1404571533203125, -0.12615203857421875, -0.111846923828125, -0.09754180908203125, -0.0832366943359375, -0.06893157958984375, -0.05462646484375, -0.04032135009765625, -0.0260162353515625, -0.01171112060546875, 0.002593994140625, 0.01689910888671875, 0.0312042236328125, 0.04550933837890625, 0.059814453125, 0.07411956787109375, 0.0884246826171875, 0.10272979736328125, 0.117034912109375, 0.13134002685546875, 0.1456451416015625, 0.15995025634765625, 0.17425537109375, 0.18856048583984375, 0.2028656005859375, 0.21717071533203125, 0.231475830078125, 0.24578094482421875, 0.2600860595703125, 0.27439117431640625, 0.2886962890625, 0.30300140380859375, 0.3173065185546875, 0.33161163330078125, 0.345916748046875, 0.36022186279296875, 0.3745269775390625, 0.38883209228515625, 0.40313720703125, 0.41744232177734375, 0.4317474365234375, 0.44605255126953125, 0.460357666015625, 0.47466278076171875, 0.4889678955078125, 0.5032730102539062, 0.517578125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 10.0, 7.0, 21.0, 34.0, 40.0, 79.0, 136.0, 209.0, 370.0, 602.0, 850.0, 667.0, 375.0, 234.0, 129.0, 105.0, 61.0, 38.0, 39.0, 21.0, 13.0, 10.0, 3.0, 2.0, 5.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.505859375, -0.4825439453125, -0.459228515625, -0.4359130859375, -0.41259765625, -0.3892822265625, -0.365966796875, -0.3426513671875, -0.3193359375, -0.2960205078125, -0.272705078125, -0.2493896484375, -0.22607421875, -0.2027587890625, -0.179443359375, -0.1561279296875, -0.1328125, -0.1094970703125, -0.086181640625, -0.0628662109375, -0.03955078125, -0.0162353515625, 0.007080078125, 0.0303955078125, 0.0537109375, 0.0770263671875, 0.100341796875, 0.1236572265625, 0.14697265625, 0.1702880859375, 0.193603515625, 0.2169189453125, 0.240234375, 0.2635498046875, 0.286865234375, 0.3101806640625, 0.33349609375, 0.3568115234375, 0.380126953125, 0.4034423828125, 0.4267578125, 0.4500732421875, 0.473388671875, 0.4967041015625, 0.52001953125, 0.5433349609375, 0.566650390625, 0.5899658203125, 0.61328125, 0.6365966796875, 0.659912109375, 0.6832275390625, 0.70654296875, 0.7298583984375, 0.753173828125, 0.7764892578125, 0.7998046875, 0.8231201171875, 0.846435546875, 0.8697509765625, 0.89306640625, 0.9163818359375, 0.939697265625, 0.9630126953125, 0.986328125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 1.0, 7.0, 7.0, 11.0, 15.0, 11.0, 39.0, 45.0, 55.0, 65.0, 80.0, 92.0, 93.0, 87.0, 87.0, 85.0, 50.0, 62.0, 27.0, 30.0, 12.0, 12.0, 13.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.943532705307007, -2.8673970699310303, -2.791261672973633, -2.7151260375976562, -2.6389904022216797, -2.562854766845703, -2.4867191314697266, -2.410583734512329, -2.3344480991363525, -2.258312463760376, -2.1821770668029785, -2.106041431427002, -2.0299057960510254, -1.9537701606750488, -1.8776346445083618, -1.8014991283416748, -1.7253634929656982, -1.6492278575897217, -1.5730923414230347, -1.4969568252563477, -1.420821189880371, -1.3446855545043945, -1.2685500383377075, -1.1924145221710205, -1.116278886795044, -1.0401432514190674, -0.9640077352523804, -0.8878721594810486, -0.8117365837097168, -0.735601007938385, -0.6594654321670532, -0.5833298563957214, -0.5071942806243896, -0.43105870485305786, -0.3549231290817261, -0.2787875533103943, -0.2026519775390625, -0.1265164017677307, -0.050380825996398926, 0.02575474977493286, 0.10189032554626465, 0.17802590131759644, 0.2541614770889282, 0.33029705286026, 0.4064326286315918, 0.4825682044029236, 0.5587037801742554, 0.6348393559455872, 0.710974931716919, 0.7871105074882507, 0.8632460832595825, 0.9393816590309143, 1.015517234802246, 1.0916528701782227, 1.1677883863449097, 1.2439239025115967, 1.3200595378875732, 1.3961951732635498, 1.4723306894302368, 1.5484662055969238, 1.6246018409729004, 1.700737476348877, 1.776872992515564, 1.853008508682251, 1.9291441440582275]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 4.0, 3.0, 7.0, 6.0, 7.0, 8.0, 15.0, 12.0, 11.0, 20.0, 16.0, 28.0, 28.0, 27.0, 34.0, 40.0, 37.0, 39.0, 41.0, 42.0, 49.0, 35.0, 35.0, 39.0, 34.0, 42.0, 34.0, 42.0, 44.0, 24.0, 26.0, 33.0, 23.0, 25.0, 16.0, 14.0, 8.0, 11.0, 8.0, 3.0, 5.0, 5.0, 7.0, 7.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6516945362091064, -1.5991718769073486, -1.5466490983963013, -1.4941264390945435, -1.4416037797927856, -1.3890810012817383, -1.3365583419799805, -1.2840356826782227, -1.2315130233764648, -1.178990364074707, -1.1264675855636597, -1.0739449262619019, -1.021422266960144, -0.9688995480537415, -0.9163768291473389, -0.863854169845581, -0.8113313913345337, -0.7588086724281311, -0.7062860131263733, -0.6537632942199707, -0.6012406349182129, -0.5487179160118103, -0.4961951971054077, -0.4436725080013275, -0.3911498188972473, -0.3386271297931671, -0.2861044406890869, -0.23358172178268433, -0.18105903267860413, -0.12853634357452393, -0.07601362466812134, -0.023490935564041138, 0.029031753540039062, 0.08155445009469986, 0.13407714664936066, 0.18659985065460205, 0.23912253975868225, 0.29164522886276245, 0.34416794776916504, 0.39669063687324524, 0.44921332597732544, 0.501736044883728, 0.5542587041854858, 0.6067814230918884, 0.659304141998291, 0.7118268013000488, 0.7643495202064514, 0.816872239112854, 0.8693948984146118, 0.9219176173210144, 0.9744402766227722, 1.0269629955291748, 1.0794856548309326, 1.1320083141326904, 1.1845310926437378, 1.2370537519454956, 1.289576530456543, 1.3420991897583008, 1.3946219682693481, 1.447144627571106, 1.4996672868728638, 1.5521900653839111, 1.604712724685669, 1.6572353839874268, 1.7097580432891846]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 4.0, 5.0, 10.0, 13.0, 24.0, 36.0, 38.0, 51.0, 92.0, 135.0, 162.0, 242.0, 336.0, 519.0, 689.0, 963.0, 1382.0, 2038.0, 2832.0, 4048.0, 5811.0, 8235.0, 11989.0, 17376.0, 26442.0, 42261.0, 75081.0, 155818.0, 259413.0, 193594.0, 94127.0, 49895.0, 30597.0, 19953.0, 13534.0, 9223.0, 6476.0, 4457.0, 3132.0, 2269.0, 1583.0, 1054.0, 781.0, 553.0, 389.0, 285.0, 162.0, 146.0, 99.0, 71.0, 40.0, 34.0, 18.0, 9.0, 10.0, 12.0, 6.0, 11.0, 0.0, 1.0], "bins": [-0.248291015625, -0.24068832397460938, -0.23308563232421875, -0.22548294067382812, -0.2178802490234375, -0.21027755737304688, -0.20267486572265625, -0.19507217407226562, -0.187469482421875, -0.17986679077148438, -0.17226409912109375, -0.16466140747070312, -0.1570587158203125, -0.14945602416992188, -0.14185333251953125, -0.13425064086914062, -0.12664794921875, -0.11904525756835938, -0.11144256591796875, -0.10383987426757812, -0.0962371826171875, -0.08863449096679688, -0.08103179931640625, -0.07342910766601562, -0.065826416015625, -0.058223724365234375, -0.05062103271484375, -0.043018341064453125, -0.0354156494140625, -0.027812957763671875, -0.02021026611328125, -0.012607574462890625, -0.0050048828125, 0.002597808837890625, 0.01020050048828125, 0.017803192138671875, 0.0254058837890625, 0.033008575439453125, 0.04061126708984375, 0.048213958740234375, 0.055816650390625, 0.06341934204101562, 0.07102203369140625, 0.07862472534179688, 0.0862274169921875, 0.09383010864257812, 0.10143280029296875, 0.10903549194335938, 0.11663818359375, 0.12424087524414062, 0.13184356689453125, 0.13944625854492188, 0.1470489501953125, 0.15465164184570312, 0.16225433349609375, 0.16985702514648438, 0.177459716796875, 0.18506240844726562, 0.19266510009765625, 0.20026779174804688, 0.2078704833984375, 0.21547317504882812, 0.22307586669921875, 0.23067855834960938, 0.23828125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 7.0, 3.0, 4.0, 3.0, 6.0, 4.0, 5.0, 10.0, 7.0, 13.0, 11.0, 13.0, 9.0, 23.0, 14.0, 20.0, 19.0, 30.0, 26.0, 30.0, 30.0, 43.0, 34.0, 36.0, 30.0, 37.0, 37.0, 38.0, 24.0, 40.0, 36.0, 35.0, 29.0, 40.0, 36.0, 35.0, 24.0, 27.0, 26.0, 17.0, 17.0, 9.0, 18.0, 15.0, 11.0, 7.0, 4.0, 6.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.2017822265625, -0.19544219970703125, -0.1891021728515625, -0.18276214599609375, -0.176422119140625, -0.17008209228515625, -0.1637420654296875, -0.15740203857421875, -0.15106201171875, -0.14472198486328125, -0.1383819580078125, -0.13204193115234375, -0.125701904296875, -0.11936187744140625, -0.1130218505859375, -0.10668182373046875, -0.100341796875, -0.09400177001953125, -0.0876617431640625, -0.08132171630859375, -0.074981689453125, -0.06864166259765625, -0.0623016357421875, -0.05596160888671875, -0.04962158203125, -0.04328155517578125, -0.0369415283203125, -0.03060150146484375, -0.024261474609375, -0.01792144775390625, -0.0115814208984375, -0.00524139404296875, 0.0010986328125, 0.00743865966796875, 0.0137786865234375, 0.02011871337890625, 0.026458740234375, 0.03279876708984375, 0.0391387939453125, 0.04547882080078125, 0.05181884765625, 0.05815887451171875, 0.0644989013671875, 0.07083892822265625, 0.077178955078125, 0.08351898193359375, 0.0898590087890625, 0.09619903564453125, 0.1025390625, 0.10887908935546875, 0.1152191162109375, 0.12155914306640625, 0.127899169921875, 0.13423919677734375, 0.1405792236328125, 0.14691925048828125, 0.15325927734375, 0.15959930419921875, 0.1659393310546875, 0.17227935791015625, 0.178619384765625, 0.18495941162109375, 0.1912994384765625, 0.19763946533203125, 0.2039794921875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 13.0, 11.0, 21.0, 26.0, 31.0, 39.0, 56.0, 75.0, 86.0, 183.0, 290.0, 636.0, 1530.0, 4092.0, 11298.0, 31426.0, 95737.0, 459574.0, 330922.0, 72147.0, 25302.0, 9216.0, 3275.0, 1271.0, 547.0, 277.0, 150.0, 96.0, 69.0, 45.0, 35.0, 23.0, 16.0, 10.0, 7.0, 9.0, 2.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5546875, -0.5340576171875, -0.513427734375, -0.4927978515625, -0.47216796875, -0.4515380859375, -0.430908203125, -0.4102783203125, -0.3896484375, -0.3690185546875, -0.348388671875, -0.3277587890625, -0.30712890625, -0.2864990234375, -0.265869140625, -0.2452392578125, -0.224609375, -0.2039794921875, -0.183349609375, -0.1627197265625, -0.14208984375, -0.1214599609375, -0.100830078125, -0.0802001953125, -0.0595703125, -0.0389404296875, -0.018310546875, 0.0023193359375, 0.02294921875, 0.0435791015625, 0.064208984375, 0.0848388671875, 0.10546875, 0.1260986328125, 0.146728515625, 0.1673583984375, 0.18798828125, 0.2086181640625, 0.229248046875, 0.2498779296875, 0.2705078125, 0.2911376953125, 0.311767578125, 0.3323974609375, 0.35302734375, 0.3736572265625, 0.394287109375, 0.4149169921875, 0.435546875, 0.4561767578125, 0.476806640625, 0.4974365234375, 0.51806640625, 0.5386962890625, 0.559326171875, 0.5799560546875, 0.6005859375, 0.6212158203125, 0.641845703125, 0.6624755859375, 0.68310546875, 0.7037353515625, 0.724365234375, 0.7449951171875, 0.765625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 1.0, 4.0, 4.0, 3.0, 10.0, 8.0, 16.0, 9.0, 15.0, 8.0, 14.0, 14.0, 18.0, 14.0, 23.0, 29.0, 27.0, 35.0, 36.0, 31.0, 35.0, 32.0, 29.0, 45.0, 48.0, 43.0, 30.0, 38.0, 40.0, 43.0, 28.0, 29.0, 27.0, 26.0, 27.0, 19.0, 27.0, 13.0, 18.0, 12.0, 12.0, 12.0, 5.0, 6.0, 6.0, 7.0, 4.0, 6.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.583984375, -0.5655059814453125, -0.547027587890625, -0.5285491943359375, -0.51007080078125, -0.4915924072265625, -0.473114013671875, -0.4546356201171875, -0.4361572265625, -0.4176788330078125, -0.399200439453125, -0.3807220458984375, -0.36224365234375, -0.3437652587890625, -0.325286865234375, -0.3068084716796875, -0.288330078125, -0.2698516845703125, -0.251373291015625, -0.2328948974609375, -0.21441650390625, -0.1959381103515625, -0.177459716796875, -0.1589813232421875, -0.1405029296875, -0.1220245361328125, -0.103546142578125, -0.0850677490234375, -0.06658935546875, -0.0481109619140625, -0.029632568359375, -0.0111541748046875, 0.00732421875, 0.0258026123046875, 0.044281005859375, 0.0627593994140625, 0.08123779296875, 0.0997161865234375, 0.118194580078125, 0.1366729736328125, 0.1551513671875, 0.1736297607421875, 0.192108154296875, 0.2105865478515625, 0.22906494140625, 0.2475433349609375, 0.266021728515625, 0.2845001220703125, 0.302978515625, 0.3214569091796875, 0.339935302734375, 0.3584136962890625, 0.37689208984375, 0.3953704833984375, 0.413848876953125, 0.4323272705078125, 0.4508056640625, 0.4692840576171875, 0.487762451171875, 0.5062408447265625, 0.52471923828125, 0.5431976318359375, 0.561676025390625, 0.5801544189453125, 0.5986328125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 5.0, 9.0, 11.0, 20.0, 24.0, 39.0, 57.0, 121.0, 180.0, 260.0, 459.0, 810.0, 1528.0, 2818.0, 5388.0, 10245.0, 20042.0, 39621.0, 79952.0, 187037.0, 360622.0, 180861.0, 78585.0, 38827.0, 19698.0, 9878.0, 5193.0, 2686.0, 1528.0, 818.0, 479.0, 298.0, 171.0, 102.0, 58.0, 43.0, 28.0, 15.0, 12.0, 11.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1639404296875, -0.1590442657470703, -0.15414810180664062, -0.14925193786621094, -0.14435577392578125, -0.13945960998535156, -0.13456344604492188, -0.1296672821044922, -0.1247711181640625, -0.11987495422363281, -0.11497879028320312, -0.11008262634277344, -0.10518646240234375, -0.10029029846191406, -0.09539413452148438, -0.09049797058105469, -0.085601806640625, -0.08070564270019531, -0.07580947875976562, -0.07091331481933594, -0.06601715087890625, -0.06112098693847656, -0.056224822998046875, -0.05132865905761719, -0.0464324951171875, -0.04153633117675781, -0.036640167236328125, -0.03174400329589844, -0.02684783935546875, -0.021951675415039062, -0.017055511474609375, -0.012159347534179688, -0.00726318359375, -0.0023670196533203125, 0.002529144287109375, 0.0074253082275390625, 0.01232147216796875, 0.017217636108398438, 0.022113800048828125, 0.027009963989257812, 0.0319061279296875, 0.03680229187011719, 0.041698455810546875, 0.04659461975097656, 0.05149078369140625, 0.05638694763183594, 0.061283111572265625, 0.06617927551269531, 0.071075439453125, 0.07597160339355469, 0.08086776733398438, 0.08576393127441406, 0.09066009521484375, 0.09555625915527344, 0.10045242309570312, 0.10534858703613281, 0.1102447509765625, 0.11514091491699219, 0.12003707885742188, 0.12493324279785156, 0.12982940673828125, 0.13472557067871094, 0.13962173461914062, 0.1445178985595703, 0.1494140625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 0.0, 3.0, 2.0, 2.0, 8.0, 5.0, 4.0, 11.0, 11.0, 12.0, 8.0, 11.0, 30.0, 38.0, 45.0, 80.0, 103.0, 154.0, 155.0, 106.0, 53.0, 40.0, 27.0, 24.0, 17.0, 7.0, 7.0, 12.0, 4.0, 5.0, 8.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.55055046081543e-05, -6.376765668392181e-05, -6.202980875968933e-05, -6.029196083545685e-05, -5.8554112911224365e-05, -5.681626498699188e-05, -5.50784170627594e-05, -5.3340569138526917e-05, -5.1602721214294434e-05, -4.986487329006195e-05, -4.812702536582947e-05, -4.6389177441596985e-05, -4.46513295173645e-05, -4.291348159313202e-05, -4.1175633668899536e-05, -3.943778574466705e-05, -3.769993782043457e-05, -3.596208989620209e-05, -3.4224241971969604e-05, -3.248639404773712e-05, -3.074854612350464e-05, -2.9010698199272156e-05, -2.7272850275039673e-05, -2.553500235080719e-05, -2.3797154426574707e-05, -2.2059306502342224e-05, -2.032145857810974e-05, -1.8583610653877258e-05, -1.6845762729644775e-05, -1.5107914805412292e-05, -1.337006688117981e-05, -1.1632218956947327e-05, -9.894371032714844e-06, -8.15652310848236e-06, -6.418675184249878e-06, -4.680827260017395e-06, -2.942979335784912e-06, -1.2051314115524292e-06, 5.327165126800537e-07, 2.2705644369125366e-06, 4.0084123611450195e-06, 5.7462602853775024e-06, 7.484108209609985e-06, 9.221956133842468e-06, 1.0959804058074951e-05, 1.2697651982307434e-05, 1.4435499906539917e-05, 1.61733478307724e-05, 1.7911195755004883e-05, 1.9649043679237366e-05, 2.138689160346985e-05, 2.312473952770233e-05, 2.4862587451934814e-05, 2.6600435376167297e-05, 2.833828330039978e-05, 3.0076131224632263e-05, 3.1813979148864746e-05, 3.355182707309723e-05, 3.528967499732971e-05, 3.7027522921562195e-05, 3.876537084579468e-05, 4.050321877002716e-05, 4.2241066694259644e-05, 4.3978914618492126e-05, 4.571676254272461e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 8.0, 6.0, 9.0, 13.0, 22.0, 26.0, 45.0, 46.0, 87.0, 122.0, 196.0, 330.0, 619.0, 1142.0, 2881.0, 8019.0, 29385.0, 121543.0, 511979.0, 285464.0, 61898.0, 16002.0, 4943.0, 1829.0, 801.0, 404.0, 266.0, 164.0, 103.0, 58.0, 39.0, 43.0, 15.0, 16.0, 15.0, 10.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.322998046875, -0.313140869140625, -0.30328369140625, -0.293426513671875, -0.2835693359375, -0.273712158203125, -0.26385498046875, -0.253997802734375, -0.244140625, -0.234283447265625, -0.22442626953125, -0.214569091796875, -0.2047119140625, -0.194854736328125, -0.18499755859375, -0.175140380859375, -0.165283203125, -0.155426025390625, -0.14556884765625, -0.135711669921875, -0.1258544921875, -0.115997314453125, -0.10614013671875, -0.096282958984375, -0.08642578125, -0.076568603515625, -0.06671142578125, -0.056854248046875, -0.0469970703125, -0.037139892578125, -0.02728271484375, -0.017425537109375, -0.007568359375, 0.002288818359375, 0.01214599609375, 0.022003173828125, 0.0318603515625, 0.041717529296875, 0.05157470703125, 0.061431884765625, 0.0712890625, 0.081146240234375, 0.09100341796875, 0.100860595703125, 0.1107177734375, 0.120574951171875, 0.13043212890625, 0.140289306640625, 0.150146484375, 0.160003662109375, 0.16986083984375, 0.179718017578125, 0.1895751953125, 0.199432373046875, 0.20928955078125, 0.219146728515625, 0.22900390625, 0.238861083984375, 0.24871826171875, 0.258575439453125, 0.2684326171875, 0.278289794921875, 0.28814697265625, 0.298004150390625, 0.307861328125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 7.0, 10.0, 9.0, 10.0, 18.0, 17.0, 19.0, 25.0, 51.0, 53.0, 62.0, 93.0, 95.0, 110.0, 108.0, 73.0, 52.0, 46.0, 35.0, 25.0, 28.0, 12.0, 8.0, 11.0, 9.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1937255859375, -0.18535423278808594, -0.17698287963867188, -0.1686115264892578, -0.16024017333984375, -0.1518688201904297, -0.14349746704101562, -0.13512611389160156, -0.1267547607421875, -0.11838340759277344, -0.11001205444335938, -0.10164070129394531, -0.09326934814453125, -0.08489799499511719, -0.07652664184570312, -0.06815528869628906, -0.059783935546875, -0.05141258239746094, -0.043041229248046875, -0.03466987609863281, -0.02629852294921875, -0.017927169799804688, -0.009555816650390625, -0.0011844635009765625, 0.0071868896484375, 0.015558242797851562, 0.023929595947265625, 0.03230094909667969, 0.04067230224609375, 0.04904365539550781, 0.057415008544921875, 0.06578636169433594, 0.07415771484375, 0.08252906799316406, 0.09090042114257812, 0.09927177429199219, 0.10764312744140625, 0.11601448059082031, 0.12438583374023438, 0.13275718688964844, 0.1411285400390625, 0.14949989318847656, 0.15787124633789062, 0.1662425994873047, 0.17461395263671875, 0.1829853057861328, 0.19135665893554688, 0.19972801208496094, 0.208099365234375, 0.21647071838378906, 0.22484207153320312, 0.2332134246826172, 0.24158477783203125, 0.2499561309814453, 0.2583274841308594, 0.26669883728027344, 0.2750701904296875, 0.28344154357910156, 0.2918128967285156, 0.3001842498779297, 0.30855560302734375, 0.3169269561767578, 0.3252983093261719, 0.33366966247558594, 0.342041015625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 2.0, 11.0, 17.0, 24.0, 39.0, 74.0, 114.0, 132.0, 160.0, 134.0, 116.0, 76.0, 56.0, 26.0, 14.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6895956993103027, -2.5931897163391113, -2.49678373336792, -2.4003775119781494, -2.303971529006958, -2.2075655460357666, -2.111159563064575, -2.0147533416748047, -1.9183473587036133, -1.8219413757324219, -1.725535273551941, -1.6291292905807495, -1.5327231884002686, -1.4363172054290771, -1.3399112224578857, -1.2435051202774048, -1.1470991373062134, -1.050693154335022, -0.954287052154541, -0.8578810691833496, -0.7614749670028687, -0.6650689840316772, -0.5686629414558411, -0.4722568988800049, -0.3758508563041687, -0.2794448137283325, -0.18303878605365753, -0.08663275837898254, 0.009773284196853638, 0.10617932677268982, 0.2025853395462036, 0.2989913821220398, 0.395397424697876, 0.49180346727371216, 0.5882095098495483, 0.6846154928207397, 0.7810215950012207, 0.8774275779724121, 0.9738336205482483, 1.0702396631240845, 1.1666457653045654, 1.2630517482757568, 1.3594578504562378, 1.4558638334274292, 1.5522699356079102, 1.6486759185791016, 1.745081901550293, 1.841488003730774, 1.9378939867019653, 2.0343000888824463, 2.1307060718536377, 2.227112054824829, 2.3235180377960205, 2.419924259185791, 2.5163302421569824, 2.612736225128174, 2.7091422080993652, 2.8055481910705566, 2.901954174041748, 2.9983603954315186, 3.09476637840271, 3.1911723613739014, 3.2875783443450928, 3.3839845657348633, 3.4803905487060547]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 7.0, 3.0, 2.0, 10.0, 2.0, 14.0, 15.0, 8.0, 14.0, 14.0, 20.0, 20.0, 25.0, 28.0, 15.0, 35.0, 37.0, 29.0, 37.0, 35.0, 36.0, 33.0, 42.0, 44.0, 46.0, 40.0, 33.0, 30.0, 38.0, 35.0, 34.0, 27.0, 25.0, 31.0, 35.0, 16.0, 17.0, 13.0, 15.0, 10.0, 5.0, 11.0, 8.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6608526706695557, -1.6099472045898438, -1.5590416193008423, -1.5081361532211304, -1.4572306871414185, -1.406325101852417, -1.355419635772705, -1.3045141696929932, -1.2536087036132812, -1.2027032375335693, -1.1517976522445679, -1.100892186164856, -1.049986720085144, -0.9990811944007874, -0.9481756687164307, -0.8972702026367188, -0.8463646173477173, -0.7954590916633606, -0.7445536255836487, -0.693648099899292, -0.6427426338195801, -0.5918371081352234, -0.5409315824508667, -0.4900260865688324, -0.4391205906867981, -0.3882150948047638, -0.3373095989227295, -0.2864040732383728, -0.2354985773563385, -0.1845930814743042, -0.1336875557899475, -0.08278205990791321, -0.031876564025878906, 0.019028939306735992, 0.06993444263935089, 0.12083995342254639, 0.1717454493045807, 0.222650945186615, 0.2735564708709717, 0.324461966753006, 0.3753674626350403, 0.4262729585170746, 0.4771784543991089, 0.5280839800834656, 0.5789895057678223, 0.6298949718475342, 0.6808004975318909, 0.7317060232162476, 0.7826114892959595, 0.8335170149803162, 0.8844224810600281, 0.9353280067443848, 0.9862334728240967, 1.0371389389038086, 1.08804452419281, 1.138949990272522, 1.1898555755615234, 1.2407610416412354, 1.2916666269302368, 1.3425720930099487, 1.3934775590896606, 1.444383144378662, 1.495288610458374, 1.546194076538086, 1.5970995426177979]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 4.0, 10.0, 11.0, 16.0, 17.0, 39.0, 72.0, 113.0, 200.0, 353.0, 640.0, 1121.0, 2100.0, 4094.0, 7596.0, 15377.0, 31978.0, 66776.0, 155947.0, 436657.0, 1515159.0, 1320887.0, 377192.0, 138161.0, 61332.0, 28884.0, 14202.0, 7183.0, 3779.0, 1979.0, 1072.0, 587.0, 320.0, 179.0, 102.0, 58.0, 35.0, 18.0, 11.0, 7.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31640625, -0.30735015869140625, -0.2982940673828125, -0.28923797607421875, -0.280181884765625, -0.27112579345703125, -0.2620697021484375, -0.25301361083984375, -0.24395751953125, -0.23490142822265625, -0.2258453369140625, -0.21678924560546875, -0.207733154296875, -0.19867706298828125, -0.1896209716796875, -0.18056488037109375, -0.1715087890625, -0.16245269775390625, -0.1533966064453125, -0.14434051513671875, -0.135284423828125, -0.12622833251953125, -0.1171722412109375, -0.10811614990234375, -0.09906005859375, -0.09000396728515625, -0.0809478759765625, -0.07189178466796875, -0.062835693359375, -0.05377960205078125, -0.0447235107421875, -0.03566741943359375, -0.026611328125, -0.01755523681640625, -0.0084991455078125, 0.00055694580078125, 0.009613037109375, 0.01866912841796875, 0.0277252197265625, 0.03678131103515625, 0.04583740234375, 0.05489349365234375, 0.0639495849609375, 0.07300567626953125, 0.082061767578125, 0.09111785888671875, 0.1001739501953125, 0.10923004150390625, 0.1182861328125, 0.12734222412109375, 0.1363983154296875, 0.14545440673828125, 0.154510498046875, 0.16356658935546875, 0.1726226806640625, 0.18167877197265625, 0.19073486328125, 0.19979095458984375, 0.2088470458984375, 0.21790313720703125, 0.226959228515625, 0.23601531982421875, 0.2450714111328125, 0.25412750244140625, 0.26318359375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 7.0, 9.0, 7.0, 8.0, 11.0, 11.0, 12.0, 12.0, 16.0, 20.0, 25.0, 17.0, 25.0, 25.0, 40.0, 37.0, 35.0, 39.0, 44.0, 36.0, 32.0, 42.0, 40.0, 33.0, 28.0, 36.0, 45.0, 41.0, 36.0, 28.0, 28.0, 18.0, 29.0, 23.0, 16.0, 17.0, 14.0, 10.0, 10.0, 10.0, 1.0, 3.0, 5.0, 7.0, 5.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2269287109375, -0.22019386291503906, -0.21345901489257812, -0.2067241668701172, -0.19998931884765625, -0.1932544708251953, -0.18651962280273438, -0.17978477478027344, -0.1730499267578125, -0.16631507873535156, -0.15958023071289062, -0.1528453826904297, -0.14611053466796875, -0.1393756866455078, -0.13264083862304688, -0.12590599060058594, -0.119171142578125, -0.11243629455566406, -0.10570144653320312, -0.09896659851074219, -0.09223175048828125, -0.08549690246582031, -0.07876205444335938, -0.07202720642089844, -0.0652923583984375, -0.05855751037597656, -0.051822662353515625, -0.04508781433105469, -0.03835296630859375, -0.03161811828613281, -0.024883270263671875, -0.018148422241210938, -0.01141357421875, -0.0046787261962890625, 0.002056121826171875, 0.008790969848632812, 0.01552581787109375, 0.022260665893554688, 0.028995513916015625, 0.03573036193847656, 0.0424652099609375, 0.04920005798339844, 0.055934906005859375, 0.06266975402832031, 0.06940460205078125, 0.07613945007324219, 0.08287429809570312, 0.08960914611816406, 0.096343994140625, 0.10307884216308594, 0.10981369018554688, 0.11654853820800781, 0.12328338623046875, 0.1300182342529297, 0.13675308227539062, 0.14348793029785156, 0.1502227783203125, 0.15695762634277344, 0.16369247436523438, 0.1704273223876953, 0.17716217041015625, 0.1838970184326172, 0.19063186645507812, 0.19736671447753906, 0.2041015625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 8.0, 9.0, 9.0, 9.0, 17.0, 23.0, 44.0, 48.0, 71.0, 95.0, 122.0, 190.0, 268.0, 388.0, 625.0, 950.0, 1554.0, 2669.0, 4606.0, 8302.0, 15351.0, 29333.0, 57764.0, 121274.0, 277970.0, 800134.0, 1672764.0, 715280.0, 255389.0, 112547.0, 54770.0, 27820.0, 14615.0, 7646.0, 4430.0, 2664.0, 1543.0, 1027.0, 617.0, 424.0, 302.0, 191.0, 126.0, 92.0, 64.0, 44.0, 23.0, 30.0, 22.0, 8.0, 6.0, 8.0, 0.0, 4.0, 1.0, 2.0, 4.0, 1.0], "bins": [-0.33203125, -0.32180023193359375, -0.3115692138671875, -0.30133819580078125, -0.291107177734375, -0.28087615966796875, -0.2706451416015625, -0.26041412353515625, -0.25018310546875, -0.23995208740234375, -0.2297210693359375, -0.21949005126953125, -0.209259033203125, -0.19902801513671875, -0.1887969970703125, -0.17856597900390625, -0.1683349609375, -0.15810394287109375, -0.1478729248046875, -0.13764190673828125, -0.127410888671875, -0.11717987060546875, -0.1069488525390625, -0.09671783447265625, -0.08648681640625, -0.07625579833984375, -0.0660247802734375, -0.05579376220703125, -0.045562744140625, -0.03533172607421875, -0.0251007080078125, -0.01486968994140625, -0.004638671875, 0.00559234619140625, 0.0158233642578125, 0.02605438232421875, 0.036285400390625, 0.04651641845703125, 0.0567474365234375, 0.06697845458984375, 0.07720947265625, 0.08744049072265625, 0.0976715087890625, 0.10790252685546875, 0.118133544921875, 0.12836456298828125, 0.1385955810546875, 0.14882659912109375, 0.1590576171875, 0.16928863525390625, 0.1795196533203125, 0.18975067138671875, 0.199981689453125, 0.21021270751953125, 0.2204437255859375, 0.23067474365234375, 0.24090576171875, 0.25113677978515625, 0.2613677978515625, 0.27159881591796875, 0.281829833984375, 0.29206085205078125, 0.3022918701171875, 0.31252288818359375, 0.32275390625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 13.0, 9.0, 8.0, 13.0, 18.0, 21.0, 47.0, 53.0, 74.0, 81.0, 107.0, 175.0, 217.0, 350.0, 492.0, 568.0, 515.0, 367.0, 247.0, 173.0, 105.0, 94.0, 71.0, 63.0, 36.0, 29.0, 24.0, 21.0, 20.0, 12.0, 5.0, 8.0, 8.0, 4.0, 4.0, 6.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.437255859375, -0.4225349426269531, -0.40781402587890625, -0.3930931091308594, -0.3783721923828125, -0.3636512756347656, -0.34893035888671875, -0.3342094421386719, -0.319488525390625, -0.3047676086425781, -0.29004669189453125, -0.2753257751464844, -0.2606048583984375, -0.24588394165039062, -0.23116302490234375, -0.21644210815429688, -0.20172119140625, -0.18700027465820312, -0.17227935791015625, -0.15755844116210938, -0.1428375244140625, -0.12811660766601562, -0.11339569091796875, -0.09867477416992188, -0.083953857421875, -0.06923294067382812, -0.05451202392578125, -0.039791107177734375, -0.0250701904296875, -0.010349273681640625, 0.00437164306640625, 0.019092559814453125, 0.0338134765625, 0.048534393310546875, 0.06325531005859375, 0.07797622680664062, 0.0926971435546875, 0.10741806030273438, 0.12213897705078125, 0.13685989379882812, 0.151580810546875, 0.16630172729492188, 0.18102264404296875, 0.19574356079101562, 0.2104644775390625, 0.22518539428710938, 0.23990631103515625, 0.2546272277832031, 0.26934814453125, 0.2840690612792969, 0.29878997802734375, 0.3135108947753906, 0.3282318115234375, 0.3429527282714844, 0.35767364501953125, 0.3723945617675781, 0.387115478515625, 0.4018363952636719, 0.41655731201171875, 0.4312782287597656, 0.4459991455078125, 0.4607200622558594, 0.47544097900390625, 0.4901618957519531, 0.5048828125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 17.0, 24.0, 51.0, 61.0, 96.0, 142.0, 142.0, 158.0, 134.0, 82.0, 37.0, 21.0, 17.0, 9.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5983855724334717, -2.477837324142456, -2.3572890758514404, -2.236740827560425, -2.11619234085083, -1.995644211769104, -1.8750958442687988, -1.7545475959777832, -1.6339993476867676, -1.513451099395752, -1.3929028511047363, -1.2723544836044312, -1.1518062353134155, -1.0312579870224, -0.9107096791267395, -0.7901613712310791, -0.6696131229400635, -0.5490648746490479, -0.42851656675338745, -0.30796828866004944, -0.18742001056671143, -0.0668717622756958, 0.0536765456199646, 0.174224853515625, 0.2947731018066406, 0.41532137989997864, 0.5358696579933167, 0.656417965888977, 0.7769662141799927, 0.8975144624710083, 1.0180628299713135, 1.138611078262329, 1.2591590881347656, 1.3797073364257812, 1.5002555847167969, 1.620803952217102, 1.7413522005081177, 1.8619004487991333, 1.9824488162994385, 2.102997064590454, 2.2235453128814697, 2.3440935611724854, 2.464641809463501, 2.5851900577545166, 2.7057385444641113, 2.826286792755127, 2.9468350410461426, 3.067383289337158, 3.187931537628174, 3.3084797859191895, 3.429028034210205, 3.5495762825012207, 3.6701245307922363, 3.790672779083252, 3.9112212657928467, 4.031769752502441, 4.152318000793457, 4.272866249084473, 4.393414497375488, 4.513962745666504, 4.6345109939575195, 4.755059242248535, 4.875607490539551, 4.996155738830566, 5.116703987121582]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 5.0, 3.0, 8.0, 3.0, 6.0, 6.0, 6.0, 12.0, 18.0, 32.0, 14.0, 17.0, 28.0, 20.0, 28.0, 22.0, 30.0, 34.0, 43.0, 46.0, 33.0, 41.0, 42.0, 41.0, 45.0, 21.0, 39.0, 40.0, 36.0, 36.0, 24.0, 36.0, 28.0, 25.0, 19.0, 16.0, 23.0, 10.0, 12.0, 12.0, 9.0, 11.0, 10.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.6624364852905273, -1.6146938800811768, -1.5669512748718262, -1.5192086696624756, -1.4714659452438354, -1.4237233400344849, -1.3759807348251343, -1.3282381296157837, -1.280495524406433, -1.2327529191970825, -1.185010313987732, -1.1372675895690918, -1.0895249843597412, -1.0417823791503906, -0.99403977394104, -0.9462971687316895, -0.8985545039176941, -0.8508118987083435, -0.8030692338943481, -0.7553266286849976, -0.707584023475647, -0.6598414182662964, -0.612098753452301, -0.5643561482429504, -0.5166134834289551, -0.4688708484172821, -0.4211282432079315, -0.37338560819625854, -0.32564300298690796, -0.277900367975235, -0.230157732963562, -0.18241512775421143, -0.13467252254486084, -0.08692990243434906, -0.03918727487325668, 0.008555352687835693, 0.05629797279834747, 0.10404059290885925, 0.15178322792053223, 0.1995258331298828, 0.2472684681415558, 0.29501110315322876, 0.34275370836257935, 0.3904963433742523, 0.4382389783859253, 0.4859815835952759, 0.5337241888046265, 0.581466794013977, 0.6292094588279724, 0.676952064037323, 0.7246947288513184, 0.772437334060669, 0.8201799392700195, 0.8679225444793701, 0.9156652092933655, 0.9634078145027161, 1.0111504793167114, 1.058893084526062, 1.1066356897354126, 1.1543784141540527, 1.2021210193634033, 1.249863624572754, 1.2976062297821045, 1.345348834991455, 1.3930914402008057]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 6.0, 4.0, 4.0, 6.0, 11.0, 6.0, 7.0, 26.0, 28.0, 46.0, 88.0, 141.0, 193.0, 315.0, 542.0, 798.0, 1369.0, 2210.0, 3514.0, 5828.0, 9698.0, 17448.0, 34884.0, 81608.0, 210782.0, 339709.0, 192245.0, 75006.0, 32280.0, 16325.0, 9183.0, 5444.0, 3401.0, 2099.0, 1192.0, 793.0, 502.0, 308.0, 187.0, 99.0, 75.0, 44.0, 35.0, 24.0, 18.0, 4.0, 8.0, 6.0, 4.0, 7.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.33544921875, -0.32511138916015625, -0.3147735595703125, -0.30443572998046875, -0.294097900390625, -0.28376007080078125, -0.2734222412109375, -0.26308441162109375, -0.25274658203125, -0.24240875244140625, -0.2320709228515625, -0.22173309326171875, -0.211395263671875, -0.20105743408203125, -0.1907196044921875, -0.18038177490234375, -0.1700439453125, -0.15970611572265625, -0.1493682861328125, -0.13903045654296875, -0.128692626953125, -0.11835479736328125, -0.1080169677734375, -0.09767913818359375, -0.08734130859375, -0.07700347900390625, -0.0666656494140625, -0.05632781982421875, -0.045989990234375, -0.03565216064453125, -0.0253143310546875, -0.01497650146484375, -0.004638671875, 0.00569915771484375, 0.0160369873046875, 0.02637481689453125, 0.036712646484375, 0.04705047607421875, 0.0573883056640625, 0.06772613525390625, 0.07806396484375, 0.08840179443359375, 0.0987396240234375, 0.10907745361328125, 0.119415283203125, 0.12975311279296875, 0.1400909423828125, 0.15042877197265625, 0.1607666015625, 0.17110443115234375, 0.1814422607421875, 0.19178009033203125, 0.202117919921875, 0.21245574951171875, 0.2227935791015625, 0.23313140869140625, 0.24346923828125, 0.25380706787109375, 0.2641448974609375, 0.27448272705078125, 0.284820556640625, 0.29515838623046875, 0.3054962158203125, 0.31583404541015625, 0.326171875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 6.0, 5.0, 6.0, 10.0, 4.0, 13.0, 10.0, 23.0, 14.0, 8.0, 21.0, 18.0, 25.0, 29.0, 35.0, 40.0, 32.0, 30.0, 29.0, 32.0, 39.0, 37.0, 41.0, 38.0, 34.0, 34.0, 45.0, 34.0, 33.0, 39.0, 25.0, 30.0, 27.0, 25.0, 14.0, 15.0, 20.0, 14.0, 8.0, 10.0, 6.0, 6.0, 7.0, 9.0, 8.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-0.22412109375, -0.2174396514892578, -0.21075820922851562, -0.20407676696777344, -0.19739532470703125, -0.19071388244628906, -0.18403244018554688, -0.1773509979248047, -0.1706695556640625, -0.1639881134033203, -0.15730667114257812, -0.15062522888183594, -0.14394378662109375, -0.13726234436035156, -0.13058090209960938, -0.12389945983886719, -0.117218017578125, -0.11053657531738281, -0.10385513305664062, -0.09717369079589844, -0.09049224853515625, -0.08381080627441406, -0.07712936401367188, -0.07044792175292969, -0.0637664794921875, -0.05708503723144531, -0.050403594970703125, -0.04372215270996094, -0.03704071044921875, -0.030359268188476562, -0.023677825927734375, -0.016996383666992188, -0.01031494140625, -0.0036334991455078125, 0.003047943115234375, 0.009729385375976562, 0.01641082763671875, 0.023092269897460938, 0.029773712158203125, 0.03645515441894531, 0.0431365966796875, 0.04981803894042969, 0.056499481201171875, 0.06318092346191406, 0.06986236572265625, 0.07654380798339844, 0.08322525024414062, 0.08990669250488281, 0.096588134765625, 0.10326957702636719, 0.10995101928710938, 0.11663246154785156, 0.12331390380859375, 0.12999534606933594, 0.13667678833007812, 0.1433582305908203, 0.1500396728515625, 0.1567211151123047, 0.16340255737304688, 0.17008399963378906, 0.17676544189453125, 0.18344688415527344, 0.19012832641601562, 0.1968097686767578, 0.2034912109375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 6.0, 4.0, 4.0, 13.0, 15.0, 19.0, 20.0, 29.0, 38.0, 49.0, 90.0, 146.0, 258.0, 509.0, 1238.0, 3026.0, 8416.0, 25099.0, 96988.0, 418537.0, 375769.0, 83223.0, 22448.0, 7450.0, 2882.0, 1140.0, 505.0, 248.0, 144.0, 71.0, 56.0, 36.0, 22.0, 14.0, 9.0, 9.0, 8.0, 4.0, 3.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.61767578125, -0.5989303588867188, -0.5801849365234375, -0.5614395141601562, -0.542694091796875, -0.5239486694335938, -0.5052032470703125, -0.48645782470703125, -0.46771240234375, -0.44896697998046875, -0.4302215576171875, -0.41147613525390625, -0.392730712890625, -0.37398529052734375, -0.3552398681640625, -0.33649444580078125, -0.3177490234375, -0.29900360107421875, -0.2802581787109375, -0.26151275634765625, -0.242767333984375, -0.22402191162109375, -0.2052764892578125, -0.18653106689453125, -0.16778564453125, -0.14904022216796875, -0.1302947998046875, -0.11154937744140625, -0.092803955078125, -0.07405853271484375, -0.0553131103515625, -0.03656768798828125, -0.017822265625, 0.00092315673828125, 0.0196685791015625, 0.03841400146484375, 0.057159423828125, 0.07590484619140625, 0.0946502685546875, 0.11339569091796875, 0.13214111328125, 0.15088653564453125, 0.1696319580078125, 0.18837738037109375, 0.207122802734375, 0.22586822509765625, 0.2446136474609375, 0.26335906982421875, 0.2821044921875, 0.30084991455078125, 0.3195953369140625, 0.33834075927734375, 0.357086181640625, 0.37583160400390625, 0.3945770263671875, 0.41332244873046875, 0.43206787109375, 0.45081329345703125, 0.4695587158203125, 0.48830413818359375, 0.507049560546875, 0.5257949829101562, 0.5445404052734375, 0.5632858276367188, 0.58203125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 8.0, 7.0, 10.0, 11.0, 12.0, 19.0, 25.0, 21.0, 21.0, 33.0, 34.0, 29.0, 31.0, 28.0, 38.0, 40.0, 45.0, 36.0, 41.0, 41.0, 38.0, 52.0, 42.0, 36.0, 27.0, 32.0, 29.0, 29.0, 27.0, 26.0, 26.0, 21.0, 16.0, 16.0, 12.0, 9.0, 4.0, 8.0, 5.0, 8.0, 2.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.673828125, -0.6527786254882812, -0.6317291259765625, -0.6106796264648438, -0.589630126953125, -0.5685806274414062, -0.5475311279296875, -0.5264816284179688, -0.50543212890625, -0.48438262939453125, -0.4633331298828125, -0.44228363037109375, -0.421234130859375, -0.40018463134765625, -0.3791351318359375, -0.35808563232421875, -0.3370361328125, -0.31598663330078125, -0.2949371337890625, -0.27388763427734375, -0.252838134765625, -0.23178863525390625, -0.2107391357421875, -0.18968963623046875, -0.16864013671875, -0.14759063720703125, -0.1265411376953125, -0.10549163818359375, -0.084442138671875, -0.06339263916015625, -0.0423431396484375, -0.02129364013671875, -0.000244140625, 0.02080535888671875, 0.0418548583984375, 0.06290435791015625, 0.083953857421875, 0.10500335693359375, 0.1260528564453125, 0.14710235595703125, 0.16815185546875, 0.18920135498046875, 0.2102508544921875, 0.23130035400390625, 0.252349853515625, 0.27339935302734375, 0.2944488525390625, 0.31549835205078125, 0.3365478515625, 0.35759735107421875, 0.3786468505859375, 0.39969635009765625, 0.420745849609375, 0.44179534912109375, 0.4628448486328125, 0.48389434814453125, 0.50494384765625, 0.5259933471679688, 0.5470428466796875, 0.5680923461914062, 0.589141845703125, 0.6101913452148438, 0.6312408447265625, 0.6522903442382812, 0.67333984375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 6.0, 4.0, 6.0, 12.0, 15.0, 26.0, 24.0, 26.0, 66.0, 86.0, 155.0, 256.0, 420.0, 755.0, 1364.0, 2420.0, 4685.0, 8954.0, 17360.0, 35296.0, 77256.0, 189204.0, 332982.0, 211852.0, 86911.0, 38661.0, 18838.0, 9755.0, 5154.0, 2615.0, 1483.0, 746.0, 441.0, 244.0, 154.0, 94.0, 90.0, 38.0, 25.0, 24.0, 11.0, 17.0, 9.0, 6.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1531982421875, -0.1486339569091797, -0.14406967163085938, -0.13950538635253906, -0.13494110107421875, -0.13037681579589844, -0.12581253051757812, -0.12124824523925781, -0.1166839599609375, -0.11211967468261719, -0.10755538940429688, -0.10299110412597656, -0.09842681884765625, -0.09386253356933594, -0.08929824829101562, -0.08473396301269531, -0.080169677734375, -0.07560539245605469, -0.07104110717773438, -0.06647682189941406, -0.06191253662109375, -0.05734825134277344, -0.052783966064453125, -0.04821968078613281, -0.0436553955078125, -0.03909111022949219, -0.034526824951171875, -0.029962539672851562, -0.02539825439453125, -0.020833969116210938, -0.016269683837890625, -0.011705398559570312, -0.00714111328125, -0.0025768280029296875, 0.001987457275390625, 0.0065517425537109375, 0.01111602783203125, 0.015680313110351562, 0.020244598388671875, 0.024808883666992188, 0.0293731689453125, 0.03393745422363281, 0.038501739501953125, 0.04306602478027344, 0.04763031005859375, 0.05219459533691406, 0.056758880615234375, 0.06132316589355469, 0.065887451171875, 0.07045173645019531, 0.07501602172851562, 0.07958030700683594, 0.08414459228515625, 0.08870887756347656, 0.09327316284179688, 0.09783744812011719, 0.1024017333984375, 0.10696601867675781, 0.11153030395507812, 0.11609458923339844, 0.12065887451171875, 0.12522315979003906, 0.12978744506835938, 0.1343517303466797, 0.138916015625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 3.0, 5.0, 9.0, 4.0, 8.0, 15.0, 22.0, 35.0, 36.0, 76.0, 107.0, 129.0, 151.0, 147.0, 88.0, 55.0, 25.0, 24.0, 22.0, 9.0, 10.0, 11.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.175041198730469e-05, -5.98980113863945e-05, -5.8045610785484314e-05, -5.619321018457413e-05, -5.434080958366394e-05, -5.2488408982753754e-05, -5.063600838184357e-05, -4.878360778093338e-05, -4.693120718002319e-05, -4.5078806579113007e-05, -4.322640597820282e-05, -4.137400537729263e-05, -3.9521604776382446e-05, -3.766920417547226e-05, -3.581680357456207e-05, -3.3964402973651886e-05, -3.21120023727417e-05, -3.0259601771831512e-05, -2.8407201170921326e-05, -2.655480057001114e-05, -2.4702399969100952e-05, -2.2849999368190765e-05, -2.099759876728058e-05, -1.9145198166370392e-05, -1.7292797565460205e-05, -1.544039696455002e-05, -1.3587996363639832e-05, -1.1735595762729645e-05, -9.883195161819458e-06, -8.030794560909271e-06, -6.1783939599990845e-06, -4.325993359088898e-06, -2.473592758178711e-06, -6.211921572685242e-07, 1.2312084436416626e-06, 3.0836090445518494e-06, 4.936009645462036e-06, 6.788410246372223e-06, 8.64081084728241e-06, 1.0493211448192596e-05, 1.2345612049102783e-05, 1.419801265001297e-05, 1.6050413250923157e-05, 1.7902813851833344e-05, 1.975521445274353e-05, 2.1607615053653717e-05, 2.3460015654563904e-05, 2.531241625547409e-05, 2.7164816856384277e-05, 2.9017217457294464e-05, 3.086961805820465e-05, 3.272201865911484e-05, 3.4574419260025024e-05, 3.642681986093521e-05, 3.82792204618454e-05, 4.0131621062755585e-05, 4.198402166366577e-05, 4.383642226457596e-05, 4.5688822865486145e-05, 4.754122346639633e-05, 4.939362406730652e-05, 5.1246024668216705e-05, 5.309842526912689e-05, 5.495082587003708e-05, 5.6803226470947266e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 17.0, 21.0, 24.0, 34.0, 58.0, 82.0, 116.0, 184.0, 294.0, 591.0, 989.0, 2095.0, 4625.0, 10606.0, 24878.0, 61074.0, 159617.0, 330501.0, 268442.0, 109193.0, 42758.0, 17909.0, 7507.0, 3406.0, 1573.0, 831.0, 432.0, 266.0, 153.0, 97.0, 64.0, 37.0, 23.0, 19.0, 9.0, 6.0, 4.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0], "bins": [-0.2047119140625, -0.1992969512939453, -0.19388198852539062, -0.18846702575683594, -0.18305206298828125, -0.17763710021972656, -0.17222213745117188, -0.1668071746826172, -0.1613922119140625, -0.1559772491455078, -0.15056228637695312, -0.14514732360839844, -0.13973236083984375, -0.13431739807128906, -0.12890243530273438, -0.12348747253417969, -0.118072509765625, -0.11265754699707031, -0.10724258422851562, -0.10182762145996094, -0.09641265869140625, -0.09099769592285156, -0.08558273315429688, -0.08016777038574219, -0.0747528076171875, -0.06933784484863281, -0.06392288208007812, -0.05850791931152344, -0.05309295654296875, -0.04767799377441406, -0.042263031005859375, -0.03684806823730469, -0.03143310546875, -0.026018142700195312, -0.020603179931640625, -0.015188217163085938, -0.00977325439453125, -0.0043582916259765625, 0.001056671142578125, 0.0064716339111328125, 0.0118865966796875, 0.017301559448242188, 0.022716522216796875, 0.028131484985351562, 0.03354644775390625, 0.03896141052246094, 0.044376373291015625, 0.04979133605957031, 0.055206298828125, 0.06062126159667969, 0.06603622436523438, 0.07145118713378906, 0.07686614990234375, 0.08228111267089844, 0.08769607543945312, 0.09311103820800781, 0.0985260009765625, 0.10394096374511719, 0.10935592651367188, 0.11477088928222656, 0.12018585205078125, 0.12560081481933594, 0.13101577758789062, 0.1364307403564453, 0.141845703125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 3.0, 7.0, 10.0, 10.0, 14.0, 14.0, 17.0, 25.0, 34.0, 35.0, 50.0, 64.0, 81.0, 96.0, 89.0, 78.0, 62.0, 71.0, 44.0, 42.0, 31.0, 19.0, 19.0, 21.0, 16.0, 10.0, 5.0, 12.0, 3.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.2451171875, -0.23901939392089844, -0.23292160034179688, -0.2268238067626953, -0.22072601318359375, -0.2146282196044922, -0.20853042602539062, -0.20243263244628906, -0.1963348388671875, -0.19023704528808594, -0.18413925170898438, -0.1780414581298828, -0.17194366455078125, -0.1658458709716797, -0.15974807739257812, -0.15365028381347656, -0.147552490234375, -0.14145469665527344, -0.13535690307617188, -0.1292591094970703, -0.12316131591796875, -0.11706352233886719, -0.11096572875976562, -0.10486793518066406, -0.0987701416015625, -0.09267234802246094, -0.08657455444335938, -0.08047676086425781, -0.07437896728515625, -0.06828117370605469, -0.062183380126953125, -0.05608558654785156, -0.04998779296875, -0.04388999938964844, -0.037792205810546875, -0.03169441223144531, -0.02559661865234375, -0.019498825073242188, -0.013401031494140625, -0.0073032379150390625, -0.0012054443359375, 0.0048923492431640625, 0.010990142822265625, 0.017087936401367188, 0.02318572998046875, 0.029283523559570312, 0.035381317138671875, 0.04147911071777344, 0.047576904296875, 0.05367469787597656, 0.059772491455078125, 0.06587028503417969, 0.07196807861328125, 0.07806587219238281, 0.08416366577148438, 0.09026145935058594, 0.0963592529296875, 0.10245704650878906, 0.10855484008789062, 0.11465263366699219, 0.12075042724609375, 0.1268482208251953, 0.13294601440429688, 0.13904380798339844, 0.1451416015625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 19.0, 44.0, 100.0, 123.0, 175.0, 176.0, 151.0, 82.0, 51.0, 36.0, 14.0, 9.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1311469078063965, -2.034599542617798, -1.9380521774291992, -1.8415048122406006, -1.7449575662612915, -1.6484102010726929, -1.5518628358840942, -1.4553155899047852, -1.3587682247161865, -1.262220859527588, -1.1656734943389893, -1.0691261291503906, -0.9725788831710815, -0.8760315179824829, -0.7794841527938843, -0.6829368472099304, -0.586389422416687, -0.48984208703041077, -0.3932947516441345, -0.2967473864555359, -0.20020005106925964, -0.1036527156829834, -0.007105350494384766, 0.08944195508956909, 0.18598932027816772, 0.28253665566444397, 0.3790839910507202, 0.47563135623931885, 0.5721787214279175, 0.6687260270118713, 0.76527339220047, 0.8618206977844238, 0.9583680629730225, 1.054915428161621, 1.1514627933502197, 1.2480101585388184, 1.3445574045181274, 1.441104769706726, 1.5376521348953247, 1.6341993808746338, 1.7307467460632324, 1.827294111251831, 1.9238414764404297, 2.0203888416290283, 2.116936206817627, 2.2134833335876465, 2.310030937194824, 2.4065780639648438, 2.5031256675720215, 2.59967303276062, 2.6962203979492188, 2.7927677631378174, 2.889315128326416, 2.9858622550964355, 3.0824098587036133, 3.178956985473633, 3.2755043506622314, 3.37205171585083, 3.4685990810394287, 3.5651464462280273, 3.661693811416626, 3.7582411766052246, 3.854788303375244, 3.9513356685638428, 4.047883033752441]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 8.0, 6.0, 9.0, 10.0, 12.0, 14.0, 17.0, 16.0, 19.0, 25.0, 27.0, 21.0, 25.0, 29.0, 35.0, 36.0, 33.0, 33.0, 44.0, 29.0, 44.0, 45.0, 51.0, 50.0, 35.0, 38.0, 35.0, 36.0, 32.0, 21.0, 28.0, 19.0, 19.0, 17.0, 8.0, 16.0, 12.0, 9.0, 9.0, 5.0, 6.0, 7.0, 2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.6426702737808228, -1.5931708812713623, -1.5436713695526123, -1.4941719770431519, -1.4446724653244019, -1.3951730728149414, -1.3456735610961914, -1.296174168586731, -1.2466747760772705, -1.19717538356781, -1.14767587184906, -1.0981764793395996, -1.0486769676208496, -0.9991775751113892, -0.9496781229972839, -0.9001786708831787, -0.8506791591644287, -0.8011797070503235, -0.7516802549362183, -0.7021808624267578, -0.6526813507080078, -0.6031819581985474, -0.5536825060844421, -0.5041830539703369, -0.4546836018562317, -0.40518414974212646, -0.35568469762802124, -0.3061852753162384, -0.2566858232021332, -0.20718637108802795, -0.15768694877624512, -0.10818749666213989, -0.05868816375732422, -0.009188719093799591, 0.04031072556972504, 0.08981016278266907, 0.1393096148967743, 0.18880906701087952, 0.23830848932266235, 0.2878079414367676, 0.3373073935508728, 0.386806845664978, 0.43630629777908325, 0.4858057200908661, 0.5353051424026489, 0.5848046541213989, 0.6343040466308594, 0.6838034987449646, 0.7333029508590698, 0.782802402973175, 0.8323018550872803, 0.8818012475967407, 0.9313007593154907, 0.9808001518249512, 1.0302996635437012, 1.0797990560531616, 1.129298448562622, 1.1787978410720825, 1.2282973527908325, 1.277796745300293, 1.327296257019043, 1.3767956495285034, 1.4262950420379639, 1.4757945537567139, 1.5252940654754639]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 6.0, 12.0, 12.0, 23.0, 31.0, 46.0, 55.0, 103.0, 191.0, 320.0, 603.0, 1161.0, 2327.0, 4723.0, 10117.0, 21099.0, 45593.0, 105058.0, 270214.0, 823175.0, 1658288.0, 795633.0, 265838.0, 104592.0, 45483.0, 20632.0, 9793.0, 4519.0, 2182.0, 1075.0, 546.0, 328.0, 163.0, 111.0, 73.0, 41.0, 31.0, 22.0, 12.0, 14.0, 6.0, 5.0, 6.0, 2.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.301513671875, -0.29193878173828125, -0.2823638916015625, -0.27278900146484375, -0.263214111328125, -0.25363922119140625, -0.2440643310546875, -0.23448944091796875, -0.22491455078125, -0.21533966064453125, -0.2057647705078125, -0.19618988037109375, -0.186614990234375, -0.17704010009765625, -0.1674652099609375, -0.15789031982421875, -0.1483154296875, -0.13874053955078125, -0.1291656494140625, -0.11959075927734375, -0.110015869140625, -0.10044097900390625, -0.0908660888671875, -0.08129119873046875, -0.07171630859375, -0.06214141845703125, -0.0525665283203125, -0.04299163818359375, -0.033416748046875, -0.02384185791015625, -0.0142669677734375, -0.00469207763671875, 0.0048828125, 0.01445770263671875, 0.0240325927734375, 0.03360748291015625, 0.043182373046875, 0.05275726318359375, 0.0623321533203125, 0.07190704345703125, 0.08148193359375, 0.09105682373046875, 0.1006317138671875, 0.11020660400390625, 0.119781494140625, 0.12935638427734375, 0.1389312744140625, 0.14850616455078125, 0.1580810546875, 0.16765594482421875, 0.1772308349609375, 0.18680572509765625, 0.196380615234375, 0.20595550537109375, 0.2155303955078125, 0.22510528564453125, 0.23468017578125, 0.24425506591796875, 0.2538299560546875, 0.26340484619140625, 0.272979736328125, 0.28255462646484375, 0.2921295166015625, 0.30170440673828125, 0.311279296875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 1.0, 2.0, 8.0, 9.0, 10.0, 9.0, 14.0, 13.0, 16.0, 16.0, 28.0, 27.0, 21.0, 21.0, 26.0, 40.0, 44.0, 30.0, 47.0, 50.0, 29.0, 52.0, 33.0, 45.0, 33.0, 24.0, 35.0, 50.0, 37.0, 32.0, 28.0, 27.0, 25.0, 15.0, 14.0, 23.0, 11.0, 11.0, 5.0, 12.0, 6.0, 5.0, 3.0, 8.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2265625, -0.21941757202148438, -0.21227264404296875, -0.20512771606445312, -0.1979827880859375, -0.19083786010742188, -0.18369293212890625, -0.17654800415039062, -0.169403076171875, -0.16225814819335938, -0.15511322021484375, -0.14796829223632812, -0.1408233642578125, -0.13367843627929688, -0.12653350830078125, -0.11938858032226562, -0.11224365234375, -0.10509872436523438, -0.09795379638671875, -0.09080886840820312, -0.0836639404296875, -0.07651901245117188, -0.06937408447265625, -0.062229156494140625, -0.055084228515625, -0.047939300537109375, -0.04079437255859375, -0.033649444580078125, -0.0265045166015625, -0.019359588623046875, -0.01221466064453125, -0.005069732666015625, 0.0020751953125, 0.009220123291015625, 0.01636505126953125, 0.023509979248046875, 0.0306549072265625, 0.037799835205078125, 0.04494476318359375, 0.052089691162109375, 0.059234619140625, 0.06637954711914062, 0.07352447509765625, 0.08066940307617188, 0.0878143310546875, 0.09495925903320312, 0.10210418701171875, 0.10924911499023438, 0.11639404296875, 0.12353897094726562, 0.13068389892578125, 0.13782882690429688, 0.1449737548828125, 0.15211868286132812, 0.15926361083984375, 0.16640853881835938, 0.173553466796875, 0.18069839477539062, 0.18784332275390625, 0.19498825073242188, 0.2021331787109375, 0.20927810668945312, 0.21642303466796875, 0.22356796264648438, 0.230712890625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 12.0, 13.0, 9.0, 24.0, 33.0, 57.0, 83.0, 124.0, 210.0, 386.0, 667.0, 1336.0, 2629.0, 5578.0, 12598.0, 29499.0, 72185.0, 191539.0, 613407.0, 1966622.0, 887494.0, 251030.0, 92150.0, 37151.0, 15932.0, 6849.0, 3253.0, 1523.0, 765.0, 421.0, 233.0, 180.0, 104.0, 61.0, 39.0, 21.0, 14.0, 21.0, 10.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.399658203125, -0.3874092102050781, -0.37516021728515625, -0.3629112243652344, -0.3506622314453125, -0.3384132385253906, -0.32616424560546875, -0.3139152526855469, -0.301666259765625, -0.2894172668457031, -0.27716827392578125, -0.2649192810058594, -0.2526702880859375, -0.24042129516601562, -0.22817230224609375, -0.21592330932617188, -0.20367431640625, -0.19142532348632812, -0.17917633056640625, -0.16692733764648438, -0.1546783447265625, -0.14242935180664062, -0.13018035888671875, -0.11793136596679688, -0.105682373046875, -0.09343338012695312, -0.08118438720703125, -0.06893539428710938, -0.0566864013671875, -0.044437408447265625, -0.03218841552734375, -0.019939422607421875, -0.0076904296875, 0.004558563232421875, 0.01680755615234375, 0.029056549072265625, 0.0413055419921875, 0.053554534912109375, 0.06580352783203125, 0.07805252075195312, 0.090301513671875, 0.10255050659179688, 0.11479949951171875, 0.12704849243164062, 0.1392974853515625, 0.15154647827148438, 0.16379547119140625, 0.17604446411132812, 0.18829345703125, 0.20054244995117188, 0.21279144287109375, 0.22504043579101562, 0.2372894287109375, 0.24953842163085938, 0.26178741455078125, 0.2740364074707031, 0.286285400390625, 0.2985343933105469, 0.31078338623046875, 0.3230323791503906, 0.3352813720703125, 0.3475303649902344, 0.35977935791015625, 0.3720283508300781, 0.38427734375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 7.0, 11.0, 11.0, 16.0, 22.0, 26.0, 39.0, 39.0, 51.0, 84.0, 124.0, 152.0, 209.0, 329.0, 456.0, 596.0, 542.0, 365.0, 248.0, 203.0, 131.0, 96.0, 57.0, 63.0, 54.0, 34.0, 28.0, 22.0, 18.0, 9.0, 8.0, 6.0, 6.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.467041015625, -0.4507789611816406, -0.43451690673828125, -0.4182548522949219, -0.4019927978515625, -0.3857307434082031, -0.36946868896484375, -0.3532066345214844, -0.336944580078125, -0.3206825256347656, -0.30442047119140625, -0.2881584167480469, -0.2718963623046875, -0.2556343078613281, -0.23937225341796875, -0.22311019897460938, -0.20684814453125, -0.19058609008789062, -0.17432403564453125, -0.15806198120117188, -0.1417999267578125, -0.12553787231445312, -0.10927581787109375, -0.09301376342773438, -0.076751708984375, -0.060489654541015625, -0.04422760009765625, -0.027965545654296875, -0.0117034912109375, 0.004558563232421875, 0.02082061767578125, 0.037082672119140625, 0.0533447265625, 0.06960678100585938, 0.08586883544921875, 0.10213088989257812, 0.1183929443359375, 0.13465499877929688, 0.15091705322265625, 0.16717910766601562, 0.183441162109375, 0.19970321655273438, 0.21596527099609375, 0.23222732543945312, 0.2484893798828125, 0.2647514343261719, 0.28101348876953125, 0.2972755432128906, 0.31353759765625, 0.3297996520996094, 0.34606170654296875, 0.3623237609863281, 0.3785858154296875, 0.3948478698730469, 0.41110992431640625, 0.4273719787597656, 0.443634033203125, 0.4598960876464844, 0.47615814208984375, 0.4924201965332031, 0.5086822509765625, 0.5249443054199219, 0.5412063598632812, 0.5574684143066406, 0.57373046875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 6.0, 7.0, 10.0, 19.0, 16.0, 22.0, 33.0, 41.0, 50.0, 70.0, 85.0, 71.0, 95.0, 90.0, 90.0, 72.0, 53.0, 47.0, 42.0, 25.0, 15.0, 16.0, 8.0, 5.0, 5.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7945706844329834, -1.7246588468551636, -1.6547470092773438, -1.584835171699524, -1.514923334121704, -1.4450114965438843, -1.3750996589660645, -1.3051879405975342, -1.2352759838104248, -1.165364146232605, -1.0954523086547852, -1.0255404710769653, -0.9556286334991455, -0.8857167959213257, -0.8158050179481506, -0.7458931803703308, -0.6759814023971558, -0.6060695648193359, -0.5361577272415161, -0.4662459194660187, -0.39633408188819885, -0.32642224431037903, -0.2565104365348816, -0.18659859895706177, -0.11668676137924194, -0.046774931252002716, 0.02313689887523651, 0.09304872155189514, 0.16296055912971497, 0.2328723967075348, 0.3027842044830322, 0.37269604206085205, 0.4426078796386719, 0.5125197172164917, 0.5824315547943115, 0.6523433923721313, 0.7222552299499512, 0.792167067527771, 0.862078845500946, 0.9319906830787659, 1.0019025802612305, 1.0718144178390503, 1.1417262554168701, 1.21163809299469, 1.2815499305725098, 1.3514617681503296, 1.4213736057281494, 1.4912853240966797, 1.5611971616744995, 1.6311089992523193, 1.7010208368301392, 1.770932674407959, 1.8408445119857788, 1.9107563495635986, 1.980668067932129, 2.0505800247192383, 2.1204917430877686, 2.190403461456299, 2.260315418243408, 2.3302271366119385, 2.400139093399048, 2.470050811767578, 2.5399627685546875, 2.6098744869232178, 2.679786443710327]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 8.0, 7.0, 8.0, 4.0, 9.0, 8.0, 11.0, 10.0, 20.0, 12.0, 17.0, 23.0, 21.0, 23.0, 28.0, 25.0, 34.0, 27.0, 39.0, 34.0, 31.0, 35.0, 38.0, 42.0, 34.0, 39.0, 33.0, 42.0, 39.0, 31.0, 20.0, 22.0, 32.0, 25.0, 20.0, 13.0, 9.0, 25.0, 9.0, 14.0, 17.0, 18.0, 7.0, 6.0, 9.0, 5.0, 3.0, 2.0, 6.0, 1.0, 3.0, 5.0, 1.0, 2.0], "bins": [-1.3539042472839355, -1.3137092590332031, -1.2735143899917603, -1.2333194017410278, -1.193124532699585, -1.1529295444488525, -1.1127345561981201, -1.0725395679473877, -1.0323446989059448, -0.9921497702598572, -0.9519548416137695, -0.9117598533630371, -0.8715649247169495, -0.8313699960708618, -0.7911750078201294, -0.7509800791740417, -0.7107851505279541, -0.6705902218818665, -0.6303952932357788, -0.5902003049850464, -0.5500053763389587, -0.5098104476928711, -0.46961548924446106, -0.429420530796051, -0.3892256021499634, -0.34903067350387573, -0.3088357150554657, -0.26864075660705566, -0.22844582796096802, -0.18825088441371918, -0.14805594086647034, -0.1078609824180603, -0.06766605377197266, -0.027471110224723816, 0.012723833322525024, 0.052918776869773865, 0.0931137204170227, 0.13330866396427155, 0.17350360751152039, 0.21369856595993042, 0.25389349460601807, 0.2940884232521057, 0.33428338170051575, 0.3744783401489258, 0.4146732687950134, 0.4548681974411011, 0.4950631558895111, 0.5352581143379211, 0.5754530429840088, 0.6156479716300964, 0.6558429002761841, 0.6960378885269165, 0.7362328171730042, 0.7764277458190918, 0.8166227340698242, 0.8568176627159119, 0.8970125913619995, 0.9372075200080872, 0.9774024486541748, 1.0175974369049072, 1.0577924251556396, 1.0979872941970825, 1.138182282447815, 1.1783771514892578, 1.2185721397399902]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [5.0, 5.0, 7.0, 6.0, 5.0, 13.0, 12.0, 15.0, 34.0, 38.0, 60.0, 89.0, 140.0, 173.0, 333.0, 404.0, 584.0, 857.0, 1193.0, 1655.0, 2278.0, 3185.0, 4272.0, 6113.0, 8755.0, 12649.0, 19994.0, 36779.0, 84447.0, 223600.0, 326760.0, 165879.0, 63172.0, 29766.0, 16922.0, 11266.0, 7802.0, 5437.0, 4049.0, 2896.0, 2029.0, 1441.0, 1021.0, 740.0, 499.0, 371.0, 249.0, 188.0, 110.0, 86.0, 63.0, 39.0, 27.0, 24.0, 11.0, 7.0, 8.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.310302734375, -0.3000755310058594, -0.28984832763671875, -0.2796211242675781, -0.2693939208984375, -0.2591667175292969, -0.24893951416015625, -0.23871231079101562, -0.228485107421875, -0.21825790405273438, -0.20803070068359375, -0.19780349731445312, -0.1875762939453125, -0.17734909057617188, -0.16712188720703125, -0.15689468383789062, -0.14666748046875, -0.13644027709960938, -0.12621307373046875, -0.11598587036132812, -0.1057586669921875, -0.09553146362304688, -0.08530426025390625, -0.07507705688476562, -0.064849853515625, -0.054622650146484375, -0.04439544677734375, -0.034168243408203125, -0.0239410400390625, -0.013713836669921875, -0.00348663330078125, 0.006740570068359375, 0.0169677734375, 0.027194976806640625, 0.03742218017578125, 0.047649383544921875, 0.0578765869140625, 0.06810379028320312, 0.07833099365234375, 0.08855819702148438, 0.098785400390625, 0.10901260375976562, 0.11923980712890625, 0.12946701049804688, 0.1396942138671875, 0.14992141723632812, 0.16014862060546875, 0.17037582397460938, 0.18060302734375, 0.19083023071289062, 0.20105743408203125, 0.21128463745117188, 0.2215118408203125, 0.23173904418945312, 0.24196624755859375, 0.2521934509277344, 0.262420654296875, 0.2726478576660156, 0.28287506103515625, 0.2931022644042969, 0.3033294677734375, 0.3135566711425781, 0.32378387451171875, 0.3340110778808594, 0.34423828125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 7.0, 7.0, 7.0, 8.0, 10.0, 18.0, 19.0, 19.0, 23.0, 31.0, 49.0, 30.0, 40.0, 38.0, 52.0, 52.0, 55.0, 64.0, 40.0, 44.0, 44.0, 41.0, 38.0, 38.0, 45.0, 29.0, 32.0, 27.0, 17.0, 15.0, 11.0, 13.0, 8.0, 8.0, 5.0, 5.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.314453125, -0.30562591552734375, -0.2967987060546875, -0.28797149658203125, -0.279144287109375, -0.27031707763671875, -0.2614898681640625, -0.25266265869140625, -0.24383544921875, -0.23500823974609375, -0.2261810302734375, -0.21735382080078125, -0.208526611328125, -0.19969940185546875, -0.1908721923828125, -0.18204498291015625, -0.1732177734375, -0.16439056396484375, -0.1555633544921875, -0.14673614501953125, -0.137908935546875, -0.12908172607421875, -0.1202545166015625, -0.11142730712890625, -0.10260009765625, -0.09377288818359375, -0.0849456787109375, -0.07611846923828125, -0.067291259765625, -0.05846405029296875, -0.0496368408203125, -0.04080963134765625, -0.031982421875, -0.02315521240234375, -0.0143280029296875, -0.00550079345703125, 0.003326416015625, 0.01215362548828125, 0.0209808349609375, 0.02980804443359375, 0.03863525390625, 0.04746246337890625, 0.0562896728515625, 0.06511688232421875, 0.073944091796875, 0.08277130126953125, 0.0915985107421875, 0.10042572021484375, 0.1092529296875, 0.11808013916015625, 0.1269073486328125, 0.13573455810546875, 0.144561767578125, 0.15338897705078125, 0.1622161865234375, 0.17104339599609375, 0.17987060546875, 0.18869781494140625, 0.1975250244140625, 0.20635223388671875, 0.215179443359375, 0.22400665283203125, 0.2328338623046875, 0.24166107177734375, 0.25048828125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 11.0, 8.0, 13.0, 10.0, 22.0, 47.0, 57.0, 80.0, 105.0, 202.0, 348.0, 756.0, 1883.0, 5592.0, 17227.0, 58934.0, 374619.0, 484684.0, 72684.0, 20806.0, 6401.0, 2255.0, 845.0, 384.0, 192.0, 155.0, 79.0, 52.0, 43.0, 21.0, 10.0, 10.0, 11.0, 5.0, 1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84326171875, -0.8169708251953125, -0.790679931640625, -0.7643890380859375, -0.73809814453125, -0.7118072509765625, -0.685516357421875, -0.6592254638671875, -0.6329345703125, -0.6066436767578125, -0.580352783203125, -0.5540618896484375, -0.52777099609375, -0.5014801025390625, -0.475189208984375, -0.4488983154296875, -0.422607421875, -0.3963165283203125, -0.370025634765625, -0.3437347412109375, -0.31744384765625, -0.2911529541015625, -0.264862060546875, -0.2385711669921875, -0.2122802734375, -0.1859893798828125, -0.159698486328125, -0.1334075927734375, -0.10711669921875, -0.0808258056640625, -0.054534912109375, -0.0282440185546875, -0.001953125, 0.0243377685546875, 0.050628662109375, 0.0769195556640625, 0.10321044921875, 0.1295013427734375, 0.155792236328125, 0.1820831298828125, 0.2083740234375, 0.2346649169921875, 0.260955810546875, 0.2872467041015625, 0.31353759765625, 0.3398284912109375, 0.366119384765625, 0.3924102783203125, 0.418701171875, 0.4449920654296875, 0.471282958984375, 0.4975738525390625, 0.52386474609375, 0.5501556396484375, 0.576446533203125, 0.6027374267578125, 0.6290283203125, 0.6553192138671875, 0.681610107421875, 0.7079010009765625, 0.73419189453125, 0.7604827880859375, 0.786773681640625, 0.8130645751953125, 0.83935546875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 2.0, 3.0, 11.0, 6.0, 4.0, 13.0, 11.0, 12.0, 14.0, 11.0, 19.0, 26.0, 24.0, 27.0, 32.0, 35.0, 43.0, 40.0, 41.0, 45.0, 44.0, 37.0, 36.0, 43.0, 35.0, 37.0, 37.0, 38.0, 34.0, 41.0, 24.0, 23.0, 15.0, 23.0, 23.0, 15.0, 15.0, 12.0, 7.0, 9.0, 5.0, 2.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.6171875, -0.5970382690429688, -0.5768890380859375, -0.5567398071289062, -0.536590576171875, -0.5164413452148438, -0.4962921142578125, -0.47614288330078125, -0.45599365234375, -0.43584442138671875, -0.4156951904296875, -0.39554595947265625, -0.375396728515625, -0.35524749755859375, -0.3350982666015625, -0.31494903564453125, -0.2947998046875, -0.27465057373046875, -0.2545013427734375, -0.23435211181640625, -0.214202880859375, -0.19405364990234375, -0.1739044189453125, -0.15375518798828125, -0.13360595703125, -0.11345672607421875, -0.0933074951171875, -0.07315826416015625, -0.053009033203125, -0.03285980224609375, -0.0127105712890625, 0.00743865966796875, 0.027587890625, 0.04773712158203125, 0.0678863525390625, 0.08803558349609375, 0.108184814453125, 0.12833404541015625, 0.1484832763671875, 0.16863250732421875, 0.18878173828125, 0.20893096923828125, 0.2290802001953125, 0.24922943115234375, 0.269378662109375, 0.28952789306640625, 0.3096771240234375, 0.32982635498046875, 0.3499755859375, 0.37012481689453125, 0.3902740478515625, 0.41042327880859375, 0.430572509765625, 0.45072174072265625, 0.4708709716796875, 0.49102020263671875, 0.51116943359375, 0.5313186645507812, 0.5514678955078125, 0.5716171264648438, 0.591766357421875, 0.6119155883789062, 0.6320648193359375, 0.6522140502929688, 0.67236328125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 9.0, 10.0, 20.0, 28.0, 63.0, 117.0, 252.0, 550.0, 1398.0, 3355.0, 8247.0, 22126.0, 96287.0, 578931.0, 272588.0, 42205.0, 13402.0, 5209.0, 2132.0, 959.0, 350.0, 153.0, 67.0, 46.0, 22.0, 12.0, 4.0, 5.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.308349609375, -0.2989349365234375, -0.289520263671875, -0.2801055908203125, -0.27069091796875, -0.2612762451171875, -0.251861572265625, -0.2424468994140625, -0.2330322265625, -0.2236175537109375, -0.214202880859375, -0.2047882080078125, -0.19537353515625, -0.1859588623046875, -0.176544189453125, -0.1671295166015625, -0.15771484375, -0.1483001708984375, -0.138885498046875, -0.1294708251953125, -0.12005615234375, -0.1106414794921875, -0.101226806640625, -0.0918121337890625, -0.0823974609375, -0.0729827880859375, -0.063568115234375, -0.0541534423828125, -0.04473876953125, -0.0353240966796875, -0.025909423828125, -0.0164947509765625, -0.007080078125, 0.0023345947265625, 0.011749267578125, 0.0211639404296875, 0.03057861328125, 0.0399932861328125, 0.049407958984375, 0.0588226318359375, 0.0682373046875, 0.0776519775390625, 0.087066650390625, 0.0964813232421875, 0.10589599609375, 0.1153106689453125, 0.124725341796875, 0.1341400146484375, 0.1435546875, 0.1529693603515625, 0.162384033203125, 0.1717987060546875, 0.18121337890625, 0.1906280517578125, 0.200042724609375, 0.2094573974609375, 0.2188720703125, 0.2282867431640625, 0.237701416015625, 0.2471160888671875, 0.25653076171875, 0.2659454345703125, 0.275360107421875, 0.2847747802734375, 0.294189453125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 5.0, 6.0, 9.0, 6.0, 14.0, 16.0, 22.0, 40.0, 62.0, 122.0, 177.0, 160.0, 137.0, 75.0, 36.0, 26.0, 15.0, 15.0, 12.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.127357482910156e-05, -5.9091486036777496e-05, -5.690939724445343e-05, -5.4727308452129364e-05, -5.25452196598053e-05, -5.036313086748123e-05, -4.8181042075157166e-05, -4.59989532828331e-05, -4.381686449050903e-05, -4.163477569818497e-05, -3.94526869058609e-05, -3.7270598113536835e-05, -3.508850932121277e-05, -3.29064205288887e-05, -3.0724331736564636e-05, -2.854224294424057e-05, -2.6360154151916504e-05, -2.4178065359592438e-05, -2.199597656726837e-05, -1.9813887774944305e-05, -1.763179898262024e-05, -1.5449710190296173e-05, -1.3267621397972107e-05, -1.108553260564804e-05, -8.903443813323975e-06, -6.7213550209999084e-06, -4.539266228675842e-06, -2.357177436351776e-06, -1.7508864402770996e-07, 2.007000148296356e-06, 4.189088940620422e-06, 6.3711777329444885e-06, 8.553266525268555e-06, 1.0735355317592621e-05, 1.2917444109916687e-05, 1.5099532902240753e-05, 1.728162169456482e-05, 1.9463710486888885e-05, 2.164579927921295e-05, 2.3827888071537018e-05, 2.6009976863861084e-05, 2.819206565618515e-05, 3.0374154448509216e-05, 3.255624324083328e-05, 3.473833203315735e-05, 3.6920420825481415e-05, 3.910250961780548e-05, 4.128459841012955e-05, 4.346668720245361e-05, 4.564877599477768e-05, 4.7830864787101746e-05, 5.001295357942581e-05, 5.219504237174988e-05, 5.4377131164073944e-05, 5.655921995639801e-05, 5.8741308748722076e-05, 6.092339754104614e-05, 6.310548633337021e-05, 6.528757512569427e-05, 6.746966391801834e-05, 6.965175271034241e-05, 7.183384150266647e-05, 7.401593029499054e-05, 7.61980190873146e-05, 7.838010787963867e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 10.0, 7.0, 13.0, 13.0, 39.0, 37.0, 58.0, 111.0, 165.0, 314.0, 646.0, 1369.0, 2924.0, 6300.0, 14927.0, 44213.0, 187877.0, 481494.0, 224555.0, 53320.0, 17008.0, 7056.0, 3128.0, 1409.0, 694.0, 343.0, 190.0, 88.0, 70.0, 55.0, 35.0, 26.0, 13.0, 11.0, 10.0, 4.0, 5.0, 4.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1707763671875, -0.16382408142089844, -0.15687179565429688, -0.1499195098876953, -0.14296722412109375, -0.1360149383544922, -0.12906265258789062, -0.12211036682128906, -0.1151580810546875, -0.10820579528808594, -0.10125350952148438, -0.09430122375488281, -0.08734893798828125, -0.08039665222167969, -0.07344436645507812, -0.06649208068847656, -0.059539794921875, -0.05258750915527344, -0.045635223388671875, -0.03868293762207031, -0.03173065185546875, -0.024778366088867188, -0.017826080322265625, -0.010873794555664062, -0.0039215087890625, 0.0030307769775390625, 0.009983062744140625, 0.016935348510742188, 0.02388763427734375, 0.030839920043945312, 0.037792205810546875, 0.04474449157714844, 0.05169677734375, 0.05864906311035156, 0.06560134887695312, 0.07255363464355469, 0.07950592041015625, 0.08645820617675781, 0.09341049194335938, 0.10036277770996094, 0.1073150634765625, 0.11426734924316406, 0.12121963500976562, 0.1281719207763672, 0.13512420654296875, 0.1420764923095703, 0.14902877807617188, 0.15598106384277344, 0.162933349609375, 0.16988563537597656, 0.17683792114257812, 0.1837902069091797, 0.19074249267578125, 0.1976947784423828, 0.20464706420898438, 0.21159934997558594, 0.2185516357421875, 0.22550392150878906, 0.23245620727539062, 0.2394084930419922, 0.24636077880859375, 0.2533130645751953, 0.2602653503417969, 0.26721763610839844, 0.274169921875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 6.0, 3.0, 2.0, 6.0, 3.0, 8.0, 8.0, 12.0, 8.0, 23.0, 21.0, 25.0, 49.0, 48.0, 64.0, 85.0, 95.0, 96.0, 76.0, 73.0, 67.0, 57.0, 40.0, 31.0, 21.0, 20.0, 12.0, 8.0, 10.0, 7.0, 7.0, 3.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.207275390625, -0.20123291015625, -0.1951904296875, -0.18914794921875, -0.18310546875, -0.17706298828125, -0.1710205078125, -0.16497802734375, -0.158935546875, -0.15289306640625, -0.1468505859375, -0.14080810546875, -0.134765625, -0.12872314453125, -0.1226806640625, -0.11663818359375, -0.110595703125, -0.10455322265625, -0.0985107421875, -0.09246826171875, -0.08642578125, -0.08038330078125, -0.0743408203125, -0.06829833984375, -0.062255859375, -0.05621337890625, -0.0501708984375, -0.04412841796875, -0.0380859375, -0.03204345703125, -0.0260009765625, -0.01995849609375, -0.013916015625, -0.00787353515625, -0.0018310546875, 0.00421142578125, 0.01025390625, 0.01629638671875, 0.0223388671875, 0.02838134765625, 0.034423828125, 0.04046630859375, 0.0465087890625, 0.05255126953125, 0.05859375, 0.06463623046875, 0.0706787109375, 0.07672119140625, 0.082763671875, 0.08880615234375, 0.0948486328125, 0.10089111328125, 0.10693359375, 0.11297607421875, 0.1190185546875, 0.12506103515625, 0.131103515625, 0.13714599609375, 0.1431884765625, 0.14923095703125, 0.1552734375, 0.16131591796875, 0.1673583984375, 0.17340087890625, 0.179443359375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 24.0, 41.0, 85.0, 163.0, 205.0, 181.0, 147.0, 87.0, 33.0, 12.0, 7.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.264548301696777, -4.139028549194336, -4.0135087966918945, -3.887989044189453, -3.7624692916870117, -3.6369495391845703, -3.511430025100708, -3.3859102725982666, -3.260390520095825, -3.134870767593384, -3.0093510150909424, -2.883831262588501, -2.7583117485046387, -2.6327919960021973, -2.507272243499756, -2.3817524909973145, -2.256232738494873, -2.1307129859924316, -2.0051932334899902, -1.8796736001968384, -1.754153847694397, -1.6286340951919556, -1.5031144618988037, -1.3775947093963623, -1.252074956893921, -1.1265552043914795, -1.001035451889038, -0.8755158185958862, -0.7499960660934448, -0.6244763135910034, -0.4989566206932068, -0.37343692779541016, -0.24791717529296875, -0.12239745259284973, 0.003122270107269287, 0.1286419928073883, 0.2541617155075073, 0.37968146800994873, 0.5052011609077454, 0.630720853805542, 0.7562406063079834, 0.8817603588104248, 1.0072801113128662, 1.132799744606018, 1.2583194971084595, 1.3838392496109009, 1.5093588829040527, 1.6348786354064941, 1.7603983879089355, 1.885918140411377, 2.0114378929138184, 2.1369576454162598, 2.262477397918701, 2.3879971504211426, 2.513516664505005, 2.6390364170074463, 2.7645561695098877, 2.890075922012329, 3.0155956745147705, 3.141115427017212, 3.266634941101074, 3.3921546936035156, 3.517674446105957, 3.6431941986083984, 3.76871395111084]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 3.0, 5.0, 5.0, 5.0, 12.0, 14.0, 6.0, 14.0, 19.0, 14.0, 20.0, 22.0, 27.0, 15.0, 23.0, 25.0, 27.0, 29.0, 49.0, 42.0, 36.0, 41.0, 33.0, 45.0, 42.0, 38.0, 43.0, 36.0, 36.0, 40.0, 31.0, 39.0, 18.0, 25.0, 23.0, 11.0, 16.0, 9.0, 12.0, 14.0, 7.0, 6.0, 8.0, 13.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4789416790008545, -1.428098201751709, -1.377254843711853, -1.3264113664627075, -1.275567889213562, -1.224724531173706, -1.1738810539245605, -1.123037576675415, -1.0721940994262695, -1.021350622177124, -0.9705072045326233, -0.9196637868881226, -0.868820309638977, -0.8179768919944763, -0.7671334743499756, -0.7162899971008301, -0.6654465794563293, -0.6146031618118286, -0.5637596845626831, -0.5129162669181824, -0.46207278966903687, -0.41122937202453613, -0.360385924577713, -0.3095424771308899, -0.2586990296840668, -0.20785558223724365, -0.15701213479042053, -0.1061687022447586, -0.055325254797935486, -0.00448182225227356, 0.04636162519454956, 0.09720507264137268, 0.1480485200881958, 0.19889196753501892, 0.24973541498184204, 0.3005788326263428, 0.3514223098754883, 0.402265727519989, 0.45310917496681213, 0.5039526224136353, 0.5547960996627808, 0.6056395173072815, 0.656482994556427, 0.7073264122009277, 0.7581698894500732, 0.809013307094574, 0.8598567247390747, 0.9107002019882202, 0.961543619632721, 1.0123870372772217, 1.0632305145263672, 1.1140739917755127, 1.1649173498153687, 1.2157608270645142, 1.2666043043136597, 1.3174476623535156, 1.3682911396026611, 1.4191346168518066, 1.4699779748916626, 1.520821452140808, 1.5716649293899536, 1.6225082874298096, 1.673351764678955, 1.7241952419281006, 1.775038719177246]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 10.0, 12.0, 20.0, 23.0, 32.0, 48.0, 63.0, 120.0, 205.0, 357.0, 641.0, 1166.0, 2440.0, 4950.0, 10359.0, 22570.0, 51745.0, 139050.0, 472580.0, 1533990.0, 1368341.0, 384135.0, 116155.0, 45906.0, 20193.0, 9701.0, 4658.0, 2323.0, 1158.0, 575.0, 295.0, 186.0, 84.0, 54.0, 48.0, 25.0, 11.0, 18.0, 12.0, 12.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.378173828125, -0.36734771728515625, -0.3565216064453125, -0.34569549560546875, -0.334869384765625, -0.32404327392578125, -0.3132171630859375, -0.30239105224609375, -0.29156494140625, -0.28073883056640625, -0.2699127197265625, -0.25908660888671875, -0.248260498046875, -0.23743438720703125, -0.2266082763671875, -0.21578216552734375, -0.2049560546875, -0.19412994384765625, -0.1833038330078125, -0.17247772216796875, -0.161651611328125, -0.15082550048828125, -0.1399993896484375, -0.12917327880859375, -0.11834716796875, -0.10752105712890625, -0.0966949462890625, -0.08586883544921875, -0.075042724609375, -0.06421661376953125, -0.0533905029296875, -0.04256439208984375, -0.03173828125, -0.02091217041015625, -0.0100860595703125, 0.00074005126953125, 0.011566162109375, 0.02239227294921875, 0.0332183837890625, 0.04404449462890625, 0.05487060546875, 0.06569671630859375, 0.0765228271484375, 0.08734893798828125, 0.098175048828125, 0.10900115966796875, 0.1198272705078125, 0.13065338134765625, 0.1414794921875, 0.15230560302734375, 0.1631317138671875, 0.17395782470703125, 0.184783935546875, 0.19561004638671875, 0.2064361572265625, 0.21726226806640625, 0.22808837890625, 0.23891448974609375, 0.2497406005859375, 0.26056671142578125, 0.271392822265625, 0.28221893310546875, 0.2930450439453125, 0.30387115478515625, 0.314697265625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 7.0, 4.0, 11.0, 8.0, 14.0, 17.0, 17.0, 15.0, 21.0, 20.0, 42.0, 24.0, 31.0, 34.0, 41.0, 34.0, 42.0, 41.0, 45.0, 41.0, 38.0, 46.0, 31.0, 45.0, 34.0, 44.0, 31.0, 26.0, 30.0, 17.0, 21.0, 17.0, 18.0, 20.0, 14.0, 12.0, 12.0, 11.0, 10.0, 3.0, 2.0, 6.0, 6.0, 2.0, 0.0, 4.0], "bins": [-0.305908203125, -0.2978096008300781, -0.28971099853515625, -0.2816123962402344, -0.2735137939453125, -0.2654151916503906, -0.25731658935546875, -0.24921798706054688, -0.241119384765625, -0.23302078247070312, -0.22492218017578125, -0.21682357788085938, -0.2087249755859375, -0.20062637329101562, -0.19252777099609375, -0.18442916870117188, -0.17633056640625, -0.16823196411132812, -0.16013336181640625, -0.15203475952148438, -0.1439361572265625, -0.13583755493164062, -0.12773895263671875, -0.11964035034179688, -0.111541748046875, -0.10344314575195312, -0.09534454345703125, -0.08724594116210938, -0.0791473388671875, -0.07104873657226562, -0.06295013427734375, -0.054851531982421875, -0.0467529296875, -0.038654327392578125, -0.03055572509765625, -0.022457122802734375, -0.0143585205078125, -0.006259918212890625, 0.00183868408203125, 0.009937286376953125, 0.018035888671875, 0.026134490966796875, 0.03423309326171875, 0.042331695556640625, 0.0504302978515625, 0.058528900146484375, 0.06662750244140625, 0.07472610473632812, 0.08282470703125, 0.09092330932617188, 0.09902191162109375, 0.10712051391601562, 0.1152191162109375, 0.12331771850585938, 0.13141632080078125, 0.13951492309570312, 0.147613525390625, 0.15571212768554688, 0.16381072998046875, 0.17190933227539062, 0.1800079345703125, 0.18810653686523438, 0.19620513916015625, 0.20430374145507812, 0.21240234375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 8.0, 6.0, 6.0, 15.0, 15.0, 21.0, 30.0, 41.0, 38.0, 68.0, 99.0, 149.0, 238.0, 408.0, 635.0, 1158.0, 2177.0, 4633.0, 9783.0, 22040.0, 52063.0, 132597.0, 413916.0, 1740538.0, 1318069.0, 311333.0, 106209.0, 42974.0, 18230.0, 8166.0, 3933.0, 1933.0, 1059.0, 598.0, 363.0, 229.0, 161.0, 105.0, 72.0, 51.0, 28.0, 27.0, 16.0, 15.0, 7.0, 10.0, 2.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.4072265625, -0.39484405517578125, -0.3824615478515625, -0.37007904052734375, -0.357696533203125, -0.34531402587890625, -0.3329315185546875, -0.32054901123046875, -0.30816650390625, -0.29578399658203125, -0.2834014892578125, -0.27101898193359375, -0.258636474609375, -0.24625396728515625, -0.2338714599609375, -0.22148895263671875, -0.2091064453125, -0.19672393798828125, -0.1843414306640625, -0.17195892333984375, -0.159576416015625, -0.14719390869140625, -0.1348114013671875, -0.12242889404296875, -0.11004638671875, -0.09766387939453125, -0.0852813720703125, -0.07289886474609375, -0.060516357421875, -0.04813385009765625, -0.0357513427734375, -0.02336883544921875, -0.010986328125, 0.00139617919921875, 0.0137786865234375, 0.02616119384765625, 0.038543701171875, 0.05092620849609375, 0.0633087158203125, 0.07569122314453125, 0.08807373046875, 0.10045623779296875, 0.1128387451171875, 0.12522125244140625, 0.137603759765625, 0.14998626708984375, 0.1623687744140625, 0.17475128173828125, 0.1871337890625, 0.19951629638671875, 0.2118988037109375, 0.22428131103515625, 0.236663818359375, 0.24904632568359375, 0.2614288330078125, 0.27381134033203125, 0.28619384765625, 0.29857635498046875, 0.3109588623046875, 0.32334136962890625, 0.335723876953125, 0.34810638427734375, 0.3604888916015625, 0.37287139892578125, 0.38525390625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 3.0, 6.0, 8.0, 26.0, 18.0, 31.0, 34.0, 57.0, 82.0, 105.0, 151.0, 250.0, 394.0, 593.0, 636.0, 573.0, 345.0, 218.0, 143.0, 113.0, 68.0, 69.0, 46.0, 26.0, 20.0, 16.0, 11.0, 4.0, 7.0, 5.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6142578125, -0.595306396484375, -0.57635498046875, -0.557403564453125, -0.5384521484375, -0.519500732421875, -0.50054931640625, -0.481597900390625, -0.462646484375, -0.443695068359375, -0.42474365234375, -0.405792236328125, -0.3868408203125, -0.367889404296875, -0.34893798828125, -0.329986572265625, -0.31103515625, -0.292083740234375, -0.27313232421875, -0.254180908203125, -0.2352294921875, -0.216278076171875, -0.19732666015625, -0.178375244140625, -0.159423828125, -0.140472412109375, -0.12152099609375, -0.102569580078125, -0.0836181640625, -0.064666748046875, -0.04571533203125, -0.026763916015625, -0.0078125, 0.011138916015625, 0.03009033203125, 0.049041748046875, 0.0679931640625, 0.086944580078125, 0.10589599609375, 0.124847412109375, 0.143798828125, 0.162750244140625, 0.18170166015625, 0.200653076171875, 0.2196044921875, 0.238555908203125, 0.25750732421875, 0.276458740234375, 0.29541015625, 0.314361572265625, 0.33331298828125, 0.352264404296875, 0.3712158203125, 0.390167236328125, 0.40911865234375, 0.428070068359375, 0.447021484375, 0.465972900390625, 0.48492431640625, 0.503875732421875, 0.5228271484375, 0.541778564453125, 0.56072998046875, 0.579681396484375, 0.5986328125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 8.0, 23.0, 36.0, 67.0, 67.0, 113.0, 151.0, 131.0, 163.0, 92.0, 68.0, 35.0, 16.0, 11.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.871828079223633, -3.752101182937622, -3.6323742866516113, -3.5126476287841797, -3.392920732498169, -3.273193836212158, -3.1534669399261475, -3.0337400436401367, -2.914013147354126, -2.7942862510681152, -2.6745593547821045, -2.5548324584960938, -2.435105800628662, -2.3153789043426514, -2.1956520080566406, -2.07592511177063, -1.9561983346939087, -1.836471438407898, -1.7167446613311768, -1.597017765045166, -1.4772908687591553, -1.3575639724731445, -1.2378371953964233, -1.1181102991104126, -0.9983834624290466, -0.8786566257476807, -0.7589297294616699, -0.639202892780304, -0.519476056098938, -0.39974915981292725, -0.2800223231315613, -0.16029542684555054, -0.04056859016418457, 0.07915826886892319, 0.19888512790203094, 0.3186119794845581, 0.43833884596824646, 0.5580657124519348, 0.6777925491333008, 0.7975194454193115, 0.9172462821006775, 1.0369731187820435, 1.1567000150680542, 1.2764267921447754, 1.3961536884307861, 1.5158805847167969, 1.6356074810028076, 1.7553343772888184, 1.8750611543655396, 1.9947880506515503, 2.1145148277282715, 2.2342417240142822, 2.353968620300293, 2.4736955165863037, 2.5934224128723145, 2.713149070739746, 2.832875967025757, 2.9526028633117676, 3.0723297595977783, 3.192056655883789, 3.3117833137512207, 3.4315102100372314, 3.551237106323242, 3.670964002609253, 3.7906908988952637]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 8.0, 2.0, 6.0, 13.0, 11.0, 16.0, 14.0, 18.0, 24.0, 21.0, 26.0, 12.0, 32.0, 35.0, 39.0, 38.0, 16.0, 38.0, 33.0, 28.0, 40.0, 36.0, 46.0, 35.0, 50.0, 37.0, 26.0, 37.0, 35.0, 29.0, 28.0, 24.0, 23.0, 14.0, 17.0, 22.0, 15.0, 9.0, 10.0, 5.0, 8.0, 12.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5893858671188354, -1.5412522554397583, -1.4931187629699707, -1.4449851512908936, -1.396851658821106, -1.3487180471420288, -1.3005845546722412, -1.252450942993164, -1.204317331314087, -1.1561837196350098, -1.1080502271652222, -1.059916615486145, -1.0117831230163574, -0.9636495113372803, -0.9155159592628479, -0.8673824071884155, -0.8192489147186279, -0.7711153626441956, -0.7229818105697632, -0.674848198890686, -0.6267147064208984, -0.5785810947418213, -0.5304475426673889, -0.48231399059295654, -0.43418043851852417, -0.3860468864440918, -0.3379133343696594, -0.28977975249290466, -0.2416462004184723, -0.19351264834403992, -0.14537906646728516, -0.09724551439285278, -0.04911184310913086, -0.0009782835841178894, 0.04715527594089508, 0.09528884291648865, 0.14342239499092102, 0.1915559470653534, 0.23968952894210815, 0.2878230810165405, 0.3359566330909729, 0.3840901851654053, 0.43222373723983765, 0.4803573191165924, 0.5284909009933472, 0.5766243934631348, 0.6247580051422119, 0.6728915572166443, 0.7210251092910767, 0.769158661365509, 0.8172922134399414, 0.8654258251190186, 0.9135593175888062, 0.9616929292678833, 1.009826421737671, 1.057960033416748, 1.1060936450958252, 1.1542272567749023, 1.20236074924469, 1.250494360923767, 1.2986278533935547, 1.3467614650726318, 1.394895076751709, 1.4430285692214966, 1.4911620616912842]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 8.0, 16.0, 15.0, 18.0, 39.0, 105.0, 221.0, 479.0, 1238.0, 2791.0, 6962.0, 15666.0, 35571.0, 125298.0, 534656.0, 237812.0, 51010.0, 20628.0, 9166.0, 3964.0, 1619.0, 660.0, 303.0, 141.0, 84.0, 31.0, 28.0, 10.0, 7.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.89892578125, -0.8773574829101562, -0.8557891845703125, -0.8342208862304688, -0.812652587890625, -0.7910842895507812, -0.7695159912109375, -0.7479476928710938, -0.72637939453125, -0.7048110961914062, -0.6832427978515625, -0.6616744995117188, -0.640106201171875, -0.6185379028320312, -0.5969696044921875, -0.5754013061523438, -0.5538330078125, -0.5322647094726562, -0.5106964111328125, -0.48912811279296875, -0.467559814453125, -0.44599151611328125, -0.4244232177734375, -0.40285491943359375, -0.38128662109375, -0.35971832275390625, -0.3381500244140625, -0.31658172607421875, -0.295013427734375, -0.27344512939453125, -0.2518768310546875, -0.23030853271484375, -0.208740234375, -0.18717193603515625, -0.1656036376953125, -0.14403533935546875, -0.122467041015625, -0.10089874267578125, -0.0793304443359375, -0.05776214599609375, -0.03619384765625, -0.01462554931640625, 0.0069427490234375, 0.02851104736328125, 0.050079345703125, 0.07164764404296875, 0.0932159423828125, 0.11478424072265625, 0.1363525390625, 0.15792083740234375, 0.1794891357421875, 0.20105743408203125, 0.222625732421875, 0.24419403076171875, 0.2657623291015625, 0.28733062744140625, 0.30889892578125, 0.33046722412109375, 0.3520355224609375, 0.37360382080078125, 0.395172119140625, 0.41674041748046875, 0.4383087158203125, 0.45987701416015625, 0.4814453125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 3.0, 4.0, 11.0, 6.0, 13.0, 10.0, 13.0, 14.0, 15.0, 24.0, 11.0, 22.0, 36.0, 32.0, 38.0, 47.0, 37.0, 37.0, 53.0, 48.0, 44.0, 37.0, 42.0, 35.0, 40.0, 42.0, 32.0, 24.0, 36.0, 35.0, 32.0, 26.0, 18.0, 10.0, 17.0, 9.0, 11.0, 10.0, 9.0, 3.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 4.0, 1.0, 2.0], "bins": [-0.29150390625, -0.28334808349609375, -0.2751922607421875, -0.26703643798828125, -0.258880615234375, -0.25072479248046875, -0.2425689697265625, -0.23441314697265625, -0.22625732421875, -0.21810150146484375, -0.2099456787109375, -0.20178985595703125, -0.193634033203125, -0.18547821044921875, -0.1773223876953125, -0.16916656494140625, -0.1610107421875, -0.15285491943359375, -0.1446990966796875, -0.13654327392578125, -0.128387451171875, -0.12023162841796875, -0.1120758056640625, -0.10391998291015625, -0.09576416015625, -0.08760833740234375, -0.0794525146484375, -0.07129669189453125, -0.063140869140625, -0.05498504638671875, -0.0468292236328125, -0.03867340087890625, -0.030517578125, -0.02236175537109375, -0.0142059326171875, -0.00605010986328125, 0.002105712890625, 0.01026153564453125, 0.0184173583984375, 0.02657318115234375, 0.03472900390625, 0.04288482666015625, 0.0510406494140625, 0.05919647216796875, 0.067352294921875, 0.07550811767578125, 0.0836639404296875, 0.09181976318359375, 0.0999755859375, 0.10813140869140625, 0.1162872314453125, 0.12444305419921875, 0.132598876953125, 0.14075469970703125, 0.1489105224609375, 0.15706634521484375, 0.16522216796875, 0.17337799072265625, 0.1815338134765625, 0.18968963623046875, 0.197845458984375, 0.20600128173828125, 0.2141571044921875, 0.22231292724609375, 0.23046875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 10.0, 6.0, 12.0, 11.0, 13.0, 29.0, 49.0, 77.0, 131.0, 213.0, 407.0, 863.0, 2200.0, 7014.0, 26615.0, 142959.0, 714812.0, 119591.0, 23499.0, 6192.0, 2004.0, 856.0, 394.0, 221.0, 127.0, 88.0, 52.0, 43.0, 22.0, 11.0, 9.0, 11.0, 6.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2294921875, -1.195770263671875, -1.16204833984375, -1.128326416015625, -1.0946044921875, -1.060882568359375, -1.02716064453125, -0.993438720703125, -0.959716796875, -0.925994873046875, -0.89227294921875, -0.858551025390625, -0.8248291015625, -0.791107177734375, -0.75738525390625, -0.723663330078125, -0.68994140625, -0.656219482421875, -0.62249755859375, -0.588775634765625, -0.5550537109375, -0.521331787109375, -0.48760986328125, -0.453887939453125, -0.420166015625, -0.386444091796875, -0.35272216796875, -0.319000244140625, -0.2852783203125, -0.251556396484375, -0.21783447265625, -0.184112548828125, -0.150390625, -0.116668701171875, -0.08294677734375, -0.049224853515625, -0.0155029296875, 0.018218994140625, 0.05194091796875, 0.085662841796875, 0.119384765625, 0.153106689453125, 0.18682861328125, 0.220550537109375, 0.2542724609375, 0.287994384765625, 0.32171630859375, 0.355438232421875, 0.38916015625, 0.422882080078125, 0.45660400390625, 0.490325927734375, 0.5240478515625, 0.557769775390625, 0.59149169921875, 0.625213623046875, 0.658935546875, 0.692657470703125, 0.72637939453125, 0.760101318359375, 0.7938232421875, 0.827545166015625, 0.86126708984375, 0.894989013671875, 0.9287109375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 4.0, 6.0, 7.0, 7.0, 13.0, 11.0, 10.0, 16.0, 15.0, 19.0, 14.0, 35.0, 36.0, 21.0, 38.0, 45.0, 45.0, 45.0, 49.0, 47.0, 40.0, 53.0, 50.0, 43.0, 49.0, 42.0, 25.0, 35.0, 29.0, 29.0, 17.0, 22.0, 11.0, 14.0, 13.0, 8.0, 8.0, 12.0, 8.0, 4.0, 1.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.84521484375, -0.818939208984375, -0.79266357421875, -0.766387939453125, -0.7401123046875, -0.713836669921875, -0.68756103515625, -0.661285400390625, -0.635009765625, -0.608734130859375, -0.58245849609375, -0.556182861328125, -0.5299072265625, -0.503631591796875, -0.47735595703125, -0.451080322265625, -0.4248046875, -0.398529052734375, -0.37225341796875, -0.345977783203125, -0.3197021484375, -0.293426513671875, -0.26715087890625, -0.240875244140625, -0.214599609375, -0.188323974609375, -0.16204833984375, -0.135772705078125, -0.1094970703125, -0.083221435546875, -0.05694580078125, -0.030670166015625, -0.00439453125, 0.021881103515625, 0.04815673828125, 0.074432373046875, 0.1007080078125, 0.126983642578125, 0.15325927734375, 0.179534912109375, 0.205810546875, 0.232086181640625, 0.25836181640625, 0.284637451171875, 0.3109130859375, 0.337188720703125, 0.36346435546875, 0.389739990234375, 0.416015625, 0.442291259765625, 0.46856689453125, 0.494842529296875, 0.5211181640625, 0.547393798828125, 0.57366943359375, 0.599945068359375, 0.626220703125, 0.652496337890625, 0.67877197265625, 0.705047607421875, 0.7313232421875, 0.757598876953125, 0.78387451171875, 0.810150146484375, 0.83642578125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 8.0, 8.0, 8.0, 19.0, 32.0, 58.0, 68.0, 111.0, 215.0, 380.0, 805.0, 1636.0, 3607.0, 7840.0, 18119.0, 46695.0, 179134.0, 555360.0, 159552.0, 43863.0, 17196.0, 7361.0, 3283.0, 1566.0, 731.0, 363.0, 199.0, 124.0, 70.0, 46.0, 34.0, 18.0, 13.0, 9.0, 6.0, 4.0, 5.0, 9.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2459716796875, -0.2378978729248047, -0.22982406616210938, -0.22175025939941406, -0.21367645263671875, -0.20560264587402344, -0.19752883911132812, -0.1894550323486328, -0.1813812255859375, -0.1733074188232422, -0.16523361206054688, -0.15715980529785156, -0.14908599853515625, -0.14101219177246094, -0.13293838500976562, -0.12486457824707031, -0.116790771484375, -0.10871696472167969, -0.10064315795898438, -0.09256935119628906, -0.08449554443359375, -0.07642173767089844, -0.06834793090820312, -0.06027412414550781, -0.0522003173828125, -0.04412651062011719, -0.036052703857421875, -0.027978897094726562, -0.01990509033203125, -0.011831283569335938, -0.003757476806640625, 0.0043163299560546875, 0.01239013671875, 0.020463943481445312, 0.028537750244140625, 0.03661155700683594, 0.04468536376953125, 0.05275917053222656, 0.060832977294921875, 0.06890678405761719, 0.0769805908203125, 0.08505439758300781, 0.09312820434570312, 0.10120201110839844, 0.10927581787109375, 0.11734962463378906, 0.12542343139648438, 0.1334972381591797, 0.141571044921875, 0.1496448516845703, 0.15771865844726562, 0.16579246520996094, 0.17386627197265625, 0.18194007873535156, 0.19001388549804688, 0.1980876922607422, 0.2061614990234375, 0.2142353057861328, 0.22230911254882812, 0.23038291931152344, 0.23845672607421875, 0.24653053283691406, 0.2546043395996094, 0.2626781463623047, 0.270751953125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 4.0, 4.0, 2.0, 7.0, 7.0, 7.0, 5.0, 10.0, 14.0, 21.0, 30.0, 22.0, 53.0, 107.0, 144.0, 162.0, 124.0, 71.0, 52.0, 33.0, 25.0, 14.0, 11.0, 9.0, 9.0, 5.0, 2.0, 7.0, 6.0, 8.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.604194641113281e-05, -6.392784416675568e-05, -6.181374192237854e-05, -5.9699639678001404e-05, -5.758553743362427e-05, -5.547143518924713e-05, -5.3357332944869995e-05, -5.124323070049286e-05, -4.912912845611572e-05, -4.7015026211738586e-05, -4.490092396736145e-05, -4.2786821722984314e-05, -4.067271947860718e-05, -3.855861723423004e-05, -3.6444514989852905e-05, -3.433041274547577e-05, -3.221631050109863e-05, -3.0102208256721497e-05, -2.798810601234436e-05, -2.5874003767967224e-05, -2.3759901523590088e-05, -2.164579927921295e-05, -1.9531697034835815e-05, -1.741759479045868e-05, -1.5303492546081543e-05, -1.3189390301704407e-05, -1.107528805732727e-05, -8.961185812950134e-06, -6.847083568572998e-06, -4.732981324195862e-06, -2.6188790798187256e-06, -5.047768354415894e-07, 1.6093254089355469e-06, 3.723427653312683e-06, 5.837529897689819e-06, 7.951632142066956e-06, 1.0065734386444092e-05, 1.2179836630821228e-05, 1.4293938875198364e-05, 1.64080411195755e-05, 1.8522143363952637e-05, 2.0636245608329773e-05, 2.275034785270691e-05, 2.4864450097084045e-05, 2.697855234146118e-05, 2.9092654585838318e-05, 3.1206756830215454e-05, 3.332085907459259e-05, 3.5434961318969727e-05, 3.754906356334686e-05, 3.9663165807724e-05, 4.1777268052101135e-05, 4.389137029647827e-05, 4.600547254085541e-05, 4.8119574785232544e-05, 5.023367702960968e-05, 5.2347779273986816e-05, 5.446188151836395e-05, 5.657598376274109e-05, 5.8690086007118225e-05, 6.080418825149536e-05, 6.29182904958725e-05, 6.503239274024963e-05, 6.714649498462677e-05, 6.92605972290039e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 0.0, 3.0, 2.0, 6.0, 7.0, 15.0, 12.0, 19.0, 35.0, 41.0, 68.0, 102.0, 176.0, 253.0, 473.0, 819.0, 1726.0, 3966.0, 10024.0, 26977.0, 82620.0, 353066.0, 418598.0, 98339.0, 31178.0, 11323.0, 4486.0, 1941.0, 931.0, 478.0, 318.0, 202.0, 110.0, 74.0, 70.0, 32.0, 23.0, 13.0, 6.0, 7.0, 7.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.244873046875, -0.23699188232421875, -0.2291107177734375, -0.22122955322265625, -0.213348388671875, -0.20546722412109375, -0.1975860595703125, -0.18970489501953125, -0.18182373046875, -0.17394256591796875, -0.1660614013671875, -0.15818023681640625, -0.150299072265625, -0.14241790771484375, -0.1345367431640625, -0.12665557861328125, -0.1187744140625, -0.11089324951171875, -0.1030120849609375, -0.09513092041015625, -0.087249755859375, -0.07936859130859375, -0.0714874267578125, -0.06360626220703125, -0.05572509765625, -0.04784393310546875, -0.0399627685546875, -0.03208160400390625, -0.024200439453125, -0.01631927490234375, -0.0084381103515625, -0.00055694580078125, 0.00732421875, 0.01520538330078125, 0.0230865478515625, 0.03096771240234375, 0.038848876953125, 0.04673004150390625, 0.0546112060546875, 0.06249237060546875, 0.07037353515625, 0.07825469970703125, 0.0861358642578125, 0.09401702880859375, 0.101898193359375, 0.10977935791015625, 0.1176605224609375, 0.12554168701171875, 0.1334228515625, 0.14130401611328125, 0.1491851806640625, 0.15706634521484375, 0.164947509765625, 0.17282867431640625, 0.1807098388671875, 0.18859100341796875, 0.19647216796875, 0.20435333251953125, 0.2122344970703125, 0.22011566162109375, 0.227996826171875, 0.23587799072265625, 0.2437591552734375, 0.25164031982421875, 0.259521484375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 1.0, 5.0, 3.0, 1.0, 8.0, 9.0, 8.0, 11.0, 7.0, 17.0, 24.0, 26.0, 41.0, 46.0, 75.0, 82.0, 98.0, 119.0, 98.0, 80.0, 51.0, 49.0, 29.0, 23.0, 13.0, 10.0, 12.0, 11.0, 10.0, 7.0, 4.0, 8.0, 4.0, 2.0, 4.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1866455078125, -0.1789073944091797, -0.17116928100585938, -0.16343116760253906, -0.15569305419921875, -0.14795494079589844, -0.14021682739257812, -0.1324787139892578, -0.1247406005859375, -0.11700248718261719, -0.10926437377929688, -0.10152626037597656, -0.09378814697265625, -0.08605003356933594, -0.07831192016601562, -0.07057380676269531, -0.062835693359375, -0.05509757995605469, -0.047359466552734375, -0.03962135314941406, -0.03188323974609375, -0.024145126342773438, -0.016407012939453125, -0.008668899536132812, -0.0009307861328125, 0.0068073272705078125, 0.014545440673828125, 0.022283554077148438, 0.03002166748046875, 0.03775978088378906, 0.045497894287109375, 0.05323600769042969, 0.06097412109375, 0.06871223449707031, 0.07645034790039062, 0.08418846130371094, 0.09192657470703125, 0.09966468811035156, 0.10740280151367188, 0.11514091491699219, 0.1228790283203125, 0.1306171417236328, 0.13835525512695312, 0.14609336853027344, 0.15383148193359375, 0.16156959533691406, 0.16930770874023438, 0.1770458221435547, 0.184783935546875, 0.1925220489501953, 0.20026016235351562, 0.20799827575683594, 0.21573638916015625, 0.22347450256347656, 0.23121261596679688, 0.2389507293701172, 0.2466888427734375, 0.2544269561767578, 0.2621650695800781, 0.26990318298339844, 0.27764129638671875, 0.28537940979003906, 0.2931175231933594, 0.3008556365966797, 0.30859375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 24.0, 38.0, 132.0, 189.0, 230.0, 186.0, 103.0, 53.0, 14.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.537570953369141, -5.381424427032471, -5.225278377532959, -5.069131851196289, -4.912985801696777, -4.756839275360107, -4.600693225860596, -4.444546699523926, -4.288400650024414, -4.132254123687744, -3.9761080741882324, -3.8199617862701416, -3.663815498352051, -3.50766921043396, -3.351522922515869, -3.195376396179199, -3.0392301082611084, -2.8830838203430176, -2.7269375324249268, -2.570791244506836, -2.414644956588745, -2.2584986686706543, -2.1023521423339844, -1.946205973625183, -1.7900596857070923, -1.6339133977890015, -1.4777671098709106, -1.3216207027435303, -1.1654744148254395, -1.0093281269073486, -0.8531818389892578, -0.697035551071167, -0.5408892631530762, -0.38474297523498535, -0.22859665751457214, -0.07245033979415894, 0.08369594812393188, 0.2398422360420227, 0.3959885835647583, 0.5521348714828491, 0.7082811594009399, 0.8644274473190308, 1.0205737352371216, 1.176720142364502, 1.3328664302825928, 1.4890127182006836, 1.6451590061187744, 1.8013052940368652, 1.957451581954956, 2.113597869873047, 2.2697441577911377, 2.4258904457092285, 2.5820367336273193, 2.73818302154541, 2.89432954788208, 3.050475597381592, 3.2066221237182617, 3.3627684116363525, 3.5189146995544434, 3.675060987472534, 3.831207275390625, 3.987353563308716, 4.143499851226807, 4.299646377563477, 4.455792427062988]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 6.0, 6.0, 7.0, 7.0, 12.0, 20.0, 18.0, 19.0, 27.0, 16.0, 21.0, 27.0, 28.0, 54.0, 29.0, 42.0, 40.0, 44.0, 35.0, 39.0, 38.0, 41.0, 41.0, 36.0, 40.0, 30.0, 32.0, 29.0, 32.0, 33.0, 18.0, 22.0, 20.0, 20.0, 13.0, 12.0, 8.0, 2.0, 10.0, 6.0, 3.0, 9.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5388506650924683, -1.4822354316711426, -1.4256203174591064, -1.3690050840377808, -1.312389850616455, -1.255774736404419, -1.1991595029830933, -1.1425442695617676, -1.0859291553497314, -1.0293139219284058, -0.9726987481117249, -0.916083574295044, -0.8594683408737183, -0.8028531670570374, -0.7462379932403564, -0.6896227598190308, -0.6330075263977051, -0.5763923525810242, -0.5197771191596985, -0.4631619453430176, -0.4065467417240143, -0.349931538105011, -0.2933163642883301, -0.23670116066932678, -0.1800859570503235, -0.12347076088190079, -0.06685556471347809, -0.010240375995635986, 0.04637482762336731, 0.1029900312423706, 0.1596052050590515, 0.2162204086780548, 0.27283573150634766, 0.32945093512535095, 0.38606613874435425, 0.44268131256103516, 0.49929651618003845, 0.5559117197990417, 0.6125268936157227, 0.6691421270370483, 0.7257573008537292, 0.7823724746704102, 0.8389877080917358, 0.8956028819084167, 0.9522180557250977, 1.0088332891464233, 1.065448522567749, 1.1220636367797852, 1.1786788702011108, 1.2352941036224365, 1.2919092178344727, 1.3485244512557983, 1.405139684677124, 1.4617547988891602, 1.5183700323104858, 1.5749852657318115, 1.6316003799438477, 1.6882156133651733, 1.7448307275772095, 1.8014459609985352, 1.8580611944198608, 1.9146764278411865, 1.9712915420532227, 2.027906656265259, 2.084522008895874]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 4.0, 7.0, 12.0, 16.0, 20.0, 28.0, 44.0, 81.0, 113.0, 178.0, 327.0, 546.0, 906.0, 1558.0, 2733.0, 4722.0, 8590.0, 16061.0, 29598.0, 59428.0, 131670.0, 321897.0, 736628.0, 1182341.0, 922017.0, 432536.0, 182520.0, 78986.0, 37573.0, 19375.0, 10481.0, 5808.0, 3250.0, 1819.0, 1040.0, 549.0, 305.0, 201.0, 111.0, 77.0, 46.0, 25.0, 14.0, 16.0, 9.0, 9.0, 3.0, 1.0, 3.0, 4.0, 1.0], "bins": [-0.281005859375, -0.2733421325683594, -0.26567840576171875, -0.2580146789550781, -0.2503509521484375, -0.24268722534179688, -0.23502349853515625, -0.22735977172851562, -0.219696044921875, -0.21203231811523438, -0.20436859130859375, -0.19670486450195312, -0.1890411376953125, -0.18137741088867188, -0.17371368408203125, -0.16604995727539062, -0.15838623046875, -0.15072250366210938, -0.14305877685546875, -0.13539505004882812, -0.1277313232421875, -0.12006759643554688, -0.11240386962890625, -0.10474014282226562, -0.097076416015625, -0.08941268920898438, -0.08174896240234375, -0.07408523559570312, -0.0664215087890625, -0.058757781982421875, -0.05109405517578125, -0.043430328369140625, -0.0357666015625, -0.028102874755859375, -0.02043914794921875, -0.012775421142578125, -0.0051116943359375, 0.002552032470703125, 0.01021575927734375, 0.017879486083984375, 0.025543212890625, 0.033206939697265625, 0.04087066650390625, 0.048534393310546875, 0.0561981201171875, 0.06386184692382812, 0.07152557373046875, 0.07918930053710938, 0.08685302734375, 0.09451675415039062, 0.10218048095703125, 0.10984420776367188, 0.1175079345703125, 0.12517166137695312, 0.13283538818359375, 0.14049911499023438, 0.148162841796875, 0.15582656860351562, 0.16349029541015625, 0.17115402221679688, 0.1788177490234375, 0.18648147583007812, 0.19414520263671875, 0.20180892944335938, 0.20947265625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 5.0, 6.0, 6.0, 8.0, 10.0, 8.0, 8.0, 12.0, 17.0, 14.0, 19.0, 20.0, 20.0, 27.0, 35.0, 36.0, 37.0, 31.0, 40.0, 52.0, 44.0, 28.0, 41.0, 54.0, 35.0, 37.0, 28.0, 28.0, 24.0, 32.0, 36.0, 22.0, 30.0, 22.0, 24.0, 17.0, 16.0, 14.0, 9.0, 7.0, 7.0, 10.0, 5.0, 3.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2347412109375, -0.2267131805419922, -0.21868515014648438, -0.21065711975097656, -0.20262908935546875, -0.19460105895996094, -0.18657302856445312, -0.1785449981689453, -0.1705169677734375, -0.1624889373779297, -0.15446090698242188, -0.14643287658691406, -0.13840484619140625, -0.13037681579589844, -0.12234878540039062, -0.11432075500488281, -0.106292724609375, -0.09826469421386719, -0.09023666381835938, -0.08220863342285156, -0.07418060302734375, -0.06615257263183594, -0.058124542236328125, -0.05009651184082031, -0.0420684814453125, -0.03404045104980469, -0.026012420654296875, -0.017984390258789062, -0.00995635986328125, -0.0019283294677734375, 0.006099700927734375, 0.014127731323242188, 0.02215576171875, 0.030183792114257812, 0.038211822509765625, 0.04623985290527344, 0.05426788330078125, 0.06229591369628906, 0.07032394409179688, 0.07835197448730469, 0.0863800048828125, 0.09440803527832031, 0.10243606567382812, 0.11046409606933594, 0.11849212646484375, 0.12652015686035156, 0.13454818725585938, 0.1425762176513672, 0.150604248046875, 0.1586322784423828, 0.16666030883789062, 0.17468833923339844, 0.18271636962890625, 0.19074440002441406, 0.19877243041992188, 0.2068004608154297, 0.2148284912109375, 0.2228565216064453, 0.23088455200195312, 0.23891258239746094, 0.24694061279296875, 0.25496864318847656, 0.2629966735839844, 0.2710247039794922, 0.279052734375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 1.0, 1.0, 4.0, 9.0, 14.0, 21.0, 29.0, 45.0, 66.0, 102.0, 157.0, 283.0, 505.0, 877.0, 1775.0, 3912.0, 9921.0, 27868.0, 82291.0, 276525.0, 1303155.0, 1889642.0, 419073.0, 116491.0, 38371.0, 13353.0, 5175.0, 2149.0, 1065.0, 523.0, 321.0, 195.0, 116.0, 79.0, 58.0, 44.0, 27.0, 11.0, 8.0, 9.0, 7.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.55517578125, -0.5398178100585938, -0.5244598388671875, -0.5091018676757812, -0.493743896484375, -0.47838592529296875, -0.4630279541015625, -0.44766998291015625, -0.43231201171875, -0.41695404052734375, -0.4015960693359375, -0.38623809814453125, -0.370880126953125, -0.35552215576171875, -0.3401641845703125, -0.32480621337890625, -0.3094482421875, -0.29409027099609375, -0.2787322998046875, -0.26337432861328125, -0.248016357421875, -0.23265838623046875, -0.2173004150390625, -0.20194244384765625, -0.18658447265625, -0.17122650146484375, -0.1558685302734375, -0.14051055908203125, -0.125152587890625, -0.10979461669921875, -0.0944366455078125, -0.07907867431640625, -0.063720703125, -0.04836273193359375, -0.0330047607421875, -0.01764678955078125, -0.002288818359375, 0.01306915283203125, 0.0284271240234375, 0.04378509521484375, 0.05914306640625, 0.07450103759765625, 0.0898590087890625, 0.10521697998046875, 0.120574951171875, 0.13593292236328125, 0.1512908935546875, 0.16664886474609375, 0.1820068359375, 0.19736480712890625, 0.2127227783203125, 0.22808074951171875, 0.243438720703125, 0.25879669189453125, 0.2741546630859375, 0.28951263427734375, 0.30487060546875, 0.32022857666015625, 0.3355865478515625, 0.35094451904296875, 0.366302490234375, 0.38166046142578125, 0.3970184326171875, 0.41237640380859375, 0.427734375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 5.0, 1.0, 0.0, 3.0, 8.0, 7.0, 4.0, 11.0, 13.0, 20.0, 15.0, 39.0, 33.0, 51.0, 67.0, 88.0, 119.0, 156.0, 214.0, 320.0, 418.0, 451.0, 474.0, 403.0, 288.0, 223.0, 148.0, 113.0, 69.0, 64.0, 58.0, 52.0, 36.0, 31.0, 18.0, 20.0, 11.0, 9.0, 6.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.471435546875, -0.4546546936035156, -0.43787384033203125, -0.4210929870605469, -0.4043121337890625, -0.3875312805175781, -0.37075042724609375, -0.3539695739746094, -0.337188720703125, -0.3204078674316406, -0.30362701416015625, -0.2868461608886719, -0.2700653076171875, -0.2532844543457031, -0.23650360107421875, -0.21972274780273438, -0.20294189453125, -0.18616104125976562, -0.16938018798828125, -0.15259933471679688, -0.1358184814453125, -0.11903762817382812, -0.10225677490234375, -0.08547592163085938, -0.068695068359375, -0.051914215087890625, -0.03513336181640625, -0.018352508544921875, -0.0015716552734375, 0.015209197998046875, 0.03199005126953125, 0.048770904541015625, 0.0655517578125, 0.08233261108398438, 0.09911346435546875, 0.11589431762695312, 0.1326751708984375, 0.14945602416992188, 0.16623687744140625, 0.18301773071289062, 0.199798583984375, 0.21657943725585938, 0.23336029052734375, 0.2501411437988281, 0.2669219970703125, 0.2837028503417969, 0.30048370361328125, 0.3172645568847656, 0.33404541015625, 0.3508262634277344, 0.36760711669921875, 0.3843879699707031, 0.4011688232421875, 0.4179496765136719, 0.43473052978515625, 0.4515113830566406, 0.468292236328125, 0.4850730895996094, 0.5018539428710938, 0.5186347961425781, 0.5354156494140625, 0.5521965026855469, 0.5689773559570312, 0.5857582092285156, 0.6025390625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 8.0, 9.0, 30.0, 74.0, 131.0, 163.0, 198.0, 176.0, 114.0, 44.0, 23.0, 11.0, 8.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0295021533966064, -2.8640270233154297, -2.698552131652832, -2.5330770015716553, -2.3676018714904785, -2.2021267414093018, -2.036651611328125, -1.8711767196655273, -1.7057015895843506, -1.5402264595031738, -1.3747514486312866, -1.2092764377593994, -1.0438013076782227, -0.8783262372016907, -0.7128511667251587, -0.5473761558532715, -0.3819010257720947, -0.21642595529556274, -0.05095088481903076, 0.11452418565750122, 0.2799992561340332, 0.4454743266105652, 0.6109493970870972, 0.7764244079589844, 0.9418995380401611, 1.107374668121338, 1.272849678993225, 1.4383246898651123, 1.603799819946289, 1.7692749500274658, 1.934749960899353, 2.1002249717712402, 2.265699863433838, 2.4311749935150146, 2.5966501235961914, 2.762125015258789, 2.927600145339966, 3.0930752754211426, 3.2585501670837402, 3.424025297164917, 3.5895004272460938, 3.7549755573272705, 3.9204506874084473, 4.085925579071045, 4.251400947570801, 4.416875839233398, 4.582350730895996, 4.747825622558594, 4.91330099105835, 5.078775882720947, 5.244251251220703, 5.409726142883301, 5.575201034545898, 5.740676403045654, 5.906151294708252, 6.071626663208008, 6.2371015548706055, 6.402576446533203, 6.568051815032959, 6.733526706695557, 6.8990020751953125, 7.06447696685791, 7.229951858520508, 7.3954267501831055, 7.560902118682861]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 3.0, 8.0, 5.0, 10.0, 21.0, 14.0, 12.0, 10.0, 21.0, 16.0, 21.0, 25.0, 33.0, 34.0, 29.0, 32.0, 28.0, 39.0, 32.0, 40.0, 42.0, 46.0, 34.0, 40.0, 38.0, 32.0, 45.0, 26.0, 22.0, 26.0, 25.0, 24.0, 17.0, 17.0, 11.0, 10.0, 16.0, 12.0, 10.0, 9.0, 18.0, 11.0, 11.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6110713481903076, -1.5594319105148315, -1.5077924728393555, -1.4561530351638794, -1.4045135974884033, -1.3528741598129272, -1.3012347221374512, -1.2495954036712646, -1.197955846786499, -1.146316409111023, -1.0946769714355469, -1.0430375337600708, -0.9913980960845947, -0.9397586584091187, -0.8881192803382874, -0.8364798426628113, -0.78484046459198, -0.7332010269165039, -0.6815615892410278, -0.6299221515655518, -0.5782827138900757, -0.5266432762145996, -0.4750038981437683, -0.42336446046829224, -0.37172502279281616, -0.3200855851173401, -0.268446147441864, -0.21680673956871033, -0.16516730189323425, -0.11352786421775818, -0.06188845634460449, -0.010249018669128418, 0.041390299797058105, 0.09302973002195358, 0.14466916024684906, 0.19630858302116394, 0.24794802069664001, 0.2995874583721161, 0.3512268662452698, 0.40286630392074585, 0.4545057415962219, 0.506145179271698, 0.5577846169471741, 0.6094239950180054, 0.6610634326934814, 0.7127028703689575, 0.7643423080444336, 0.8159817457199097, 0.8676211833953857, 0.9192606210708618, 0.9709000587463379, 1.022539496421814, 1.07417893409729, 1.1258183717727661, 1.1774578094482422, 1.2290971279144287, 1.2807366847991943, 1.3323761224746704, 1.3840155601501465, 1.4356549978256226, 1.4872944355010986, 1.5389338731765747, 1.5905733108520508, 1.6422126293182373, 1.6938520669937134]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 0.0, 4.0, 7.0, 8.0, 6.0, 18.0, 10.0, 21.0, 48.0, 58.0, 86.0, 143.0, 223.0, 349.0, 592.0, 1077.0, 1928.0, 3418.0, 6447.0, 11062.0, 19964.0, 35873.0, 75183.0, 183643.0, 324494.0, 209768.0, 84988.0, 39988.0, 21505.0, 12227.0, 6914.0, 3693.0, 2041.0, 1114.0, 645.0, 377.0, 205.0, 139.0, 106.0, 57.0, 47.0, 29.0, 16.0, 13.0, 14.0, 1.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34326171875, -0.3312492370605469, -0.31923675537109375, -0.3072242736816406, -0.2952117919921875, -0.2831993103027344, -0.27118682861328125, -0.2591743469238281, -0.247161865234375, -0.23514938354492188, -0.22313690185546875, -0.21112442016601562, -0.1991119384765625, -0.18709945678710938, -0.17508697509765625, -0.16307449340820312, -0.15106201171875, -0.13904953002929688, -0.12703704833984375, -0.11502456665039062, -0.1030120849609375, -0.09099960327148438, -0.07898712158203125, -0.06697463989257812, -0.054962158203125, -0.042949676513671875, -0.03093719482421875, -0.018924713134765625, -0.0069122314453125, 0.005100250244140625, 0.01711273193359375, 0.029125213623046875, 0.0411376953125, 0.053150177001953125, 0.06516265869140625, 0.07717514038085938, 0.0891876220703125, 0.10120010375976562, 0.11321258544921875, 0.12522506713867188, 0.137237548828125, 0.14925003051757812, 0.16126251220703125, 0.17327499389648438, 0.1852874755859375, 0.19729995727539062, 0.20931243896484375, 0.22132492065429688, 0.23333740234375, 0.24534988403320312, 0.25736236572265625, 0.2693748474121094, 0.2813873291015625, 0.2933998107910156, 0.30541229248046875, 0.3174247741699219, 0.329437255859375, 0.3414497375488281, 0.35346221923828125, 0.3654747009277344, 0.3774871826171875, 0.3894996643066406, 0.40151214599609375, 0.4135246276855469, 0.425537109375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 1.0, 3.0, 6.0, 6.0, 8.0, 11.0, 6.0, 13.0, 18.0, 13.0, 13.0, 21.0, 23.0, 31.0, 21.0, 25.0, 35.0, 26.0, 39.0, 44.0, 36.0, 35.0, 45.0, 40.0, 39.0, 39.0, 30.0, 42.0, 34.0, 35.0, 41.0, 29.0, 24.0, 21.0, 25.0, 28.0, 21.0, 14.0, 10.0, 8.0, 14.0, 9.0, 7.0, 7.0, 3.0, 5.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.224609375, -0.2169036865234375, -0.209197998046875, -0.2014923095703125, -0.19378662109375, -0.1860809326171875, -0.178375244140625, -0.1706695556640625, -0.1629638671875, -0.1552581787109375, -0.147552490234375, -0.1398468017578125, -0.13214111328125, -0.1244354248046875, -0.116729736328125, -0.1090240478515625, -0.101318359375, -0.0936126708984375, -0.085906982421875, -0.0782012939453125, -0.07049560546875, -0.0627899169921875, -0.055084228515625, -0.0473785400390625, -0.0396728515625, -0.0319671630859375, -0.024261474609375, -0.0165557861328125, -0.00885009765625, -0.0011444091796875, 0.006561279296875, 0.0142669677734375, 0.02197265625, 0.0296783447265625, 0.037384033203125, 0.0450897216796875, 0.05279541015625, 0.0605010986328125, 0.068206787109375, 0.0759124755859375, 0.0836181640625, 0.0913238525390625, 0.099029541015625, 0.1067352294921875, 0.11444091796875, 0.1221466064453125, 0.129852294921875, 0.1375579833984375, 0.145263671875, 0.1529693603515625, 0.160675048828125, 0.1683807373046875, 0.17608642578125, 0.1837921142578125, 0.191497802734375, 0.1992034912109375, 0.2069091796875, 0.2146148681640625, 0.222320556640625, 0.2300262451171875, 0.23773193359375, 0.2454376220703125, 0.253143310546875, 0.2608489990234375, 0.2685546875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 4.0, 5.0, 3.0, 10.0, 8.0, 13.0, 20.0, 24.0, 35.0, 66.0, 93.0, 130.0, 211.0, 337.0, 620.0, 1176.0, 3064.0, 8602.0, 27214.0, 96886.0, 447677.0, 353052.0, 75235.0, 21748.0, 7237.0, 2526.0, 1105.0, 597.0, 319.0, 200.0, 112.0, 82.0, 49.0, 39.0, 16.0, 14.0, 10.0, 9.0, 5.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63037109375, -0.6050643920898438, -0.5797576904296875, -0.5544509887695312, -0.529144287109375, -0.5038375854492188, -0.4785308837890625, -0.45322418212890625, -0.42791748046875, -0.40261077880859375, -0.3773040771484375, -0.35199737548828125, -0.326690673828125, -0.30138397216796875, -0.2760772705078125, -0.25077056884765625, -0.2254638671875, -0.20015716552734375, -0.1748504638671875, -0.14954376220703125, -0.124237060546875, -0.09893035888671875, -0.0736236572265625, -0.04831695556640625, -0.02301025390625, 0.00229644775390625, 0.0276031494140625, 0.05290985107421875, 0.078216552734375, 0.10352325439453125, 0.1288299560546875, 0.15413665771484375, 0.179443359375, 0.20475006103515625, 0.2300567626953125, 0.25536346435546875, 0.280670166015625, 0.30597686767578125, 0.3312835693359375, 0.35659027099609375, 0.38189697265625, 0.40720367431640625, 0.4325103759765625, 0.45781707763671875, 0.483123779296875, 0.5084304809570312, 0.5337371826171875, 0.5590438842773438, 0.5843505859375, 0.6096572875976562, 0.6349639892578125, 0.6602706909179688, 0.685577392578125, 0.7108840942382812, 0.7361907958984375, 0.7614974975585938, 0.78680419921875, 0.8121109008789062, 0.8374176025390625, 0.8627243041992188, 0.888031005859375, 0.9133377075195312, 0.9386444091796875, 0.9639511108398438, 0.9892578125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 1.0, 6.0, 8.0, 3.0, 3.0, 7.0, 15.0, 5.0, 8.0, 13.0, 21.0, 23.0, 36.0, 29.0, 25.0, 29.0, 26.0, 40.0, 49.0, 49.0, 36.0, 50.0, 56.0, 45.0, 30.0, 39.0, 32.0, 28.0, 45.0, 34.0, 42.0, 26.0, 19.0, 24.0, 17.0, 12.0, 14.0, 15.0, 12.0, 4.0, 8.0, 4.0, 4.0, 2.0, 5.0, 7.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.87890625, -0.8538818359375, -0.828857421875, -0.8038330078125, -0.77880859375, -0.7537841796875, -0.728759765625, -0.7037353515625, -0.6787109375, -0.6536865234375, -0.628662109375, -0.6036376953125, -0.57861328125, -0.5535888671875, -0.528564453125, -0.5035400390625, -0.478515625, -0.4534912109375, -0.428466796875, -0.4034423828125, -0.37841796875, -0.3533935546875, -0.328369140625, -0.3033447265625, -0.2783203125, -0.2532958984375, -0.228271484375, -0.2032470703125, -0.17822265625, -0.1531982421875, -0.128173828125, -0.1031494140625, -0.078125, -0.0531005859375, -0.028076171875, -0.0030517578125, 0.02197265625, 0.0469970703125, 0.072021484375, 0.0970458984375, 0.1220703125, 0.1470947265625, 0.172119140625, 0.1971435546875, 0.22216796875, 0.2471923828125, 0.272216796875, 0.2972412109375, 0.322265625, 0.3472900390625, 0.372314453125, 0.3973388671875, 0.42236328125, 0.4473876953125, 0.472412109375, 0.4974365234375, 0.5224609375, 0.5474853515625, 0.572509765625, 0.5975341796875, 0.62255859375, 0.6475830078125, 0.672607421875, 0.6976318359375, 0.72265625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 5.0, 6.0, 7.0, 25.0, 38.0, 40.0, 75.0, 127.0, 164.0, 249.0, 453.0, 768.0, 1452.0, 2654.0, 4900.0, 9494.0, 19177.0, 44054.0, 118558.0, 315669.0, 322440.0, 122402.0, 45191.0, 19709.0, 9678.0, 4881.0, 2756.0, 1478.0, 834.0, 489.0, 287.0, 165.0, 101.0, 76.0, 45.0, 33.0, 15.0, 13.0, 14.0, 5.0, 5.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.1845703125, -0.17897987365722656, -0.17338943481445312, -0.1677989959716797, -0.16220855712890625, -0.1566181182861328, -0.15102767944335938, -0.14543724060058594, -0.1398468017578125, -0.13425636291503906, -0.12866592407226562, -0.12307548522949219, -0.11748504638671875, -0.11189460754394531, -0.10630416870117188, -0.10071372985839844, -0.095123291015625, -0.08953285217285156, -0.08394241333007812, -0.07835197448730469, -0.07276153564453125, -0.06717109680175781, -0.061580657958984375, -0.05599021911621094, -0.0503997802734375, -0.04480934143066406, -0.039218902587890625, -0.03362846374511719, -0.02803802490234375, -0.022447586059570312, -0.016857147216796875, -0.011266708374023438, -0.00567626953125, -8.58306884765625e-05, 0.005504608154296875, 0.011095046997070312, 0.01668548583984375, 0.022275924682617188, 0.027866363525390625, 0.03345680236816406, 0.0390472412109375, 0.04463768005371094, 0.050228118896484375, 0.05581855773925781, 0.06140899658203125, 0.06699943542480469, 0.07258987426757812, 0.07818031311035156, 0.083770751953125, 0.08936119079589844, 0.09495162963867188, 0.10054206848144531, 0.10613250732421875, 0.11172294616699219, 0.11731338500976562, 0.12290382385253906, 0.1284942626953125, 0.13408470153808594, 0.13967514038085938, 0.1452655792236328, 0.15085601806640625, 0.1564464569091797, 0.16203689575195312, 0.16762733459472656, 0.1732177734375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 7.0, 11.0, 10.0, 13.0, 16.0, 29.0, 27.0, 39.0, 54.0, 87.0, 127.0, 160.0, 136.0, 78.0, 60.0, 35.0, 17.0, 19.0, 16.0, 10.0, 9.0, 10.0, 6.0, 5.0, 5.0, 8.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.900331497192383e-05, -9.66126099228859e-05, -9.422190487384796e-05, -9.183119982481003e-05, -8.94404947757721e-05, -8.704978972673416e-05, -8.465908467769623e-05, -8.22683796286583e-05, -7.987767457962036e-05, -7.748696953058243e-05, -7.50962644815445e-05, -7.270555943250656e-05, -7.031485438346863e-05, -6.79241493344307e-05, -6.553344428539276e-05, -6.314273923635483e-05, -6.0752034187316895e-05, -5.836132913827896e-05, -5.597062408924103e-05, -5.3579919040203094e-05, -5.118921399116516e-05, -4.879850894212723e-05, -4.6407803893089294e-05, -4.401709884405136e-05, -4.162639379501343e-05, -3.9235688745975494e-05, -3.684498369693756e-05, -3.445427864789963e-05, -3.2063573598861694e-05, -2.967286854982376e-05, -2.7282163500785828e-05, -2.4891458451747894e-05, -2.250075340270996e-05, -2.0110048353672028e-05, -1.7719343304634094e-05, -1.532863825559616e-05, -1.2937933206558228e-05, -1.0547228157520294e-05, -8.15652310848236e-06, -5.7658180594444275e-06, -3.375113010406494e-06, -9.844079613685608e-07, 1.4062970876693726e-06, 3.797002136707306e-06, 6.187707185745239e-06, 8.578412234783173e-06, 1.0969117283821106e-05, 1.335982233285904e-05, 1.5750527381896973e-05, 1.8141232430934906e-05, 2.053193747997284e-05, 2.2922642529010773e-05, 2.5313347578048706e-05, 2.770405262708664e-05, 3.0094757676124573e-05, 3.2485462725162506e-05, 3.487616777420044e-05, 3.726687282323837e-05, 3.9657577872276306e-05, 4.204828292131424e-05, 4.443898797035217e-05, 4.6829693019390106e-05, 4.922039806842804e-05, 5.161110311746597e-05, 5.4001808166503906e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 8.0, 4.0, 10.0, 23.0, 25.0, 34.0, 42.0, 53.0, 79.0, 116.0, 162.0, 261.0, 445.0, 833.0, 1518.0, 2993.0, 6322.0, 13882.0, 34152.0, 95058.0, 253053.0, 353626.0, 178279.0, 63362.0, 23961.0, 10389.0, 4641.0, 2326.0, 1173.0, 626.0, 407.0, 199.0, 137.0, 100.0, 66.0, 47.0, 38.0, 18.0, 24.0, 16.0, 17.0, 11.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.17333984375, -0.16797447204589844, -0.16260910034179688, -0.1572437286376953, -0.15187835693359375, -0.1465129852294922, -0.14114761352539062, -0.13578224182128906, -0.1304168701171875, -0.12505149841308594, -0.11968612670898438, -0.11432075500488281, -0.10895538330078125, -0.10359001159667969, -0.09822463989257812, -0.09285926818847656, -0.087493896484375, -0.08212852478027344, -0.07676315307617188, -0.07139778137207031, -0.06603240966796875, -0.06066703796386719, -0.055301666259765625, -0.04993629455566406, -0.0445709228515625, -0.03920555114746094, -0.033840179443359375, -0.028474807739257812, -0.02310943603515625, -0.017744064331054688, -0.012378692626953125, -0.0070133209228515625, -0.00164794921875, 0.0037174224853515625, 0.009082794189453125, 0.014448165893554688, 0.01981353759765625, 0.025178909301757812, 0.030544281005859375, 0.03590965270996094, 0.0412750244140625, 0.04664039611816406, 0.052005767822265625, 0.05737113952636719, 0.06273651123046875, 0.06810188293457031, 0.07346725463867188, 0.07883262634277344, 0.084197998046875, 0.08956336975097656, 0.09492874145507812, 0.10029411315917969, 0.10565948486328125, 0.11102485656738281, 0.11639022827148438, 0.12175559997558594, 0.1271209716796875, 0.13248634338378906, 0.13785171508789062, 0.1432170867919922, 0.14858245849609375, 0.1539478302001953, 0.15931320190429688, 0.16467857360839844, 0.1700439453125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 2.0, 1.0, 5.0, 4.0, 3.0, 10.0, 12.0, 9.0, 24.0, 28.0, 30.0, 41.0, 32.0, 49.0, 54.0, 74.0, 78.0, 84.0, 70.0, 65.0, 64.0, 44.0, 57.0, 39.0, 36.0, 18.0, 18.0, 13.0, 5.0, 6.0, 5.0, 4.0, 5.0, 7.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23681640625, -0.22997093200683594, -0.22312545776367188, -0.2162799835205078, -0.20943450927734375, -0.2025890350341797, -0.19574356079101562, -0.18889808654785156, -0.1820526123046875, -0.17520713806152344, -0.16836166381835938, -0.1615161895751953, -0.15467071533203125, -0.1478252410888672, -0.14097976684570312, -0.13413429260253906, -0.127288818359375, -0.12044334411621094, -0.11359786987304688, -0.10675239562988281, -0.09990692138671875, -0.09306144714355469, -0.08621597290039062, -0.07937049865722656, -0.0725250244140625, -0.06567955017089844, -0.058834075927734375, -0.05198860168457031, -0.04514312744140625, -0.03829765319824219, -0.031452178955078125, -0.024606704711914062, -0.01776123046875, -0.010915756225585938, -0.004070281982421875, 0.0027751922607421875, 0.00962066650390625, 0.016466140747070312, 0.023311614990234375, 0.030157089233398438, 0.0370025634765625, 0.04384803771972656, 0.050693511962890625, 0.05753898620605469, 0.06438446044921875, 0.07122993469238281, 0.07807540893554688, 0.08492088317871094, 0.091766357421875, 0.09861183166503906, 0.10545730590820312, 0.11230278015136719, 0.11914825439453125, 0.1259937286376953, 0.13283920288085938, 0.13968467712402344, 0.1465301513671875, 0.15337562561035156, 0.16022109985351562, 0.1670665740966797, 0.17391204833984375, 0.1807575225830078, 0.18760299682617188, 0.19444847106933594, 0.2012939453125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 17.0, 29.0, 96.0, 180.0, 220.0, 202.0, 147.0, 64.0, 22.0, 9.0, 6.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.009251117706299, -4.861154556274414, -4.713057994842529, -4.5649614334106445, -4.416865348815918, -4.268768787384033, -4.120672225952148, -3.9725756645202637, -3.824479103088379, -3.676382541656494, -3.5282859802246094, -3.3801896572113037, -3.232093095779419, -3.083996534347534, -2.9359002113342285, -2.7878036499023438, -2.639707088470459, -2.491610527038574, -2.3435139656066895, -2.195417642593384, -2.047321081161499, -1.8992245197296143, -1.751128077507019, -1.6030316352844238, -1.454935073852539, -1.3068385124206543, -1.158742070198059, -1.0106456279754639, -0.8625490665435791, -0.7144525647163391, -0.5663560628890991, -0.4182596206665039, -0.27016353607177734, -0.12206703424453735, 0.026029467582702637, 0.17412596940994263, 0.3222224712371826, 0.4703189730644226, 0.6184154748916626, 0.7665119171142578, 0.9146084785461426, 1.0627050399780273, 1.2108014822006226, 1.3588979244232178, 1.5069944858551025, 1.6550910472869873, 1.8031874895095825, 1.9512839317321777, 2.0993804931640625, 2.2474770545959473, 2.395573616027832, 2.5436699390411377, 2.6917665004730225, 2.8398630619049072, 2.987959384918213, 3.1360559463500977, 3.2841525077819824, 3.432249069213867, 3.580345630645752, 3.7284419536590576, 3.8765385150909424, 4.024634838104248, 4.172731399536133, 4.320827960968018, 4.468924522399902]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 3.0, 4.0, 10.0, 3.0, 12.0, 8.0, 17.0, 19.0, 24.0, 19.0, 21.0, 30.0, 27.0, 30.0, 25.0, 34.0, 29.0, 43.0, 38.0, 55.0, 39.0, 26.0, 56.0, 51.0, 34.0, 49.0, 44.0, 38.0, 27.0, 29.0, 21.0, 17.0, 24.0, 13.0, 17.0, 11.0, 7.0, 6.0, 14.0, 7.0, 5.0, 3.0, 6.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.8780732154846191, -1.820070743560791, -1.762068271636963, -1.7040657997131348, -1.6460633277893066, -1.5880608558654785, -1.5300583839416504, -1.4720559120178223, -1.4140534400939941, -1.356050968170166, -1.298048496246338, -1.2400460243225098, -1.1820435523986816, -1.1240410804748535, -1.0660386085510254, -1.0080361366271973, -0.9500337243080139, -0.8920312523841858, -0.8340287804603577, -0.7760263085365295, -0.7180238366127014, -0.6600214242935181, -0.6020189523696899, -0.5440164804458618, -0.4860139787197113, -0.4280115067958832, -0.37000903487205505, -0.3120065927505493, -0.2540041208267212, -0.19600164890289307, -0.13799917697906494, -0.07999670505523682, -0.02199423313140869, 0.036008235067129135, 0.09401070326566696, 0.1520131677389145, 0.21001563966274261, 0.26801809668540955, 0.32602056860923767, 0.3840230405330658, 0.4420255124568939, 0.5000279545783997, 0.5580304265022278, 0.6160328984260559, 0.674035370349884, 0.7320378422737122, 0.7900403141975403, 0.8480427861213684, 0.9060452580451965, 0.9640477299690247, 1.022050142288208, 1.0800526142120361, 1.1380550861358643, 1.1960575580596924, 1.2540600299835205, 1.3120625019073486, 1.3700649738311768, 1.4280674457550049, 1.486069917678833, 1.5440723896026611, 1.6020748615264893, 1.6600773334503174, 1.7180798053741455, 1.7760822772979736, 1.8340847492218018]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 10.0, 7.0, 10.0, 13.0, 17.0, 22.0, 31.0, 45.0, 52.0, 100.0, 184.0, 393.0, 879.0, 2265.0, 5808.0, 15325.0, 42805.0, 137936.0, 561904.0, 1693543.0, 1269216.0, 329915.0, 87188.0, 29235.0, 10619.0, 3875.0, 1527.0, 630.0, 300.0, 143.0, 100.0, 36.0, 36.0, 33.0, 24.0, 7.0, 12.0, 9.0, 8.0, 1.0, 8.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.37841796875, -0.36652374267578125, -0.3546295166015625, -0.34273529052734375, -0.330841064453125, -0.31894683837890625, -0.3070526123046875, -0.29515838623046875, -0.28326416015625, -0.27136993408203125, -0.2594757080078125, -0.24758148193359375, -0.235687255859375, -0.22379302978515625, -0.2118988037109375, -0.20000457763671875, -0.1881103515625, -0.17621612548828125, -0.1643218994140625, -0.15242767333984375, -0.140533447265625, -0.12863922119140625, -0.1167449951171875, -0.10485076904296875, -0.09295654296875, -0.08106231689453125, -0.0691680908203125, -0.05727386474609375, -0.045379638671875, -0.03348541259765625, -0.0215911865234375, -0.00969696044921875, 0.002197265625, 0.01409149169921875, 0.0259857177734375, 0.03787994384765625, 0.049774169921875, 0.06166839599609375, 0.0735626220703125, 0.08545684814453125, 0.09735107421875, 0.10924530029296875, 0.1211395263671875, 0.13303375244140625, 0.144927978515625, 0.15682220458984375, 0.1687164306640625, 0.18061065673828125, 0.1925048828125, 0.20439910888671875, 0.2162933349609375, 0.22818756103515625, 0.240081787109375, 0.25197601318359375, 0.2638702392578125, 0.27576446533203125, 0.28765869140625, 0.29955291748046875, 0.3114471435546875, 0.32334136962890625, 0.335235595703125, 0.34712982177734375, 0.3590240478515625, 0.37091827392578125, 0.3828125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 1.0, 5.0, 2.0, 7.0, 9.0, 5.0, 9.0, 11.0, 9.0, 13.0, 16.0, 20.0, 17.0, 24.0, 22.0, 19.0, 29.0, 38.0, 39.0, 35.0, 35.0, 39.0, 29.0, 45.0, 42.0, 39.0, 35.0, 39.0, 38.0, 35.0, 31.0, 31.0, 24.0, 20.0, 28.0, 21.0, 19.0, 21.0, 13.0, 14.0, 18.0, 16.0, 2.0, 8.0, 6.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.2186279296875, -0.211456298828125, -0.20428466796875, -0.197113037109375, -0.18994140625, -0.182769775390625, -0.17559814453125, -0.168426513671875, -0.1612548828125, -0.154083251953125, -0.14691162109375, -0.139739990234375, -0.132568359375, -0.125396728515625, -0.11822509765625, -0.111053466796875, -0.1038818359375, -0.096710205078125, -0.08953857421875, -0.082366943359375, -0.0751953125, -0.068023681640625, -0.06085205078125, -0.053680419921875, -0.0465087890625, -0.039337158203125, -0.03216552734375, -0.024993896484375, -0.017822265625, -0.010650634765625, -0.00347900390625, 0.003692626953125, 0.0108642578125, 0.018035888671875, 0.02520751953125, 0.032379150390625, 0.03955078125, 0.046722412109375, 0.05389404296875, 0.061065673828125, 0.0682373046875, 0.075408935546875, 0.08258056640625, 0.089752197265625, 0.096923828125, 0.104095458984375, 0.11126708984375, 0.118438720703125, 0.1256103515625, 0.132781982421875, 0.13995361328125, 0.147125244140625, 0.154296875, 0.161468505859375, 0.16864013671875, 0.175811767578125, 0.1829833984375, 0.190155029296875, 0.19732666015625, 0.204498291015625, 0.211669921875, 0.218841552734375, 0.22601318359375, 0.233184814453125, 0.2403564453125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 9.0, 18.0, 22.0, 54.0, 58.0, 121.0, 199.0, 378.0, 662.0, 1335.0, 2962.0, 7414.0, 23105.0, 85013.0, 398170.0, 2389776.0, 1052696.0, 169273.0, 42078.0, 12422.0, 4410.0, 1929.0, 957.0, 503.0, 278.0, 137.0, 89.0, 68.0, 41.0, 27.0, 20.0, 7.0, 13.0, 10.0, 5.0, 7.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.59619140625, -0.5774078369140625, -0.558624267578125, -0.5398406982421875, -0.52105712890625, -0.5022735595703125, -0.483489990234375, -0.4647064208984375, -0.4459228515625, -0.4271392822265625, -0.408355712890625, -0.3895721435546875, -0.37078857421875, -0.3520050048828125, -0.333221435546875, -0.3144378662109375, -0.295654296875, -0.2768707275390625, -0.258087158203125, -0.2393035888671875, -0.22052001953125, -0.2017364501953125, -0.182952880859375, -0.1641693115234375, -0.1453857421875, -0.1266021728515625, -0.107818603515625, -0.0890350341796875, -0.07025146484375, -0.0514678955078125, -0.032684326171875, -0.0139007568359375, 0.0048828125, 0.0236663818359375, 0.042449951171875, 0.0612335205078125, 0.08001708984375, 0.0988006591796875, 0.117584228515625, 0.1363677978515625, 0.1551513671875, 0.1739349365234375, 0.192718505859375, 0.2115020751953125, 0.23028564453125, 0.2490692138671875, 0.267852783203125, 0.2866363525390625, 0.305419921875, 0.3242034912109375, 0.342987060546875, 0.3617706298828125, 0.38055419921875, 0.3993377685546875, 0.418121337890625, 0.4369049072265625, 0.4556884765625, 0.4744720458984375, 0.493255615234375, 0.5120391845703125, 0.53082275390625, 0.5496063232421875, 0.568389892578125, 0.5871734619140625, 0.60595703125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 5.0, 14.0, 3.0, 14.0, 13.0, 18.0, 22.0, 32.0, 54.0, 57.0, 66.0, 92.0, 143.0, 211.0, 291.0, 420.0, 528.0, 546.0, 450.0, 309.0, 223.0, 133.0, 101.0, 68.0, 59.0, 60.0, 28.0, 29.0, 20.0, 14.0, 10.0, 13.0, 3.0, 9.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4765625, -0.459564208984375, -0.44256591796875, -0.425567626953125, -0.4085693359375, -0.391571044921875, -0.37457275390625, -0.357574462890625, -0.340576171875, -0.323577880859375, -0.30657958984375, -0.289581298828125, -0.2725830078125, -0.255584716796875, -0.23858642578125, -0.221588134765625, -0.20458984375, -0.187591552734375, -0.17059326171875, -0.153594970703125, -0.1365966796875, -0.119598388671875, -0.10260009765625, -0.085601806640625, -0.068603515625, -0.051605224609375, -0.03460693359375, -0.017608642578125, -0.0006103515625, 0.016387939453125, 0.03338623046875, 0.050384521484375, 0.0673828125, 0.084381103515625, 0.10137939453125, 0.118377685546875, 0.1353759765625, 0.152374267578125, 0.16937255859375, 0.186370849609375, 0.203369140625, 0.220367431640625, 0.23736572265625, 0.254364013671875, 0.2713623046875, 0.288360595703125, 0.30535888671875, 0.322357177734375, 0.33935546875, 0.356353759765625, 0.37335205078125, 0.390350341796875, 0.4073486328125, 0.424346923828125, 0.44134521484375, 0.458343505859375, 0.475341796875, 0.492340087890625, 0.50933837890625, 0.526336669921875, 0.5433349609375, 0.560333251953125, 0.57733154296875, 0.594329833984375, 0.611328125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 18.0, 25.0, 51.0, 91.0, 154.0, 173.0, 188.0, 145.0, 83.0, 33.0, 17.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9025442600250244, -2.7388224601745605, -2.5751004219055176, -2.4113783836364746, -2.2476565837860107, -2.083934783935547, -1.920212745666504, -1.7564908266067505, -1.592768907546997, -1.4290469884872437, -1.2653250694274902, -1.1016031503677368, -0.9378812313079834, -0.77415931224823, -0.6104373931884766, -0.44671547412872314, -0.2829935550689697, -0.11927163600921631, 0.04445028305053711, 0.20817220211029053, 0.37189412117004395, 0.5356160402297974, 0.6993379592895508, 0.8630598783493042, 1.0267817974090576, 1.190503716468811, 1.3542256355285645, 1.5179475545883179, 1.6816694736480713, 1.8453913927078247, 2.009113311767578, 2.172835350036621, 2.336557388305664, 2.500279426574707, 2.664001226425171, 2.8277230262756348, 2.9914450645446777, 3.1551671028137207, 3.3188889026641846, 3.4826107025146484, 3.6463327407836914, 3.8100547790527344, 3.9737765789031982, 4.137498378753662, 4.301220417022705, 4.464942455291748, 4.628664016723633, 4.792386054992676, 4.956108093261719, 5.119830131530762, 5.283552169799805, 5.4472737312316895, 5.610995769500732, 5.774717807769775, 5.93843936920166, 6.102161407470703, 6.265883445739746, 6.429605484008789, 6.593327522277832, 6.757049083709717, 6.92077112197876, 7.084493160247803, 7.2482147216796875, 7.4119367599487305, 7.575658798217773]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 6.0, 5.0, 10.0, 14.0, 18.0, 20.0, 29.0, 29.0, 45.0, 38.0, 42.0, 57.0, 31.0, 43.0, 47.0, 50.0, 45.0, 58.0, 48.0, 59.0, 33.0, 35.0, 34.0, 35.0, 35.0, 17.0, 18.0, 16.0, 16.0, 11.0, 10.0, 10.0, 2.0, 3.0, 4.0, 7.0, 5.0, 0.0, 3.0, 2.0, 3.0, 1.0], "bins": [-2.575913429260254, -2.5085458755493164, -2.441178321838379, -2.3738107681274414, -2.306443214416504, -2.2390758991241455, -2.171708345413208, -2.1043407917022705, -2.036973237991333, -1.9696056842803955, -1.902238130569458, -1.83487069606781, -1.7675031423568726, -1.700135588645935, -1.632768154144287, -1.5654006004333496, -1.498033046722412, -1.4306654930114746, -1.363297939300537, -1.2959305047988892, -1.2285629510879517, -1.1611953973770142, -1.0938279628753662, -1.0264604091644287, -0.9590928554534912, -0.8917253017425537, -0.824357807636261, -0.7569903135299683, -0.6896227598190308, -0.6222552061080933, -0.5548877120018005, -0.4875201880931854, -0.4201526641845703, -0.3527851402759552, -0.2854176163673401, -0.21805009245872498, -0.15068256855010986, -0.08331504464149475, -0.01594752073287964, 0.051420003175735474, 0.11878752708435059, 0.1861550509929657, 0.2535225749015808, 0.3208900988101959, 0.38825762271881104, 0.45562514662742615, 0.5229926705360413, 0.590360164642334, 0.6577277183532715, 0.725095272064209, 0.7924627661705017, 0.8598302602767944, 0.9271978139877319, 0.9945653676986694, 1.0619328022003174, 1.1293003559112549, 1.1966679096221924, 1.2640354633331299, 1.3314030170440674, 1.3987704515457153, 1.4661380052566528, 1.5335055589675903, 1.6008729934692383, 1.6682405471801758, 1.7356081008911133]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 12.0, 13.0, 18.0, 30.0, 39.0, 66.0, 91.0, 164.0, 323.0, 570.0, 1118.0, 2231.0, 4623.0, 10036.0, 23311.0, 56035.0, 129886.0, 233217.0, 265266.0, 175900.0, 83218.0, 34849.0, 14583.0, 6671.0, 3031.0, 1520.0, 779.0, 398.0, 208.0, 140.0, 76.0, 36.0, 41.0, 20.0, 17.0, 11.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.328369140625, -0.3187751770019531, -0.30918121337890625, -0.2995872497558594, -0.2899932861328125, -0.2803993225097656, -0.27080535888671875, -0.2612113952636719, -0.251617431640625, -0.24202346801757812, -0.23242950439453125, -0.22283554077148438, -0.2132415771484375, -0.20364761352539062, -0.19405364990234375, -0.18445968627929688, -0.17486572265625, -0.16527175903320312, -0.15567779541015625, -0.14608383178710938, -0.1364898681640625, -0.12689590454101562, -0.11730194091796875, -0.10770797729492188, -0.098114013671875, -0.08852005004882812, -0.07892608642578125, -0.06933212280273438, -0.0597381591796875, -0.050144195556640625, -0.04055023193359375, -0.030956268310546875, -0.0213623046875, -0.011768341064453125, -0.00217437744140625, 0.007419586181640625, 0.0170135498046875, 0.026607513427734375, 0.03620147705078125, 0.045795440673828125, 0.055389404296875, 0.06498336791992188, 0.07457733154296875, 0.08417129516601562, 0.0937652587890625, 0.10335922241210938, 0.11295318603515625, 0.12254714965820312, 0.13214111328125, 0.14173507690429688, 0.15132904052734375, 0.16092300415039062, 0.1705169677734375, 0.18011093139648438, 0.18970489501953125, 0.19929885864257812, 0.208892822265625, 0.21848678588867188, 0.22808074951171875, 0.23767471313476562, 0.2472686767578125, 0.2568626403808594, 0.26645660400390625, 0.2760505676269531, 0.28564453125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 4.0, 7.0, 12.0, 7.0, 11.0, 6.0, 8.0, 18.0, 23.0, 14.0, 29.0, 31.0, 29.0, 29.0, 30.0, 39.0, 31.0, 32.0, 50.0, 38.0, 28.0, 29.0, 37.0, 44.0, 35.0, 34.0, 40.0, 31.0, 25.0, 31.0, 33.0, 29.0, 21.0, 17.0, 15.0, 25.0, 19.0, 11.0, 9.0, 11.0, 5.0, 5.0, 8.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1976318359375, -0.19067001342773438, -0.18370819091796875, -0.17674636840820312, -0.1697845458984375, -0.16282272338867188, -0.15586090087890625, -0.14889907836914062, -0.141937255859375, -0.13497543334960938, -0.12801361083984375, -0.12105178833007812, -0.1140899658203125, -0.10712814331054688, -0.10016632080078125, -0.09320449829101562, -0.08624267578125, -0.07928085327148438, -0.07231903076171875, -0.06535720825195312, -0.0583953857421875, -0.051433563232421875, -0.04447174072265625, -0.037509918212890625, -0.030548095703125, -0.023586273193359375, -0.01662445068359375, -0.009662628173828125, -0.0027008056640625, 0.004261016845703125, 0.01122283935546875, 0.018184661865234375, 0.025146484375, 0.032108306884765625, 0.03907012939453125, 0.046031951904296875, 0.0529937744140625, 0.059955596923828125, 0.06691741943359375, 0.07387924194335938, 0.080841064453125, 0.08780288696289062, 0.09476470947265625, 0.10172653198242188, 0.1086883544921875, 0.11565017700195312, 0.12261199951171875, 0.12957382202148438, 0.13653564453125, 0.14349746704101562, 0.15045928955078125, 0.15742111206054688, 0.1643829345703125, 0.17134475708007812, 0.17830657958984375, 0.18526840209960938, 0.192230224609375, 0.19919204711914062, 0.20615386962890625, 0.21311569213867188, 0.2200775146484375, 0.22703933715820312, 0.23400115966796875, 0.24096298217773438, 0.2479248046875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 3.0, 4.0, 9.0, 8.0, 18.0, 21.0, 23.0, 43.0, 62.0, 78.0, 125.0, 219.0, 408.0, 787.0, 1723.0, 3919.0, 9232.0, 23914.0, 69961.0, 196517.0, 348962.0, 245736.0, 93648.0, 32215.0, 11884.0, 4796.0, 2054.0, 964.0, 508.0, 254.0, 149.0, 88.0, 66.0, 43.0, 27.0, 22.0, 11.0, 15.0, 11.0, 4.0, 3.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.44287109375, -0.430084228515625, -0.41729736328125, -0.404510498046875, -0.3917236328125, -0.378936767578125, -0.36614990234375, -0.353363037109375, -0.340576171875, -0.327789306640625, -0.31500244140625, -0.302215576171875, -0.2894287109375, -0.276641845703125, -0.26385498046875, -0.251068115234375, -0.23828125, -0.225494384765625, -0.21270751953125, -0.199920654296875, -0.1871337890625, -0.174346923828125, -0.16156005859375, -0.148773193359375, -0.135986328125, -0.123199462890625, -0.11041259765625, -0.097625732421875, -0.0848388671875, -0.072052001953125, -0.05926513671875, -0.046478271484375, -0.03369140625, -0.020904541015625, -0.00811767578125, 0.004669189453125, 0.0174560546875, 0.030242919921875, 0.04302978515625, 0.055816650390625, 0.068603515625, 0.081390380859375, 0.09417724609375, 0.106964111328125, 0.1197509765625, 0.132537841796875, 0.14532470703125, 0.158111572265625, 0.1708984375, 0.183685302734375, 0.19647216796875, 0.209259033203125, 0.2220458984375, 0.234832763671875, 0.24761962890625, 0.260406494140625, 0.273193359375, 0.285980224609375, 0.29876708984375, 0.311553955078125, 0.3243408203125, 0.337127685546875, 0.34991455078125, 0.362701416015625, 0.37548828125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 7.0, 5.0, 5.0, 7.0, 3.0, 8.0, 9.0, 17.0, 19.0, 17.0, 24.0, 25.0, 24.0, 26.0, 29.0, 34.0, 34.0, 34.0, 35.0, 30.0, 32.0, 46.0, 54.0, 35.0, 31.0, 37.0, 39.0, 32.0, 31.0, 30.0, 36.0, 22.0, 29.0, 20.0, 21.0, 16.0, 19.0, 14.0, 16.0, 7.0, 3.0, 12.0, 4.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.6552734375, -0.6363677978515625, -0.617462158203125, -0.5985565185546875, -0.57965087890625, -0.5607452392578125, -0.541839599609375, -0.5229339599609375, -0.5040283203125, -0.4851226806640625, -0.466217041015625, -0.4473114013671875, -0.42840576171875, -0.4095001220703125, -0.390594482421875, -0.3716888427734375, -0.352783203125, -0.3338775634765625, -0.314971923828125, -0.2960662841796875, -0.27716064453125, -0.2582550048828125, -0.239349365234375, -0.2204437255859375, -0.2015380859375, -0.1826324462890625, -0.163726806640625, -0.1448211669921875, -0.12591552734375, -0.1070098876953125, -0.088104248046875, -0.0691986083984375, -0.05029296875, -0.0313873291015625, -0.012481689453125, 0.0064239501953125, 0.02532958984375, 0.0442352294921875, 0.063140869140625, 0.0820465087890625, 0.1009521484375, 0.1198577880859375, 0.138763427734375, 0.1576690673828125, 0.17657470703125, 0.1954803466796875, 0.214385986328125, 0.2332916259765625, 0.252197265625, 0.2711029052734375, 0.290008544921875, 0.3089141845703125, 0.32781982421875, 0.3467254638671875, 0.365631103515625, 0.3845367431640625, 0.4034423828125, 0.4223480224609375, 0.441253662109375, 0.4601593017578125, 0.47906494140625, 0.4979705810546875, 0.516876220703125, 0.5357818603515625, 0.5546875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 6.0, 6.0, 5.0, 3.0, 11.0, 8.0, 17.0, 28.0, 29.0, 56.0, 78.0, 155.0, 217.0, 387.0, 734.0, 1417.0, 3037.0, 6742.0, 15578.0, 38777.0, 98407.0, 232189.0, 322014.0, 194739.0, 78806.0, 31234.0, 12981.0, 5645.0, 2562.0, 1246.0, 604.0, 327.0, 201.0, 96.0, 68.0, 49.0, 36.0, 12.0, 17.0, 9.0, 10.0, 8.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1580810546875, -0.1528778076171875, -0.147674560546875, -0.1424713134765625, -0.13726806640625, -0.1320648193359375, -0.126861572265625, -0.1216583251953125, -0.116455078125, -0.1112518310546875, -0.106048583984375, -0.1008453369140625, -0.09564208984375, -0.0904388427734375, -0.085235595703125, -0.0800323486328125, -0.0748291015625, -0.0696258544921875, -0.064422607421875, -0.0592193603515625, -0.05401611328125, -0.0488128662109375, -0.043609619140625, -0.0384063720703125, -0.033203125, -0.0279998779296875, -0.022796630859375, -0.0175933837890625, -0.01239013671875, -0.0071868896484375, -0.001983642578125, 0.0032196044921875, 0.0084228515625, 0.0136260986328125, 0.018829345703125, 0.0240325927734375, 0.02923583984375, 0.0344390869140625, 0.039642333984375, 0.0448455810546875, 0.050048828125, 0.0552520751953125, 0.060455322265625, 0.0656585693359375, 0.07086181640625, 0.0760650634765625, 0.081268310546875, 0.0864715576171875, 0.0916748046875, 0.0968780517578125, 0.102081298828125, 0.1072845458984375, 0.11248779296875, 0.1176910400390625, 0.122894287109375, 0.1280975341796875, 0.13330078125, 0.1385040283203125, 0.143707275390625, 0.1489105224609375, 0.15411376953125, 0.1593170166015625, 0.164520263671875, 0.1697235107421875, 0.1749267578125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 7.0, 3.0, 10.0, 17.0, 12.0, 26.0, 27.0, 34.0, 27.0, 53.0, 57.0, 54.0, 76.0, 83.0, 91.0, 65.0, 66.0, 44.0, 46.0, 44.0, 29.0, 28.0, 15.0, 19.0, 12.0, 9.0, 8.0, 6.0, 3.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.07099723815918e-05, -3.935955464839935e-05, -3.800913691520691e-05, -3.6658719182014465e-05, -3.530830144882202e-05, -3.395788371562958e-05, -3.2607465982437134e-05, -3.125704824924469e-05, -2.9906630516052246e-05, -2.8556212782859802e-05, -2.720579504966736e-05, -2.5855377316474915e-05, -2.450495958328247e-05, -2.3154541850090027e-05, -2.1804124116897583e-05, -2.045370638370514e-05, -1.9103288650512695e-05, -1.775287091732025e-05, -1.6402453184127808e-05, -1.5052035450935364e-05, -1.370161771774292e-05, -1.2351199984550476e-05, -1.1000782251358032e-05, -9.650364518165588e-06, -8.299946784973145e-06, -6.949529051780701e-06, -5.599111318588257e-06, -4.248693585395813e-06, -2.898275852203369e-06, -1.5478581190109253e-06, -1.9744038581848145e-07, 1.1529773473739624e-06, 2.5033950805664062e-06, 3.85381281375885e-06, 5.204230546951294e-06, 6.554648280143738e-06, 7.905066013336182e-06, 9.255483746528625e-06, 1.060590147972107e-05, 1.1956319212913513e-05, 1.3306736946105957e-05, 1.4657154679298401e-05, 1.6007572412490845e-05, 1.735799014568329e-05, 1.8708407878875732e-05, 2.0058825612068176e-05, 2.140924334526062e-05, 2.2759661078453064e-05, 2.4110078811645508e-05, 2.546049654483795e-05, 2.6810914278030396e-05, 2.816133201122284e-05, 2.9511749744415283e-05, 3.086216747760773e-05, 3.221258521080017e-05, 3.3563002943992615e-05, 3.491342067718506e-05, 3.62638384103775e-05, 3.7614256143569946e-05, 3.896467387676239e-05, 4.0315091609954834e-05, 4.166550934314728e-05, 4.301592707633972e-05, 4.4366344809532166e-05, 4.571676254272461e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 4.0, 8.0, 9.0, 16.0, 17.0, 37.0, 55.0, 98.0, 177.0, 233.0, 471.0, 883.0, 1594.0, 3696.0, 8788.0, 21493.0, 54856.0, 135787.0, 272025.0, 288124.0, 154521.0, 62881.0, 24512.0, 10089.0, 4110.0, 1844.0, 934.0, 535.0, 280.0, 155.0, 93.0, 77.0, 53.0, 29.0, 16.0, 21.0, 7.0, 10.0, 5.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.183837890625, -0.17859649658203125, -0.1733551025390625, -0.16811370849609375, -0.162872314453125, -0.15763092041015625, -0.1523895263671875, -0.14714813232421875, -0.14190673828125, -0.13666534423828125, -0.1314239501953125, -0.12618255615234375, -0.120941162109375, -0.11569976806640625, -0.1104583740234375, -0.10521697998046875, -0.0999755859375, -0.09473419189453125, -0.0894927978515625, -0.08425140380859375, -0.079010009765625, -0.07376861572265625, -0.0685272216796875, -0.06328582763671875, -0.05804443359375, -0.05280303955078125, -0.0475616455078125, -0.04232025146484375, -0.037078857421875, -0.03183746337890625, -0.0265960693359375, -0.02135467529296875, -0.01611328125, -0.01087188720703125, -0.0056304931640625, -0.00038909912109375, 0.004852294921875, 0.01009368896484375, 0.0153350830078125, 0.02057647705078125, 0.02581787109375, 0.03105926513671875, 0.0363006591796875, 0.04154205322265625, 0.046783447265625, 0.05202484130859375, 0.0572662353515625, 0.06250762939453125, 0.0677490234375, 0.07299041748046875, 0.0782318115234375, 0.08347320556640625, 0.088714599609375, 0.09395599365234375, 0.0991973876953125, 0.10443878173828125, 0.10968017578125, 0.11492156982421875, 0.1201629638671875, 0.12540435791015625, 0.130645751953125, 0.13588714599609375, 0.1411285400390625, 0.14636993408203125, 0.151611328125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 2.0, 5.0, 4.0, 4.0, 7.0, 9.0, 6.0, 12.0, 16.0, 12.0, 20.0, 17.0, 39.0, 38.0, 35.0, 45.0, 58.0, 44.0, 62.0, 70.0, 67.0, 48.0, 52.0, 56.0, 49.0, 32.0, 32.0, 27.0, 21.0, 17.0, 24.0, 16.0, 6.0, 6.0, 5.0, 3.0, 5.0, 6.0, 4.0, 4.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.147705078125, -0.1431713104248047, -0.13863754272460938, -0.13410377502441406, -0.12957000732421875, -0.12503623962402344, -0.12050247192382812, -0.11596870422363281, -0.1114349365234375, -0.10690116882324219, -0.10236740112304688, -0.09783363342285156, -0.09329986572265625, -0.08876609802246094, -0.08423233032226562, -0.07969856262207031, -0.075164794921875, -0.07063102722167969, -0.06609725952148438, -0.06156349182128906, -0.05702972412109375, -0.05249595642089844, -0.047962188720703125, -0.04342842102050781, -0.0388946533203125, -0.03436088562011719, -0.029827117919921875, -0.025293350219726562, -0.02075958251953125, -0.016225814819335938, -0.011692047119140625, -0.0071582794189453125, -0.00262451171875, 0.0019092559814453125, 0.006443023681640625, 0.010976791381835938, 0.01551055908203125, 0.020044326782226562, 0.024578094482421875, 0.029111862182617188, 0.0336456298828125, 0.03817939758300781, 0.042713165283203125, 0.04724693298339844, 0.05178070068359375, 0.05631446838378906, 0.060848236083984375, 0.06538200378417969, 0.069915771484375, 0.07444953918457031, 0.07898330688476562, 0.08351707458496094, 0.08805084228515625, 0.09258460998535156, 0.09711837768554688, 0.10165214538574219, 0.1061859130859375, 0.11071968078613281, 0.11525344848632812, 0.11978721618652344, 0.12432098388671875, 0.12885475158691406, 0.13338851928710938, 0.1379222869873047, 0.1424560546875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 13.0, 31.0, 133.0, 303.0, 325.0, 136.0, 49.0, 13.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.125173568725586, -2.9417195320129395, -2.758265256881714, -2.5748112201690674, -2.391356945037842, -2.2079029083251953, -2.024448871612549, -1.8409947156906128, -1.6575405597686768, -1.4740864038467407, -1.2906322479248047, -1.1071782112121582, -0.9237240552902222, -0.7402698993682861, -0.5568158626556396, -0.3733617067337036, -0.18990755081176758, -0.006453424692153931, 0.17700070142745972, 0.360454797744751, 0.543908953666687, 0.727363109588623, 0.9108171463012695, 1.0942713022232056, 1.2777254581451416, 1.4611796140670776, 1.6446337699890137, 1.8280878067016602, 2.0115418434143066, 2.1949961185455322, 2.3784501552581787, 2.5619044303894043, 2.745358467102051, 2.9288125038146973, 3.112266778945923, 3.2957208156585693, 3.479175090789795, 3.6626291275024414, 3.846083164215088, 4.029537200927734, 4.212991714477539, 4.3964457511901855, 4.579899787902832, 4.763354301452637, 4.946808338165283, 5.13026237487793, 5.313716411590576, 5.497170448303223, 5.680624485015869, 5.864078521728516, 6.047532558441162, 6.230986595153809, 6.414441108703613, 6.59789514541626, 6.781349182128906, 6.964803218841553, 7.148257255554199, 7.331711292266846, 7.515165328979492, 7.698619842529297, 7.882073879241943, 8.06552791595459, 8.248981475830078, 8.432435989379883, 8.615890502929688]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 9.0, 10.0, 15.0, 6.0, 16.0, 21.0, 27.0, 22.0, 34.0, 26.0, 26.0, 32.0, 35.0, 37.0, 31.0, 38.0, 41.0, 46.0, 28.0, 49.0, 42.0, 48.0, 41.0, 39.0, 34.0, 31.0, 27.0, 24.0, 27.0, 31.0, 12.0, 19.0, 13.0, 12.0, 7.0, 12.0, 3.0, 4.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.80169677734375, -1.7469565868377686, -1.6922165155410767, -1.6374764442443848, -1.5827362537384033, -1.5279960632324219, -1.47325599193573, -1.418515920639038, -1.3637757301330566, -1.3090355396270752, -1.2542954683303833, -1.1995553970336914, -1.14481520652771, -1.0900750160217285, -1.0353349447250366, -0.9805948138237, -0.9258546829223633, -0.8711145520210266, -0.8163744211196899, -0.7616342902183533, -0.7068941593170166, -0.6521540284156799, -0.5974138975143433, -0.5426737666130066, -0.4879336357116699, -0.43319350481033325, -0.3784533739089966, -0.3237132430076599, -0.26897311210632324, -0.21423298120498657, -0.1594928503036499, -0.10475271940231323, -0.05001258850097656, 0.004727542400360107, 0.05946767330169678, 0.11420780420303345, 0.16894793510437012, 0.2236880660057068, 0.27842819690704346, 0.3331683278083801, 0.3879084587097168, 0.44264858961105347, 0.49738872051239014, 0.5521288514137268, 0.6068689823150635, 0.6616091132164001, 0.7163492441177368, 0.7710893750190735, 0.8258295059204102, 0.8805696368217468, 0.9353097677230835, 0.9900498986244202, 1.0447900295257568, 1.0995302200317383, 1.1542702913284302, 1.209010362625122, 1.2637505531311035, 1.318490743637085, 1.3732308149337769, 1.4279708862304688, 1.4827110767364502, 1.5374512672424316, 1.5921913385391235, 1.6469314098358154, 1.7016716003417969]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 7.0, 3.0, 5.0, 10.0, 11.0, 24.0, 17.0, 38.0, 36.0, 48.0, 89.0, 117.0, 184.0, 395.0, 846.0, 2288.0, 7613.0, 33460.0, 194052.0, 1238050.0, 2105048.0, 511361.0, 78762.0, 15502.0, 3909.0, 1239.0, 516.0, 241.0, 126.0, 81.0, 48.0, 50.0, 23.0, 22.0, 10.0, 12.0, 9.0, 8.0, 9.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.49365234375, -0.4792366027832031, -0.46482086181640625, -0.4504051208496094, -0.4359893798828125, -0.4215736389160156, -0.40715789794921875, -0.3927421569824219, -0.378326416015625, -0.3639106750488281, -0.34949493408203125, -0.3350791931152344, -0.3206634521484375, -0.3062477111816406, -0.29183197021484375, -0.2774162292480469, -0.26300048828125, -0.24858474731445312, -0.23416900634765625, -0.21975326538085938, -0.2053375244140625, -0.19092178344726562, -0.17650604248046875, -0.16209030151367188, -0.147674560546875, -0.13325881958007812, -0.11884307861328125, -0.10442733764648438, -0.0900115966796875, -0.07559585571289062, -0.06118011474609375, -0.046764373779296875, -0.0323486328125, -0.017932891845703125, -0.00351715087890625, 0.010898590087890625, 0.0253143310546875, 0.039730072021484375, 0.05414581298828125, 0.06856155395507812, 0.082977294921875, 0.09739303588867188, 0.11180877685546875, 0.12622451782226562, 0.1406402587890625, 0.15505599975585938, 0.16947174072265625, 0.18388748168945312, 0.19830322265625, 0.21271896362304688, 0.22713470458984375, 0.24155044555664062, 0.2559661865234375, 0.2703819274902344, 0.28479766845703125, 0.2992134094238281, 0.313629150390625, 0.3280448913574219, 0.34246063232421875, 0.3568763732910156, 0.3712921142578125, 0.3857078552246094, 0.40012359619140625, 0.4145393371582031, 0.428955078125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 3.0, 4.0, 5.0, 7.0, 10.0, 13.0, 7.0, 22.0, 17.0, 19.0, 18.0, 23.0, 29.0, 31.0, 28.0, 30.0, 35.0, 43.0, 34.0, 67.0, 44.0, 47.0, 42.0, 37.0, 43.0, 42.0, 34.0, 39.0, 43.0, 23.0, 27.0, 28.0, 26.0, 19.0, 14.0, 7.0, 10.0, 6.0, 7.0, 4.0, 1.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.27685546875, -0.26827239990234375, -0.2596893310546875, -0.25110626220703125, -0.242523193359375, -0.23394012451171875, -0.2253570556640625, -0.21677398681640625, -0.20819091796875, -0.19960784912109375, -0.1910247802734375, -0.18244171142578125, -0.173858642578125, -0.16527557373046875, -0.1566925048828125, -0.14810943603515625, -0.1395263671875, -0.13094329833984375, -0.1223602294921875, -0.11377716064453125, -0.105194091796875, -0.09661102294921875, -0.0880279541015625, -0.07944488525390625, -0.07086181640625, -0.06227874755859375, -0.0536956787109375, -0.04511260986328125, -0.036529541015625, -0.02794647216796875, -0.0193634033203125, -0.01078033447265625, -0.002197265625, 0.00638580322265625, 0.0149688720703125, 0.02355194091796875, 0.032135009765625, 0.04071807861328125, 0.0493011474609375, 0.05788421630859375, 0.06646728515625, 0.07505035400390625, 0.0836334228515625, 0.09221649169921875, 0.100799560546875, 0.10938262939453125, 0.1179656982421875, 0.12654876708984375, 0.1351318359375, 0.14371490478515625, 0.1522979736328125, 0.16088104248046875, 0.169464111328125, 0.17804718017578125, 0.1866302490234375, 0.19521331787109375, 0.20379638671875, 0.21237945556640625, 0.2209625244140625, 0.22954559326171875, 0.238128662109375, 0.24671173095703125, 0.2552947998046875, 0.26387786865234375, 0.2724609375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 11.0, 7.0, 12.0, 24.0, 42.0, 47.0, 78.0, 118.0, 179.0, 302.0, 569.0, 1021.0, 2117.0, 5606.0, 16735.0, 60251.0, 294149.0, 2053007.0, 1487028.0, 205467.0, 45712.0, 13099.0, 4692.0, 1893.0, 907.0, 492.0, 280.0, 148.0, 88.0, 58.0, 44.0, 37.0, 15.0, 11.0, 9.0, 8.0, 1.0, 2.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.497314453125, -0.4817237854003906, -0.46613311767578125, -0.4505424499511719, -0.4349517822265625, -0.4193611145019531, -0.40377044677734375, -0.3881797790527344, -0.372589111328125, -0.3569984436035156, -0.34140777587890625, -0.3258171081542969, -0.3102264404296875, -0.2946357727050781, -0.27904510498046875, -0.2634544372558594, -0.24786376953125, -0.23227310180664062, -0.21668243408203125, -0.20109176635742188, -0.1855010986328125, -0.16991043090820312, -0.15431976318359375, -0.13872909545898438, -0.123138427734375, -0.10754776000976562, -0.09195709228515625, -0.07636642456054688, -0.0607757568359375, -0.045185089111328125, -0.02959442138671875, -0.014003753662109375, 0.0015869140625, 0.017177581787109375, 0.03276824951171875, 0.048358917236328125, 0.0639495849609375, 0.07954025268554688, 0.09513092041015625, 0.11072158813476562, 0.126312255859375, 0.14190292358398438, 0.15749359130859375, 0.17308425903320312, 0.1886749267578125, 0.20426559448242188, 0.21985626220703125, 0.23544692993164062, 0.25103759765625, 0.2666282653808594, 0.28221893310546875, 0.2978096008300781, 0.3134002685546875, 0.3289909362792969, 0.34458160400390625, 0.3601722717285156, 0.375762939453125, 0.3913536071777344, 0.40694427490234375, 0.4225349426269531, 0.4381256103515625, 0.4537162780761719, 0.46930694580078125, 0.4848976135253906, 0.50048828125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 9.0, 8.0, 26.0, 29.0, 43.0, 60.0, 95.0, 138.0, 213.0, 388.0, 531.0, 672.0, 652.0, 428.0, 291.0, 158.0, 98.0, 63.0, 32.0, 35.0, 23.0, 15.0, 15.0, 13.0, 8.0, 9.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.56787109375, -0.5504684448242188, -0.5330657958984375, -0.5156631469726562, -0.498260498046875, -0.48085784912109375, -0.4634552001953125, -0.44605255126953125, -0.42864990234375, -0.41124725341796875, -0.3938446044921875, -0.37644195556640625, -0.359039306640625, -0.34163665771484375, -0.3242340087890625, -0.30683135986328125, -0.2894287109375, -0.27202606201171875, -0.2546234130859375, -0.23722076416015625, -0.219818115234375, -0.20241546630859375, -0.1850128173828125, -0.16761016845703125, -0.15020751953125, -0.13280487060546875, -0.1154022216796875, -0.09799957275390625, -0.080596923828125, -0.06319427490234375, -0.0457916259765625, -0.02838897705078125, -0.010986328125, 0.00641632080078125, 0.0238189697265625, 0.04122161865234375, 0.058624267578125, 0.07602691650390625, 0.0934295654296875, 0.11083221435546875, 0.12823486328125, 0.14563751220703125, 0.1630401611328125, 0.18044281005859375, 0.197845458984375, 0.21524810791015625, 0.2326507568359375, 0.25005340576171875, 0.2674560546875, 0.28485870361328125, 0.3022613525390625, 0.31966400146484375, 0.337066650390625, 0.35446929931640625, 0.3718719482421875, 0.38927459716796875, 0.40667724609375, 0.42407989501953125, 0.4414825439453125, 0.45888519287109375, 0.476287841796875, 0.49369049072265625, 0.5110931396484375, 0.5284957885742188, 0.5458984375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 0.0, 1.0, 4.0, 7.0, 13.0, 30.0, 57.0, 85.0, 146.0, 129.0, 158.0, 152.0, 90.0, 57.0, 34.0, 16.0, 9.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.4671103954315186, -3.3625025749206543, -3.257894992828369, -3.153287172317505, -3.0486793518066406, -2.9440717697143555, -2.839463949203491, -2.734856128692627, -2.630248546600342, -2.5256407260894775, -2.4210331439971924, -2.316425323486328, -2.211817502975464, -2.1072096824645996, -2.0026021003723145, -1.8979942798614502, -1.793386459350586, -1.6887787580490112, -1.584170937538147, -1.4795632362365723, -1.374955415725708, -1.2703477144241333, -1.1657400131225586, -1.0611321926116943, -0.9565244913101196, -0.8519167304039001, -0.7473089694976807, -0.642701268196106, -0.5380935072898865, -0.433485746383667, -0.3288780450820923, -0.2242702841758728, -0.11966228485107422, -0.01505453884601593, 0.08955320715904236, 0.19416093826293945, 0.29876869916915894, 0.4033764600753784, 0.5079841613769531, 0.6125919222831726, 0.7171996831893921, 0.8218074440956116, 0.926415205001831, 1.0310229063034058, 1.1356306076049805, 1.2402384281158447, 1.3448461294174194, 1.4494538307189941, 1.5540616512298584, 1.658669352531433, 1.7632771730422974, 1.867884874343872, 1.9724926948547363, 2.0771002769470215, 2.1817080974578857, 2.28631591796875, 2.390923500061035, 2.4955313205718994, 2.6001389026641846, 2.704746723175049, 2.809354543685913, 2.9139623641967773, 3.0185699462890625, 3.1231777667999268, 3.227785587310791]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 3.0, 5.0, 6.0, 8.0, 6.0, 10.0, 17.0, 15.0, 21.0, 24.0, 24.0, 32.0, 26.0, 23.0, 29.0, 43.0, 41.0, 37.0, 43.0, 38.0, 46.0, 37.0, 43.0, 27.0, 40.0, 42.0, 26.0, 29.0, 33.0, 30.0, 29.0, 28.0, 30.0, 15.0, 19.0, 14.0, 12.0, 7.0, 11.0, 6.0, 3.0, 5.0, 5.0, 2.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.4681293964385986, -1.4269018173217773, -1.3856743574142456, -1.3444467782974243, -1.3032193183898926, -1.2619917392730713, -1.2207642793655396, -1.1795367002487183, -1.1383092403411865, -1.0970816612243652, -1.0558542013168335, -1.0146266222000122, -0.9733991622924805, -0.9321715831756592, -0.8909440636634827, -0.8497165441513062, -0.8084889650344849, -0.7672614455223083, -0.7260339260101318, -0.6848064064979553, -0.6435788869857788, -0.6023513078689575, -0.561123788356781, -0.5198962688446045, -0.478668749332428, -0.43744122982025146, -0.39621371030807495, -0.35498616099357605, -0.31375864148139954, -0.272531121969223, -0.23130358755588531, -0.1900760531425476, -0.1488485336303711, -0.10762100666761398, -0.06639347970485687, -0.025165952742099762, 0.01606157422065735, 0.05728909373283386, 0.09851662814617157, 0.13974416255950928, 0.1809716820716858, 0.2221992015838623, 0.2634267210960388, 0.3046542704105377, 0.34588178992271423, 0.38710930943489075, 0.42833685874938965, 0.46956437826156616, 0.5107918977737427, 0.5520194172859192, 0.5932469367980957, 0.6344744563102722, 0.6757019758224487, 0.71692955493927, 0.7581570744514465, 0.799384593963623, 0.8406121134757996, 0.8818396329879761, 0.9230671525001526, 0.9642946720123291, 1.0055222511291504, 1.0467497110366821, 1.0879772901535034, 1.1292047500610352, 1.1704323291778564]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 6.0, 6.0, 7.0, 12.0, 16.0, 27.0, 25.0, 31.0, 48.0, 64.0, 117.0, 170.0, 270.0, 445.0, 712.0, 1135.0, 2105.0, 3597.0, 6349.0, 11993.0, 24709.0, 58479.0, 145657.0, 284903.0, 272446.0, 133199.0, 53508.0, 22964.0, 11125.0, 6155.0, 3426.0, 1918.0, 1114.0, 644.0, 401.0, 256.0, 151.0, 102.0, 67.0, 56.0, 26.0, 32.0, 25.0, 19.0, 12.0, 4.0, 7.0, 6.0, 4.0, 2.0, 3.0, 2.0], "bins": [-0.38671875, -0.3759613037109375, -0.365203857421875, -0.3544464111328125, -0.34368896484375, -0.3329315185546875, -0.322174072265625, -0.3114166259765625, -0.3006591796875, -0.2899017333984375, -0.279144287109375, -0.2683868408203125, -0.25762939453125, -0.2468719482421875, -0.236114501953125, -0.2253570556640625, -0.214599609375, -0.2038421630859375, -0.193084716796875, -0.1823272705078125, -0.17156982421875, -0.1608123779296875, -0.150054931640625, -0.1392974853515625, -0.1285400390625, -0.1177825927734375, -0.107025146484375, -0.0962677001953125, -0.08551025390625, -0.0747528076171875, -0.063995361328125, -0.0532379150390625, -0.04248046875, -0.0317230224609375, -0.020965576171875, -0.0102081298828125, 0.00054931640625, 0.0113067626953125, 0.022064208984375, 0.0328216552734375, 0.0435791015625, 0.0543365478515625, 0.065093994140625, 0.0758514404296875, 0.08660888671875, 0.0973663330078125, 0.108123779296875, 0.1188812255859375, 0.129638671875, 0.1403961181640625, 0.151153564453125, 0.1619110107421875, 0.17266845703125, 0.1834259033203125, 0.194183349609375, 0.2049407958984375, 0.2156982421875, 0.2264556884765625, 0.237213134765625, 0.2479705810546875, 0.25872802734375, 0.2694854736328125, 0.280242919921875, 0.2910003662109375, 0.3017578125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 7.0, 8.0, 14.0, 19.0, 4.0, 16.0, 17.0, 18.0, 18.0, 22.0, 23.0, 27.0, 29.0, 43.0, 41.0, 30.0, 41.0, 31.0, 47.0, 38.0, 44.0, 56.0, 35.0, 47.0, 36.0, 36.0, 35.0, 27.0, 35.0, 28.0, 24.0, 25.0, 20.0, 14.0, 11.0, 7.0, 11.0, 4.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.281982421875, -0.2738456726074219, -0.26570892333984375, -0.2575721740722656, -0.2494354248046875, -0.24129867553710938, -0.23316192626953125, -0.22502517700195312, -0.216888427734375, -0.20875167846679688, -0.20061492919921875, -0.19247817993164062, -0.1843414306640625, -0.17620468139648438, -0.16806793212890625, -0.15993118286132812, -0.15179443359375, -0.14365768432617188, -0.13552093505859375, -0.12738418579101562, -0.1192474365234375, -0.11111068725585938, -0.10297393798828125, -0.09483718872070312, -0.086700439453125, -0.07856369018554688, -0.07042694091796875, -0.062290191650390625, -0.0541534423828125, -0.046016693115234375, -0.03787994384765625, -0.029743194580078125, -0.0216064453125, -0.013469696044921875, -0.00533294677734375, 0.002803802490234375, 0.0109405517578125, 0.019077301025390625, 0.02721405029296875, 0.035350799560546875, 0.043487548828125, 0.051624298095703125, 0.05976104736328125, 0.06789779663085938, 0.0760345458984375, 0.08417129516601562, 0.09230804443359375, 0.10044479370117188, 0.10858154296875, 0.11671829223632812, 0.12485504150390625, 0.13299179077148438, 0.1411285400390625, 0.14926528930664062, 0.15740203857421875, 0.16553878784179688, 0.173675537109375, 0.18181228637695312, 0.18994903564453125, 0.19808578491210938, 0.2062225341796875, 0.21435928344726562, 0.22249603271484375, 0.23063278198242188, 0.23876953125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 7.0, 2.0, 2.0, 10.0, 10.0, 9.0, 24.0, 26.0, 37.0, 47.0, 62.0, 128.0, 203.0, 348.0, 614.0, 1310.0, 2861.0, 6690.0, 16551.0, 47702.0, 166776.0, 416963.0, 268812.0, 77250.0, 24788.0, 9446.0, 4056.0, 1861.0, 858.0, 436.0, 264.0, 154.0, 81.0, 57.0, 40.0, 23.0, 18.0, 10.0, 7.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.50732421875, -0.4918098449707031, -0.47629547119140625, -0.4607810974121094, -0.4452667236328125, -0.4297523498535156, -0.41423797607421875, -0.3987236022949219, -0.383209228515625, -0.3676948547363281, -0.35218048095703125, -0.3366661071777344, -0.3211517333984375, -0.3056373596191406, -0.29012298583984375, -0.2746086120605469, -0.25909423828125, -0.24357986450195312, -0.22806549072265625, -0.21255111694335938, -0.1970367431640625, -0.18152236938476562, -0.16600799560546875, -0.15049362182617188, -0.134979248046875, -0.11946487426757812, -0.10395050048828125, -0.08843612670898438, -0.0729217529296875, -0.057407379150390625, -0.04189300537109375, -0.026378631591796875, -0.0108642578125, 0.004650115966796875, 0.02016448974609375, 0.035678863525390625, 0.0511932373046875, 0.06670761108398438, 0.08222198486328125, 0.09773635864257812, 0.113250732421875, 0.12876510620117188, 0.14427947998046875, 0.15979385375976562, 0.1753082275390625, 0.19082260131835938, 0.20633697509765625, 0.22185134887695312, 0.23736572265625, 0.2528800964355469, 0.26839447021484375, 0.2839088439941406, 0.2994232177734375, 0.3149375915527344, 0.33045196533203125, 0.3459663391113281, 0.361480712890625, 0.3769950866699219, 0.39250946044921875, 0.4080238342285156, 0.4235382080078125, 0.4390525817871094, 0.45456695556640625, 0.4700813293457031, 0.485595703125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 4.0, 8.0, 3.0, 11.0, 9.0, 12.0, 17.0, 20.0, 25.0, 22.0, 14.0, 34.0, 29.0, 37.0, 40.0, 33.0, 44.0, 49.0, 38.0, 37.0, 43.0, 40.0, 41.0, 47.0, 38.0, 31.0, 25.0, 30.0, 35.0, 29.0, 16.0, 26.0, 16.0, 22.0, 11.0, 12.0, 15.0, 8.0, 6.0, 7.0, 7.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.7685546875, -0.7467498779296875, -0.724945068359375, -0.7031402587890625, -0.68133544921875, -0.6595306396484375, -0.637725830078125, -0.6159210205078125, -0.5941162109375, -0.5723114013671875, -0.550506591796875, -0.5287017822265625, -0.50689697265625, -0.4850921630859375, -0.463287353515625, -0.4414825439453125, -0.419677734375, -0.3978729248046875, -0.376068115234375, -0.3542633056640625, -0.33245849609375, -0.3106536865234375, -0.288848876953125, -0.2670440673828125, -0.2452392578125, -0.2234344482421875, -0.201629638671875, -0.1798248291015625, -0.15802001953125, -0.1362152099609375, -0.114410400390625, -0.0926055908203125, -0.07080078125, -0.0489959716796875, -0.027191162109375, -0.0053863525390625, 0.01641845703125, 0.0382232666015625, 0.060028076171875, 0.0818328857421875, 0.1036376953125, 0.1254425048828125, 0.147247314453125, 0.1690521240234375, 0.19085693359375, 0.2126617431640625, 0.234466552734375, 0.2562713623046875, 0.278076171875, 0.2998809814453125, 0.321685791015625, 0.3434906005859375, 0.36529541015625, 0.3871002197265625, 0.408905029296875, 0.4307098388671875, 0.4525146484375, 0.4743194580078125, 0.496124267578125, 0.5179290771484375, 0.53973388671875, 0.5615386962890625, 0.583343505859375, 0.6051483154296875, 0.626953125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 12.0, 23.0, 24.0, 50.0, 120.0, 188.0, 406.0, 819.0, 1643.0, 3486.0, 7504.0, 16670.0, 42278.0, 127163.0, 345550.0, 323122.0, 112650.0, 38301.0, 15361.0, 6870.0, 3187.0, 1533.0, 795.0, 388.0, 179.0, 109.0, 56.0, 28.0, 15.0, 13.0, 5.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.143310546875, -0.13799285888671875, -0.1326751708984375, -0.12735748291015625, -0.122039794921875, -0.11672210693359375, -0.1114044189453125, -0.10608673095703125, -0.10076904296875, -0.09545135498046875, -0.0901336669921875, -0.08481597900390625, -0.079498291015625, -0.07418060302734375, -0.0688629150390625, -0.06354522705078125, -0.0582275390625, -0.05290985107421875, -0.0475921630859375, -0.04227447509765625, -0.036956787109375, -0.03163909912109375, -0.0263214111328125, -0.02100372314453125, -0.01568603515625, -0.01036834716796875, -0.0050506591796875, 0.00026702880859375, 0.005584716796875, 0.01090240478515625, 0.0162200927734375, 0.02153778076171875, 0.02685546875, 0.03217315673828125, 0.0374908447265625, 0.04280853271484375, 0.048126220703125, 0.05344390869140625, 0.0587615966796875, 0.06407928466796875, 0.06939697265625, 0.07471466064453125, 0.0800323486328125, 0.08535003662109375, 0.090667724609375, 0.09598541259765625, 0.1013031005859375, 0.10662078857421875, 0.1119384765625, 0.11725616455078125, 0.1225738525390625, 0.12789154052734375, 0.133209228515625, 0.13852691650390625, 0.1438446044921875, 0.14916229248046875, 0.15447998046875, 0.15979766845703125, 0.1651153564453125, 0.17043304443359375, 0.175750732421875, 0.18106842041015625, 0.1863861083984375, 0.19170379638671875, 0.197021484375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 5.0, 6.0, 10.0, 10.0, 11.0, 13.0, 32.0, 34.0, 47.0, 60.0, 91.0, 110.0, 127.0, 92.0, 79.0, 56.0, 43.0, 33.0, 20.0, 16.0, 17.0, 14.0, 13.0, 6.0, 9.0, 6.0, 5.0, 3.0, 3.0, 0.0, 3.0, 5.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0], "bins": [-6.109476089477539e-05, -5.951337516307831e-05, -5.7931989431381226e-05, -5.635060369968414e-05, -5.476921796798706e-05, -5.318783223628998e-05, -5.1606446504592896e-05, -5.002506077289581e-05, -4.844367504119873e-05, -4.686228930950165e-05, -4.5280903577804565e-05, -4.369951784610748e-05, -4.21181321144104e-05, -4.053674638271332e-05, -3.8955360651016235e-05, -3.737397491931915e-05, -3.579258918762207e-05, -3.421120345592499e-05, -3.2629817724227905e-05, -3.104843199253082e-05, -2.946704626083374e-05, -2.7885660529136658e-05, -2.6304274797439575e-05, -2.4722889065742493e-05, -2.314150333404541e-05, -2.1560117602348328e-05, -1.9978731870651245e-05, -1.8397346138954163e-05, -1.681596040725708e-05, -1.5234574675559998e-05, -1.3653188943862915e-05, -1.2071803212165833e-05, -1.049041748046875e-05, -8.909031748771667e-06, -7.327646017074585e-06, -5.7462602853775024e-06, -4.16487455368042e-06, -2.5834888219833374e-06, -1.0021030902862549e-06, 5.792826414108276e-07, 2.16066837310791e-06, 3.7420541048049927e-06, 5.323439836502075e-06, 6.904825568199158e-06, 8.48621129989624e-06, 1.0067597031593323e-05, 1.1648982763290405e-05, 1.3230368494987488e-05, 1.481175422668457e-05, 1.6393139958381653e-05, 1.7974525690078735e-05, 1.9555911421775818e-05, 2.11372971534729e-05, 2.2718682885169983e-05, 2.4300068616867065e-05, 2.5881454348564148e-05, 2.746284008026123e-05, 2.9044225811958313e-05, 3.0625611543655396e-05, 3.220699727535248e-05, 3.378838300704956e-05, 3.536976873874664e-05, 3.6951154470443726e-05, 3.853254020214081e-05, 4.011392593383789e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 3.0, 8.0, 15.0, 15.0, 35.0, 48.0, 75.0, 150.0, 288.0, 683.0, 1916.0, 5530.0, 17513.0, 56996.0, 195989.0, 416114.0, 246387.0, 73542.0, 22216.0, 6996.0, 2455.0, 837.0, 338.0, 166.0, 92.0, 52.0, 27.0, 21.0, 20.0, 8.0, 5.0, 6.0, 8.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1708984375, -0.16470718383789062, -0.15851593017578125, -0.15232467651367188, -0.1461334228515625, -0.13994216918945312, -0.13375091552734375, -0.12755966186523438, -0.121368408203125, -0.11517715454101562, -0.10898590087890625, -0.10279464721679688, -0.0966033935546875, -0.09041213989257812, -0.08422088623046875, -0.07802963256835938, -0.07183837890625, -0.06564712524414062, -0.05945587158203125, -0.053264617919921875, -0.0470733642578125, -0.040882110595703125, -0.03469085693359375, -0.028499603271484375, -0.022308349609375, -0.016117095947265625, -0.00992584228515625, -0.003734588623046875, 0.0024566650390625, 0.008647918701171875, 0.01483917236328125, 0.021030426025390625, 0.0272216796875, 0.033412933349609375, 0.03960418701171875, 0.045795440673828125, 0.0519866943359375, 0.058177947998046875, 0.06436920166015625, 0.07056045532226562, 0.076751708984375, 0.08294296264648438, 0.08913421630859375, 0.09532546997070312, 0.1015167236328125, 0.10770797729492188, 0.11389923095703125, 0.12009048461914062, 0.12628173828125, 0.13247299194335938, 0.13866424560546875, 0.14485549926757812, 0.1510467529296875, 0.15723800659179688, 0.16342926025390625, 0.16962051391601562, 0.175811767578125, 0.18200302124023438, 0.18819427490234375, 0.19438552856445312, 0.2005767822265625, 0.20676803588867188, 0.21295928955078125, 0.21915054321289062, 0.225341796875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 12.0, 2.0, 9.0, 8.0, 19.0, 19.0, 16.0, 48.0, 45.0, 54.0, 62.0, 74.0, 80.0, 93.0, 72.0, 80.0, 63.0, 51.0, 34.0, 30.0, 20.0, 24.0, 24.0, 10.0, 13.0, 8.0, 7.0, 8.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1802978515625, -0.17490768432617188, -0.16951751708984375, -0.16412734985351562, -0.1587371826171875, -0.15334701538085938, -0.14795684814453125, -0.14256668090820312, -0.137176513671875, -0.13178634643554688, -0.12639617919921875, -0.12100601196289062, -0.1156158447265625, -0.11022567749023438, -0.10483551025390625, -0.09944534301757812, -0.09405517578125, -0.08866500854492188, -0.08327484130859375, -0.07788467407226562, -0.0724945068359375, -0.06710433959960938, -0.06171417236328125, -0.056324005126953125, -0.050933837890625, -0.045543670654296875, -0.04015350341796875, -0.034763336181640625, -0.0293731689453125, -0.023983001708984375, -0.01859283447265625, -0.013202667236328125, -0.0078125, -0.002422332763671875, 0.00296783447265625, 0.008358001708984375, 0.0137481689453125, 0.019138336181640625, 0.02452850341796875, 0.029918670654296875, 0.035308837890625, 0.040699005126953125, 0.04608917236328125, 0.051479339599609375, 0.0568695068359375, 0.062259674072265625, 0.06764984130859375, 0.07304000854492188, 0.07843017578125, 0.08382034301757812, 0.08921051025390625, 0.09460067749023438, 0.0999908447265625, 0.10538101196289062, 0.11077117919921875, 0.11616134643554688, 0.121551513671875, 0.12694168090820312, 0.13233184814453125, 0.13772201538085938, 0.1431121826171875, 0.14850234985351562, 0.15389251708984375, 0.15928268432617188, 0.1646728515625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 5.0, 3.0, 6.0, 14.0, 18.0, 36.0, 42.0, 83.0, 119.0, 113.0, 142.0, 119.0, 103.0, 74.0, 49.0, 17.0, 21.0, 11.0, 7.0, 2.0, 2.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8853745460510254, -1.8137964010238647, -1.742218255996704, -1.670640230178833, -1.5990620851516724, -1.5274839401245117, -1.4559059143066406, -1.38432776927948, -1.3127496242523193, -1.2411714792251587, -1.169593334197998, -1.098015308380127, -1.0264371633529663, -0.9548590183258057, -0.8832809329032898, -0.8117028474807739, -0.7401247024536133, -0.6685465574264526, -0.5969684720039368, -0.5253903865814209, -0.45381224155426025, -0.382234126329422, -0.31065601110458374, -0.23907792568206787, -0.16749978065490723, -0.09592166543006897, -0.024343550205230713, 0.047234565019607544, 0.1188126802444458, 0.19039079546928406, 0.2619689106941223, 0.3335469961166382, 0.40512537956237793, 0.4767034947872162, 0.5482816100120544, 0.6198596954345703, 0.691437840461731, 0.7630159854888916, 0.8345940709114075, 0.9061721563339233, 0.977750301361084, 1.0493284463882446, 1.1209065914154053, 1.1924846172332764, 1.264062762260437, 1.3356409072875977, 1.4072189331054688, 1.4787970781326294, 1.55037522315979, 1.6219533681869507, 1.6935315132141113, 1.7651095390319824, 1.836687684059143, 1.9082658290863037, 1.9798438549041748, 2.051422119140625, 2.123000144958496, 2.194578170776367, 2.2661564350128174, 2.3377344608306885, 2.4093127250671387, 2.4808907508850098, 2.552468776702881, 2.624046802520752, 2.695625066757202]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 6.0, 17.0, 5.0, 8.0, 8.0, 11.0, 22.0, 25.0, 18.0, 20.0, 28.0, 33.0, 35.0, 33.0, 44.0, 37.0, 35.0, 42.0, 48.0, 44.0, 38.0, 42.0, 40.0, 38.0, 37.0, 33.0, 36.0, 32.0, 29.0, 30.0, 24.0, 23.0, 11.0, 11.0, 14.0, 8.0, 12.0, 7.0, 8.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6571247577667236, -1.5989245176315308, -1.540724277496338, -1.4825239181518555, -1.4243236780166626, -1.3661234378814697, -1.3079230785369873, -1.2497228384017944, -1.1915225982666016, -1.1333223581314087, -1.0751221179962158, -1.0169217586517334, -0.9587215185165405, -0.9005212783813477, -0.84232097864151, -0.7841206789016724, -0.7259204387664795, -0.6677201986312866, -0.609519898891449, -0.5513195991516113, -0.49311935901641846, -0.4349190890789032, -0.37671881914138794, -0.3185185492038727, -0.2603182792663574, -0.20211800932884216, -0.1439177393913269, -0.08571746945381165, -0.027517199516296387, 0.030683070421218872, 0.08888334035873413, 0.1470836102962494, 0.20528388023376465, 0.2634841501712799, 0.32168442010879517, 0.3798846900463104, 0.4380849599838257, 0.49628522992134094, 0.5544854998588562, 0.6126857995986938, 0.6708860397338867, 0.7290862798690796, 0.7872865796089172, 0.8454868793487549, 0.9036871194839478, 0.9618873596191406, 1.020087718963623, 1.078287959098816, 1.1364881992340088, 1.1946884393692017, 1.2528886795043945, 1.311089038848877, 1.3692892789840698, 1.4274895191192627, 1.4856898784637451, 1.543890118598938, 1.6020903587341309, 1.6602905988693237, 1.7184908390045166, 1.776691198348999, 1.834891438484192, 1.8930916786193848, 1.9512920379638672, 2.0094921588897705, 2.067692518234253]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 3.0, 2.0, 2.0, 4.0, 13.0, 15.0, 13.0, 18.0, 33.0, 46.0, 62.0, 92.0, 125.0, 224.0, 358.0, 536.0, 895.0, 1501.0, 2437.0, 4345.0, 7687.0, 14211.0, 27013.0, 52089.0, 100668.0, 187164.0, 328147.0, 527203.0, 718974.0, 755633.0, 598379.0, 387061.0, 220718.0, 119877.0, 64072.0, 33792.0, 18126.0, 9887.0, 5233.0, 2998.0, 1774.0, 1117.0, 624.0, 392.0, 264.0, 155.0, 107.0, 67.0, 49.0, 29.0, 21.0, 14.0, 10.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1546630859375, -0.1498546600341797, -0.14504623413085938, -0.14023780822753906, -0.13542938232421875, -0.13062095642089844, -0.12581253051757812, -0.12100410461425781, -0.1161956787109375, -0.11138725280761719, -0.10657882690429688, -0.10177040100097656, -0.09696197509765625, -0.09215354919433594, -0.08734512329101562, -0.08253669738769531, -0.077728271484375, -0.07291984558105469, -0.06811141967773438, -0.06330299377441406, -0.05849456787109375, -0.05368614196777344, -0.048877716064453125, -0.04406929016113281, -0.0392608642578125, -0.03445243835449219, -0.029644012451171875, -0.024835586547851562, -0.02002716064453125, -0.015218734741210938, -0.010410308837890625, -0.0056018829345703125, -0.00079345703125, 0.0040149688720703125, 0.008823394775390625, 0.013631820678710938, 0.01844024658203125, 0.023248672485351562, 0.028057098388671875, 0.03286552429199219, 0.0376739501953125, 0.04248237609863281, 0.047290802001953125, 0.05209922790527344, 0.05690765380859375, 0.06171607971191406, 0.06652450561523438, 0.07133293151855469, 0.076141357421875, 0.08094978332519531, 0.08575820922851562, 0.09056663513183594, 0.09537506103515625, 0.10018348693847656, 0.10499191284179688, 0.10980033874511719, 0.1146087646484375, 0.11941719055175781, 0.12422561645507812, 0.12903404235839844, 0.13384246826171875, 0.13865089416503906, 0.14345932006835938, 0.1482677459716797, 0.153076171875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 3.0, 6.0, 9.0, 9.0, 11.0, 12.0, 18.0, 19.0, 23.0, 25.0, 26.0, 42.0, 39.0, 44.0, 47.0, 49.0, 44.0, 34.0, 37.0, 51.0, 37.0, 45.0, 40.0, 48.0, 39.0, 34.0, 33.0, 27.0, 24.0, 16.0, 18.0, 12.0, 11.0, 9.0, 13.0, 7.0, 9.0, 6.0, 9.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.293212890625, -0.2842674255371094, -0.27532196044921875, -0.2663764953613281, -0.2574310302734375, -0.24848556518554688, -0.23954010009765625, -0.23059463500976562, -0.221649169921875, -0.21270370483398438, -0.20375823974609375, -0.19481277465820312, -0.1858673095703125, -0.17692184448242188, -0.16797637939453125, -0.15903091430664062, -0.15008544921875, -0.14113998413085938, -0.13219451904296875, -0.12324905395507812, -0.1143035888671875, -0.10535812377929688, -0.09641265869140625, -0.08746719360351562, -0.078521728515625, -0.06957626342773438, -0.06063079833984375, -0.051685333251953125, -0.0427398681640625, -0.033794403076171875, -0.02484893798828125, -0.015903472900390625, -0.0069580078125, 0.001987457275390625, 0.01093292236328125, 0.019878387451171875, 0.0288238525390625, 0.037769317626953125, 0.04671478271484375, 0.055660247802734375, 0.064605712890625, 0.07355117797851562, 0.08249664306640625, 0.09144210815429688, 0.1003875732421875, 0.10933303833007812, 0.11827850341796875, 0.12722396850585938, 0.13616943359375, 0.14511489868164062, 0.15406036376953125, 0.16300582885742188, 0.1719512939453125, 0.18089675903320312, 0.18984222412109375, 0.19878768920898438, 0.207733154296875, 0.21667861938476562, 0.22562408447265625, 0.23456954956054688, 0.2435150146484375, 0.2524604797363281, 0.26140594482421875, 0.2703514099121094, 0.279296875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 6.0, 11.0, 20.0, 35.0, 51.0, 68.0, 119.0, 248.0, 495.0, 1028.0, 2596.0, 7517.0, 28384.0, 141288.0, 1026129.0, 2440387.0, 449078.0, 72327.0, 16421.0, 4771.0, 1693.0, 750.0, 391.0, 174.0, 116.0, 70.0, 36.0, 23.0, 15.0, 15.0, 3.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37060546875, -0.3539886474609375, -0.337371826171875, -0.3207550048828125, -0.30413818359375, -0.2875213623046875, -0.270904541015625, -0.2542877197265625, -0.2376708984375, -0.2210540771484375, -0.204437255859375, -0.1878204345703125, -0.17120361328125, -0.1545867919921875, -0.137969970703125, -0.1213531494140625, -0.104736328125, -0.0881195068359375, -0.071502685546875, -0.0548858642578125, -0.03826904296875, -0.0216522216796875, -0.005035400390625, 0.0115814208984375, 0.0281982421875, 0.0448150634765625, 0.061431884765625, 0.0780487060546875, 0.09466552734375, 0.1112823486328125, 0.127899169921875, 0.1445159912109375, 0.1611328125, 0.1777496337890625, 0.194366455078125, 0.2109832763671875, 0.22760009765625, 0.2442169189453125, 0.260833740234375, 0.2774505615234375, 0.2940673828125, 0.3106842041015625, 0.327301025390625, 0.3439178466796875, 0.36053466796875, 0.3771514892578125, 0.393768310546875, 0.4103851318359375, 0.427001953125, 0.4436187744140625, 0.460235595703125, 0.4768524169921875, 0.49346923828125, 0.5100860595703125, 0.526702880859375, 0.5433197021484375, 0.5599365234375, 0.5765533447265625, 0.593170166015625, 0.6097869873046875, 0.62640380859375, 0.6430206298828125, 0.659637451171875, 0.6762542724609375, 0.69287109375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 4.0, 10.0, 13.0, 23.0, 26.0, 38.0, 64.0, 70.0, 130.0, 183.0, 278.0, 405.0, 502.0, 573.0, 526.0, 399.0, 261.0, 190.0, 120.0, 74.0, 54.0, 42.0, 18.0, 23.0, 16.0, 6.0, 8.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.477783203125, -0.4609870910644531, -0.44419097900390625, -0.4273948669433594, -0.4105987548828125, -0.3938026428222656, -0.37700653076171875, -0.3602104187011719, -0.343414306640625, -0.3266181945800781, -0.30982208251953125, -0.2930259704589844, -0.2762298583984375, -0.2594337463378906, -0.24263763427734375, -0.22584152221679688, -0.20904541015625, -0.19224929809570312, -0.17545318603515625, -0.15865707397460938, -0.1418609619140625, -0.12506484985351562, -0.10826873779296875, -0.09147262573242188, -0.074676513671875, -0.057880401611328125, -0.04108428955078125, -0.024288177490234375, -0.0074920654296875, 0.009304046630859375, 0.02610015869140625, 0.042896270751953125, 0.0596923828125, 0.07648849487304688, 0.09328460693359375, 0.11008071899414062, 0.1268768310546875, 0.14367294311523438, 0.16046905517578125, 0.17726516723632812, 0.194061279296875, 0.21085739135742188, 0.22765350341796875, 0.24444961547851562, 0.2612457275390625, 0.2780418395996094, 0.29483795166015625, 0.3116340637207031, 0.32843017578125, 0.3452262878417969, 0.36202239990234375, 0.3788185119628906, 0.3956146240234375, 0.4124107360839844, 0.42920684814453125, 0.4460029602050781, 0.462799072265625, 0.4795951843261719, 0.49639129638671875, 0.5131874084472656, 0.5299835205078125, 0.5467796325683594, 0.5635757446289062, 0.5803718566894531, 0.59716796875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 12.0, 11.0, 27.0, 34.0, 58.0, 84.0, 125.0, 163.0, 168.0, 123.0, 90.0, 52.0, 21.0, 17.0, 13.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3478312492370605, -3.2429308891296387, -3.138030529022217, -3.033130168914795, -2.928229808807373, -2.823329448699951, -2.71842885017395, -2.6135284900665283, -2.5086281299591064, -2.4037277698516846, -2.2988274097442627, -2.193927049636841, -2.08902645111084, -1.9841262102127075, -1.879225730895996, -1.7743253707885742, -1.6694250106811523, -1.5645246505737305, -1.4596242904663086, -1.3547238111495972, -1.2498234510421753, -1.1449230909347534, -1.040022611618042, -0.9351222515106201, -0.8302218914031982, -0.7253215312957764, -0.6204211115837097, -0.5155206918716431, -0.4106203317642212, -0.3057199716567993, -0.20081955194473267, -0.09591913223266602, 0.00898122787475586, 0.11388161778450012, 0.21878200769424438, 0.32368239760398865, 0.4285827875137329, 0.5334831476211548, 0.6383835673332214, 0.7432839870452881, 0.84818434715271, 0.9530847072601318, 1.0579850673675537, 1.1628855466842651, 1.267785906791687, 1.3726862668991089, 1.4775867462158203, 1.5824871063232422, 1.687387466430664, 1.792287826538086, 1.8971881866455078, 2.0020885467529297, 2.1069889068603516, 2.2118892669677734, 2.3167898654937744, 2.4216902256011963, 2.526590585708618, 2.63149094581604, 2.736391305923462, 2.841291666030884, 2.9461922645568848, 3.0510926246643066, 3.1559929847717285, 3.2608933448791504, 3.3657937049865723]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 8.0, 6.0, 6.0, 10.0, 11.0, 11.0, 19.0, 19.0, 21.0, 23.0, 41.0, 33.0, 37.0, 25.0, 32.0, 35.0, 39.0, 50.0, 51.0, 43.0, 51.0, 44.0, 52.0, 37.0, 34.0, 35.0, 36.0, 28.0, 24.0, 29.0, 16.0, 22.0, 11.0, 17.0, 12.0, 13.0, 5.0, 3.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.5104460716247559, -1.4645224809646606, -1.4185988903045654, -1.3726751804351807, -1.3267515897750854, -1.2808279991149902, -1.234904408454895, -1.1889808177947998, -1.143057107925415, -1.0971335172653198, -1.0512099266052246, -1.0052862167358398, -0.9593626260757446, -0.9134390354156494, -0.8675154447555542, -0.8215917944908142, -0.775668203830719, -0.7297446131706238, -0.6838209629058838, -0.6378973722457886, -0.5919737219810486, -0.5460501313209534, -0.5001264810562134, -0.45420289039611816, -0.40827926993370056, -0.36235564947128296, -0.31643202900886536, -0.27050840854644775, -0.22458480298519135, -0.17866118252277374, -0.13273757696151733, -0.08681395649909973, -0.04089033603668213, 0.005033280700445175, 0.05095689743757248, 0.09688051044940948, 0.1428041309118271, 0.1887277513742447, 0.2346513569355011, 0.2805749773979187, 0.3264985978603363, 0.3724222183227539, 0.4183458387851715, 0.4642694592475891, 0.5101930499076843, 0.5561167001724243, 0.6020402908325195, 0.6479638814926147, 0.6938875317573547, 0.73981112241745, 0.7857347726821899, 0.8316583633422852, 0.8775820136070251, 0.9235056042671204, 0.9694292545318604, 1.0153528451919556, 1.0612764358520508, 1.107200026512146, 1.1531236171722412, 1.199047327041626, 1.2449709177017212, 1.2908945083618164, 1.3368180990219116, 1.3827416896820068, 1.4286653995513916]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 4.0, 12.0, 14.0, 22.0, 26.0, 34.0, 64.0, 68.0, 111.0, 156.0, 264.0, 372.0, 548.0, 894.0, 1423.0, 2395.0, 3858.0, 6015.0, 10329.0, 18778.0, 39944.0, 92291.0, 190668.0, 264150.0, 210255.0, 108484.0, 46834.0, 21245.0, 11313.0, 6827.0, 4031.0, 2654.0, 1738.0, 1028.0, 598.0, 375.0, 239.0, 146.0, 111.0, 79.0, 43.0, 37.0, 21.0, 22.0, 16.0, 7.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.340576171875, -0.3301277160644531, -0.31967926025390625, -0.3092308044433594, -0.2987823486328125, -0.2883338928222656, -0.27788543701171875, -0.2674369812011719, -0.256988525390625, -0.24654006958007812, -0.23609161376953125, -0.22564315795898438, -0.2151947021484375, -0.20474624633789062, -0.19429779052734375, -0.18384933471679688, -0.17340087890625, -0.16295242309570312, -0.15250396728515625, -0.14205551147460938, -0.1316070556640625, -0.12115859985351562, -0.11071014404296875, -0.10026168823242188, -0.089813232421875, -0.07936477661132812, -0.06891632080078125, -0.058467864990234375, -0.0480194091796875, -0.037570953369140625, -0.02712249755859375, -0.016674041748046875, -0.0062255859375, 0.004222869873046875, 0.01467132568359375, 0.025119781494140625, 0.0355682373046875, 0.046016693115234375, 0.05646514892578125, 0.06691360473632812, 0.077362060546875, 0.08781051635742188, 0.09825897216796875, 0.10870742797851562, 0.1191558837890625, 0.12960433959960938, 0.14005279541015625, 0.15050125122070312, 0.16094970703125, 0.17139816284179688, 0.18184661865234375, 0.19229507446289062, 0.2027435302734375, 0.21319198608398438, 0.22364044189453125, 0.23408889770507812, 0.244537353515625, 0.2549858093261719, 0.26543426513671875, 0.2758827209472656, 0.2863311767578125, 0.2967796325683594, 0.30722808837890625, 0.3176765441894531, 0.328125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 0.0, 5.0, 5.0, 7.0, 9.0, 16.0, 14.0, 14.0, 13.0, 28.0, 26.0, 30.0, 36.0, 32.0, 35.0, 45.0, 52.0, 46.0, 36.0, 40.0, 40.0, 41.0, 40.0, 38.0, 39.0, 42.0, 29.0, 35.0, 32.0, 27.0, 16.0, 24.0, 18.0, 18.0, 4.0, 15.0, 14.0, 11.0, 13.0, 4.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.319580078125, -0.3108234405517578, -0.3020668029785156, -0.29331016540527344, -0.28455352783203125, -0.27579689025878906, -0.2670402526855469, -0.2582836151123047, -0.2495269775390625, -0.2407703399658203, -0.23201370239257812, -0.22325706481933594, -0.21450042724609375, -0.20574378967285156, -0.19698715209960938, -0.1882305145263672, -0.179473876953125, -0.1707172393798828, -0.16196060180664062, -0.15320396423339844, -0.14444732666015625, -0.13569068908691406, -0.12693405151367188, -0.11817741394042969, -0.1094207763671875, -0.10066413879394531, -0.09190750122070312, -0.08315086364746094, -0.07439422607421875, -0.06563758850097656, -0.056880950927734375, -0.04812431335449219, -0.03936767578125, -0.030611038208007812, -0.021854400634765625, -0.013097763061523438, -0.00434112548828125, 0.0044155120849609375, 0.013172149658203125, 0.021928787231445312, 0.0306854248046875, 0.03944206237792969, 0.048198699951171875, 0.05695533752441406, 0.06571197509765625, 0.07446861267089844, 0.08322525024414062, 0.09198188781738281, 0.100738525390625, 0.10949516296386719, 0.11825180053710938, 0.12700843811035156, 0.13576507568359375, 0.14452171325683594, 0.15327835083007812, 0.1620349884033203, 0.1707916259765625, 0.1795482635498047, 0.18830490112304688, 0.19706153869628906, 0.20581817626953125, 0.21457481384277344, 0.22333145141601562, 0.2320880889892578, 0.2408447265625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 1.0, 8.0, 6.0, 11.0, 15.0, 17.0, 30.0, 42.0, 52.0, 109.0, 160.0, 283.0, 564.0, 1150.0, 2498.0, 5723.0, 13389.0, 35867.0, 119190.0, 369761.0, 341657.0, 103946.0, 31906.0, 12361.0, 5182.0, 2253.0, 1077.0, 522.0, 291.0, 175.0, 93.0, 61.0, 50.0, 26.0, 24.0, 19.0, 9.0, 6.0, 6.0, 9.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56005859375, -0.541961669921875, -0.52386474609375, -0.505767822265625, -0.4876708984375, -0.469573974609375, -0.45147705078125, -0.433380126953125, -0.415283203125, -0.397186279296875, -0.37908935546875, -0.360992431640625, -0.3428955078125, -0.324798583984375, -0.30670166015625, -0.288604736328125, -0.2705078125, -0.252410888671875, -0.23431396484375, -0.216217041015625, -0.1981201171875, -0.180023193359375, -0.16192626953125, -0.143829345703125, -0.125732421875, -0.107635498046875, -0.08953857421875, -0.071441650390625, -0.0533447265625, -0.035247802734375, -0.01715087890625, 0.000946044921875, 0.01904296875, 0.037139892578125, 0.05523681640625, 0.073333740234375, 0.0914306640625, 0.109527587890625, 0.12762451171875, 0.145721435546875, 0.163818359375, 0.181915283203125, 0.20001220703125, 0.218109130859375, 0.2362060546875, 0.254302978515625, 0.27239990234375, 0.290496826171875, 0.30859375, 0.326690673828125, 0.34478759765625, 0.362884521484375, 0.3809814453125, 0.399078369140625, 0.41717529296875, 0.435272216796875, 0.453369140625, 0.471466064453125, 0.48956298828125, 0.507659912109375, 0.5257568359375, 0.543853759765625, 0.56195068359375, 0.580047607421875, 0.59814453125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 10.0, 7.0, 6.0, 17.0, 13.0, 16.0, 16.0, 25.0, 23.0, 29.0, 30.0, 33.0, 30.0, 49.0, 37.0, 44.0, 52.0, 30.0, 46.0, 44.0, 38.0, 42.0, 37.0, 28.0, 30.0, 34.0, 32.0, 21.0, 27.0, 24.0, 30.0, 18.0, 16.0, 14.0, 10.0, 7.0, 8.0, 6.0, 6.0, 5.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.84521484375, -0.8201141357421875, -0.795013427734375, -0.7699127197265625, -0.74481201171875, -0.7197113037109375, -0.694610595703125, -0.6695098876953125, -0.6444091796875, -0.6193084716796875, -0.594207763671875, -0.5691070556640625, -0.54400634765625, -0.5189056396484375, -0.493804931640625, -0.4687042236328125, -0.443603515625, -0.4185028076171875, -0.393402099609375, -0.3683013916015625, -0.34320068359375, -0.3180999755859375, -0.292999267578125, -0.2678985595703125, -0.2427978515625, -0.2176971435546875, -0.192596435546875, -0.1674957275390625, -0.14239501953125, -0.1172943115234375, -0.092193603515625, -0.0670928955078125, -0.0419921875, -0.0168914794921875, 0.008209228515625, 0.0333099365234375, 0.05841064453125, 0.0835113525390625, 0.108612060546875, 0.1337127685546875, 0.1588134765625, 0.1839141845703125, 0.209014892578125, 0.2341156005859375, 0.25921630859375, 0.2843170166015625, 0.309417724609375, 0.3345184326171875, 0.359619140625, 0.3847198486328125, 0.409820556640625, 0.4349212646484375, 0.46002197265625, 0.4851226806640625, 0.510223388671875, 0.5353240966796875, 0.5604248046875, 0.5855255126953125, 0.610626220703125, 0.6357269287109375, 0.66082763671875, 0.6859283447265625, 0.711029052734375, 0.7361297607421875, 0.76123046875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 6.0, 2.0, 0.0, 1.0, 4.0, 4.0, 10.0, 6.0, 14.0, 31.0, 28.0, 25.0, 49.0, 73.0, 95.0, 129.0, 167.0, 280.0, 352.0, 475.0, 705.0, 1058.0, 1538.0, 2536.0, 4797.0, 12578.0, 56408.0, 542132.0, 366295.0, 37994.0, 9815.0, 3959.0, 2173.0, 1483.0, 1003.0, 672.0, 455.0, 349.0, 228.0, 187.0, 121.0, 104.0, 60.0, 45.0, 32.0, 19.0, 20.0, 14.0, 11.0, 13.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3623046875, -0.3497657775878906, -0.33722686767578125, -0.3246879577636719, -0.3121490478515625, -0.2996101379394531, -0.28707122802734375, -0.2745323181152344, -0.261993408203125, -0.24945449829101562, -0.23691558837890625, -0.22437667846679688, -0.2118377685546875, -0.19929885864257812, -0.18675994873046875, -0.17422103881835938, -0.16168212890625, -0.14914321899414062, -0.13660430908203125, -0.12406539916992188, -0.1115264892578125, -0.09898757934570312, -0.08644866943359375, -0.07390975952148438, -0.061370849609375, -0.048831939697265625, -0.03629302978515625, -0.023754119873046875, -0.0112152099609375, 0.001323699951171875, 0.01386260986328125, 0.026401519775390625, 0.0389404296875, 0.051479339599609375, 0.06401824951171875, 0.07655715942382812, 0.0890960693359375, 0.10163497924804688, 0.11417388916015625, 0.12671279907226562, 0.139251708984375, 0.15179061889648438, 0.16432952880859375, 0.17686843872070312, 0.1894073486328125, 0.20194625854492188, 0.21448516845703125, 0.22702407836914062, 0.23956298828125, 0.2521018981933594, 0.26464080810546875, 0.2771797180175781, 0.2897186279296875, 0.3022575378417969, 0.31479644775390625, 0.3273353576660156, 0.339874267578125, 0.3524131774902344, 0.36495208740234375, 0.3774909973144531, 0.3900299072265625, 0.4025688171386719, 0.41510772705078125, 0.4276466369628906, 0.440185546875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 3.0, 8.0, 10.0, 17.0, 55.0, 179.0, 340.0, 236.0, 80.0, 32.0, 9.0, 5.0, 4.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019919872283935547, -0.00019289925694465637, -0.00018659979104995728, -0.00018030032515525818, -0.00017400085926055908, -0.00016770139336585999, -0.0001614019274711609, -0.0001551024615764618, -0.0001488029956817627, -0.0001425035297870636, -0.0001362040638923645, -0.0001299045979976654, -0.0001236051321029663, -0.00011730566620826721, -0.00011100620031356812, -0.00010470673441886902, -9.840726852416992e-05, -9.210780262947083e-05, -8.580833673477173e-05, -7.950887084007263e-05, -7.320940494537354e-05, -6.690993905067444e-05, -6.061047315597534e-05, -5.4311007261276245e-05, -4.801154136657715e-05, -4.171207547187805e-05, -3.5412609577178955e-05, -2.911314368247986e-05, -2.2813677787780762e-05, -1.6514211893081665e-05, -1.0214745998382568e-05, -3.915280103683472e-06, 2.384185791015625e-06, 8.683651685714722e-06, 1.4983117580413818e-05, 2.1282583475112915e-05, 2.7582049369812012e-05, 3.388151526451111e-05, 4.0180981159210205e-05, 4.64804470539093e-05, 5.27799129486084e-05, 5.9079378843307495e-05, 6.537884473800659e-05, 7.167831063270569e-05, 7.797777652740479e-05, 8.427724242210388e-05, 9.057670831680298e-05, 9.687617421150208e-05, 0.00010317564010620117, 0.00010947510600090027, 0.00011577457189559937, 0.00012207403779029846, 0.00012837350368499756, 0.00013467296957969666, 0.00014097243547439575, 0.00014727190136909485, 0.00015357136726379395, 0.00015987083315849304, 0.00016617029905319214, 0.00017246976494789124, 0.00017876923084259033, 0.00018506869673728943, 0.00019136816263198853, 0.00019766762852668762, 0.00020396709442138672]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 7.0, 5.0, 12.0, 14.0, 9.0, 21.0, 25.0, 41.0, 64.0, 132.0, 216.0, 321.0, 500.0, 832.0, 1457.0, 2904.0, 8540.0, 51444.0, 546223.0, 389462.0, 33754.0, 6634.0, 2590.0, 1284.0, 768.0, 475.0, 312.0, 179.0, 108.0, 62.0, 41.0, 28.0, 25.0, 14.0, 9.0, 10.0, 6.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.451904296875, -0.43857574462890625, -0.4252471923828125, -0.41191864013671875, -0.398590087890625, -0.38526153564453125, -0.3719329833984375, -0.35860443115234375, -0.34527587890625, -0.33194732666015625, -0.3186187744140625, -0.30529022216796875, -0.291961669921875, -0.27863311767578125, -0.2653045654296875, -0.25197601318359375, -0.2386474609375, -0.22531890869140625, -0.2119903564453125, -0.19866180419921875, -0.185333251953125, -0.17200469970703125, -0.1586761474609375, -0.14534759521484375, -0.13201904296875, -0.11869049072265625, -0.1053619384765625, -0.09203338623046875, -0.078704833984375, -0.06537628173828125, -0.0520477294921875, -0.03871917724609375, -0.025390625, -0.01206207275390625, 0.0012664794921875, 0.01459503173828125, 0.027923583984375, 0.04125213623046875, 0.0545806884765625, 0.06790924072265625, 0.08123779296875, 0.09456634521484375, 0.1078948974609375, 0.12122344970703125, 0.134552001953125, 0.14788055419921875, 0.1612091064453125, 0.17453765869140625, 0.1878662109375, 0.20119476318359375, 0.2145233154296875, 0.22785186767578125, 0.241180419921875, 0.25450897216796875, 0.2678375244140625, 0.28116607666015625, 0.29449462890625, 0.30782318115234375, 0.3211517333984375, 0.33448028564453125, 0.347808837890625, 0.36113739013671875, 0.3744659423828125, 0.38779449462890625, 0.401123046875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 7.0, 7.0, 12.0, 23.0, 33.0, 58.0, 95.0, 137.0, 161.0, 134.0, 112.0, 79.0, 49.0, 37.0, 15.0, 7.0, 12.0, 5.0, 3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.362548828125, -0.35039520263671875, -0.3382415771484375, -0.32608795166015625, -0.313934326171875, -0.30178070068359375, -0.2896270751953125, -0.27747344970703125, -0.26531982421875, -0.25316619873046875, -0.2410125732421875, -0.22885894775390625, -0.216705322265625, -0.20455169677734375, -0.1923980712890625, -0.18024444580078125, -0.1680908203125, -0.15593719482421875, -0.1437835693359375, -0.13162994384765625, -0.119476318359375, -0.10732269287109375, -0.0951690673828125, -0.08301544189453125, -0.07086181640625, -0.05870819091796875, -0.0465545654296875, -0.03440093994140625, -0.022247314453125, -0.01009368896484375, 0.0020599365234375, 0.01421356201171875, 0.0263671875, 0.03852081298828125, 0.0506744384765625, 0.06282806396484375, 0.074981689453125, 0.08713531494140625, 0.0992889404296875, 0.11144256591796875, 0.12359619140625, 0.13574981689453125, 0.1479034423828125, 0.16005706787109375, 0.172210693359375, 0.18436431884765625, 0.1965179443359375, 0.20867156982421875, 0.2208251953125, 0.23297882080078125, 0.2451324462890625, 0.25728607177734375, 0.269439697265625, 0.28159332275390625, 0.2937469482421875, 0.30590057373046875, 0.31805419921875, 0.33020782470703125, 0.3423614501953125, 0.35451507568359375, 0.366668701171875, 0.37882232666015625, 0.3909759521484375, 0.40312957763671875, 0.415283203125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 6.0, 7.0, 13.0, 23.0, 33.0, 64.0, 109.0, 189.0, 183.0, 165.0, 108.0, 49.0, 18.0, 10.0, 7.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.606661319732666, -4.471972942352295, -4.337285041809082, -4.202596664428711, -4.06790828704834, -3.933220386505127, -3.798532009124756, -3.663843870162964, -3.529155731201172, -3.39446759223938, -3.259779453277588, -3.125091075897217, -2.990402936935425, -2.855714797973633, -2.7210264205932617, -2.5863382816314697, -2.4516501426696777, -2.3169620037078857, -2.1822738647460938, -2.0475854873657227, -1.9128973484039307, -1.7782092094421387, -1.6435209512710571, -1.5088326930999756, -1.3741445541381836, -1.2394564151763916, -1.10476815700531, -0.9700799584388733, -0.8353917598724365, -0.7007035613059998, -0.566015362739563, -0.4313271641731262, -0.29663896560668945, -0.16195076704025269, -0.027262568473815918, 0.10742563009262085, 0.24211382865905762, 0.3768020272254944, 0.5114902257919312, 0.6461784243583679, 0.7808666229248047, 0.9155548214912415, 1.0502430200576782, 1.1849312782287598, 1.3196194171905518, 1.4543075561523438, 1.5889958143234253, 1.7236840724945068, 1.8583722114562988, 1.9930603504180908, 2.127748489379883, 2.262436866760254, 2.397125005722046, 2.531813144683838, 2.666501522064209, 2.801189661026001, 2.935877799987793, 3.070565938949585, 3.205254077911377, 3.339942455291748, 3.47463059425354, 3.609318733215332, 3.744007110595703, 3.878695249557495, 4.013383388519287]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 2.0, 4.0, 2.0, 8.0, 11.0, 11.0, 7.0, 11.0, 13.0, 22.0, 26.0, 31.0, 20.0, 36.0, 31.0, 47.0, 37.0, 44.0, 34.0, 38.0, 55.0, 36.0, 47.0, 38.0, 43.0, 29.0, 26.0, 42.0, 45.0, 26.0, 21.0, 24.0, 23.0, 22.0, 15.0, 11.0, 9.0, 12.0, 9.0, 11.0, 6.0, 6.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7436070442199707, -1.6839699745178223, -1.6243329048156738, -1.5646958351135254, -1.505058765411377, -1.4454216957092285, -1.38578462600708, -1.3261475563049316, -1.2665104866027832, -1.2068734169006348, -1.1472363471984863, -1.087599277496338, -1.0279622077941895, -0.968325138092041, -0.9086880683898926, -0.8490509986877441, -0.7894139289855957, -0.7297768592834473, -0.6701397895812988, -0.6105027198791504, -0.550865650177002, -0.4912285804748535, -0.4315915107727051, -0.37195444107055664, -0.3123173713684082, -0.25268030166625977, -0.19304323196411133, -0.1334061622619629, -0.07376909255981445, -0.014132022857666016, 0.04550504684448242, 0.10514211654663086, 0.1647791862487793, 0.22441625595092773, 0.28405332565307617, 0.3436903953552246, 0.40332746505737305, 0.4629645347595215, 0.5226016044616699, 0.5822386741638184, 0.6418757438659668, 0.7015128135681152, 0.7611498832702637, 0.8207869529724121, 0.8804240226745605, 0.940061092376709, 0.9996981620788574, 1.0593352317810059, 1.1189723014831543, 1.1786093711853027, 1.2382464408874512, 1.2978835105895996, 1.357520580291748, 1.4171576499938965, 1.476794719696045, 1.5364317893981934, 1.5960688591003418, 1.6557059288024902, 1.7153429985046387, 1.774980068206787, 1.8346171379089355, 1.894254207611084, 1.9538912773132324, 2.013528347015381, 2.0731654167175293]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 10.0, 10.0, 10.0, 16.0, 25.0, 49.0, 55.0, 81.0, 155.0, 253.0, 526.0, 1081.0, 1894.0, 4577.0, 12181.0, 38790.0, 145263.0, 516107.0, 1249145.0, 1348953.0, 622566.0, 180862.0, 47329.0, 14361.0, 5205.0, 2215.0, 1091.0, 591.0, 320.0, 192.0, 120.0, 68.0, 53.0, 33.0, 24.0, 28.0, 12.0, 6.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.38037109375, -0.36920928955078125, -0.3580474853515625, -0.34688568115234375, -0.335723876953125, -0.32456207275390625, -0.3134002685546875, -0.30223846435546875, -0.29107666015625, -0.27991485595703125, -0.2687530517578125, -0.25759124755859375, -0.246429443359375, -0.23526763916015625, -0.2241058349609375, -0.21294403076171875, -0.2017822265625, -0.19062042236328125, -0.1794586181640625, -0.16829681396484375, -0.157135009765625, -0.14597320556640625, -0.1348114013671875, -0.12364959716796875, -0.11248779296875, -0.10132598876953125, -0.0901641845703125, -0.07900238037109375, -0.067840576171875, -0.05667877197265625, -0.0455169677734375, -0.03435516357421875, -0.023193359375, -0.01203155517578125, -0.0008697509765625, 0.01029205322265625, 0.021453857421875, 0.03261566162109375, 0.0437774658203125, 0.05493927001953125, 0.06610107421875, 0.07726287841796875, 0.0884246826171875, 0.09958648681640625, 0.110748291015625, 0.12191009521484375, 0.1330718994140625, 0.14423370361328125, 0.1553955078125, 0.16655731201171875, 0.1777191162109375, 0.18888092041015625, 0.200042724609375, 0.21120452880859375, 0.2223663330078125, 0.23352813720703125, 0.24468994140625, 0.25585174560546875, 0.2670135498046875, 0.27817535400390625, 0.289337158203125, 0.30049896240234375, 0.3116607666015625, 0.32282257080078125, 0.333984375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 9.0, 17.0, 17.0, 22.0, 23.0, 38.0, 38.0, 45.0, 54.0, 51.0, 66.0, 75.0, 62.0, 69.0, 58.0, 66.0, 59.0, 54.0, 39.0, 40.0, 27.0, 16.0, 21.0, 10.0, 9.0, 6.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4189453125, -0.40325164794921875, -0.3875579833984375, -0.37186431884765625, -0.356170654296875, -0.34047698974609375, -0.3247833251953125, -0.30908966064453125, -0.29339599609375, -0.27770233154296875, -0.2620086669921875, -0.24631500244140625, -0.230621337890625, -0.21492767333984375, -0.1992340087890625, -0.18354034423828125, -0.1678466796875, -0.15215301513671875, -0.1364593505859375, -0.12076568603515625, -0.105072021484375, -0.08937835693359375, -0.0736846923828125, -0.05799102783203125, -0.04229736328125, -0.02660369873046875, -0.0109100341796875, 0.00478363037109375, 0.020477294921875, 0.03617095947265625, 0.0518646240234375, 0.06755828857421875, 0.083251953125, 0.09894561767578125, 0.1146392822265625, 0.13033294677734375, 0.146026611328125, 0.16172027587890625, 0.1774139404296875, 0.19310760498046875, 0.20880126953125, 0.22449493408203125, 0.2401885986328125, 0.25588226318359375, 0.271575927734375, 0.28726959228515625, 0.3029632568359375, 0.31865692138671875, 0.3343505859375, 0.35004425048828125, 0.3657379150390625, 0.38143157958984375, 0.397125244140625, 0.41281890869140625, 0.4285125732421875, 0.44420623779296875, 0.45989990234375, 0.47559356689453125, 0.4912872314453125, 0.5069808959960938, 0.522674560546875, 0.5383682250976562, 0.5540618896484375, 0.5697555541992188, 0.58544921875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 4.0, 8.0, 15.0, 21.0, 31.0, 48.0, 75.0, 120.0, 208.0, 314.0, 656.0, 1429.0, 3989.0, 13795.0, 66542.0, 514598.0, 2702598.0, 772274.0, 92018.0, 17462.0, 4808.0, 1667.0, 692.0, 369.0, 212.0, 122.0, 71.0, 37.0, 26.0, 16.0, 18.0, 11.0, 8.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.5458984375, -0.5268020629882812, -0.5077056884765625, -0.48860931396484375, -0.469512939453125, -0.45041656494140625, -0.4313201904296875, -0.41222381591796875, -0.39312744140625, -0.37403106689453125, -0.3549346923828125, -0.33583831787109375, -0.316741943359375, -0.29764556884765625, -0.2785491943359375, -0.25945281982421875, -0.2403564453125, -0.22126007080078125, -0.2021636962890625, -0.18306732177734375, -0.163970947265625, -0.14487457275390625, -0.1257781982421875, -0.10668182373046875, -0.08758544921875, -0.06848907470703125, -0.0493927001953125, -0.03029632568359375, -0.011199951171875, 0.00789642333984375, 0.0269927978515625, 0.04608917236328125, 0.065185546875, 0.08428192138671875, 0.1033782958984375, 0.12247467041015625, 0.141571044921875, 0.16066741943359375, 0.1797637939453125, 0.19886016845703125, 0.21795654296875, 0.23705291748046875, 0.2561492919921875, 0.27524566650390625, 0.294342041015625, 0.31343841552734375, 0.3325347900390625, 0.35163116455078125, 0.3707275390625, 0.38982391357421875, 0.4089202880859375, 0.42801666259765625, 0.447113037109375, 0.46620941162109375, 0.4853057861328125, 0.5044021606445312, 0.52349853515625, 0.5425949096679688, 0.5616912841796875, 0.5807876586914062, 0.599884033203125, 0.6189804077148438, 0.6380767822265625, 0.6571731567382812, 0.67626953125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 4.0, 4.0, 4.0, 6.0, 18.0, 17.0, 29.0, 51.0, 78.0, 140.0, 228.0, 381.0, 529.0, 666.0, 677.0, 458.0, 297.0, 185.0, 101.0, 69.0, 43.0, 37.0, 12.0, 10.0, 11.0, 11.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5244140625, -0.5023651123046875, -0.480316162109375, -0.4582672119140625, -0.43621826171875, -0.4141693115234375, -0.392120361328125, -0.3700714111328125, -0.3480224609375, -0.3259735107421875, -0.303924560546875, -0.2818756103515625, -0.25982666015625, -0.2377777099609375, -0.215728759765625, -0.1936798095703125, -0.171630859375, -0.1495819091796875, -0.127532958984375, -0.1054840087890625, -0.08343505859375, -0.0613861083984375, -0.039337158203125, -0.0172882080078125, 0.0047607421875, 0.0268096923828125, 0.048858642578125, 0.0709075927734375, 0.09295654296875, 0.1150054931640625, 0.137054443359375, 0.1591033935546875, 0.18115234375, 0.2032012939453125, 0.225250244140625, 0.2472991943359375, 0.26934814453125, 0.2913970947265625, 0.313446044921875, 0.3354949951171875, 0.3575439453125, 0.3795928955078125, 0.401641845703125, 0.4236907958984375, 0.44573974609375, 0.4677886962890625, 0.489837646484375, 0.5118865966796875, 0.533935546875, 0.5559844970703125, 0.578033447265625, 0.6000823974609375, 0.62213134765625, 0.6441802978515625, 0.666229248046875, 0.6882781982421875, 0.7103271484375, 0.7323760986328125, 0.754425048828125, 0.7764739990234375, 0.79852294921875, 0.8205718994140625, 0.842620849609375, 0.8646697998046875, 0.88671875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 11.0, 15.0, 30.0, 48.0, 97.0, 121.0, 160.0, 149.0, 133.0, 98.0, 48.0, 41.0, 17.0, 8.0, 7.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.220745086669922, -3.1059622764587402, -2.9911797046661377, -2.876397132873535, -2.7616143226623535, -2.646831512451172, -2.5320489406585693, -2.417266368865967, -2.302483558654785, -2.1877007484436035, -2.072918176651001, -1.9581354856491089, -1.8433527946472168, -1.7285701036453247, -1.6137874126434326, -1.4990047216415405, -1.3842220306396484, -1.2694393396377563, -1.1546566486358643, -1.0398739576339722, -0.9250912666320801, -0.810308575630188, -0.6955258846282959, -0.5807431936264038, -0.4659605026245117, -0.35117781162261963, -0.23639512062072754, -0.12161242961883545, -0.006829738616943359, 0.10795295238494873, 0.22273564338684082, 0.3375183343887329, 0.452301025390625, 0.5670837163925171, 0.6818664073944092, 0.7966490983963013, 0.9114317893981934, 1.0262144804000854, 1.1409971714019775, 1.2557798624038696, 1.3705625534057617, 1.4853452444076538, 1.600127935409546, 1.714910626411438, 1.82969331741333, 1.9444760084152222, 2.0592586994171143, 2.174041271209717, 2.2888240814208984, 2.40360689163208, 2.5183894634246826, 2.633172035217285, 2.747954845428467, 2.8627376556396484, 2.977520227432251, 3.0923027992248535, 3.207085609436035, 3.321868419647217, 3.4366509914398193, 3.551433563232422, 3.6662163734436035, 3.780999183654785, 3.8957817554473877, 4.01056432723999, 4.125347137451172]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 5.0, 2.0, 3.0, 8.0, 2.0, 8.0, 8.0, 6.0, 10.0, 12.0, 23.0, 22.0, 17.0, 25.0, 25.0, 21.0, 32.0, 23.0, 26.0, 36.0, 39.0, 38.0, 46.0, 44.0, 47.0, 42.0, 38.0, 45.0, 26.0, 31.0, 34.0, 28.0, 19.0, 23.0, 27.0, 16.0, 21.0, 22.0, 21.0, 12.0, 16.0, 7.0, 8.0, 8.0, 3.0, 8.0, 6.0, 5.0, 2.0, 6.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-1.375675082206726, -1.3328278064727783, -1.2899805307388306, -1.2471332550048828, -1.2042860984802246, -1.1614388227462769, -1.118591547012329, -1.0757442712783813, -1.0328969955444336, -0.9900497198104858, -0.9472024440765381, -0.9043552279472351, -0.8615079522132874, -0.8186606764793396, -0.7758134603500366, -0.7329661846160889, -0.6901189088821411, -0.6472716331481934, -0.6044243574142456, -0.5615771412849426, -0.5187298655509949, -0.4758825898170471, -0.43303534388542175, -0.3901880979537964, -0.34734082221984863, -0.3044935464859009, -0.2616463005542755, -0.21879903972148895, -0.1759517788887024, -0.13310451805591583, -0.09025725722312927, -0.047410011291503906, -0.004562854766845703, 0.03828440606594086, 0.08113166689872742, 0.12397892773151398, 0.16682618856430054, 0.2096734493970871, 0.25252071022987366, 0.295367956161499, 0.3382152318954468, 0.38106250762939453, 0.4239097535610199, 0.46675699949264526, 0.509604275226593, 0.5524515509605408, 0.5952987670898438, 0.6381460428237915, 0.6809933185577393, 0.723840594291687, 0.7666878700256348, 0.8095350861549377, 0.8523823618888855, 0.8952296376228333, 0.9380768537521362, 0.980924129486084, 1.0237714052200317, 1.0666186809539795, 1.1094659566879272, 1.152313232421875, 1.1951603889465332, 1.238007664680481, 1.2808549404144287, 1.3237022161483765, 1.3665494918823242]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 7.0, 4.0, 11.0, 7.0, 12.0, 32.0, 35.0, 59.0, 132.0, 273.0, 515.0, 1057.0, 2520.0, 6358.0, 21625.0, 132842.0, 564253.0, 265039.0, 38223.0, 9302.0, 3436.0, 1434.0, 659.0, 302.0, 193.0, 91.0, 52.0, 22.0, 22.0, 7.0, 6.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.9658203125, -0.9408493041992188, -0.9158782958984375, -0.8909072875976562, -0.865936279296875, -0.8409652709960938, -0.8159942626953125, -0.7910232543945312, -0.76605224609375, -0.7410812377929688, -0.7161102294921875, -0.6911392211914062, -0.666168212890625, -0.6411972045898438, -0.6162261962890625, -0.5912551879882812, -0.5662841796875, -0.5413131713867188, -0.5163421630859375, -0.49137115478515625, -0.466400146484375, -0.44142913818359375, -0.4164581298828125, -0.39148712158203125, -0.36651611328125, -0.34154510498046875, -0.3165740966796875, -0.29160308837890625, -0.266632080078125, -0.24166107177734375, -0.2166900634765625, -0.19171905517578125, -0.166748046875, -0.14177703857421875, -0.1168060302734375, -0.09183502197265625, -0.066864013671875, -0.04189300537109375, -0.0169219970703125, 0.00804901123046875, 0.03302001953125, 0.05799102783203125, 0.0829620361328125, 0.10793304443359375, 0.132904052734375, 0.15787506103515625, 0.1828460693359375, 0.20781707763671875, 0.2327880859375, 0.25775909423828125, 0.2827301025390625, 0.30770111083984375, 0.332672119140625, 0.35764312744140625, 0.3826141357421875, 0.40758514404296875, 0.43255615234375, 0.45752716064453125, 0.4824981689453125, 0.5074691772460938, 0.532440185546875, 0.5574111938476562, 0.5823822021484375, 0.6073532104492188, 0.63232421875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 5.0, 6.0, 11.0, 7.0, 11.0, 18.0, 11.0, 18.0, 22.0, 20.0, 22.0, 34.0, 35.0, 50.0, 62.0, 45.0, 44.0, 45.0, 58.0, 57.0, 44.0, 60.0, 48.0, 31.0, 40.0, 22.0, 21.0, 26.0, 29.0, 20.0, 15.0, 19.0, 17.0, 11.0, 5.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4169921875, -0.40459442138671875, -0.3921966552734375, -0.37979888916015625, -0.367401123046875, -0.35500335693359375, -0.3426055908203125, -0.33020782470703125, -0.31781005859375, -0.30541229248046875, -0.2930145263671875, -0.28061676025390625, -0.268218994140625, -0.25582122802734375, -0.2434234619140625, -0.23102569580078125, -0.2186279296875, -0.20623016357421875, -0.1938323974609375, -0.18143463134765625, -0.169036865234375, -0.15663909912109375, -0.1442413330078125, -0.13184356689453125, -0.11944580078125, -0.10704803466796875, -0.0946502685546875, -0.08225250244140625, -0.069854736328125, -0.05745697021484375, -0.0450592041015625, -0.03266143798828125, -0.020263671875, -0.00786590576171875, 0.0045318603515625, 0.01692962646484375, 0.029327392578125, 0.04172515869140625, 0.0541229248046875, 0.06652069091796875, 0.07891845703125, 0.09131622314453125, 0.1037139892578125, 0.11611175537109375, 0.128509521484375, 0.14090728759765625, 0.1533050537109375, 0.16570281982421875, 0.1781005859375, 0.19049835205078125, 0.2028961181640625, 0.21529388427734375, 0.227691650390625, 0.24008941650390625, 0.2524871826171875, 0.26488494873046875, 0.27728271484375, 0.28968048095703125, 0.3020782470703125, 0.31447601318359375, 0.326873779296875, 0.33927154541015625, 0.3516693115234375, 0.36406707763671875, 0.37646484375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 6.0, 5.0, 15.0, 30.0, 30.0, 39.0, 65.0, 111.0, 203.0, 344.0, 640.0, 1248.0, 2473.0, 4750.0, 10224.0, 23227.0, 65226.0, 202243.0, 372765.0, 236605.0, 78691.0, 26925.0, 11401.0, 5500.0, 2742.0, 1376.0, 721.0, 393.0, 220.0, 120.0, 66.0, 54.0, 22.0, 19.0, 13.0, 7.0, 8.0, 5.0, 4.0, 6.0, 3.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.487548828125, -0.47303009033203125, -0.4585113525390625, -0.44399261474609375, -0.429473876953125, -0.41495513916015625, -0.4004364013671875, -0.38591766357421875, -0.37139892578125, -0.35688018798828125, -0.3423614501953125, -0.32784271240234375, -0.313323974609375, -0.29880523681640625, -0.2842864990234375, -0.26976776123046875, -0.2552490234375, -0.24073028564453125, -0.2262115478515625, -0.21169281005859375, -0.197174072265625, -0.18265533447265625, -0.1681365966796875, -0.15361785888671875, -0.13909912109375, -0.12458038330078125, -0.1100616455078125, -0.09554290771484375, -0.081024169921875, -0.06650543212890625, -0.0519866943359375, -0.03746795654296875, -0.02294921875, -0.00843048095703125, 0.0060882568359375, 0.02060699462890625, 0.035125732421875, 0.04964447021484375, 0.0641632080078125, 0.07868194580078125, 0.09320068359375, 0.10771942138671875, 0.1222381591796875, 0.13675689697265625, 0.151275634765625, 0.16579437255859375, 0.1803131103515625, 0.19483184814453125, 0.2093505859375, 0.22386932373046875, 0.2383880615234375, 0.25290679931640625, 0.267425537109375, 0.28194427490234375, 0.2964630126953125, 0.31098175048828125, 0.32550048828125, 0.34001922607421875, 0.3545379638671875, 0.36905670166015625, 0.383575439453125, 0.39809417724609375, 0.4126129150390625, 0.42713165283203125, 0.441650390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 9.0, 4.0, 11.0, 8.0, 7.0, 8.0, 9.0, 28.0, 22.0, 12.0, 19.0, 33.0, 41.0, 40.0, 37.0, 38.0, 50.0, 54.0, 56.0, 39.0, 48.0, 48.0, 37.0, 42.0, 51.0, 42.0, 40.0, 35.0, 23.0, 22.0, 16.0, 11.0, 11.0, 8.0, 8.0, 6.0, 8.0, 5.0, 3.0, 5.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.1376953125, -1.1070938110351562, -1.0764923095703125, -1.0458908081054688, -1.015289306640625, -0.9846878051757812, -0.9540863037109375, -0.9234848022460938, -0.89288330078125, -0.8622817993164062, -0.8316802978515625, -0.8010787963867188, -0.770477294921875, -0.7398757934570312, -0.7092742919921875, -0.6786727905273438, -0.6480712890625, -0.6174697875976562, -0.5868682861328125, -0.5562667846679688, -0.525665283203125, -0.49506378173828125, -0.4644622802734375, -0.43386077880859375, -0.40325927734375, -0.37265777587890625, -0.3420562744140625, -0.31145477294921875, -0.280853271484375, -0.25025177001953125, -0.2196502685546875, -0.18904876708984375, -0.158447265625, -0.12784576416015625, -0.0972442626953125, -0.06664276123046875, -0.036041259765625, -0.00543975830078125, 0.0251617431640625, 0.05576324462890625, 0.08636474609375, 0.11696624755859375, 0.1475677490234375, 0.17816925048828125, 0.208770751953125, 0.23937225341796875, 0.2699737548828125, 0.30057525634765625, 0.3311767578125, 0.36177825927734375, 0.3923797607421875, 0.42298126220703125, 0.453582763671875, 0.48418426513671875, 0.5147857666015625, 0.5453872680664062, 0.57598876953125, 0.6065902709960938, 0.6371917724609375, 0.6677932739257812, 0.698394775390625, 0.7289962768554688, 0.7595977783203125, 0.7901992797851562, 0.82080078125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 2.0, 6.0, 6.0, 8.0, 13.0, 25.0, 39.0, 52.0, 71.0, 102.0, 167.0, 223.0, 378.0, 659.0, 1249.0, 2496.0, 5470.0, 14311.0, 51543.0, 329269.0, 516159.0, 91097.0, 20865.0, 7466.0, 3225.0, 1571.0, 813.0, 458.0, 291.0, 176.0, 112.0, 72.0, 52.0, 38.0, 27.0, 12.0, 14.0, 13.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.235107421875, -0.22731399536132812, -0.21952056884765625, -0.21172714233398438, -0.2039337158203125, -0.19614028930664062, -0.18834686279296875, -0.18055343627929688, -0.172760009765625, -0.16496658325195312, -0.15717315673828125, -0.14937973022460938, -0.1415863037109375, -0.13379287719726562, -0.12599945068359375, -0.11820602416992188, -0.11041259765625, -0.10261917114257812, -0.09482574462890625, -0.08703231811523438, -0.0792388916015625, -0.07144546508789062, -0.06365203857421875, -0.055858612060546875, -0.048065185546875, -0.040271759033203125, -0.03247833251953125, -0.024684906005859375, -0.0168914794921875, -0.009098052978515625, -0.00130462646484375, 0.006488800048828125, 0.0142822265625, 0.022075653076171875, 0.02986907958984375, 0.037662506103515625, 0.0454559326171875, 0.053249359130859375, 0.06104278564453125, 0.06883621215820312, 0.076629638671875, 0.08442306518554688, 0.09221649169921875, 0.10000991821289062, 0.1078033447265625, 0.11559677124023438, 0.12339019775390625, 0.13118362426757812, 0.13897705078125, 0.14677047729492188, 0.15456390380859375, 0.16235733032226562, 0.1701507568359375, 0.17794418334960938, 0.18573760986328125, 0.19353103637695312, 0.201324462890625, 0.20911788940429688, 0.21691131591796875, 0.22470474243164062, 0.2324981689453125, 0.24029159545898438, 0.24808502197265625, 0.2558784484863281, 0.263671875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 7.0, 11.0, 10.0, 7.0, 21.0, 39.0, 76.0, 162.0, 212.0, 199.0, 122.0, 62.0, 17.0, 20.0, 9.0, 11.0, 7.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.666515350341797e-05, -8.302740752696991e-05, -7.938966155052185e-05, -7.575191557407379e-05, -7.211416959762573e-05, -6.847642362117767e-05, -6.483867764472961e-05, -6.120093166828156e-05, -5.7563185691833496e-05, -5.392543971538544e-05, -5.028769373893738e-05, -4.664994776248932e-05, -4.301220178604126e-05, -3.93744558095932e-05, -3.573670983314514e-05, -3.209896385669708e-05, -2.8461217880249023e-05, -2.4823471903800964e-05, -2.1185725927352905e-05, -1.7547979950904846e-05, -1.3910233974456787e-05, -1.0272487998008728e-05, -6.634742021560669e-06, -2.99699604511261e-06, 6.407499313354492e-07, 4.278495907783508e-06, 7.916241884231567e-06, 1.1553987860679626e-05, 1.5191733837127686e-05, 1.8829479813575745e-05, 2.2467225790023804e-05, 2.6104971766471863e-05, 2.9742717742919922e-05, 3.338046371936798e-05, 3.701820969581604e-05, 4.06559556722641e-05, 4.429370164871216e-05, 4.793144762516022e-05, 5.1569193601608276e-05, 5.5206939578056335e-05, 5.8844685554504395e-05, 6.248243153095245e-05, 6.612017750740051e-05, 6.975792348384857e-05, 7.339566946029663e-05, 7.703341543674469e-05, 8.067116141319275e-05, 8.430890738964081e-05, 8.794665336608887e-05, 9.158439934253693e-05, 9.522214531898499e-05, 9.885989129543304e-05, 0.0001024976372718811, 0.00010613538324832916, 0.00010977312922477722, 0.00011341087520122528, 0.00011704862117767334, 0.0001206863671541214, 0.00012432411313056946, 0.00012796185910701752, 0.00013159960508346558, 0.00013523735105991364, 0.0001388750970363617, 0.00014251284301280975, 0.0001461505889892578]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 6.0, 6.0, 18.0, 21.0, 37.0, 68.0, 119.0, 199.0, 409.0, 692.0, 1479.0, 4079.0, 12482.0, 50392.0, 255613.0, 516361.0, 159643.0, 32646.0, 8864.0, 3059.0, 1106.0, 558.0, 251.0, 151.0, 102.0, 64.0, 55.0, 23.0, 17.0, 12.0, 9.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.26318359375, -0.2561378479003906, -0.24909210205078125, -0.24204635620117188, -0.2350006103515625, -0.22795486450195312, -0.22090911865234375, -0.21386337280273438, -0.206817626953125, -0.19977188110351562, -0.19272613525390625, -0.18568038940429688, -0.1786346435546875, -0.17158889770507812, -0.16454315185546875, -0.15749740600585938, -0.15045166015625, -0.14340591430664062, -0.13636016845703125, -0.12931442260742188, -0.1222686767578125, -0.11522293090820312, -0.10817718505859375, -0.10113143920898438, -0.094085693359375, -0.08703994750976562, -0.07999420166015625, -0.07294845581054688, -0.0659027099609375, -0.058856964111328125, -0.05181121826171875, -0.044765472412109375, -0.0377197265625, -0.030673980712890625, -0.02362823486328125, -0.016582489013671875, -0.0095367431640625, -0.002490997314453125, 0.00455474853515625, 0.011600494384765625, 0.018646240234375, 0.025691986083984375, 0.03273773193359375, 0.039783477783203125, 0.0468292236328125, 0.053874969482421875, 0.06092071533203125, 0.06796646118164062, 0.07501220703125, 0.08205795288085938, 0.08910369873046875, 0.09614944458007812, 0.1031951904296875, 0.11024093627929688, 0.11728668212890625, 0.12433242797851562, 0.131378173828125, 0.13842391967773438, 0.14546966552734375, 0.15251541137695312, 0.1595611572265625, 0.16660690307617188, 0.17365264892578125, 0.18069839477539062, 0.187744140625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 5.0, 11.0, 7.0, 13.0, 11.0, 16.0, 19.0, 42.0, 48.0, 78.0, 96.0, 97.0, 96.0, 93.0, 84.0, 64.0, 49.0, 48.0, 26.0, 25.0, 11.0, 21.0, 9.0, 9.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177001953125, -0.1699981689453125, -0.162994384765625, -0.1559906005859375, -0.14898681640625, -0.1419830322265625, -0.134979248046875, -0.1279754638671875, -0.1209716796875, -0.1139678955078125, -0.106964111328125, -0.0999603271484375, -0.09295654296875, -0.0859527587890625, -0.078948974609375, -0.0719451904296875, -0.06494140625, -0.0579376220703125, -0.050933837890625, -0.0439300537109375, -0.03692626953125, -0.0299224853515625, -0.022918701171875, -0.0159149169921875, -0.0089111328125, -0.0019073486328125, 0.005096435546875, 0.0121002197265625, 0.01910400390625, 0.0261077880859375, 0.033111572265625, 0.0401153564453125, 0.047119140625, 0.0541229248046875, 0.061126708984375, 0.0681304931640625, 0.07513427734375, 0.0821380615234375, 0.089141845703125, 0.0961456298828125, 0.1031494140625, 0.1101531982421875, 0.117156982421875, 0.1241607666015625, 0.13116455078125, 0.1381683349609375, 0.145172119140625, 0.1521759033203125, 0.1591796875, 0.1661834716796875, 0.173187255859375, 0.1801910400390625, 0.18719482421875, 0.1941986083984375, 0.201202392578125, 0.2082061767578125, 0.2152099609375, 0.2222137451171875, 0.229217529296875, 0.2362213134765625, 0.24322509765625, 0.2502288818359375, 0.257232666015625, 0.2642364501953125, 0.271240234375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 5.0, 10.0, 12.0, 15.0, 37.0, 63.0, 91.0, 120.0, 182.0, 143.0, 114.0, 74.0, 49.0, 34.0, 14.0, 13.0, 5.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.7111592292785645, -2.613602876663208, -2.5160465240478516, -2.418490171432495, -2.3209338188171387, -2.2233774662017822, -2.125821113586426, -2.0282645225524902, -1.9307082891464233, -1.833151936531067, -1.7355955839157104, -1.6380391120910645, -1.540482759475708, -1.4429264068603516, -1.3453700542449951, -1.2478137016296387, -1.1502573490142822, -1.0527009963989258, -0.9551446437835693, -0.8575882315635681, -0.7600318789482117, -0.6624755263328552, -0.564919114112854, -0.46736276149749756, -0.3698064088821411, -0.27225005626678467, -0.17469367384910583, -0.077137291431427, 0.020419061183929443, 0.11797541379928589, 0.2155318260192871, 0.31308817863464355, 0.4106447696685791, 0.5082011222839355, 0.605757474899292, 0.7033138871192932, 0.8008702397346497, 0.8984265923500061, 0.9959830045700073, 1.0935393571853638, 1.1910957098007202, 1.2886520624160767, 1.386208415031433, 1.483764886856079, 1.5813212394714355, 1.678877592086792, 1.7764339447021484, 1.8739902973175049, 1.9715466499328613, 2.0691030025482178, 2.166659355163574, 2.2642157077789307, 2.361772060394287, 2.4593284130096436, 2.556884765625, 2.6544413566589355, 2.751997470855713, 2.8495538234710693, 2.947110176086426, 3.0446665287017822, 3.1422228813171387, 3.239779233932495, 3.3373355865478516, 3.434892177581787, 3.5324485301971436]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 4.0, 3.0, 7.0, 7.0, 5.0, 4.0, 6.0, 10.0, 15.0, 23.0, 15.0, 26.0, 30.0, 28.0, 40.0, 38.0, 39.0, 39.0, 40.0, 37.0, 44.0, 47.0, 51.0, 42.0, 33.0, 35.0, 36.0, 35.0, 40.0, 28.0, 28.0, 22.0, 30.0, 22.0, 11.0, 18.0, 17.0, 10.0, 10.0, 5.0, 7.0, 3.0, 7.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.0485012531280518, -1.9815906286239624, -1.9146798849105835, -1.8477692604064941, -1.7808585166931152, -1.7139478921890259, -1.6470372676849365, -1.5801265239715576, -1.5132158994674683, -1.446305274963379, -1.37939453125, -1.3124839067459106, -1.2455732822418213, -1.1786625385284424, -1.111751914024353, -1.0448412895202637, -0.9779305458068848, -0.9110198616981506, -0.8441091775894165, -0.7771985530853271, -0.710287868976593, -0.6433771848678589, -0.5764665603637695, -0.5095558762550354, -0.44264519214630127, -0.37573450803756714, -0.3088238537311554, -0.24191318452358246, -0.17500251531600952, -0.10809183120727539, -0.04118117690086365, 0.025729477405548096, 0.09263992309570312, 0.15955059230327606, 0.226461261510849, 0.29337191581726074, 0.3602825999259949, 0.427193284034729, 0.49410393834114075, 0.5610145926475525, 0.6279252767562866, 0.6948359608650208, 0.7617466449737549, 0.8286572694778442, 0.8955679535865784, 0.9624786376953125, 1.0293892621994019, 1.0962998867034912, 1.1632106304168701, 1.2301212549209595, 1.2970319986343384, 1.3639426231384277, 1.4308533668518066, 1.497763991355896, 1.5646746158599854, 1.6315853595733643, 1.6984959840774536, 1.765406608581543, 1.8323173522949219, 1.8992279767990112, 1.9661386013031006, 2.0330493450164795, 2.0999600887298584, 2.166870594024658, 2.233781337738037]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 8.0, 9.0, 16.0, 16.0, 28.0, 39.0, 49.0, 101.0, 170.0, 373.0, 668.0, 1568.0, 4284.0, 14246.0, 57224.0, 238484.0, 810297.0, 1550324.0, 1056930.0, 346999.0, 82698.0, 19501.0, 5913.0, 2239.0, 976.0, 456.0, 235.0, 150.0, 88.0, 65.0, 43.0, 31.0, 22.0, 12.0, 7.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.48779296875, -0.4757881164550781, -0.46378326416015625, -0.4517784118652344, -0.4397735595703125, -0.4277687072753906, -0.41576385498046875, -0.4037590026855469, -0.391754150390625, -0.3797492980957031, -0.36774444580078125, -0.3557395935058594, -0.3437347412109375, -0.3317298889160156, -0.31972503662109375, -0.3077201843261719, -0.29571533203125, -0.2837104797363281, -0.27170562744140625, -0.2597007751464844, -0.2476959228515625, -0.23569107055664062, -0.22368621826171875, -0.21168136596679688, -0.199676513671875, -0.18767166137695312, -0.17566680908203125, -0.16366195678710938, -0.1516571044921875, -0.13965225219726562, -0.12764739990234375, -0.11564254760742188, -0.1036376953125, -0.09163284301757812, -0.07962799072265625, -0.06762313842773438, -0.0556182861328125, -0.043613433837890625, -0.03160858154296875, -0.019603729248046875, -0.007598876953125, 0.004405975341796875, 0.01641082763671875, 0.028415679931640625, 0.0404205322265625, 0.052425384521484375, 0.06443023681640625, 0.07643508911132812, 0.08843994140625, 0.10044479370117188, 0.11244964599609375, 0.12445449829101562, 0.1364593505859375, 0.14846420288085938, 0.16046905517578125, 0.17247390747070312, 0.184478759765625, 0.19648361206054688, 0.20848846435546875, 0.22049331665039062, 0.2324981689453125, 0.24450302124023438, 0.25650787353515625, 0.2685127258300781, 0.280517578125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 9.0, 3.0, 7.0, 7.0, 11.0, 11.0, 22.0, 13.0, 19.0, 19.0, 27.0, 28.0, 39.0, 36.0, 38.0, 36.0, 52.0, 46.0, 47.0, 45.0, 51.0, 47.0, 40.0, 41.0, 41.0, 38.0, 28.0, 23.0, 41.0, 19.0, 22.0, 19.0, 13.0, 12.0, 13.0, 6.0, 9.0, 9.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.394775390625, -0.384033203125, -0.373291015625, -0.362548828125, -0.351806640625, -0.341064453125, -0.330322265625, -0.319580078125, -0.308837890625, -0.298095703125, -0.287353515625, -0.276611328125, -0.265869140625, -0.255126953125, -0.244384765625, -0.233642578125, -0.222900390625, -0.212158203125, -0.201416015625, -0.190673828125, -0.179931640625, -0.169189453125, -0.158447265625, -0.147705078125, -0.136962890625, -0.126220703125, -0.115478515625, -0.104736328125, -0.093994140625, -0.083251953125, -0.072509765625, -0.061767578125, -0.051025390625, -0.040283203125, -0.029541015625, -0.018798828125, -0.008056640625, 0.002685546875, 0.013427734375, 0.024169921875, 0.034912109375, 0.045654296875, 0.056396484375, 0.067138671875, 0.077880859375, 0.088623046875, 0.099365234375, 0.110107421875, 0.120849609375, 0.131591796875, 0.142333984375, 0.153076171875, 0.163818359375, 0.174560546875, 0.185302734375, 0.196044921875, 0.206787109375, 0.217529296875, 0.228271484375, 0.239013671875, 0.249755859375, 0.260498046875, 0.271240234375, 0.281982421875, 0.292724609375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 7.0, 5.0, 3.0, 14.0, 22.0, 30.0, 41.0, 63.0, 96.0, 173.0, 285.0, 461.0, 912.0, 1666.0, 3554.0, 8600.0, 26704.0, 124287.0, 948767.0, 2511069.0, 464978.0, 72250.0, 18226.0, 6205.0, 2754.0, 1373.0, 728.0, 408.0, 224.0, 156.0, 74.0, 48.0, 42.0, 28.0, 7.0, 10.0, 6.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.55615234375, -0.5404129028320312, -0.5246734619140625, -0.5089340209960938, -0.493194580078125, -0.47745513916015625, -0.4617156982421875, -0.44597625732421875, -0.43023681640625, -0.41449737548828125, -0.3987579345703125, -0.38301849365234375, -0.367279052734375, -0.35153961181640625, -0.3358001708984375, -0.32006072998046875, -0.3043212890625, -0.28858184814453125, -0.2728424072265625, -0.25710296630859375, -0.241363525390625, -0.22562408447265625, -0.2098846435546875, -0.19414520263671875, -0.17840576171875, -0.16266632080078125, -0.1469268798828125, -0.13118743896484375, -0.115447998046875, -0.09970855712890625, -0.0839691162109375, -0.06822967529296875, -0.052490234375, -0.03675079345703125, -0.0210113525390625, -0.00527191162109375, 0.010467529296875, 0.02620697021484375, 0.0419464111328125, 0.05768585205078125, 0.07342529296875, 0.08916473388671875, 0.1049041748046875, 0.12064361572265625, 0.136383056640625, 0.15212249755859375, 0.1678619384765625, 0.18360137939453125, 0.1993408203125, 0.21508026123046875, 0.2308197021484375, 0.24655914306640625, 0.262298583984375, 0.27803802490234375, 0.2937774658203125, 0.30951690673828125, 0.32525634765625, 0.34099578857421875, 0.3567352294921875, 0.37247467041015625, 0.388214111328125, 0.40395355224609375, 0.4196929931640625, 0.43543243408203125, 0.451171875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 1.0, 14.0, 7.0, 16.0, 14.0, 18.0, 38.0, 53.0, 69.0, 122.0, 184.0, 300.0, 428.0, 603.0, 669.0, 511.0, 345.0, 215.0, 146.0, 96.0, 79.0, 43.0, 34.0, 28.0, 9.0, 7.0, 0.0, 7.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.75390625, -0.7346878051757812, -0.7154693603515625, -0.6962509155273438, -0.677032470703125, -0.6578140258789062, -0.6385955810546875, -0.6193771362304688, -0.60015869140625, -0.5809402465820312, -0.5617218017578125, -0.5425033569335938, -0.523284912109375, -0.5040664672851562, -0.4848480224609375, -0.46562957763671875, -0.4464111328125, -0.42719268798828125, -0.4079742431640625, -0.38875579833984375, -0.369537353515625, -0.35031890869140625, -0.3311004638671875, -0.31188201904296875, -0.29266357421875, -0.27344512939453125, -0.2542266845703125, -0.23500823974609375, -0.215789794921875, -0.19657135009765625, -0.1773529052734375, -0.15813446044921875, -0.138916015625, -0.11969757080078125, -0.1004791259765625, -0.08126068115234375, -0.062042236328125, -0.04282379150390625, -0.0236053466796875, -0.00438690185546875, 0.01483154296875, 0.03404998779296875, 0.0532684326171875, 0.07248687744140625, 0.091705322265625, 0.11092376708984375, 0.1301422119140625, 0.14936065673828125, 0.1685791015625, 0.18779754638671875, 0.2070159912109375, 0.22623443603515625, 0.245452880859375, 0.26467132568359375, 0.2838897705078125, 0.30310821533203125, 0.32232666015625, 0.34154510498046875, 0.3607635498046875, 0.37998199462890625, 0.399200439453125, 0.41841888427734375, 0.4376373291015625, 0.45685577392578125, 0.47607421875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 7.0, 10.0, 22.0, 59.0, 144.0, 197.0, 273.0, 151.0, 78.0, 36.0, 11.0, 6.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.9995903968811035, -6.806433200836182, -6.61327600479126, -6.420118808746338, -6.226961612701416, -6.033804416656494, -5.840646743774414, -5.647489547729492, -5.45433235168457, -5.261175155639648, -5.068017959594727, -4.874860763549805, -4.681703567504883, -4.488546371459961, -4.295389175415039, -4.102231979370117, -3.9090747833251953, -3.7159175872802734, -3.5227603912353516, -3.3296031951904297, -3.136445999145508, -2.943288803100586, -2.750131368637085, -2.556974172592163, -2.363816976547241, -2.1706597805023193, -1.9775025844573975, -1.784345269203186, -1.5911880731582642, -1.3980308771133423, -1.2048735618591309, -1.011716365814209, -0.8185586929321289, -0.625401496887207, -0.4322442412376404, -0.23908698558807373, -0.045929789543151855, 0.14722740650177002, 0.34038472175598145, 0.5335419178009033, 0.7266991138458252, 0.9198563098907471, 1.113013505935669, 1.3061708211898804, 1.4993280172348022, 1.6924852132797241, 1.8856425285339355, 2.0787997245788574, 2.2719569206237793, 2.465114116668701, 2.658271312713623, 2.851428508758545, 3.044585704803467, 3.2377429008483887, 3.4309003353118896, 3.6240575313568115, 3.8172147274017334, 4.010372161865234, 4.203529357910156, 4.396686553955078, 4.58984375, 4.783000946044922, 4.976158142089844, 5.169315338134766, 5.3624725341796875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 14.0, 12.0, 11.0, 19.0, 20.0, 26.0, 40.0, 44.0, 38.0, 42.0, 56.0, 71.0, 58.0, 61.0, 75.0, 43.0, 55.0, 48.0, 43.0, 35.0, 24.0, 30.0, 25.0, 28.0, 17.0, 16.0, 11.0, 11.0, 8.0, 5.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.229010581970215, -2.1601381301879883, -2.091265916824341, -2.0223934650421143, -1.9535212516784668, -1.8846487998962402, -1.8157764673233032, -1.7469041347503662, -1.6780318021774292, -1.6091594696044922, -1.5402871370315552, -1.4714148044586182, -1.4025423526763916, -1.3336701393127441, -1.2647976875305176, -1.1959253549575806, -1.1270530223846436, -1.0581806898117065, -0.9893083572387695, -0.9204359650611877, -0.8515636324882507, -0.7826912999153137, -0.7138189077377319, -0.6449465751647949, -0.5760742425918579, -0.5072019100189209, -0.4383295476436615, -0.3694571852684021, -0.3005848526954651, -0.23171252012252808, -0.16284015774726868, -0.09396779537200928, -0.025095701217651367, 0.04377664625644684, 0.11264899373054504, 0.18152134120464325, 0.25039368867874146, 0.31926602125167847, 0.38813838362693787, 0.45701074600219727, 0.5258830785751343, 0.5947554111480713, 0.6636277437210083, 0.7325001358985901, 0.8013724684715271, 0.8702448010444641, 0.9391171932220459, 1.007989525794983, 1.07686185836792, 1.145734190940857, 1.214606523513794, 1.283478856086731, 1.352351188659668, 1.4212236404418945, 1.4900959730148315, 1.5589683055877686, 1.6278406381607056, 1.6967129707336426, 1.7655853033065796, 1.8344576358795166, 1.9033300876617432, 1.9722023010253906, 2.041074752807617, 2.1099472045898438, 2.178819417953491]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 0.0, 8.0, 11.0, 8.0, 6.0, 13.0, 12.0, 26.0, 35.0, 48.0, 82.0, 111.0, 190.0, 296.0, 585.0, 891.0, 1792.0, 3416.0, 6248.0, 12592.0, 24492.0, 48689.0, 91940.0, 160636.0, 217723.0, 200236.0, 130746.0, 71861.0, 36949.0, 18574.0, 9590.0, 4961.0, 2557.0, 1350.0, 776.0, 421.0, 262.0, 137.0, 93.0, 70.0, 50.0, 26.0, 14.0, 14.0, 8.0, 4.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.270263671875, -0.2617645263671875, -0.253265380859375, -0.2447662353515625, -0.23626708984375, -0.2277679443359375, -0.219268798828125, -0.2107696533203125, -0.2022705078125, -0.1937713623046875, -0.185272216796875, -0.1767730712890625, -0.16827392578125, -0.1597747802734375, -0.151275634765625, -0.1427764892578125, -0.13427734375, -0.1257781982421875, -0.117279052734375, -0.1087799072265625, -0.10028076171875, -0.0917816162109375, -0.083282470703125, -0.0747833251953125, -0.0662841796875, -0.0577850341796875, -0.049285888671875, -0.0407867431640625, -0.03228759765625, -0.0237884521484375, -0.015289306640625, -0.0067901611328125, 0.001708984375, 0.0102081298828125, 0.018707275390625, 0.0272064208984375, 0.03570556640625, 0.0442047119140625, 0.052703857421875, 0.0612030029296875, 0.0697021484375, 0.0782012939453125, 0.086700439453125, 0.0951995849609375, 0.10369873046875, 0.1121978759765625, 0.120697021484375, 0.1291961669921875, 0.1376953125, 0.1461944580078125, 0.154693603515625, 0.1631927490234375, 0.17169189453125, 0.1801910400390625, 0.188690185546875, 0.1971893310546875, 0.2056884765625, 0.2141876220703125, 0.222686767578125, 0.2311859130859375, 0.23968505859375, 0.2481842041015625, 0.256683349609375, 0.2651824951171875, 0.273681640625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 12.0, 4.0, 5.0, 15.0, 19.0, 25.0, 25.0, 27.0, 40.0, 29.0, 47.0, 42.0, 47.0, 62.0, 50.0, 46.0, 50.0, 52.0, 41.0, 50.0, 47.0, 43.0, 38.0, 28.0, 30.0, 24.0, 17.0, 17.0, 17.0, 10.0, 8.0, 12.0, 7.0, 4.0, 5.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.361083984375, -0.34830474853515625, -0.3355255126953125, -0.32274627685546875, -0.309967041015625, -0.29718780517578125, -0.2844085693359375, -0.27162933349609375, -0.25885009765625, -0.24607086181640625, -0.2332916259765625, -0.22051239013671875, -0.207733154296875, -0.19495391845703125, -0.1821746826171875, -0.16939544677734375, -0.1566162109375, -0.14383697509765625, -0.1310577392578125, -0.11827850341796875, -0.105499267578125, -0.09272003173828125, -0.0799407958984375, -0.06716156005859375, -0.05438232421875, -0.04160308837890625, -0.0288238525390625, -0.01604461669921875, -0.003265380859375, 0.00951385498046875, 0.0222930908203125, 0.03507232666015625, 0.0478515625, 0.06063079833984375, 0.0734100341796875, 0.08618927001953125, 0.098968505859375, 0.11174774169921875, 0.1245269775390625, 0.13730621337890625, 0.15008544921875, 0.16286468505859375, 0.1756439208984375, 0.18842315673828125, 0.201202392578125, 0.21398162841796875, 0.2267608642578125, 0.23954010009765625, 0.2523193359375, 0.26509857177734375, 0.2778778076171875, 0.29065704345703125, 0.303436279296875, 0.31621551513671875, 0.3289947509765625, 0.34177398681640625, 0.35455322265625, 0.36733245849609375, 0.3801116943359375, 0.39289093017578125, 0.405670166015625, 0.41844940185546875, 0.4312286376953125, 0.44400787353515625, 0.456787109375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 2.0, 6.0, 8.0, 12.0, 13.0, 26.0, 32.0, 47.0, 75.0, 124.0, 217.0, 397.0, 821.0, 1532.0, 3532.0, 8267.0, 20644.0, 54851.0, 143575.0, 319427.0, 285607.0, 128629.0, 48502.0, 18468.0, 7548.0, 3148.0, 1395.0, 760.0, 397.0, 206.0, 99.0, 72.0, 37.0, 18.0, 19.0, 11.0, 7.0, 4.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.451904296875, -0.4396705627441406, -0.42743682861328125, -0.4152030944824219, -0.4029693603515625, -0.3907356262207031, -0.37850189208984375, -0.3662681579589844, -0.354034423828125, -0.3418006896972656, -0.32956695556640625, -0.3173332214355469, -0.3050994873046875, -0.2928657531738281, -0.28063201904296875, -0.2683982849121094, -0.25616455078125, -0.24393081665039062, -0.23169708251953125, -0.21946334838867188, -0.2072296142578125, -0.19499588012695312, -0.18276214599609375, -0.17052841186523438, -0.158294677734375, -0.14606094360351562, -0.13382720947265625, -0.12159347534179688, -0.1093597412109375, -0.09712600708007812, -0.08489227294921875, -0.07265853881835938, -0.0604248046875, -0.048191070556640625, -0.03595733642578125, -0.023723602294921875, -0.0114898681640625, 0.000743865966796875, 0.01297760009765625, 0.025211334228515625, 0.037445068359375, 0.049678802490234375, 0.06191253662109375, 0.07414627075195312, 0.0863800048828125, 0.09861373901367188, 0.11084747314453125, 0.12308120727539062, 0.13531494140625, 0.14754867553710938, 0.15978240966796875, 0.17201614379882812, 0.1842498779296875, 0.19648361206054688, 0.20871734619140625, 0.22095108032226562, 0.233184814453125, 0.24541854858398438, 0.25765228271484375, 0.2698860168457031, 0.2821197509765625, 0.2943534851074219, 0.30658721923828125, 0.3188209533691406, 0.3310546875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 7.0, 7.0, 7.0, 18.0, 15.0, 17.0, 24.0, 23.0, 25.0, 24.0, 28.0, 44.0, 34.0, 37.0, 34.0, 52.0, 51.0, 42.0, 40.0, 41.0, 44.0, 39.0, 45.0, 30.0, 24.0, 30.0, 30.0, 34.0, 18.0, 27.0, 18.0, 13.0, 15.0, 12.0, 10.0, 10.0, 6.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.9443359375, -0.91766357421875, -0.8909912109375, -0.86431884765625, -0.837646484375, -0.81097412109375, -0.7843017578125, -0.75762939453125, -0.73095703125, -0.70428466796875, -0.6776123046875, -0.65093994140625, -0.624267578125, -0.59759521484375, -0.5709228515625, -0.54425048828125, -0.517578125, -0.49090576171875, -0.4642333984375, -0.43756103515625, -0.410888671875, -0.38421630859375, -0.3575439453125, -0.33087158203125, -0.30419921875, -0.27752685546875, -0.2508544921875, -0.22418212890625, -0.197509765625, -0.17083740234375, -0.1441650390625, -0.11749267578125, -0.0908203125, -0.06414794921875, -0.0374755859375, -0.01080322265625, 0.015869140625, 0.04254150390625, 0.0692138671875, 0.09588623046875, 0.12255859375, 0.14923095703125, 0.1759033203125, 0.20257568359375, 0.229248046875, 0.25592041015625, 0.2825927734375, 0.30926513671875, 0.3359375, 0.36260986328125, 0.3892822265625, 0.41595458984375, 0.442626953125, 0.46929931640625, 0.4959716796875, 0.52264404296875, 0.54931640625, 0.57598876953125, 0.6026611328125, 0.62933349609375, 0.656005859375, 0.68267822265625, 0.7093505859375, 0.73602294921875, 0.7626953125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 3.0, 11.0, 10.0, 11.0, 27.0, 23.0, 58.0, 68.0, 101.0, 150.0, 175.0, 316.0, 560.0, 776.0, 1294.0, 2371.0, 5211.0, 15488.0, 66316.0, 301233.0, 480478.0, 130498.0, 27864.0, 7881.0, 3316.0, 1634.0, 923.0, 585.0, 354.0, 257.0, 160.0, 139.0, 88.0, 47.0, 36.0, 21.0, 16.0, 16.0, 14.0, 6.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.17822265625, -0.1734333038330078, -0.16864395141601562, -0.16385459899902344, -0.15906524658203125, -0.15427589416503906, -0.14948654174804688, -0.1446971893310547, -0.1399078369140625, -0.1351184844970703, -0.13032913208007812, -0.12553977966308594, -0.12075042724609375, -0.11596107482910156, -0.11117172241210938, -0.10638236999511719, -0.101593017578125, -0.09680366516113281, -0.09201431274414062, -0.08722496032714844, -0.08243560791015625, -0.07764625549316406, -0.07285690307617188, -0.06806755065917969, -0.0632781982421875, -0.05848884582519531, -0.053699493408203125, -0.04891014099121094, -0.04412078857421875, -0.03933143615722656, -0.034542083740234375, -0.029752731323242188, -0.02496337890625, -0.020174026489257812, -0.015384674072265625, -0.010595321655273438, -0.00580596923828125, -0.0010166168212890625, 0.003772735595703125, 0.008562088012695312, 0.0133514404296875, 0.018140792846679688, 0.022930145263671875, 0.027719497680664062, 0.03250885009765625, 0.03729820251464844, 0.042087554931640625, 0.04687690734863281, 0.051666259765625, 0.05645561218261719, 0.061244964599609375, 0.06603431701660156, 0.07082366943359375, 0.07561302185058594, 0.08040237426757812, 0.08519172668457031, 0.0899810791015625, 0.09477043151855469, 0.09955978393554688, 0.10434913635253906, 0.10913848876953125, 0.11392784118652344, 0.11871719360351562, 0.12350654602050781, 0.1282958984375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 11.0, 24.0, 31.0, 89.0, 122.0, 196.0, 206.0, 137.0, 70.0, 32.0, 19.0, 12.0, 6.0, 4.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.709596633911133e-05, -9.406637400388718e-05, -9.103678166866302e-05, -8.800718933343887e-05, -8.497759699821472e-05, -8.194800466299057e-05, -7.891841232776642e-05, -7.588881999254227e-05, -7.285922765731812e-05, -6.982963532209396e-05, -6.680004298686981e-05, -6.377045065164566e-05, -6.074085831642151e-05, -5.771126598119736e-05, -5.4681673645973206e-05, -5.1652081310749054e-05, -4.86224889755249e-05, -4.559289664030075e-05, -4.25633043050766e-05, -3.953371196985245e-05, -3.6504119634628296e-05, -3.3474527299404144e-05, -3.0444934964179993e-05, -2.741534262895584e-05, -2.438575029373169e-05, -2.1356157958507538e-05, -1.8326565623283386e-05, -1.5296973288059235e-05, -1.2267380952835083e-05, -9.237788617610931e-06, -6.20819628238678e-06, -3.178603947162628e-06, -1.4901161193847656e-07, 2.880580723285675e-06, 5.910173058509827e-06, 8.939765393733978e-06, 1.196935772895813e-05, 1.4998950064182281e-05, 1.8028542399406433e-05, 2.1058134734630585e-05, 2.4087727069854736e-05, 2.7117319405078888e-05, 3.014691174030304e-05, 3.317650407552719e-05, 3.620609641075134e-05, 3.9235688745975494e-05, 4.2265281081199646e-05, 4.52948734164238e-05, 4.832446575164795e-05, 5.13540580868721e-05, 5.438365042209625e-05, 5.7413242757320404e-05, 6.0442835092544556e-05, 6.347242742776871e-05, 6.650201976299286e-05, 6.953161209821701e-05, 7.256120443344116e-05, 7.559079676866531e-05, 7.862038910388947e-05, 8.164998143911362e-05, 8.467957377433777e-05, 8.770916610956192e-05, 9.073875844478607e-05, 9.376835078001022e-05, 9.679794311523438e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 2.0, 4.0, 10.0, 9.0, 13.0, 16.0, 18.0, 36.0, 33.0, 69.0, 107.0, 150.0, 234.0, 460.0, 857.0, 1719.0, 3588.0, 10118.0, 45605.0, 253515.0, 537217.0, 153965.0, 27527.0, 7237.0, 2902.0, 1394.0, 713.0, 377.0, 219.0, 156.0, 96.0, 74.0, 37.0, 32.0, 15.0, 11.0, 8.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2232666015625, -0.2175922393798828, -0.21191787719726562, -0.20624351501464844, -0.20056915283203125, -0.19489479064941406, -0.18922042846679688, -0.1835460662841797, -0.1778717041015625, -0.1721973419189453, -0.16652297973632812, -0.16084861755371094, -0.15517425537109375, -0.14949989318847656, -0.14382553100585938, -0.1381511688232422, -0.132476806640625, -0.1268024444580078, -0.12112808227539062, -0.11545372009277344, -0.10977935791015625, -0.10410499572753906, -0.09843063354492188, -0.09275627136230469, -0.0870819091796875, -0.08140754699707031, -0.07573318481445312, -0.07005882263183594, -0.06438446044921875, -0.05871009826660156, -0.053035736083984375, -0.04736137390136719, -0.04168701171875, -0.03601264953613281, -0.030338287353515625, -0.024663925170898438, -0.01898956298828125, -0.013315200805664062, -0.007640838623046875, -0.0019664764404296875, 0.0037078857421875, 0.009382247924804688, 0.015056610107421875, 0.020730972290039062, 0.02640533447265625, 0.03207969665527344, 0.037754058837890625, 0.04342842102050781, 0.049102783203125, 0.05477714538574219, 0.060451507568359375, 0.06612586975097656, 0.07180023193359375, 0.07747459411621094, 0.08314895629882812, 0.08882331848144531, 0.0944976806640625, 0.10017204284667969, 0.10584640502929688, 0.11152076721191406, 0.11719512939453125, 0.12286949157714844, 0.12854385375976562, 0.1342182159423828, 0.139892578125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 3.0, 7.0, 10.0, 9.0, 21.0, 30.0, 48.0, 59.0, 92.0, 96.0, 137.0, 112.0, 119.0, 87.0, 68.0, 38.0, 23.0, 10.0, 15.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.333251953125, -0.32563018798828125, -0.3180084228515625, -0.31038665771484375, -0.302764892578125, -0.29514312744140625, -0.2875213623046875, -0.27989959716796875, -0.27227783203125, -0.26465606689453125, -0.2570343017578125, -0.24941253662109375, -0.241790771484375, -0.23416900634765625, -0.2265472412109375, -0.21892547607421875, -0.2113037109375, -0.20368194580078125, -0.1960601806640625, -0.18843841552734375, -0.180816650390625, -0.17319488525390625, -0.1655731201171875, -0.15795135498046875, -0.15032958984375, -0.14270782470703125, -0.1350860595703125, -0.12746429443359375, -0.119842529296875, -0.11222076416015625, -0.1045989990234375, -0.09697723388671875, -0.08935546875, -0.08173370361328125, -0.0741119384765625, -0.06649017333984375, -0.058868408203125, -0.05124664306640625, -0.0436248779296875, -0.03600311279296875, -0.02838134765625, -0.02075958251953125, -0.0131378173828125, -0.00551605224609375, 0.002105712890625, 0.00972747802734375, 0.0173492431640625, 0.02497100830078125, 0.0325927734375, 0.04021453857421875, 0.0478363037109375, 0.05545806884765625, 0.063079833984375, 0.07070159912109375, 0.0783233642578125, 0.08594512939453125, 0.09356689453125, 0.10118865966796875, 0.1088104248046875, 0.11643218994140625, 0.124053955078125, 0.13167572021484375, 0.1392974853515625, 0.14691925048828125, 0.154541015625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 8.0, 20.0, 47.0, 128.0, 232.0, 268.0, 170.0, 70.0, 27.0, 15.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.990912914276123, -3.83859920501709, -3.6862857341766357, -3.5339720249176025, -3.3816585540771484, -3.2293448448181152, -3.077031135559082, -2.924717426300049, -2.7724039554595947, -2.6200902462005615, -2.4677767753601074, -2.315463066101074, -2.163149356842041, -2.010835886001587, -1.8585221767425537, -1.70620858669281, -1.5538949966430664, -1.4015814065933228, -1.249267816543579, -1.096954107284546, -0.9446405172348022, -0.7923269271850586, -0.6400132775306702, -0.48769962787628174, -0.3353860378265381, -0.18307241797447205, -0.030758798122406006, 0.12155482172966003, 0.2738684415817261, 0.4261820316314697, 0.5784956812858582, 0.7308093309402466, 0.883122444152832, 1.0354360342025757, 1.1877496242523193, 1.3400633335113525, 1.4923769235610962, 1.6446905136108398, 1.797004222869873, 1.9493178129196167, 2.1016314029693604, 2.2539451122283936, 2.4062585830688477, 2.558572292327881, 2.710886001586914, 2.863199472427368, 3.0155131816864014, 3.1678266525268555, 3.3201403617858887, 3.472454071044922, 3.624767541885376, 3.777081251144409, 3.9293947219848633, 4.0817084312438965, 4.23402214050293, 4.386335849761963, 4.538649559020996, 4.690963268280029, 4.8432769775390625, 4.9955902099609375, 5.147903919219971, 5.300217628479004, 5.452531337738037, 5.60484504699707, 5.757158279418945]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 9.0, 7.0, 13.0, 10.0, 12.0, 13.0, 15.0, 23.0, 37.0, 25.0, 37.0, 60.0, 44.0, 40.0, 56.0, 51.0, 47.0, 53.0, 44.0, 49.0, 52.0, 58.0, 31.0, 36.0, 29.0, 28.0, 29.0, 12.0, 20.0, 13.0, 8.0, 10.0, 5.0, 9.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.6188805103302, -2.541846513748169, -2.4648125171661377, -2.3877785205841064, -2.310744524002075, -2.233710289001465, -2.1566762924194336, -2.0796422958374023, -2.002608299255371, -1.9255743026733398, -1.8485403060913086, -1.7715063095092773, -1.6944721937179565, -1.6174381971359253, -1.540404200553894, -1.4633700847625732, -1.3863362073898315, -1.3093022108078003, -1.232268214225769, -1.1552340984344482, -1.078200101852417, -1.0011661052703857, -0.9241321086883545, -0.8470980525016785, -0.7700640559196472, -0.693030059337616, -0.6159960031509399, -0.5389620065689087, -0.46192798018455505, -0.3848939538002014, -0.30785995721817017, -0.23082590103149414, -0.1537919044494629, -0.07675788551568985, 0.0002761334180831909, 0.07731014490127563, 0.15434417128562927, 0.2313781976699829, 0.30841219425201416, 0.3854462504386902, 0.46248024702072144, 0.5395142436027527, 0.6165482997894287, 0.69358229637146, 0.7706162929534912, 0.8476503491401672, 0.9246843457221985, 1.0017184019088745, 1.0787523984909058, 1.155786395072937, 1.2328203916549683, 1.309854507446289, 1.3868885040283203, 1.4639225006103516, 1.5409564971923828, 1.617990493774414, 1.6950244903564453, 1.7720584869384766, 1.8490924835205078, 1.926126480102539, 2.0031604766845703, 2.0801944732666016, 2.157228469848633, 2.234262704849243, 2.3112967014312744]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 8.0, 3.0, 8.0, 4.0, 19.0, 22.0, 30.0, 42.0, 53.0, 88.0, 131.0, 202.0, 353.0, 609.0, 1184.0, 2099.0, 4436.0, 10247.0, 26539.0, 70497.0, 175380.0, 370424.0, 635041.0, 852552.0, 835167.0, 605699.0, 345880.0, 154858.0, 59745.0, 23058.0, 9884.0, 4731.0, 2249.0, 1176.0, 701.0, 472.0, 272.0, 150.0, 108.0, 57.0, 32.0, 18.0, 22.0, 8.0, 13.0, 8.0, 8.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.24072265625, -0.23318862915039062, -0.22565460205078125, -0.21812057495117188, -0.2105865478515625, -0.20305252075195312, -0.19551849365234375, -0.18798446655273438, -0.180450439453125, -0.17291641235351562, -0.16538238525390625, -0.15784835815429688, -0.1503143310546875, -0.14278030395507812, -0.13524627685546875, -0.12771224975585938, -0.12017822265625, -0.11264419555664062, -0.10511016845703125, -0.09757614135742188, -0.0900421142578125, -0.08250808715820312, -0.07497406005859375, -0.06744003295898438, -0.059906005859375, -0.052371978759765625, -0.04483795166015625, -0.037303924560546875, -0.0297698974609375, -0.022235870361328125, -0.01470184326171875, -0.007167816162109375, 0.0003662109375, 0.007900238037109375, 0.01543426513671875, 0.022968292236328125, 0.0305023193359375, 0.038036346435546875, 0.04557037353515625, 0.053104400634765625, 0.060638427734375, 0.06817245483398438, 0.07570648193359375, 0.08324050903320312, 0.0907745361328125, 0.09830856323242188, 0.10584259033203125, 0.11337661743164062, 0.12091064453125, 0.12844467163085938, 0.13597869873046875, 0.14351272583007812, 0.1510467529296875, 0.15858078002929688, 0.16611480712890625, 0.17364883422851562, 0.181182861328125, 0.18871688842773438, 0.19625091552734375, 0.20378494262695312, 0.2113189697265625, 0.21885299682617188, 0.22638702392578125, 0.23392105102539062, 0.241455078125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 6.0, 14.0, 18.0, 15.0, 18.0, 17.0, 20.0, 25.0, 31.0, 28.0, 33.0, 33.0, 27.0, 31.0, 44.0, 53.0, 43.0, 57.0, 44.0, 40.0, 47.0, 35.0, 41.0, 29.0, 35.0, 34.0, 22.0, 26.0, 21.0, 21.0, 16.0, 14.0, 16.0, 11.0, 6.0, 4.0, 12.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.364013671875, -0.3537712097167969, -0.34352874755859375, -0.3332862854003906, -0.3230438232421875, -0.3128013610839844, -0.30255889892578125, -0.2923164367675781, -0.282073974609375, -0.2718315124511719, -0.26158905029296875, -0.2513465881347656, -0.2411041259765625, -0.23086166381835938, -0.22061920166015625, -0.21037673950195312, -0.20013427734375, -0.18989181518554688, -0.17964935302734375, -0.16940689086914062, -0.1591644287109375, -0.14892196655273438, -0.13867950439453125, -0.12843704223632812, -0.118194580078125, -0.10795211791992188, -0.09770965576171875, -0.08746719360351562, -0.0772247314453125, -0.06698226928710938, -0.05673980712890625, -0.046497344970703125, -0.0362548828125, -0.026012420654296875, -0.01576995849609375, -0.005527496337890625, 0.0047149658203125, 0.014957427978515625, 0.02519989013671875, 0.035442352294921875, 0.045684814453125, 0.055927276611328125, 0.06616973876953125, 0.07641220092773438, 0.0866546630859375, 0.09689712524414062, 0.10713958740234375, 0.11738204956054688, 0.12762451171875, 0.13786697387695312, 0.14810943603515625, 0.15835189819335938, 0.1685943603515625, 0.17883682250976562, 0.18907928466796875, 0.19932174682617188, 0.209564208984375, 0.21980667114257812, 0.23004913330078125, 0.24029159545898438, 0.2505340576171875, 0.2607765197753906, 0.27101898193359375, 0.2812614440917969, 0.29150390625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 9.0, 10.0, 4.0, 12.0, 24.0, 28.0, 40.0, 112.0, 186.0, 333.0, 720.0, 1787.0, 5994.0, 35727.0, 776931.0, 3214548.0, 138491.0, 13690.0, 3311.0, 1158.0, 517.0, 257.0, 147.0, 84.0, 49.0, 33.0, 21.0, 14.0, 6.0, 5.0, 13.0, 4.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.810546875, -0.7818603515625, -0.753173828125, -0.7244873046875, -0.69580078125, -0.6671142578125, -0.638427734375, -0.6097412109375, -0.5810546875, -0.5523681640625, -0.523681640625, -0.4949951171875, -0.46630859375, -0.4376220703125, -0.408935546875, -0.3802490234375, -0.3515625, -0.3228759765625, -0.294189453125, -0.2655029296875, -0.23681640625, -0.2081298828125, -0.179443359375, -0.1507568359375, -0.1220703125, -0.0933837890625, -0.064697265625, -0.0360107421875, -0.00732421875, 0.0213623046875, 0.050048828125, 0.0787353515625, 0.107421875, 0.1361083984375, 0.164794921875, 0.1934814453125, 0.22216796875, 0.2508544921875, 0.279541015625, 0.3082275390625, 0.3369140625, 0.3656005859375, 0.394287109375, 0.4229736328125, 0.45166015625, 0.4803466796875, 0.509033203125, 0.5377197265625, 0.56640625, 0.5950927734375, 0.623779296875, 0.6524658203125, 0.68115234375, 0.7098388671875, 0.738525390625, 0.7672119140625, 0.7958984375, 0.8245849609375, 0.853271484375, 0.8819580078125, 0.91064453125, 0.9393310546875, 0.968017578125, 0.9967041015625, 1.025390625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 2.0, 3.0, 5.0, 8.0, 14.0, 15.0, 22.0, 28.0, 56.0, 85.0, 120.0, 196.0, 265.0, 383.0, 470.0, 506.0, 537.0, 405.0, 285.0, 211.0, 163.0, 93.0, 73.0, 45.0, 26.0, 22.0, 9.0, 8.0, 9.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.794921875, -0.77069091796875, -0.7464599609375, -0.72222900390625, -0.697998046875, -0.67376708984375, -0.6495361328125, -0.62530517578125, -0.60107421875, -0.57684326171875, -0.5526123046875, -0.52838134765625, -0.504150390625, -0.47991943359375, -0.4556884765625, -0.43145751953125, -0.4072265625, -0.38299560546875, -0.3587646484375, -0.33453369140625, -0.310302734375, -0.28607177734375, -0.2618408203125, -0.23760986328125, -0.21337890625, -0.18914794921875, -0.1649169921875, -0.14068603515625, -0.116455078125, -0.09222412109375, -0.0679931640625, -0.04376220703125, -0.01953125, 0.00469970703125, 0.0289306640625, 0.05316162109375, 0.077392578125, 0.10162353515625, 0.1258544921875, 0.15008544921875, 0.17431640625, 0.19854736328125, 0.2227783203125, 0.24700927734375, 0.271240234375, 0.29547119140625, 0.3197021484375, 0.34393310546875, 0.3681640625, 0.39239501953125, 0.4166259765625, 0.44085693359375, 0.465087890625, 0.48931884765625, 0.5135498046875, 0.53778076171875, 0.56201171875, 0.58624267578125, 0.6104736328125, 0.63470458984375, 0.658935546875, 0.68316650390625, 0.7073974609375, 0.73162841796875, 0.755859375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 6.0, 18.0, 15.0, 31.0, 39.0, 83.0, 129.0, 164.0, 148.0, 127.0, 92.0, 50.0, 38.0, 20.0, 15.0, 5.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.603601455688477, -5.3700971603393555, -5.136593341827393, -4.90308952331543, -4.669585227966309, -4.4360809326171875, -4.202577114105225, -3.9690730571746826, -3.7355690002441406, -3.5020649433135986, -3.2685608863830566, -3.0350568294525146, -2.8015527725219727, -2.5680487155914307, -2.3345446586608887, -2.1010406017303467, -1.8675365447998047, -1.6340324878692627, -1.4005284309387207, -1.1670243740081787, -0.9335203170776367, -0.7000162601470947, -0.46651220321655273, -0.23300814628601074, 0.00049591064453125, 0.23399996757507324, 0.46750402450561523, 0.7010080814361572, 0.9345121383666992, 1.1680161952972412, 1.4015202522277832, 1.6350243091583252, 1.8685283660888672, 2.102032423019409, 2.335536479949951, 2.569040536880493, 2.802544593811035, 3.036048650741577, 3.269552707672119, 3.503056764602661, 3.736560821533203, 3.970064878463745, 4.203568935394287, 4.43707275390625, 4.670577049255371, 4.904081344604492, 5.137585163116455, 5.371088981628418, 5.604593276977539, 5.83809757232666, 6.071601390838623, 6.305105209350586, 6.538609504699707, 6.772113800048828, 7.005617618560791, 7.239121437072754, 7.472625732421875, 7.706130027770996, 7.939633846282959, 8.173137664794922, 8.406641960144043, 8.640146255493164, 8.873649597167969, 9.10715389251709, 9.340658187866211]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 5.0, 8.0, 7.0, 9.0, 22.0, 13.0, 26.0, 33.0, 24.0, 31.0, 33.0, 40.0, 42.0, 40.0, 52.0, 64.0, 43.0, 52.0, 47.0, 47.0, 41.0, 44.0, 37.0, 34.0, 21.0, 32.0, 16.0, 20.0, 19.0, 13.0, 11.0, 11.0, 11.0, 9.0, 9.0, 6.0, 5.0, 1.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.7309513092041016, -2.641127347946167, -2.5513033866882324, -2.461479425430298, -2.3716554641723633, -2.2818312644958496, -2.192007541656494, -2.1021833419799805, -2.012359380722046, -1.9225354194641113, -1.8327114582061768, -1.7428874969482422, -1.653063416481018, -1.5632394552230835, -1.473415493965149, -1.3835914134979248, -1.2937675714492798, -1.2039436101913452, -1.1141196489334106, -1.0242955684661865, -0.934471607208252, -0.8446476459503174, -0.7548236846923828, -0.6649996638298035, -0.5751757025718689, -0.48535171151161194, -0.395527720451355, -0.3057037591934204, -0.21587976813316345, -0.1260557770729065, -0.036231815814971924, 0.05359220504760742, 0.143416166305542, 0.23324015736579895, 0.3230641484260559, 0.4128881096839905, 0.5027121305465698, 0.5925360918045044, 0.682360053062439, 0.7721840739250183, 0.8620080351829529, 0.9518319964408875, 1.0416560173034668, 1.1314799785614014, 1.221303939819336, 1.3111279010772705, 1.400951862335205, 1.4907759428024292, 1.5805999040603638, 1.6704238653182983, 1.760247826576233, 1.850071907043457, 1.9398958683013916, 2.029719829559326, 2.1195437908172607, 2.2093677520751953, 2.29919171333313, 2.3890156745910645, 2.478839635848999, 2.5686635971069336, 2.658487558364868, 2.7483115196228027, 2.8381357192993164, 2.927959680557251, 3.0177836418151855]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 4.0, 5.0, 3.0, 18.0, 11.0, 15.0, 37.0, 64.0, 89.0, 125.0, 214.0, 443.0, 809.0, 1662.0, 4231.0, 12736.0, 50390.0, 275546.0, 545249.0, 118969.0, 25404.0, 7272.0, 2659.0, 1204.0, 593.0, 307.0, 186.0, 111.0, 73.0, 42.0, 35.0, 14.0, 9.0, 10.0, 2.0, 5.0, 4.0, 6.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.499755859375, -0.4826774597167969, -0.46559906005859375, -0.4485206604003906, -0.4314422607421875, -0.4143638610839844, -0.39728546142578125, -0.3802070617675781, -0.363128662109375, -0.3460502624511719, -0.32897186279296875, -0.3118934631347656, -0.2948150634765625, -0.2777366638183594, -0.26065826416015625, -0.24357986450195312, -0.22650146484375, -0.20942306518554688, -0.19234466552734375, -0.17526626586914062, -0.1581878662109375, -0.14110946655273438, -0.12403106689453125, -0.10695266723632812, -0.089874267578125, -0.07279586791992188, -0.05571746826171875, -0.038639068603515625, -0.0215606689453125, -0.004482269287109375, 0.01259613037109375, 0.029674530029296875, 0.0467529296875, 0.06383132934570312, 0.08090972900390625, 0.09798812866210938, 0.1150665283203125, 0.13214492797851562, 0.14922332763671875, 0.16630172729492188, 0.183380126953125, 0.20045852661132812, 0.21753692626953125, 0.23461532592773438, 0.2516937255859375, 0.2687721252441406, 0.28585052490234375, 0.3029289245605469, 0.32000732421875, 0.3370857238769531, 0.35416412353515625, 0.3712425231933594, 0.3883209228515625, 0.4053993225097656, 0.42247772216796875, 0.4395561218261719, 0.456634521484375, 0.4737129211425781, 0.49079132080078125, 0.5078697204589844, 0.5249481201171875, 0.5420265197753906, 0.5591049194335938, 0.5761833190917969, 0.59326171875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 3.0, 7.0, 10.0, 18.0, 14.0, 21.0, 42.0, 43.0, 39.0, 51.0, 54.0, 64.0, 82.0, 83.0, 71.0, 69.0, 70.0, 45.0, 46.0, 43.0, 36.0, 23.0, 15.0, 16.0, 8.0, 7.0, 12.0, 2.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.83154296875, -0.8104934692382812, -0.7894439697265625, -0.7683944702148438, -0.747344970703125, -0.7262954711914062, -0.7052459716796875, -0.6841964721679688, -0.66314697265625, -0.6420974731445312, -0.6210479736328125, -0.5999984741210938, -0.578948974609375, -0.5578994750976562, -0.5368499755859375, -0.5158004760742188, -0.4947509765625, -0.47370147705078125, -0.4526519775390625, -0.43160247802734375, -0.410552978515625, -0.38950347900390625, -0.3684539794921875, -0.34740447998046875, -0.32635498046875, -0.30530548095703125, -0.2842559814453125, -0.26320648193359375, -0.242156982421875, -0.22110748291015625, -0.2000579833984375, -0.17900848388671875, -0.157958984375, -0.13690948486328125, -0.1158599853515625, -0.09481048583984375, -0.073760986328125, -0.05271148681640625, -0.0316619873046875, -0.01061248779296875, 0.01043701171875, 0.03148651123046875, 0.0525360107421875, 0.07358551025390625, 0.094635009765625, 0.11568450927734375, 0.1367340087890625, 0.15778350830078125, 0.1788330078125, 0.19988250732421875, 0.2209320068359375, 0.24198150634765625, 0.263031005859375, 0.28408050537109375, 0.3051300048828125, 0.32617950439453125, 0.34722900390625, 0.36827850341796875, 0.3893280029296875, 0.41037750244140625, 0.431427001953125, 0.45247650146484375, 0.4735260009765625, 0.49457550048828125, 0.515625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 3.0, 10.0, 14.0, 15.0, 13.0, 20.0, 36.0, 56.0, 74.0, 107.0, 151.0, 201.0, 387.0, 666.0, 1127.0, 2011.0, 3889.0, 8036.0, 17483.0, 43236.0, 125842.0, 419149.0, 282836.0, 85935.0, 30981.0, 12938.0, 6147.0, 3067.0, 1653.0, 951.0, 520.0, 320.0, 221.0, 149.0, 89.0, 63.0, 55.0, 23.0, 24.0, 18.0, 7.0, 10.0, 10.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2457275390625, -0.2374897003173828, -0.22925186157226562, -0.22101402282714844, -0.21277618408203125, -0.20453834533691406, -0.19630050659179688, -0.1880626678466797, -0.1798248291015625, -0.1715869903564453, -0.16334915161132812, -0.15511131286621094, -0.14687347412109375, -0.13863563537597656, -0.13039779663085938, -0.12215995788574219, -0.113922119140625, -0.10568428039550781, -0.09744644165039062, -0.08920860290527344, -0.08097076416015625, -0.07273292541503906, -0.06449508666992188, -0.05625724792480469, -0.0480194091796875, -0.03978157043457031, -0.031543731689453125, -0.023305892944335938, -0.01506805419921875, -0.0068302154541015625, 0.001407623291015625, 0.009645462036132812, 0.01788330078125, 0.026121139526367188, 0.034358978271484375, 0.04259681701660156, 0.05083465576171875, 0.05907249450683594, 0.06731033325195312, 0.07554817199707031, 0.0837860107421875, 0.09202384948730469, 0.10026168823242188, 0.10849952697753906, 0.11673736572265625, 0.12497520446777344, 0.13321304321289062, 0.1414508819580078, 0.149688720703125, 0.1579265594482422, 0.16616439819335938, 0.17440223693847656, 0.18264007568359375, 0.19087791442871094, 0.19911575317382812, 0.2073535919189453, 0.2155914306640625, 0.2238292694091797, 0.23206710815429688, 0.24030494689941406, 0.24854278564453125, 0.25678062438964844, 0.2650184631347656, 0.2732563018798828, 0.281494140625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 9.0, 9.0, 10.0, 14.0, 22.0, 14.0, 21.0, 30.0, 37.0, 39.0, 59.0, 58.0, 65.0, 69.0, 78.0, 89.0, 63.0, 62.0, 47.0, 47.0, 36.0, 30.0, 22.0, 17.0, 15.0, 16.0, 10.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.23046875, -1.186737060546875, -1.14300537109375, -1.099273681640625, -1.0555419921875, -1.011810302734375, -0.96807861328125, -0.924346923828125, -0.880615234375, -0.836883544921875, -0.79315185546875, -0.749420166015625, -0.7056884765625, -0.661956787109375, -0.61822509765625, -0.574493408203125, -0.53076171875, -0.487030029296875, -0.44329833984375, -0.399566650390625, -0.3558349609375, -0.312103271484375, -0.26837158203125, -0.224639892578125, -0.180908203125, -0.137176513671875, -0.09344482421875, -0.049713134765625, -0.0059814453125, 0.037750244140625, 0.08148193359375, 0.125213623046875, 0.1689453125, 0.212677001953125, 0.25640869140625, 0.300140380859375, 0.3438720703125, 0.387603759765625, 0.43133544921875, 0.475067138671875, 0.518798828125, 0.562530517578125, 0.60626220703125, 0.649993896484375, 0.6937255859375, 0.737457275390625, 0.78118896484375, 0.824920654296875, 0.86865234375, 0.912384033203125, 0.95611572265625, 0.999847412109375, 1.0435791015625, 1.087310791015625, 1.13104248046875, 1.174774169921875, 1.218505859375, 1.262237548828125, 1.30596923828125, 1.349700927734375, 1.3934326171875, 1.437164306640625, 1.48089599609375, 1.524627685546875, 1.568359375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 6.0, 9.0, 10.0, 26.0, 51.0, 141.0, 336.0, 1314.0, 8616.0, 1004994.0, 29612.0, 2521.0, 577.0, 170.0, 82.0, 48.0, 21.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.50537109375, -0.4899024963378906, -0.47443389892578125, -0.4589653015136719, -0.4434967041015625, -0.4280281066894531, -0.41255950927734375, -0.3970909118652344, -0.381622314453125, -0.3661537170410156, -0.35068511962890625, -0.3352165222167969, -0.3197479248046875, -0.3042793273925781, -0.28881072998046875, -0.2733421325683594, -0.25787353515625, -0.24240493774414062, -0.22693634033203125, -0.21146774291992188, -0.1959991455078125, -0.18053054809570312, -0.16506195068359375, -0.14959335327148438, -0.134124755859375, -0.11865615844726562, -0.10318756103515625, -0.08771896362304688, -0.0722503662109375, -0.056781768798828125, -0.04131317138671875, -0.025844573974609375, -0.0103759765625, 0.005092620849609375, 0.02056121826171875, 0.036029815673828125, 0.0514984130859375, 0.06696701049804688, 0.08243560791015625, 0.09790420532226562, 0.113372802734375, 0.12884140014648438, 0.14430999755859375, 0.15977859497070312, 0.1752471923828125, 0.19071578979492188, 0.20618438720703125, 0.22165298461914062, 0.23712158203125, 0.2525901794433594, 0.26805877685546875, 0.2835273742675781, 0.2989959716796875, 0.3144645690917969, 0.32993316650390625, 0.3454017639160156, 0.360870361328125, 0.3763389587402344, 0.39180755615234375, 0.4072761535644531, 0.4227447509765625, 0.4382133483886719, 0.45368194580078125, 0.4691505432128906, 0.484619140625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 5.0, 24.0, 40.0, 92.0, 148.0, 200.0, 196.0, 137.0, 78.0, 35.0, 10.0, 5.0, 5.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.2319297790527344e-05, -4.074256867170334e-05, -3.9165839552879333e-05, -3.758911043405533e-05, -3.601238131523132e-05, -3.443565219640732e-05, -3.285892307758331e-05, -3.128219395875931e-05, -2.9705464839935303e-05, -2.8128735721111298e-05, -2.6552006602287292e-05, -2.4975277483463287e-05, -2.3398548364639282e-05, -2.1821819245815277e-05, -2.0245090126991272e-05, -1.8668361008167267e-05, -1.7091631889343262e-05, -1.5514902770519257e-05, -1.3938173651695251e-05, -1.2361444532871246e-05, -1.0784715414047241e-05, -9.207986295223236e-06, -7.631257176399231e-06, -6.054528057575226e-06, -4.477798938751221e-06, -2.9010698199272156e-06, -1.3243407011032104e-06, 2.523884177207947e-07, 1.8291175365447998e-06, 3.405846655368805e-06, 4.98257577419281e-06, 6.559304893016815e-06, 8.13603401184082e-06, 9.712763130664825e-06, 1.128949224948883e-05, 1.2866221368312836e-05, 1.444295048713684e-05, 1.6019679605960846e-05, 1.759640872478485e-05, 1.9173137843608856e-05, 2.074986696243286e-05, 2.2326596081256866e-05, 2.390332520008087e-05, 2.5480054318904877e-05, 2.7056783437728882e-05, 2.8633512556552887e-05, 3.0210241675376892e-05, 3.17869707942009e-05, 3.33636999130249e-05, 3.494042903184891e-05, 3.651715815067291e-05, 3.809388726949692e-05, 3.967061638832092e-05, 4.124734550714493e-05, 4.282407462596893e-05, 4.440080374479294e-05, 4.597753286361694e-05, 4.755426198244095e-05, 4.9130991101264954e-05, 5.070772022008896e-05, 5.2284449338912964e-05, 5.386117845773697e-05, 5.5437907576560974e-05, 5.701463669538498e-05, 5.8591365814208984e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 5.0, 3.0, 5.0, 3.0, 1.0, 4.0, 4.0, 8.0, 8.0, 8.0, 7.0, 10.0, 21.0, 25.0, 57.0, 111.0, 129.0, 233.0, 396.0, 814.0, 1665.0, 4045.0, 14688.0, 132038.0, 788536.0, 88034.0, 11451.0, 3230.0, 1267.0, 664.0, 423.0, 234.0, 163.0, 108.0, 48.0, 35.0, 30.0, 13.0, 10.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1663818359375, -0.16140365600585938, -0.15642547607421875, -0.15144729614257812, -0.1464691162109375, -0.14149093627929688, -0.13651275634765625, -0.13153457641601562, -0.126556396484375, -0.12157821655273438, -0.11660003662109375, -0.11162185668945312, -0.1066436767578125, -0.10166549682617188, -0.09668731689453125, -0.09170913696289062, -0.08673095703125, -0.08175277709960938, -0.07677459716796875, -0.07179641723632812, -0.0668182373046875, -0.061840057373046875, -0.05686187744140625, -0.051883697509765625, -0.046905517578125, -0.041927337646484375, -0.03694915771484375, -0.031970977783203125, -0.0269927978515625, -0.022014617919921875, -0.01703643798828125, -0.012058258056640625, -0.007080078125, -0.002101898193359375, 0.00287628173828125, 0.007854461669921875, 0.0128326416015625, 0.017810821533203125, 0.02278900146484375, 0.027767181396484375, 0.032745361328125, 0.037723541259765625, 0.04270172119140625, 0.047679901123046875, 0.0526580810546875, 0.057636260986328125, 0.06261444091796875, 0.06759262084960938, 0.07257080078125, 0.07754898071289062, 0.08252716064453125, 0.08750534057617188, 0.0924835205078125, 0.09746170043945312, 0.10243988037109375, 0.10741806030273438, 0.112396240234375, 0.11737442016601562, 0.12235260009765625, 0.12733078002929688, 0.1323089599609375, 0.13728713989257812, 0.14226531982421875, 0.14724349975585938, 0.1522216796875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 7.0, 16.0, 18.0, 33.0, 43.0, 116.0, 193.0, 209.0, 167.0, 79.0, 40.0, 25.0, 18.0, 2.0, 7.0, 4.0, 11.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41845703125, -0.407806396484375, -0.39715576171875, -0.386505126953125, -0.3758544921875, -0.365203857421875, -0.35455322265625, -0.343902587890625, -0.333251953125, -0.322601318359375, -0.31195068359375, -0.301300048828125, -0.2906494140625, -0.279998779296875, -0.26934814453125, -0.258697509765625, -0.248046875, -0.237396240234375, -0.22674560546875, -0.216094970703125, -0.2054443359375, -0.194793701171875, -0.18414306640625, -0.173492431640625, -0.162841796875, -0.152191162109375, -0.14154052734375, -0.130889892578125, -0.1202392578125, -0.109588623046875, -0.09893798828125, -0.088287353515625, -0.07763671875, -0.066986083984375, -0.05633544921875, -0.045684814453125, -0.0350341796875, -0.024383544921875, -0.01373291015625, -0.003082275390625, 0.007568359375, 0.018218994140625, 0.02886962890625, 0.039520263671875, 0.0501708984375, 0.060821533203125, 0.07147216796875, 0.082122802734375, 0.0927734375, 0.103424072265625, 0.11407470703125, 0.124725341796875, 0.1353759765625, 0.146026611328125, 0.15667724609375, 0.167327880859375, 0.177978515625, 0.188629150390625, 0.19927978515625, 0.209930419921875, 0.2205810546875, 0.231231689453125, 0.24188232421875, 0.252532958984375, 0.26318359375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 4.0, 6.0, 12.0, 29.0, 60.0, 131.0, 323.0, 251.0, 102.0, 38.0, 18.0, 10.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.016511917114258, -6.821351528167725, -6.626190662384033, -6.4310302734375, -6.235869407653809, -6.040709018707275, -5.845548629760742, -5.650387763977051, -5.455226898193359, -5.260066509246826, -5.064905643463135, -4.869745254516602, -4.67458438873291, -4.479423999786377, -4.284263610839844, -4.089102745056152, -3.893942356109619, -3.698781728744507, -3.5036211013793945, -3.3084607124328613, -3.11329984664917, -2.9181394577026367, -2.7229788303375244, -2.527818202972412, -2.3326575756073, -2.1374969482421875, -1.9423363208770752, -1.7471758127212524, -1.5520151853561401, -1.3568545579910278, -1.161694049835205, -0.9665334224700928, -0.7713727951049805, -0.5762121677398682, -0.38105159997940063, -0.1858910322189331, 0.0092695951461792, 0.2044302225112915, 0.39959073066711426, 0.5947513580322266, 0.7899119853973389, 0.9850726127624512, 1.1802332401275635, 1.3753937482833862, 1.5705543756484985, 1.7657150030136108, 1.9608755111694336, 2.156036138534546, 2.351196765899658, 2.5463573932647705, 2.741518020629883, 2.936678409576416, 3.1318392753601074, 3.3269996643066406, 3.522160291671753, 3.7173209190368652, 3.9124815464019775, 4.10764217376709, 4.302802562713623, 4.4979634284973145, 4.693123817443848, 4.888284683227539, 5.083445072174072, 5.2786054611206055, 5.473766326904297]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 12.0, 14.0, 17.0, 31.0, 28.0, 49.0, 65.0, 67.0, 83.0, 134.0, 103.0, 83.0, 54.0, 59.0, 45.0, 34.0, 38.0, 18.0, 14.0, 17.0, 9.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.387158393859863, -4.253346920013428, -4.11953592300415, -3.985724687576294, -3.8519134521484375, -3.718101978302002, -3.5842907428741455, -3.450479507446289, -3.3166682720184326, -3.182857036590576, -3.0490458011627197, -2.9152345657348633, -2.7814230918884277, -2.6476120948791504, -2.513800621032715, -2.3799893856048584, -2.246178150177002, -2.1123669147491455, -1.978555679321289, -1.844744324684143, -1.7109330892562866, -1.5771218538284302, -1.4433104991912842, -1.3094992637634277, -1.1756880283355713, -1.0418767929077148, -0.9080654978752136, -0.7742542028427124, -0.640442967414856, -0.5066317319869995, -0.3728204369544983, -0.23900914192199707, -0.10519838333129883, 0.028612881898880005, 0.16242414712905884, 0.29623541235923767, 0.4300466775894165, 0.563857913017273, 0.6976692080497742, 0.8314805030822754, 0.9652917385101318, 1.0991029739379883, 1.2329142093658447, 1.3667255640029907, 1.5005367994308472, 1.6343480348587036, 1.7681593894958496, 1.901970624923706, 2.0357818603515625, 2.169593095779419, 2.3034043312072754, 2.437215566635132, 2.5710268020629883, 2.704838275909424, 2.8386495113372803, 2.9724607467651367, 3.106271982192993, 3.2400832176208496, 3.373894453048706, 3.5077056884765625, 3.641517162322998, 3.7753281593322754, 3.909139633178711, 4.042950630187988, 4.176762104034424]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 3.0, 5.0, 6.0, 9.0, 9.0, 12.0, 16.0, 29.0, 29.0, 32.0, 37.0, 54.0, 284.0, 194.0, 65.0, 50.0, 30.0, 29.0, 24.0, 19.0, 12.0, 8.0, 10.0, 8.0, 6.0, 7.0, 5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.720703125, -0.6966018676757812, -0.6725006103515625, -0.6483993530273438, -0.624298095703125, -0.6001968383789062, -0.5760955810546875, -0.5519943237304688, -0.52789306640625, -0.5037918090820312, -0.4796905517578125, -0.45558929443359375, -0.431488037109375, -0.40738677978515625, -0.3832855224609375, -0.35918426513671875, -0.3350830078125, -0.31098175048828125, -0.2868804931640625, -0.26277923583984375, -0.238677978515625, -0.21457672119140625, -0.1904754638671875, -0.16637420654296875, -0.14227294921875, -0.11817169189453125, -0.0940704345703125, -0.06996917724609375, -0.045867919921875, -0.02176666259765625, 0.0023345947265625, 0.02643585205078125, 0.050537109375, 0.07463836669921875, 0.0987396240234375, 0.12284088134765625, 0.146942138671875, 0.17104339599609375, 0.1951446533203125, 0.21924591064453125, 0.24334716796875, 0.26744842529296875, 0.2915496826171875, 0.31565093994140625, 0.339752197265625, 0.36385345458984375, 0.3879547119140625, 0.41205596923828125, 0.4361572265625, 0.46025848388671875, 0.4843597412109375, 0.5084609985351562, 0.532562255859375, 0.5566635131835938, 0.5807647705078125, 0.6048660278320312, 0.62896728515625, 0.6530685424804688, 0.6771697998046875, 0.7012710571289062, 0.725372314453125, 0.7494735717773438, 0.7735748291015625, 0.7976760864257812, 0.82177734375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 4.0, 5.0, 5.0, 17.0, 16.0, 24.0, 28.0, 30.0, 50.0, 78.0, 132.0, 156.0, 308.0, 555.0, 1098.0, 2526.0, 7333.0, 40323.0, 8280694.0, 43003.0, 7512.0, 2445.0, 1000.0, 503.0, 279.0, 160.0, 103.0, 47.0, 37.0, 37.0, 19.0, 20.0, 6.0, 10.0, 9.0, 7.0, 3.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.582430362701416, -1.5390931367874146, -1.4957560300827026, -1.4524188041687012, -1.4090816974639893, -1.3657444715499878, -1.3224072456359863, -1.2790701389312744, -1.2357330322265625, -1.192395806312561, -1.1490586996078491, -1.1057214736938477, -1.0623843669891357, -1.0190471410751343, -0.9757099747657776, -0.9323728084564209, -0.8890355825424194, -0.8456984162330627, -0.802361249923706, -0.7590240240097046, -0.7156869173049927, -0.6723496913909912, -0.6290125250816345, -0.5856753587722778, -0.5423381924629211, -0.49900102615356445, -0.45566385984420776, -0.4123266637325287, -0.368989497423172, -0.3256523311138153, -0.28231513500213623, -0.23897796869277954, -0.1956409215927124, -0.1523037552833557, -0.10896657407283783, -0.06562939286231995, -0.022292226552963257, 0.021044939756393433, 0.06438213586807251, 0.1077193021774292, 0.1510564684867859, 0.19439363479614258, 0.23773081600666046, 0.28106799721717834, 0.32440516352653503, 0.3677423298358917, 0.4110795259475708, 0.4544166922569275, 0.4977538585662842, 0.5410910248756409, 0.5844281911849976, 0.627765417098999, 0.6711025238037109, 0.7144397497177124, 0.7577769160270691, 0.8011140823364258, 0.8444512486457825, 0.8877884149551392, 0.9311255812644958, 0.9744627475738525, 1.017799973487854, 1.061137080192566, 1.1044743061065674, 1.1478114128112793, 1.1911486387252808]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 3.0, 2.0, 8.0, 1.0, 2.0, 4.0, 5.0, 2.0, 2.0, 4.0, 8.0, 6.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 7.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.5420992374420166, -3.4338197708129883, -3.32554030418396, -3.2172608375549316, -3.1089813709259033, -3.000701904296875, -2.8924221992492676, -2.7841427326202393, -2.675863265991211, -2.5675837993621826, -2.4593043327331543, -2.351024866104126, -2.2427453994750977, -2.1344656944274902, -2.026186466217041, -1.9179067611694336, -1.8096274137496948, -1.7013479471206665, -1.5930684804916382, -1.4847888946533203, -1.376509428024292, -1.2682299613952637, -1.1599504947662354, -1.051671028137207, -0.9433915019035339, -0.8351120352745056, -0.7268325090408325, -0.6185530424118042, -0.5102735757827759, -0.4019940495491028, -0.29371458292007446, -0.18543505668640137, -0.07715559005737305, 0.031123898923397064, 0.13940338790416718, 0.2476828694343567, 0.3559623658657074, 0.4642418622970581, 0.5725213289260864, 0.6808008551597595, 0.7890803217887878, 0.8973597884178162, 1.0056393146514893, 1.1139187812805176, 1.222198247909546, 1.3304777145385742, 1.4387571811676025, 1.5470367670059204, 1.6553162336349487, 1.763595700263977, 1.8718751668930054, 1.9801547527313232, 2.0884342193603516, 2.19671368598938, 2.304993152618408, 2.4132726192474365, 2.521552085876465, 2.629831552505493, 2.7381110191345215, 2.84639048576355, 2.954669952392578, 3.0629496574401855, 3.1712288856506348, 3.279508590698242, 3.3877880573272705]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 7.0, 6.0, 13.0, 16.0, 19.0, 36.0, 52.0, 56.0, 67.0, 77.0, 70.0, 92.0, 87.0, 78.0, 56.0, 74.0, 56.0, 30.0, 38.0, 19.0, 15.0, 10.0, 15.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.68994140625, -0.6705474853515625, -0.651153564453125, -0.6317596435546875, -0.61236572265625, -0.5929718017578125, -0.573577880859375, -0.5541839599609375, -0.5347900390625, -0.5153961181640625, -0.496002197265625, -0.4766082763671875, -0.45721435546875, -0.4378204345703125, -0.418426513671875, -0.3990325927734375, -0.379638671875, -0.3602447509765625, -0.340850830078125, -0.3214569091796875, -0.30206298828125, -0.2826690673828125, -0.263275146484375, -0.2438812255859375, -0.2244873046875, -0.2050933837890625, -0.185699462890625, -0.1663055419921875, -0.14691162109375, -0.1275177001953125, -0.108123779296875, -0.0887298583984375, -0.0693359375, -0.0499420166015625, -0.030548095703125, -0.0111541748046875, 0.00823974609375, 0.0276336669921875, 0.047027587890625, 0.0664215087890625, 0.0858154296875, 0.1052093505859375, 0.124603271484375, 0.1439971923828125, 0.16339111328125, 0.1827850341796875, 0.202178955078125, 0.2215728759765625, 0.240966796875, 0.2603607177734375, 0.279754638671875, 0.2991485595703125, 0.31854248046875, 0.3379364013671875, 0.357330322265625, 0.3767242431640625, 0.3961181640625, 0.4155120849609375, 0.434906005859375, 0.4542999267578125, 0.47369384765625, 0.4930877685546875, 0.512481689453125, 0.5318756103515625, 0.55126953125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 8.0, 17.0, 21.0, 45.0, 60.0, 119.0, 246.0, 410.0, 806.0, 1630.0, 3421.0, 7580.0, 18343.0, 53593.0, 202068.0, 165953.0, 42039.0, 15357.0, 6363.0, 3032.0, 1497.0, 734.0, 394.0, 225.0, 123.0, 59.0, 46.0, 25.0, 21.0, 7.0, 4.0, 5.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.3515625, -4.21514892578125, -4.0787353515625, -3.94232177734375, -3.805908203125, -3.66949462890625, -3.5330810546875, -3.39666748046875, -3.26025390625, -3.12384033203125, -2.9874267578125, -2.85101318359375, -2.714599609375, -2.57818603515625, -2.4417724609375, -2.30535888671875, -2.1689453125, -2.03253173828125, -1.8961181640625, -1.75970458984375, -1.623291015625, -1.48687744140625, -1.3504638671875, -1.21405029296875, -1.07763671875, -0.94122314453125, -0.8048095703125, -0.66839599609375, -0.531982421875, -0.39556884765625, -0.2591552734375, -0.12274169921875, 0.013671875, 0.15008544921875, 0.2864990234375, 0.42291259765625, 0.559326171875, 0.69573974609375, 0.8321533203125, 0.96856689453125, 1.10498046875, 1.24139404296875, 1.3778076171875, 1.51422119140625, 1.650634765625, 1.78704833984375, 1.9234619140625, 2.05987548828125, 2.1962890625, 2.33270263671875, 2.4691162109375, 2.60552978515625, 2.741943359375, 2.87835693359375, 3.0147705078125, 3.15118408203125, 3.28759765625, 3.42401123046875, 3.5604248046875, 3.69683837890625, 3.833251953125, 3.96966552734375, 4.1060791015625, 4.24249267578125, 4.37890625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 13.0, 7.0, 6.0, 14.0, 18.0, 26.0, 43.0, 40.0, 43.0, 64.0, 64.0, 68.0, 77.0, 79.0, 87.0, 63.0, 61.0, 48.0, 40.0, 38.0, 30.0, 27.0, 9.0, 10.0, 8.0, 9.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46435546875, -0.44618988037109375, -0.4280242919921875, -0.40985870361328125, -0.391693115234375, -0.37352752685546875, -0.3553619384765625, -0.33719635009765625, -0.31903076171875, -0.30086517333984375, -0.2826995849609375, -0.26453399658203125, -0.246368408203125, -0.22820281982421875, -0.2100372314453125, -0.19187164306640625, -0.1737060546875, -0.15554046630859375, -0.1373748779296875, -0.11920928955078125, -0.101043701171875, -0.08287811279296875, -0.0647125244140625, -0.04654693603515625, -0.02838134765625, -0.01021575927734375, 0.0079498291015625, 0.02611541748046875, 0.044281005859375, 0.06244659423828125, 0.0806121826171875, 0.09877777099609375, 0.116943359375, 0.13510894775390625, 0.1532745361328125, 0.17144012451171875, 0.189605712890625, 0.20777130126953125, 0.2259368896484375, 0.24410247802734375, 0.26226806640625, 0.28043365478515625, 0.2985992431640625, 0.31676483154296875, 0.334930419921875, 0.35309600830078125, 0.3712615966796875, 0.38942718505859375, 0.4075927734375, 0.42575836181640625, 0.4439239501953125, 0.46208953857421875, 0.480255126953125, 0.49842071533203125, 0.5165863037109375, 0.5347518920898438, 0.55291748046875, 0.5710830688476562, 0.5892486572265625, 0.6074142456054688, 0.625579833984375, 0.6437454223632812, 0.6619110107421875, 0.6800765991210938, 0.6982421875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 5.0, 6.0, 10.0, 5.0, 16.0, 24.0, 30.0, 59.0, 90.0, 96.0, 58.0, 33.0, 18.0, 15.0, 7.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.364755392074585, -2.3110127449035645, -2.257270097732544, -2.2035274505615234, -2.149784803390503, -2.0960421562194824, -2.042299747467041, -1.9885571002960205, -1.934814453125, -1.8810718059539795, -1.827329158782959, -1.773586630821228, -1.7198439836502075, -1.666101336479187, -1.6123586893081665, -1.5586161613464355, -1.504873514175415, -1.4511308670043945, -1.397388219833374, -1.343645691871643, -1.2899030447006226, -1.236160397529602, -1.1824177503585815, -1.1286752223968506, -1.0749324560165405, -1.02118980884552, -0.9674472212791443, -0.9137045741081238, -0.859961986541748, -0.8062193393707275, -0.752476692199707, -0.6987341046333313, -0.6449915170669556, -0.5912488698959351, -0.5375062823295593, -0.4837636351585388, -0.4300210475921631, -0.3762784004211426, -0.32253578305244446, -0.26879316568374634, -0.21505054831504822, -0.1613079309463501, -0.10756530612707138, -0.053822681307792664, -8.006393909454346e-05, 0.05366256833076477, 0.10740518569946289, 0.161147803068161, 0.21489042043685913, 0.26863303780555725, 0.32237565517425537, 0.3761183023452759, 0.4298608899116516, 0.4836035370826721, 0.5373461246490479, 0.5910887718200684, 0.6448314189910889, 0.6985740661621094, 0.7523166537284851, 0.8060593008995056, 0.8598018884658813, 0.9135445356369019, 0.9672871828079224, 1.0210297107696533, 1.0747723579406738]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 7.0, 3.0, 7.0, 6.0, 11.0, 14.0, 15.0, 25.0, 32.0, 86.0, 116.0, 69.0, 17.0, 17.0, 19.0, 4.0, 9.0, 7.0, 7.0, 10.0, 10.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.7380106449127197, -3.6531708240509033, -3.568331003189087, -3.4834909439086914, -3.398651123046875, -3.3138113021850586, -3.228971481323242, -3.144131660461426, -3.0592918395996094, -2.974452018737793, -2.8896121978759766, -2.80477237701416, -2.7199323177337646, -2.6350924968719482, -2.550252676010132, -2.4654128551483154, -2.38057279586792, -2.2957329750061035, -2.210893154144287, -2.1260533332824707, -2.041213274002075, -1.9563734531402588, -1.8715336322784424, -1.786693811416626, -1.70185387134552, -1.6170140504837036, -1.5321741104125977, -1.4473342895507812, -1.3624944686889648, -1.2776545286178589, -1.1928147077560425, -1.1079747676849365, -1.0231349468231201, -0.9382950663566589, -0.8534551858901978, -0.7686153650283813, -0.6837754845619202, -0.598935604095459, -0.5140957832336426, -0.4292559027671814, -0.3444160223007202, -0.25957614183425903, -0.17473629117012024, -0.08989644050598145, -0.005056560039520264, 0.07978332042694092, 0.16462314128875732, 0.2494630217552185, 0.3343029022216797, 0.41914278268814087, 0.503982663154602, 0.5888224840164185, 0.6736623644828796, 0.7585022449493408, 0.8433420658111572, 0.9281819462776184, 1.0130218267440796, 1.097861647605896, 1.182701587677002, 1.2675414085388184, 1.3523812294006348, 1.4372211694717407, 1.5220609903335571, 1.606900930404663, 1.6917407512664795]}, "eval/loss": 2.135566473007202, "eval/bleu": 1.0140224330923163e-13, "eval/runtime": 2535.9584, "eval/samples_per_second": 5.82, "eval/steps_per_second": 0.728} \ No newline at end of file