diff --git "a/wandb/run-20220325_193848-1sz5964i/files/wandb-summary.json" "b/wandb/run-20220325_193848-1sz5964i/files/wandb-summary.json" --- "a/wandb/run-20220325_193848-1sz5964i/files/wandb-summary.json" +++ "b/wandb/run-20220325_193848-1sz5964i/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.1399, "train/learning_rate": 5.804878048780487e-05, "train/epoch": 4.48, "train/global_step": 1000, "_runtime": 23379, "_timestamp": 1648260507, "_step": 1001, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 4.0, 12.0, 33.0, 69.0, 114.0, 204.0, 218.0, 169.0, 114.0, 54.0, 24.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6282283663749695, -0.5442143082618713, -0.4602002799510956, -0.3761862516403198, -0.2921721935272217, -0.20815813541412354, -0.12414413690567017, -0.04013007879257202, 0.04388397932052612, 0.12789802253246307, 0.21191206574440002, 0.2959260940551758, 0.3799401521682739, 0.46395421028137207, 0.5479682087898254, 0.6319822669029236, 0.7159963250160217, 0.8000103831291199, 0.8840243816375732, 0.9680384397506714, 1.0520524978637695, 1.1360665559768677, 1.2200806140899658, 1.3040945529937744, 1.388108730316162, 1.4721227884292603, 1.5561368465423584, 1.640150785446167, 1.7241649627685547, 1.8081789016723633, 1.8921929597854614, 1.9762070178985596, 2.0602211952209473, 2.144235134124756, 2.2282493114471436, 2.312263250350952, 2.39627742767334, 2.4802913665771484, 2.564305305480957, 2.6483194828033447, 2.7323336601257324, 2.816347599029541, 2.9003617763519287, 2.9843757152557373, 3.068389892578125, 3.1524038314819336, 3.236417770385742, 3.32043194770813, 3.4044458866119385, 3.488459825515747, 3.5724740028381348, 3.6564879417419434, 3.740502119064331, 3.8245160579681396, 3.9085302352905273, 3.992544174194336, 4.0765581130981445, 4.160572052001953, 4.244585990905762, 4.3286004066467285, 4.412614345550537, 4.496628284454346, 4.580642223358154, 4.664656639099121, 4.74867057800293]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 3.0, 11.0, 8.0, 13.0, 15.0, 12.0, 15.0, 19.0, 21.0, 26.0, 26.0, 30.0, 16.0, 37.0, 48.0, 41.0, 30.0, 29.0, 34.0, 33.0, 45.0, 37.0, 35.0, 32.0, 36.0, 31.0, 24.0, 26.0, 30.0, 25.0, 25.0, 26.0, 22.0, 21.0, 19.0, 10.0, 14.0, 11.0, 7.0, 10.0, 5.0, 9.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.6512007117271423, -0.6314267516136169, -0.6116528511047363, -0.5918788909912109, -0.5721049308776855, -0.5523310303688049, -0.5325570702552795, -0.5127831697463989, -0.49300920963287354, -0.47323527932167053, -0.45346134901046753, -0.43368738889694214, -0.41391345858573914, -0.39413952827453613, -0.37436556816101074, -0.35459163784980774, -0.33481770753860474, -0.31504377722740173, -0.29526984691619873, -0.27549588680267334, -0.25572195649147034, -0.23594802618026733, -0.21617408096790314, -0.19640013575553894, -0.17662620544433594, -0.15685227513313293, -0.13707832992076874, -0.11730439215898514, -0.09753045439720154, -0.07775651663541794, -0.05798257887363434, -0.03820863366127014, -0.01843470335006714, 0.0013392344117164612, 0.02111317217350006, 0.04088710993528366, 0.06066104769706726, 0.08043498545885086, 0.10020892322063446, 0.11998286843299866, 0.13975679874420166, 0.15953072905540466, 0.17930467426776886, 0.19907861948013306, 0.21885254979133606, 0.23862648010253906, 0.25840044021606445, 0.27817437052726746, 0.29794830083847046, 0.31772223114967346, 0.33749616146087646, 0.35727012157440186, 0.37704405188560486, 0.39681798219680786, 0.41659194231033325, 0.43636587262153625, 0.45613980293273926, 0.47591373324394226, 0.49568766355514526, 0.5154616236686707, 0.5352355241775513, 0.5550094842910767, 0.574783444404602, 0.5945574045181274, 0.6143313050270081]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 6.0, 8.0, 11.0, 17.0, 20.0, 25.0, 41.0, 57.0, 78.0, 97.0, 144.0, 157.0, 242.0, 361.0, 536.0, 812.0, 1261.0, 2350.0, 5105.0, 14067.0, 54606.0, 330245.0, 1770445.0, 1647513.0, 290964.0, 50858.0, 13409.0, 4942.0, 2230.0, 1237.0, 719.0, 453.0, 345.0, 234.0, 185.0, 131.0, 96.0, 73.0, 62.0, 39.0, 23.0, 24.0, 22.0, 9.0, 12.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.275390625, -2.2042236328125, -2.133056640625, -2.0618896484375, -1.99072265625, -1.9195556640625, -1.848388671875, -1.7772216796875, -1.7060546875, -1.6348876953125, -1.563720703125, -1.4925537109375, -1.42138671875, -1.3502197265625, -1.279052734375, -1.2078857421875, -1.13671875, -1.0655517578125, -0.994384765625, -0.9232177734375, -0.85205078125, -0.7808837890625, -0.709716796875, -0.6385498046875, -0.5673828125, -0.4962158203125, -0.425048828125, -0.3538818359375, -0.28271484375, -0.2115478515625, -0.140380859375, -0.0692138671875, 0.001953125, 0.0731201171875, 0.144287109375, 0.2154541015625, 0.28662109375, 0.3577880859375, 0.428955078125, 0.5001220703125, 0.5712890625, 0.6424560546875, 0.713623046875, 0.7847900390625, 0.85595703125, 0.9271240234375, 0.998291015625, 1.0694580078125, 1.140625, 1.2117919921875, 1.282958984375, 1.3541259765625, 1.42529296875, 1.4964599609375, 1.567626953125, 1.6387939453125, 1.7099609375, 1.7811279296875, 1.852294921875, 1.9234619140625, 1.99462890625, 2.0657958984375, 2.136962890625, 2.2081298828125, 2.279296875]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 6.0, 2.0, 2.0, 9.0, 7.0, 5.0, 12.0, 13.0, 16.0, 14.0, 25.0, 20.0, 19.0, 22.0, 27.0, 20.0, 38.0, 38.0, 30.0, 38.0, 52.0, 34.0, 42.0, 32.0, 44.0, 30.0, 37.0, 42.0, 38.0, 43.0, 25.0, 33.0, 16.0, 31.0, 16.0, 15.0, 17.0, 15.0, 14.0, 9.0, 10.0, 7.0, 7.0, 5.0, 8.0, 3.0, 3.0, 0.0, 3.0, 4.0, 2.0, 1.0, 5.0, 0.0, 1.0], "bins": [-1.220703125, -1.1827545166015625, -1.144805908203125, -1.1068572998046875, -1.06890869140625, -1.0309600830078125, -0.993011474609375, -0.9550628662109375, -0.9171142578125, -0.8791656494140625, -0.841217041015625, -0.8032684326171875, -0.76531982421875, -0.7273712158203125, -0.689422607421875, -0.6514739990234375, -0.613525390625, -0.5755767822265625, -0.537628173828125, -0.4996795654296875, -0.46173095703125, -0.4237823486328125, -0.385833740234375, -0.3478851318359375, -0.3099365234375, -0.2719879150390625, -0.234039306640625, -0.1960906982421875, -0.15814208984375, -0.1201934814453125, -0.082244873046875, -0.0442962646484375, -0.00634765625, 0.0316009521484375, 0.069549560546875, 0.1074981689453125, 0.14544677734375, 0.1833953857421875, 0.221343994140625, 0.2592926025390625, 0.2972412109375, 0.3351898193359375, 0.373138427734375, 0.4110870361328125, 0.44903564453125, 0.4869842529296875, 0.524932861328125, 0.5628814697265625, 0.600830078125, 0.6387786865234375, 0.676727294921875, 0.7146759033203125, 0.75262451171875, 0.7905731201171875, 0.828521728515625, 0.8664703369140625, 0.9044189453125, 0.9423675537109375, 0.980316162109375, 1.0182647705078125, 1.05621337890625, 1.0941619873046875, 1.132110595703125, 1.1700592041015625, 1.2080078125]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 4.0, 10.0, 12.0, 13.0, 27.0, 34.0, 50.0, 104.0, 235.0, 659.0, 4144.0, 4156266.0, 31072.0, 1025.0, 298.0, 115.0, 76.0, 47.0, 29.0, 20.0, 15.0, 11.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.125, -17.656494140625, -17.18798828125, -16.719482421875, -16.2509765625, -15.782470703125, -15.31396484375, -14.845458984375, -14.376953125, -13.908447265625, -13.43994140625, -12.971435546875, -12.5029296875, -12.034423828125, -11.56591796875, -11.097412109375, -10.62890625, -10.160400390625, -9.69189453125, -9.223388671875, -8.7548828125, -8.286376953125, -7.81787109375, -7.349365234375, -6.880859375, -6.412353515625, -5.94384765625, -5.475341796875, -5.0068359375, -4.538330078125, -4.06982421875, -3.601318359375, -3.1328125, -2.664306640625, -2.19580078125, -1.727294921875, -1.2587890625, -0.790283203125, -0.32177734375, 0.146728515625, 0.615234375, 1.083740234375, 1.55224609375, 2.020751953125, 2.4892578125, 2.957763671875, 3.42626953125, 3.894775390625, 4.36328125, 4.831787109375, 5.30029296875, 5.768798828125, 6.2373046875, 6.705810546875, 7.17431640625, 7.642822265625, 8.111328125, 8.579833984375, 9.04833984375, 9.516845703125, 9.9853515625, 10.453857421875, 10.92236328125, 11.390869140625, 11.859375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 9.0, 15.0, 12.0, 18.0, 33.0, 56.0, 67.0, 106.0, 173.0, 327.0, 650.0, 990.0, 718.0, 375.0, 189.0, 129.0, 74.0, 47.0, 23.0, 28.0, 9.0, 10.0, 7.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.1572265625, -1.1300506591796875, -1.102874755859375, -1.0756988525390625, -1.04852294921875, -1.0213470458984375, -0.994171142578125, -0.9669952392578125, -0.9398193359375, -0.9126434326171875, -0.885467529296875, -0.8582916259765625, -0.83111572265625, -0.8039398193359375, -0.776763916015625, -0.7495880126953125, -0.722412109375, -0.6952362060546875, -0.668060302734375, -0.6408843994140625, -0.61370849609375, -0.5865325927734375, -0.559356689453125, -0.5321807861328125, -0.5050048828125, -0.4778289794921875, -0.450653076171875, -0.4234771728515625, -0.39630126953125, -0.3691253662109375, -0.341949462890625, -0.3147735595703125, -0.28759765625, -0.2604217529296875, -0.233245849609375, -0.2060699462890625, -0.17889404296875, -0.1517181396484375, -0.124542236328125, -0.0973663330078125, -0.0701904296875, -0.0430145263671875, -0.015838623046875, 0.0113372802734375, 0.03851318359375, 0.0656890869140625, 0.092864990234375, 0.1200408935546875, 0.147216796875, 0.1743927001953125, 0.201568603515625, 0.2287445068359375, 0.25592041015625, 0.2830963134765625, 0.310272216796875, 0.3374481201171875, 0.3646240234375, 0.3917999267578125, 0.418975830078125, 0.4461517333984375, 0.47332763671875, 0.5005035400390625, 0.527679443359375, 0.5548553466796875, 0.58203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 7.0, 7.0, 17.0, 13.0, 18.0, 14.0, 23.0, 27.0, 27.0, 36.0, 51.0, 63.0, 63.0, 67.0, 62.0, 67.0, 53.0, 68.0, 55.0, 44.0, 43.0, 30.0, 30.0, 31.0, 19.0, 18.0, 10.0, 11.0, 6.0, 9.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.607733130455017, -1.5505421161651611, -1.4933512210845947, -1.4361602067947388, -1.3789691925048828, -1.3217781782150269, -1.264587163925171, -1.2073962688446045, -1.1502052545547485, -1.0930142402648926, -1.0358233451843262, -0.9786323308944702, -0.9214413166046143, -0.8642503023147583, -0.8070593476295471, -0.7498683929443359, -0.69267737865448, -0.635486364364624, -0.5782954096794128, -0.5211044549942017, -0.4639134407043457, -0.40672245621681213, -0.34953147172927856, -0.292340487241745, -0.23514950275421143, -0.17795851826667786, -0.12076753377914429, -0.06357654929161072, -0.0063855648040771484, 0.05080541968345642, 0.10799640417098999, 0.16518738865852356, 0.22237825393676758, 0.27956923842430115, 0.3367602229118347, 0.3939512073993683, 0.45114219188690186, 0.5083332061767578, 0.565524160861969, 0.6227151155471802, 0.6799061298370361, 0.7370971441268921, 0.7942880988121033, 0.8514790534973145, 0.9086700677871704, 0.9658610820770264, 1.0230519771575928, 1.0802429914474487, 1.1374340057373047, 1.1946250200271606, 1.2518160343170166, 1.309006929397583, 1.366197943687439, 1.423388957977295, 1.4805798530578613, 1.5377708673477173, 1.5949618816375732, 1.6521528959274292, 1.7093439102172852, 1.7665348052978516, 1.8237258195877075, 1.8809168338775635, 1.9381077289581299, 1.9952987432479858, 2.052489757537842]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 4.0, 7.0, 7.0, 6.0, 6.0, 12.0, 12.0, 12.0, 12.0, 17.0, 24.0, 28.0, 23.0, 30.0, 29.0, 31.0, 40.0, 32.0, 50.0, 42.0, 47.0, 37.0, 37.0, 42.0, 37.0, 41.0, 30.0, 30.0, 37.0, 34.0, 32.0, 31.0, 27.0, 19.0, 11.0, 12.0, 18.0, 10.0, 13.0, 8.0, 8.0, 4.0, 3.0, 4.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.3626282215118408, -1.3228709697723389, -1.283113718032837, -1.243356466293335, -1.203599214553833, -1.163841962814331, -1.124084711074829, -1.0843275785446167, -1.0445703268051147, -1.0048130750656128, -0.9650558233261108, -0.9252985715866089, -0.8855413794517517, -0.8457841277122498, -0.8060268759727478, -0.7662696838378906, -0.7265123724937439, -0.6867551207542419, -0.64699786901474, -0.6072406768798828, -0.5674834251403809, -0.5277261734008789, -0.48796892166137695, -0.4482116997241974, -0.40845444798469543, -0.3686971962451935, -0.3289399743080139, -0.28918272256851196, -0.2494254857301712, -0.20966824889183044, -0.1699109971523285, -0.13015377521514893, -0.09039652347564697, -0.050639282912015915, -0.010882042348384857, 0.0288752019405365, 0.06863243877887726, 0.10838967561721802, 0.14814692735671997, 0.18790414929389954, 0.2276614010334015, 0.26741865277290344, 0.307175874710083, 0.34693312644958496, 0.3866903781890869, 0.4264476001262665, 0.46620485186576843, 0.505962073802948, 0.54571932554245, 0.5854765772819519, 0.6252338290214539, 0.664991021156311, 0.704748272895813, 0.7445055246353149, 0.7842627763748169, 0.8240200281143188, 0.8637772798538208, 0.9035345315933228, 0.9432917833328247, 0.9830490350723267, 1.0228062868118286, 1.062563419342041, 1.102320671081543, 1.142077922821045, 1.1818351745605469]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 6.0, 8.0, 10.0, 16.0, 9.0, 13.0, 35.0, 36.0, 57.0, 76.0, 112.0, 163.0, 257.0, 356.0, 495.0, 755.0, 1166.0, 1832.0, 2828.0, 4551.0, 7334.0, 11790.0, 19237.0, 31382.0, 49733.0, 75503.0, 109138.0, 149427.0, 167305.0, 136680.0, 97392.0, 66818.0, 43133.0, 26990.0, 16337.0, 10206.0, 6393.0, 3887.0, 2407.0, 1551.0, 1034.0, 682.0, 445.0, 307.0, 191.0, 163.0, 87.0, 68.0, 49.0, 38.0, 26.0, 21.0, 16.0, 6.0, 0.0, 6.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.45068359375, -0.4367485046386719, -0.42281341552734375, -0.4088783264160156, -0.3949432373046875, -0.3810081481933594, -0.36707305908203125, -0.3531379699707031, -0.339202880859375, -0.3252677917480469, -0.31133270263671875, -0.2973976135253906, -0.2834625244140625, -0.2695274353027344, -0.25559234619140625, -0.24165725708007812, -0.22772216796875, -0.21378707885742188, -0.19985198974609375, -0.18591690063476562, -0.1719818115234375, -0.15804672241210938, -0.14411163330078125, -0.13017654418945312, -0.116241455078125, -0.10230636596679688, -0.08837127685546875, -0.07443618774414062, -0.0605010986328125, -0.046566009521484375, -0.03263092041015625, -0.018695831298828125, -0.0047607421875, 0.009174346923828125, 0.02310943603515625, 0.037044525146484375, 0.0509796142578125, 0.06491470336914062, 0.07884979248046875, 0.09278488159179688, 0.106719970703125, 0.12065505981445312, 0.13459014892578125, 0.14852523803710938, 0.1624603271484375, 0.17639541625976562, 0.19033050537109375, 0.20426559448242188, 0.21820068359375, 0.23213577270507812, 0.24607086181640625, 0.2600059509277344, 0.2739410400390625, 0.2878761291503906, 0.30181121826171875, 0.3157463073730469, 0.329681396484375, 0.3436164855957031, 0.35755157470703125, 0.3714866638183594, 0.3854217529296875, 0.3993568420410156, 0.41329193115234375, 0.4272270202636719, 0.441162109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 9.0, 6.0, 3.0, 13.0, 10.0, 14.0, 18.0, 12.0, 23.0, 34.0, 33.0, 31.0, 40.0, 35.0, 44.0, 34.0, 40.0, 34.0, 46.0, 39.0, 44.0, 43.0, 43.0, 44.0, 35.0, 33.0, 32.0, 29.0, 25.0, 24.0, 16.0, 27.0, 10.0, 18.0, 10.0, 10.0, 5.0, 7.0, 5.0, 5.0, 4.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79296875, -0.76776123046875, -0.7425537109375, -0.71734619140625, -0.692138671875, -0.66693115234375, -0.6417236328125, -0.61651611328125, -0.59130859375, -0.56610107421875, -0.5408935546875, -0.51568603515625, -0.490478515625, -0.46527099609375, -0.4400634765625, -0.41485595703125, -0.3896484375, -0.36444091796875, -0.3392333984375, -0.31402587890625, -0.288818359375, -0.26361083984375, -0.2384033203125, -0.21319580078125, -0.18798828125, -0.16278076171875, -0.1375732421875, -0.11236572265625, -0.087158203125, -0.06195068359375, -0.0367431640625, -0.01153564453125, 0.013671875, 0.03887939453125, 0.0640869140625, 0.08929443359375, 0.114501953125, 0.13970947265625, 0.1649169921875, 0.19012451171875, 0.21533203125, 0.24053955078125, 0.2657470703125, 0.29095458984375, 0.316162109375, 0.34136962890625, 0.3665771484375, 0.39178466796875, 0.4169921875, 0.44219970703125, 0.4674072265625, 0.49261474609375, 0.517822265625, 0.54302978515625, 0.5682373046875, 0.59344482421875, 0.61865234375, 0.64385986328125, 0.6690673828125, 0.69427490234375, 0.719482421875, 0.74468994140625, 0.7698974609375, 0.79510498046875, 0.8203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 7.0, 4.0, 11.0, 5.0, 12.0, 17.0, 30.0, 33.0, 66.0, 86.0, 120.0, 265.0, 464.0, 856.0, 1821.0, 4691.0, 13456.0, 42485.0, 134809.0, 336255.0, 324697.0, 127626.0, 40222.0, 12479.0, 4443.0, 1736.0, 833.0, 406.0, 208.0, 152.0, 92.0, 52.0, 39.0, 27.0, 15.0, 14.0, 6.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8916015625, -0.8628158569335938, -0.8340301513671875, -0.8052444458007812, -0.776458740234375, -0.7476730346679688, -0.7188873291015625, -0.6901016235351562, -0.66131591796875, -0.6325302124023438, -0.6037445068359375, -0.5749588012695312, -0.546173095703125, -0.5173873901367188, -0.4886016845703125, -0.45981597900390625, -0.4310302734375, -0.40224456787109375, -0.3734588623046875, -0.34467315673828125, -0.315887451171875, -0.28710174560546875, -0.2583160400390625, -0.22953033447265625, -0.20074462890625, -0.17195892333984375, -0.1431732177734375, -0.11438751220703125, -0.085601806640625, -0.05681610107421875, -0.0280303955078125, 0.00075531005859375, 0.029541015625, 0.05832672119140625, 0.0871124267578125, 0.11589813232421875, 0.144683837890625, 0.17346954345703125, 0.2022552490234375, 0.23104095458984375, 0.25982666015625, 0.28861236572265625, 0.3173980712890625, 0.34618377685546875, 0.374969482421875, 0.40375518798828125, 0.4325408935546875, 0.46132659912109375, 0.4901123046875, 0.5188980102539062, 0.5476837158203125, 0.5764694213867188, 0.605255126953125, 0.6340408325195312, 0.6628265380859375, 0.6916122436523438, 0.72039794921875, 0.7491836547851562, 0.7779693603515625, 0.8067550659179688, 0.835540771484375, 0.8643264770507812, 0.8931121826171875, 0.9218978881835938, 0.95068359375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 5.0, 4.0, 3.0, 4.0, 4.0, 4.0, 3.0, 7.0, 10.0, 8.0, 8.0, 12.0, 15.0, 15.0, 15.0, 23.0, 26.0, 17.0, 24.0, 31.0, 43.0, 40.0, 42.0, 43.0, 44.0, 48.0, 48.0, 48.0, 30.0, 32.0, 49.0, 39.0, 37.0, 31.0, 30.0, 27.0, 24.0, 20.0, 14.0, 16.0, 11.0, 16.0, 11.0, 6.0, 6.0, 7.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4814453125, -1.430389404296875, -1.37933349609375, -1.328277587890625, -1.2772216796875, -1.226165771484375, -1.17510986328125, -1.124053955078125, -1.072998046875, -1.021942138671875, -0.97088623046875, -0.919830322265625, -0.8687744140625, -0.817718505859375, -0.76666259765625, -0.715606689453125, -0.66455078125, -0.613494873046875, -0.56243896484375, -0.511383056640625, -0.4603271484375, -0.409271240234375, -0.35821533203125, -0.307159423828125, -0.256103515625, -0.205047607421875, -0.15399169921875, -0.102935791015625, -0.0518798828125, -0.000823974609375, 0.05023193359375, 0.101287841796875, 0.15234375, 0.203399658203125, 0.25445556640625, 0.305511474609375, 0.3565673828125, 0.407623291015625, 0.45867919921875, 0.509735107421875, 0.560791015625, 0.611846923828125, 0.66290283203125, 0.713958740234375, 0.7650146484375, 0.816070556640625, 0.86712646484375, 0.918182373046875, 0.96923828125, 1.020294189453125, 1.07135009765625, 1.122406005859375, 1.1734619140625, 1.224517822265625, 1.27557373046875, 1.326629638671875, 1.377685546875, 1.428741455078125, 1.47979736328125, 1.530853271484375, 1.5819091796875, 1.632965087890625, 1.68402099609375, 1.735076904296875, 1.7861328125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 6.0, 7.0, 4.0, 8.0, 17.0, 21.0, 25.0, 36.0, 62.0, 104.0, 174.0, 280.0, 508.0, 918.0, 1944.0, 4003.0, 9654.0, 27748.0, 96089.0, 344551.0, 392403.0, 116751.0, 32795.0, 11363.0, 4627.0, 2030.0, 1033.0, 564.0, 340.0, 172.0, 116.0, 63.0, 44.0, 20.0, 23.0, 16.0, 12.0, 15.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.21630859375, -0.21047401428222656, -0.20463943481445312, -0.1988048553466797, -0.19297027587890625, -0.1871356964111328, -0.18130111694335938, -0.17546653747558594, -0.1696319580078125, -0.16379737854003906, -0.15796279907226562, -0.1521282196044922, -0.14629364013671875, -0.1404590606689453, -0.13462448120117188, -0.12878990173339844, -0.122955322265625, -0.11712074279785156, -0.11128616333007812, -0.10545158386230469, -0.09961700439453125, -0.09378242492675781, -0.08794784545898438, -0.08211326599121094, -0.0762786865234375, -0.07044410705566406, -0.06460952758789062, -0.05877494812011719, -0.05294036865234375, -0.04710578918457031, -0.041271209716796875, -0.03543663024902344, -0.02960205078125, -0.023767471313476562, -0.017932891845703125, -0.012098312377929688, -0.00626373291015625, -0.0004291534423828125, 0.005405426025390625, 0.011240005493164062, 0.0170745849609375, 0.022909164428710938, 0.028743743896484375, 0.03457832336425781, 0.04041290283203125, 0.04624748229980469, 0.052082061767578125, 0.05791664123535156, 0.063751220703125, 0.06958580017089844, 0.07542037963867188, 0.08125495910644531, 0.08708953857421875, 0.09292411804199219, 0.09875869750976562, 0.10459327697753906, 0.1104278564453125, 0.11626243591308594, 0.12209701538085938, 0.1279315948486328, 0.13376617431640625, 0.1396007537841797, 0.14543533325195312, 0.15126991271972656, 0.1571044921875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 5.0, 3.0, 5.0, 9.0, 10.0, 15.0, 13.0, 14.0, 28.0, 28.0, 44.0, 48.0, 59.0, 91.0, 103.0, 95.0, 81.0, 70.0, 56.0, 36.0, 40.0, 27.0, 22.0, 20.0, 15.0, 12.0, 6.0, 5.0, 9.0, 3.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00012302398681640625, -0.00011891871690750122, -0.00011481344699859619, -0.00011070817708969116, -0.00010660290718078613, -0.0001024976372718811, -9.839236736297607e-05, -9.428709745407104e-05, -9.018182754516602e-05, -8.607655763626099e-05, -8.197128772735596e-05, -7.786601781845093e-05, -7.37607479095459e-05, -6.965547800064087e-05, -6.555020809173584e-05, -6.144493818283081e-05, -5.733966827392578e-05, -5.323439836502075e-05, -4.912912845611572e-05, -4.502385854721069e-05, -4.0918588638305664e-05, -3.6813318729400635e-05, -3.2708048820495605e-05, -2.8602778911590576e-05, -2.4497509002685547e-05, -2.0392239093780518e-05, -1.6286969184875488e-05, -1.2181699275970459e-05, -8.07642936706543e-06, -3.9711594581604e-06, 1.341104507446289e-07, 4.239380359649658e-06, 8.344650268554688e-06, 1.2449920177459717e-05, 1.6555190086364746e-05, 2.0660459995269775e-05, 2.4765729904174805e-05, 2.8870999813079834e-05, 3.297626972198486e-05, 3.708153963088989e-05, 4.118680953979492e-05, 4.529207944869995e-05, 4.939734935760498e-05, 5.350261926651001e-05, 5.760788917541504e-05, 6.171315908432007e-05, 6.58184289932251e-05, 6.992369890213013e-05, 7.402896881103516e-05, 7.813423871994019e-05, 8.223950862884521e-05, 8.634477853775024e-05, 9.045004844665527e-05, 9.45553183555603e-05, 9.866058826446533e-05, 0.00010276585817337036, 0.00010687112808227539, 0.00011097639799118042, 0.00011508166790008545, 0.00011918693780899048, 0.0001232922077178955, 0.00012739747762680054, 0.00013150274753570557, 0.0001356080174446106, 0.00013971328735351562]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 6.0, 7.0, 15.0, 17.0, 43.0, 61.0, 137.0, 288.0, 1027.0, 5710.0, 118456.0, 869512.0, 48432.0, 3619.0, 771.0, 217.0, 100.0, 45.0, 18.0, 24.0, 14.0, 11.0, 8.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4765625, -0.45915985107421875, -0.4417572021484375, -0.42435455322265625, -0.406951904296875, -0.38954925537109375, -0.3721466064453125, -0.35474395751953125, -0.33734130859375, -0.31993865966796875, -0.3025360107421875, -0.28513336181640625, -0.267730712890625, -0.25032806396484375, -0.2329254150390625, -0.21552276611328125, -0.1981201171875, -0.18071746826171875, -0.1633148193359375, -0.14591217041015625, -0.128509521484375, -0.11110687255859375, -0.0937042236328125, -0.07630157470703125, -0.05889892578125, -0.04149627685546875, -0.0240936279296875, -0.00669097900390625, 0.010711669921875, 0.02811431884765625, 0.0455169677734375, 0.06291961669921875, 0.080322265625, 0.09772491455078125, 0.1151275634765625, 0.13253021240234375, 0.149932861328125, 0.16733551025390625, 0.1847381591796875, 0.20214080810546875, 0.21954345703125, 0.23694610595703125, 0.2543487548828125, 0.27175140380859375, 0.289154052734375, 0.30655670166015625, 0.3239593505859375, 0.34136199951171875, 0.3587646484375, 0.37616729736328125, 0.3935699462890625, 0.41097259521484375, 0.428375244140625, 0.44577789306640625, 0.4631805419921875, 0.48058319091796875, 0.49798583984375, 0.5153884887695312, 0.5327911376953125, 0.5501937866210938, 0.567596435546875, 0.5849990844726562, 0.6024017333984375, 0.6198043823242188, 0.63720703125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 6.0, 10.0, 14.0, 16.0, 21.0, 31.0, 58.0, 56.0, 73.0, 81.0, 138.0, 113.0, 100.0, 88.0, 59.0, 44.0, 32.0, 20.0, 13.0, 7.0, 6.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.080078125, -0.07722663879394531, -0.07437515258789062, -0.07152366638183594, -0.06867218017578125, -0.06582069396972656, -0.06296920776367188, -0.06011772155761719, -0.0572662353515625, -0.05441474914550781, -0.051563262939453125, -0.04871177673339844, -0.04586029052734375, -0.04300880432128906, -0.040157318115234375, -0.03730583190917969, -0.034454345703125, -0.03160285949707031, -0.028751373291015625, -0.025899887084960938, -0.02304840087890625, -0.020196914672851562, -0.017345428466796875, -0.014493942260742188, -0.0116424560546875, -0.008790969848632812, -0.005939483642578125, -0.0030879974365234375, -0.00023651123046875, 0.0026149749755859375, 0.005466461181640625, 0.008317947387695312, 0.01116943359375, 0.014020919799804688, 0.016872406005859375, 0.019723892211914062, 0.02257537841796875, 0.025426864624023438, 0.028278350830078125, 0.031129837036132812, 0.0339813232421875, 0.03683280944824219, 0.039684295654296875, 0.04253578186035156, 0.04538726806640625, 0.04823875427246094, 0.051090240478515625, 0.05394172668457031, 0.056793212890625, 0.05964469909667969, 0.062496185302734375, 0.06534767150878906, 0.06819915771484375, 0.07105064392089844, 0.07390213012695312, 0.07675361633300781, 0.0796051025390625, 0.08245658874511719, 0.08530807495117188, 0.08815956115722656, 0.09101104736328125, 0.09386253356933594, 0.09671401977539062, 0.09956550598144531, 0.1024169921875]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 5.0, 15.0, 33.0, 74.0, 158.0, 217.0, 215.0, 164.0, 69.0, 29.0, 19.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.363602638244629, -2.260921001434326, -2.1582393646240234, -2.0555577278137207, -1.952876091003418, -1.8501944541931152, -1.747512698173523, -1.6448310613632202, -1.5421494245529175, -1.4394677877426147, -1.336786150932312, -1.2341043949127197, -1.131422758102417, -1.0287411212921143, -0.9260594844818115, -0.8233778476715088, -0.720696210861206, -0.6180145740509033, -0.5153329372406006, -0.4126512408256531, -0.30996960401535034, -0.2072879672050476, -0.1046062707901001, -0.0019246339797973633, 0.10075700283050537, 0.2034386545419693, 0.3061203062534332, 0.40880197286605835, 0.5114836096763611, 0.6141652464866638, 0.7168469429016113, 0.8195285797119141, 0.9222102165222168, 1.0248918533325195, 1.1275734901428223, 1.230255126953125, 1.3329367637634277, 1.4356184005737305, 1.5383001565933228, 1.6409817934036255, 1.7436634302139282, 1.846345067024231, 1.9490267038345337, 2.051708459854126, 2.1543900966644287, 2.2570717334747314, 2.359753370285034, 2.462435007095337, 2.5651166439056396, 2.6677982807159424, 2.770479917526245, 2.873161554336548, 2.9758431911468506, 3.0785248279571533, 3.181206703186035, 3.283888339996338, 3.3865699768066406, 3.4892516136169434, 3.591933250427246, 3.694614887237549, 3.7972965240478516, 3.8999781608581543, 4.002659797668457, 4.10534143447876, 4.2080230712890625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 7.0, 10.0, 8.0, 9.0, 12.0, 18.0, 24.0, 24.0, 33.0, 21.0, 31.0, 36.0, 35.0, 45.0, 33.0, 64.0, 39.0, 45.0, 45.0, 45.0, 40.0, 30.0, 41.0, 45.0, 23.0, 36.0, 40.0, 25.0, 21.0, 18.0, 16.0, 15.0, 13.0, 12.0, 9.0, 3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7979270219802856, -0.7721570134162903, -0.7463870644569397, -0.7206170558929443, -0.6948471069335938, -0.6690770983695984, -0.643307089805603, -0.6175371408462524, -0.5917671322822571, -0.5659971237182617, -0.5402271747589111, -0.5144571661949158, -0.4886871874332428, -0.4629172086715698, -0.43714720010757446, -0.4113772213459015, -0.3856072425842285, -0.35983726382255554, -0.33406728506088257, -0.3082972764968872, -0.28252729773521423, -0.25675731897354126, -0.2309873253107071, -0.20521733164787292, -0.17944735288619995, -0.15367737412452698, -0.1279073804616928, -0.10213739424943924, -0.07636740803718567, -0.050597429275512695, -0.024827435612678528, 0.0009425580501556396, 0.02671259641647339, 0.05248258262872696, 0.07825256884098053, 0.1040225550532341, 0.12979254126548767, 0.15556252002716064, 0.1813325136899948, 0.20710250735282898, 0.23287248611450195, 0.2586424648761749, 0.2844124436378479, 0.31018245220184326, 0.33595243096351624, 0.3617224097251892, 0.38749241828918457, 0.41326239705085754, 0.4390323758125305, 0.4648023545742035, 0.49057233333587646, 0.5163423418998718, 0.5421123504638672, 0.5678822994232178, 0.5936523079872131, 0.6194223165512085, 0.6451922655105591, 0.6709622740745544, 0.696732223033905, 0.7225022315979004, 0.748272180557251, 0.7740421891212463, 0.7998121976852417, 0.8255821466445923, 0.8513521552085876]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 8.0, 3.0, 8.0, 14.0, 21.0, 27.0, 45.0, 68.0, 114.0, 137.0, 202.0, 338.0, 510.0, 824.0, 1433.0, 2427.0, 3846.0, 6787.0, 12136.0, 21624.0, 39585.0, 73263.0, 131965.0, 215522.0, 222356.0, 140589.0, 78571.0, 42610.0, 23151.0, 12772.0, 7202.0, 4062.0, 2405.0, 1472.0, 856.0, 550.0, 349.0, 246.0, 145.0, 107.0, 79.0, 39.0, 22.0, 26.0, 14.0, 9.0, 6.0, 10.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.272705078125, -0.26392364501953125, -0.2551422119140625, -0.24636077880859375, -0.237579345703125, -0.22879791259765625, -0.2200164794921875, -0.21123504638671875, -0.20245361328125, -0.19367218017578125, -0.1848907470703125, -0.17610931396484375, -0.167327880859375, -0.15854644775390625, -0.1497650146484375, -0.14098358154296875, -0.1322021484375, -0.12342071533203125, -0.1146392822265625, -0.10585784912109375, -0.097076416015625, -0.08829498291015625, -0.0795135498046875, -0.07073211669921875, -0.06195068359375, -0.05316925048828125, -0.0443878173828125, -0.03560638427734375, -0.026824951171875, -0.01804351806640625, -0.0092620849609375, -0.00048065185546875, 0.00830078125, 0.01708221435546875, 0.0258636474609375, 0.03464508056640625, 0.043426513671875, 0.05220794677734375, 0.0609893798828125, 0.06977081298828125, 0.07855224609375, 0.08733367919921875, 0.0961151123046875, 0.10489654541015625, 0.113677978515625, 0.12245941162109375, 0.1312408447265625, 0.14002227783203125, 0.1488037109375, 0.15758514404296875, 0.1663665771484375, 0.17514801025390625, 0.183929443359375, 0.19271087646484375, 0.2014923095703125, 0.21027374267578125, 0.21905517578125, 0.22783660888671875, 0.2366180419921875, 0.24539947509765625, 0.254180908203125, 0.26296234130859375, 0.2717437744140625, 0.28052520751953125, 0.289306640625]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 4.0, 6.0, 9.0, 7.0, 11.0, 13.0, 14.0, 22.0, 21.0, 34.0, 24.0, 41.0, 26.0, 35.0, 40.0, 52.0, 51.0, 45.0, 47.0, 49.0, 50.0, 46.0, 37.0, 38.0, 35.0, 37.0, 37.0, 30.0, 22.0, 14.0, 18.0, 14.0, 20.0, 12.0, 8.0, 6.0, 11.0, 5.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.47265625, -4.33587646484375, -4.1990966796875, -4.06231689453125, -3.925537109375, -3.78875732421875, -3.6519775390625, -3.51519775390625, -3.37841796875, -3.24163818359375, -3.1048583984375, -2.96807861328125, -2.831298828125, -2.69451904296875, -2.5577392578125, -2.42095947265625, -2.2841796875, -2.14739990234375, -2.0106201171875, -1.87384033203125, -1.737060546875, -1.60028076171875, -1.4635009765625, -1.32672119140625, -1.18994140625, -1.05316162109375, -0.9163818359375, -0.77960205078125, -0.642822265625, -0.50604248046875, -0.3692626953125, -0.23248291015625, -0.095703125, 0.04107666015625, 0.1778564453125, 0.31463623046875, 0.451416015625, 0.58819580078125, 0.7249755859375, 0.86175537109375, 0.99853515625, 1.13531494140625, 1.2720947265625, 1.40887451171875, 1.545654296875, 1.68243408203125, 1.8192138671875, 1.95599365234375, 2.0927734375, 2.22955322265625, 2.3663330078125, 2.50311279296875, 2.639892578125, 2.77667236328125, 2.9134521484375, 3.05023193359375, 3.18701171875, 3.32379150390625, 3.4605712890625, 3.59735107421875, 3.734130859375, 3.87091064453125, 4.0076904296875, 4.14447021484375, 4.28125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 8.0, 7.0, 8.0, 8.0, 11.0, 13.0, 25.0, 15.0, 25.0, 32.0, 50.0, 47.0, 60.0, 75.0, 100.0, 138.0, 228.0, 386.0, 1035.0, 7498.0, 693518.0, 338703.0, 4590.0, 839.0, 382.0, 206.0, 126.0, 91.0, 62.0, 44.0, 46.0, 32.0, 36.0, 35.0, 15.0, 8.0, 9.0, 8.0, 11.0, 5.0, 7.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.328125, -2.24761962890625, -2.1671142578125, -2.08660888671875, -2.006103515625, -1.92559814453125, -1.8450927734375, -1.76458740234375, -1.68408203125, -1.60357666015625, -1.5230712890625, -1.44256591796875, -1.362060546875, -1.28155517578125, -1.2010498046875, -1.12054443359375, -1.0400390625, -0.95953369140625, -0.8790283203125, -0.79852294921875, -0.718017578125, -0.63751220703125, -0.5570068359375, -0.47650146484375, -0.39599609375, -0.31549072265625, -0.2349853515625, -0.15447998046875, -0.073974609375, 0.00653076171875, 0.0870361328125, 0.16754150390625, 0.248046875, 0.32855224609375, 0.4090576171875, 0.48956298828125, 0.570068359375, 0.65057373046875, 0.7310791015625, 0.81158447265625, 0.89208984375, 0.97259521484375, 1.0531005859375, 1.13360595703125, 1.214111328125, 1.29461669921875, 1.3751220703125, 1.45562744140625, 1.5361328125, 1.61663818359375, 1.6971435546875, 1.77764892578125, 1.858154296875, 1.93865966796875, 2.0191650390625, 2.09967041015625, 2.18017578125, 2.26068115234375, 2.3411865234375, 2.42169189453125, 2.502197265625, 2.58270263671875, 2.6632080078125, 2.74371337890625, 2.82421875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 5.0, 9.0, 13.0, 12.0, 17.0, 17.0, 21.0, 28.0, 32.0, 24.0, 31.0, 24.0, 38.0, 40.0, 43.0, 42.0, 38.0, 39.0, 42.0, 40.0, 38.0, 34.0, 41.0, 44.0, 27.0, 36.0, 24.0, 23.0, 22.0, 24.0, 26.0, 24.0, 10.0, 8.0, 6.0, 9.0, 12.0, 9.0, 3.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.609375, -3.483642578125, -3.35791015625, -3.232177734375, -3.1064453125, -2.980712890625, -2.85498046875, -2.729248046875, -2.603515625, -2.477783203125, -2.35205078125, -2.226318359375, -2.1005859375, -1.974853515625, -1.84912109375, -1.723388671875, -1.59765625, -1.471923828125, -1.34619140625, -1.220458984375, -1.0947265625, -0.968994140625, -0.84326171875, -0.717529296875, -0.591796875, -0.466064453125, -0.34033203125, -0.214599609375, -0.0888671875, 0.036865234375, 0.16259765625, 0.288330078125, 0.4140625, 0.539794921875, 0.66552734375, 0.791259765625, 0.9169921875, 1.042724609375, 1.16845703125, 1.294189453125, 1.419921875, 1.545654296875, 1.67138671875, 1.797119140625, 1.9228515625, 2.048583984375, 2.17431640625, 2.300048828125, 2.42578125, 2.551513671875, 2.67724609375, 2.802978515625, 2.9287109375, 3.054443359375, 3.18017578125, 3.305908203125, 3.431640625, 3.557373046875, 3.68310546875, 3.808837890625, 3.9345703125, 4.060302734375, 4.18603515625, 4.311767578125, 4.4375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 0.0, 2.0, 8.0, 12.0, 12.0, 23.0, 33.0, 46.0, 73.0, 93.0, 186.0, 273.0, 543.0, 1068.0, 2299.0, 5643.0, 18151.0, 77801.0, 642498.0, 241609.0, 40055.0, 10814.0, 3850.0, 1591.0, 795.0, 430.0, 255.0, 152.0, 63.0, 57.0, 42.0, 24.0, 15.0, 13.0, 13.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.1363525390625, -0.1320629119873047, -0.12777328491210938, -0.12348365783691406, -0.11919403076171875, -0.11490440368652344, -0.11061477661132812, -0.10632514953613281, -0.1020355224609375, -0.09774589538574219, -0.09345626831054688, -0.08916664123535156, -0.08487701416015625, -0.08058738708496094, -0.07629776000976562, -0.07200813293457031, -0.067718505859375, -0.06342887878417969, -0.059139251708984375, -0.05484962463378906, -0.05055999755859375, -0.04627037048339844, -0.041980743408203125, -0.03769111633300781, -0.0334014892578125, -0.029111862182617188, -0.024822235107421875, -0.020532608032226562, -0.01624298095703125, -0.011953353881835938, -0.007663726806640625, -0.0033740997314453125, 0.00091552734375, 0.0052051544189453125, 0.009494781494140625, 0.013784408569335938, 0.01807403564453125, 0.022363662719726562, 0.026653289794921875, 0.030942916870117188, 0.0352325439453125, 0.03952217102050781, 0.043811798095703125, 0.04810142517089844, 0.05239105224609375, 0.05668067932128906, 0.060970306396484375, 0.06525993347167969, 0.069549560546875, 0.07383918762207031, 0.07812881469726562, 0.08241844177246094, 0.08670806884765625, 0.09099769592285156, 0.09528732299804688, 0.09957695007324219, 0.1038665771484375, 0.10815620422363281, 0.11244583129882812, 0.11673545837402344, 0.12102508544921875, 0.12531471252441406, 0.12960433959960938, 0.1338939666748047, 0.13818359375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 9.0, 16.0, 26.0, 39.0, 60.0, 128.0, 240.0, 217.0, 114.0, 55.0, 30.0, 21.0, 17.0, 7.0, 6.0, 0.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2988529205322266e-05, -5.1625072956085205e-05, -5.0261616706848145e-05, -4.8898160457611084e-05, -4.7534704208374023e-05, -4.617124795913696e-05, -4.48077917098999e-05, -4.344433546066284e-05, -4.208087921142578e-05, -4.071742296218872e-05, -3.935396671295166e-05, -3.79905104637146e-05, -3.662705421447754e-05, -3.526359796524048e-05, -3.390014171600342e-05, -3.253668546676636e-05, -3.11732292175293e-05, -2.9809772968292236e-05, -2.8446316719055176e-05, -2.7082860469818115e-05, -2.5719404220581055e-05, -2.4355947971343994e-05, -2.2992491722106934e-05, -2.1629035472869873e-05, -2.0265579223632812e-05, -1.8902122974395752e-05, -1.753866672515869e-05, -1.617521047592163e-05, -1.481175422668457e-05, -1.344829797744751e-05, -1.208484172821045e-05, -1.0721385478973389e-05, -9.357929229736328e-06, -7.994472980499268e-06, -6.631016731262207e-06, -5.2675604820251465e-06, -3.904104232788086e-06, -2.5406479835510254e-06, -1.1771917343139648e-06, 1.862645149230957e-07, 1.5497207641601562e-06, 2.913177013397217e-06, 4.276633262634277e-06, 5.640089511871338e-06, 7.0035457611083984e-06, 8.367002010345459e-06, 9.73045825958252e-06, 1.109391450881958e-05, 1.245737075805664e-05, 1.3820827007293701e-05, 1.5184283256530762e-05, 1.6547739505767822e-05, 1.7911195755004883e-05, 1.9274652004241943e-05, 2.0638108253479004e-05, 2.2001564502716064e-05, 2.3365020751953125e-05, 2.4728477001190186e-05, 2.6091933250427246e-05, 2.7455389499664307e-05, 2.8818845748901367e-05, 3.0182301998138428e-05, 3.154575824737549e-05, 3.290921449661255e-05, 3.427267074584961e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 5.0, 4.0, 10.0, 22.0, 32.0, 32.0, 53.0, 61.0, 114.0, 150.0, 253.0, 411.0, 757.0, 1712.0, 4209.0, 13126.0, 49936.0, 349796.0, 538678.0, 63976.0, 16055.0, 4979.0, 1981.0, 929.0, 450.0, 298.0, 161.0, 127.0, 66.0, 43.0, 54.0, 24.0, 14.0, 13.0, 5.0, 5.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1378173828125, -0.1336517333984375, -0.129486083984375, -0.1253204345703125, -0.12115478515625, -0.1169891357421875, -0.112823486328125, -0.1086578369140625, -0.1044921875, -0.1003265380859375, -0.096160888671875, -0.0919952392578125, -0.08782958984375, -0.0836639404296875, -0.079498291015625, -0.0753326416015625, -0.0711669921875, -0.0670013427734375, -0.062835693359375, -0.0586700439453125, -0.05450439453125, -0.0503387451171875, -0.046173095703125, -0.0420074462890625, -0.037841796875, -0.0336761474609375, -0.029510498046875, -0.0253448486328125, -0.02117919921875, -0.0170135498046875, -0.012847900390625, -0.0086822509765625, -0.0045166015625, -0.0003509521484375, 0.003814697265625, 0.0079803466796875, 0.01214599609375, 0.0163116455078125, 0.020477294921875, 0.0246429443359375, 0.02880859375, 0.0329742431640625, 0.037139892578125, 0.0413055419921875, 0.04547119140625, 0.0496368408203125, 0.053802490234375, 0.0579681396484375, 0.0621337890625, 0.0662994384765625, 0.070465087890625, 0.0746307373046875, 0.07879638671875, 0.0829620361328125, 0.087127685546875, 0.0912933349609375, 0.095458984375, 0.0996246337890625, 0.103790283203125, 0.1079559326171875, 0.11212158203125, 0.1162872314453125, 0.120452880859375, 0.1246185302734375, 0.1287841796875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 7.0, 5.0, 6.0, 5.0, 7.0, 15.0, 16.0, 25.0, 15.0, 30.0, 23.0, 46.0, 71.0, 96.0, 134.0, 132.0, 107.0, 71.0, 43.0, 28.0, 29.0, 15.0, 12.0, 9.0, 13.0, 12.0, 4.0, 9.0, 4.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04718017578125, -0.04583597183227539, -0.04449176788330078, -0.04314756393432617, -0.04180335998535156, -0.04045915603637695, -0.039114952087402344, -0.037770748138427734, -0.036426544189453125, -0.035082340240478516, -0.033738136291503906, -0.0323939323425293, -0.031049728393554688, -0.029705524444580078, -0.02836132049560547, -0.02701711654663086, -0.02567291259765625, -0.02432870864868164, -0.02298450469970703, -0.021640300750732422, -0.020296096801757812, -0.018951892852783203, -0.017607688903808594, -0.016263484954833984, -0.014919281005859375, -0.013575077056884766, -0.012230873107910156, -0.010886669158935547, -0.009542465209960938, -0.008198261260986328, -0.006854057312011719, -0.005509853363037109, -0.0041656494140625, -0.0028214454650878906, -0.0014772415161132812, -0.00013303756713867188, 0.0012111663818359375, 0.002555370330810547, 0.0038995742797851562, 0.005243778228759766, 0.006587982177734375, 0.007932186126708984, 0.009276390075683594, 0.010620594024658203, 0.011964797973632812, 0.013309001922607422, 0.014653205871582031, 0.01599740982055664, 0.01734161376953125, 0.01868581771850586, 0.02003002166748047, 0.021374225616455078, 0.022718429565429688, 0.024062633514404297, 0.025406837463378906, 0.026751041412353516, 0.028095245361328125, 0.029439449310302734, 0.030783653259277344, 0.03212785720825195, 0.03347206115722656, 0.03481626510620117, 0.03616046905517578, 0.03750467300415039, 0.038848876953125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 50.0, 629.0, 325.0, 17.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.586158752441406, -35.9533805847168, -35.32060241699219, -34.68782424926758, -34.05504608154297, -33.422271728515625, -32.789493560791016, -32.156715393066406, -31.523937225341797, -30.891159057617188, -30.258380889892578, -29.6256046295166, -28.992826461791992, -28.360048294067383, -27.727270126342773, -27.094491958618164, -26.461713790893555, -25.828935623168945, -25.196157455444336, -24.56338119506836, -23.93060302734375, -23.29782485961914, -22.66504669189453, -22.032268524169922, -21.399490356445312, -20.766712188720703, -20.133934020996094, -19.501157760620117, -18.868379592895508, -18.2356014251709, -17.60282325744629, -16.97004508972168, -16.33726692199707, -15.704488754272461, -15.071711540222168, -14.438933372497559, -13.806156158447266, -13.173377990722656, -12.540599822998047, -11.907821655273438, -11.275044441223145, -10.642266273498535, -10.009489059448242, -9.376710891723633, -8.743932723999023, -8.11115550994873, -7.478377342224121, -6.84559965133667, -6.212821960449219, -5.580044269561768, -4.947266578674316, -4.314488410949707, -3.681710720062256, -3.0489330291748047, -2.4161550998687744, -1.7833771705627441, -1.150599479675293, -0.5178216695785522, 0.11495614051818848, 0.7477339506149292, 1.38051176071167, 2.013289451599121, 2.6460673809051514, 3.2788453102111816, 3.911623001098633]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 6.0, 3.0, 5.0, 0.0, 4.0, 10.0, 6.0, 19.0, 13.0, 20.0, 16.0, 12.0, 22.0, 21.0, 34.0, 37.0, 40.0, 25.0, 31.0, 34.0, 33.0, 38.0, 48.0, 39.0, 36.0, 32.0, 36.0, 45.0, 37.0, 36.0, 36.0, 31.0, 16.0, 23.0, 31.0, 22.0, 27.0, 15.0, 11.0, 13.0, 6.0, 5.0, 3.0, 2.0, 7.0, 6.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-5.821846961975098, -5.630846977233887, -5.439846992492676, -5.248847007751465, -5.057846546173096, -4.866846561431885, -4.675846576690674, -4.484846591949463, -4.293846130371094, -4.102846145629883, -3.9118459224700928, -3.720845937728882, -3.529845714569092, -3.338845729827881, -3.14784574508667, -2.956845760345459, -2.765845775604248, -2.574845790863037, -2.383845567703247, -2.192845582962036, -2.001845359802246, -1.8108453750610352, -1.6198453903198242, -1.4288452863693237, -1.2378451824188232, -1.0468450784683228, -0.855845034122467, -0.6648449897766113, -0.47384488582611084, -0.28284478187561035, -0.09184479713439941, 0.09915530681610107, 0.29015541076660156, 0.48115548491477966, 0.6721555590629578, 0.8631556034088135, 1.054155707359314, 1.2451558113098145, 1.4361557960510254, 1.6271559000015259, 1.8181560039520264, 2.0091559886932373, 2.2001562118530273, 2.3911561965942383, 2.582156181335449, 2.7731564044952393, 2.96415638923645, 3.1551566123962402, 3.346156597137451, 3.537156581878662, 3.728156805038452, 3.919156789779663, 4.110157012939453, 4.301156997680664, 4.492156982421875, 4.683156967163086, 4.874156951904297, 5.065156936645508, 5.256156921386719, 5.44715690612793, 5.638157367706299, 5.82915735244751, 6.020157337188721, 6.211157321929932, 6.402157783508301]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 9.0, 1.0, 8.0, 4.0, 10.0, 9.0, 16.0, 14.0, 14.0, 29.0, 23.0, 30.0, 65.0, 89.0, 148.0, 277.0, 697.0, 1816.0, 7267.0, 35438.0, 429631.0, 2797194.0, 845991.0, 61685.0, 9562.0, 2529.0, 855.0, 348.0, 174.0, 90.0, 44.0, 39.0, 35.0, 34.0, 22.0, 16.0, 13.0, 11.0, 6.0, 6.0, 9.0, 5.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.923828125, -1.8666229248046875, -1.809417724609375, -1.7522125244140625, -1.69500732421875, -1.6378021240234375, -1.580596923828125, -1.5233917236328125, -1.4661865234375, -1.4089813232421875, -1.351776123046875, -1.2945709228515625, -1.23736572265625, -1.1801605224609375, -1.122955322265625, -1.0657501220703125, -1.008544921875, -0.9513397216796875, -0.894134521484375, -0.8369293212890625, -0.77972412109375, -0.7225189208984375, -0.665313720703125, -0.6081085205078125, -0.5509033203125, -0.4936981201171875, -0.436492919921875, -0.3792877197265625, -0.32208251953125, -0.2648773193359375, -0.207672119140625, -0.1504669189453125, -0.09326171875, -0.0360565185546875, 0.021148681640625, 0.0783538818359375, 0.13555908203125, 0.1927642822265625, 0.249969482421875, 0.3071746826171875, 0.3643798828125, 0.4215850830078125, 0.478790283203125, 0.5359954833984375, 0.59320068359375, 0.6504058837890625, 0.707611083984375, 0.7648162841796875, 0.822021484375, 0.8792266845703125, 0.936431884765625, 0.9936370849609375, 1.05084228515625, 1.1080474853515625, 1.165252685546875, 1.2224578857421875, 1.2796630859375, 1.3368682861328125, 1.394073486328125, 1.4512786865234375, 1.50848388671875, 1.5656890869140625, 1.622894287109375, 1.6800994873046875, 1.7373046875]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 11.0, 13.0, 9.0, 15.0, 28.0, 30.0, 38.0, 53.0, 47.0, 55.0, 58.0, 52.0, 74.0, 60.0, 57.0, 57.0, 55.0, 57.0, 46.0, 41.0, 28.0, 25.0, 22.0, 11.0, 16.0, 13.0, 4.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94140625, -0.9024200439453125, -0.863433837890625, -0.8244476318359375, -0.78546142578125, -0.7464752197265625, -0.707489013671875, -0.6685028076171875, -0.6295166015625, -0.5905303955078125, -0.551544189453125, -0.5125579833984375, -0.47357177734375, -0.4345855712890625, -0.395599365234375, -0.3566131591796875, -0.317626953125, -0.2786407470703125, -0.239654541015625, -0.2006683349609375, -0.16168212890625, -0.1226959228515625, -0.083709716796875, -0.0447235107421875, -0.0057373046875, 0.0332489013671875, 0.072235107421875, 0.1112213134765625, 0.15020751953125, 0.1891937255859375, 0.228179931640625, 0.2671661376953125, 0.30615234375, 0.3451385498046875, 0.384124755859375, 0.4231109619140625, 0.46209716796875, 0.5010833740234375, 0.540069580078125, 0.5790557861328125, 0.6180419921875, 0.6570281982421875, 0.696014404296875, 0.7350006103515625, 0.77398681640625, 0.8129730224609375, 0.851959228515625, 0.8909454345703125, 0.929931640625, 0.9689178466796875, 1.007904052734375, 1.0468902587890625, 1.08587646484375, 1.1248626708984375, 1.163848876953125, 1.2028350830078125, 1.2418212890625, 1.2808074951171875, 1.319793701171875, 1.3587799072265625, 1.39776611328125, 1.4367523193359375, 1.475738525390625, 1.5147247314453125, 1.5537109375]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 8.0, 27.0, 48.0, 179.0, 2471573.0, 1722150.0, 178.0, 52.0, 18.0, 16.0, 7.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-39.1875, -38.25439453125, -37.3212890625, -36.38818359375, -35.455078125, -34.52197265625, -33.5888671875, -32.65576171875, -31.72265625, -30.78955078125, -29.8564453125, -28.92333984375, -27.990234375, -27.05712890625, -26.1240234375, -25.19091796875, -24.2578125, -23.32470703125, -22.3916015625, -21.45849609375, -20.525390625, -19.59228515625, -18.6591796875, -17.72607421875, -16.79296875, -15.85986328125, -14.9267578125, -13.99365234375, -13.060546875, -12.12744140625, -11.1943359375, -10.26123046875, -9.328125, -8.39501953125, -7.4619140625, -6.52880859375, -5.595703125, -4.66259765625, -3.7294921875, -2.79638671875, -1.86328125, -0.93017578125, 0.0029296875, 0.93603515625, 1.869140625, 2.80224609375, 3.7353515625, 4.66845703125, 5.6015625, 6.53466796875, 7.4677734375, 8.40087890625, 9.333984375, 10.26708984375, 11.2001953125, 12.13330078125, 13.06640625, 13.99951171875, 14.9326171875, 15.86572265625, 16.798828125, 17.73193359375, 18.6650390625, 19.59814453125, 20.53125]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 17.0, 22.0, 43.0, 77.0, 144.0, 313.0, 789.0, 1232.0, 767.0, 323.0, 170.0, 72.0, 35.0, 28.0, 13.0, 8.0, 5.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94873046875, -0.9240646362304688, -0.8993988037109375, -0.8747329711914062, -0.850067138671875, -0.8254013061523438, -0.8007354736328125, -0.7760696411132812, -0.75140380859375, -0.7267379760742188, -0.7020721435546875, -0.6774063110351562, -0.652740478515625, -0.6280746459960938, -0.6034088134765625, -0.5787429809570312, -0.5540771484375, -0.5294113159179688, -0.5047454833984375, -0.48007965087890625, -0.455413818359375, -0.43074798583984375, -0.4060821533203125, -0.38141632080078125, -0.35675048828125, -0.33208465576171875, -0.3074188232421875, -0.28275299072265625, -0.258087158203125, -0.23342132568359375, -0.2087554931640625, -0.18408966064453125, -0.159423828125, -0.13475799560546875, -0.1100921630859375, -0.08542633056640625, -0.060760498046875, -0.03609466552734375, -0.0114288330078125, 0.01323699951171875, 0.03790283203125, 0.06256866455078125, 0.0872344970703125, 0.11190032958984375, 0.136566162109375, 0.16123199462890625, 0.1858978271484375, 0.21056365966796875, 0.2352294921875, 0.25989532470703125, 0.2845611572265625, 0.30922698974609375, 0.333892822265625, 0.35855865478515625, 0.3832244873046875, 0.40789031982421875, 0.43255615234375, 0.45722198486328125, 0.4818878173828125, 0.5065536499023438, 0.531219482421875, 0.5558853149414062, 0.5805511474609375, 0.6052169799804688, 0.6298828125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 5.0, 5.0, 14.0, 11.0, 17.0, 36.0, 34.0, 41.0, 70.0, 72.0, 66.0, 92.0, 88.0, 80.0, 89.0, 71.0, 55.0, 47.0, 17.0, 28.0, 20.0, 13.0, 12.0, 8.0, 2.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4012956619262695, -1.3553353548049927, -1.3093749284744263, -1.2634146213531494, -1.217454195022583, -1.1714938879013062, -1.1255335807800293, -1.079573154449463, -1.0336127281188965, -0.9876523613929749, -0.9416919946670532, -0.8957316875457764, -0.84977126121521, -0.8038109540939331, -0.7578505873680115, -0.7118902206420898, -0.665929913520813, -0.6199695467948914, -0.5740091800689697, -0.5280488729476929, -0.48208847641944885, -0.4361281096935272, -0.390167772769928, -0.34420740604400635, -0.2982470393180847, -0.2522866725921631, -0.20632632076740265, -0.1603659689426422, -0.11440560221672058, -0.06844523549079895, -0.022484898567199707, 0.023475468158721924, 0.0694359540939331, 0.11539631336927414, 0.16135667264461517, 0.2073170244693756, 0.25327739119529724, 0.29923775792121887, 0.3451980948448181, 0.39115846157073975, 0.4371188282966614, 0.483079195022583, 0.5290395617485046, 0.5749999284744263, 0.6209602355957031, 0.6669206619262695, 0.7128809690475464, 0.758841335773468, 0.8048017024993896, 0.8507620692253113, 0.8967224359512329, 0.9426827430725098, 0.9886431694030762, 1.034603476524353, 1.0805637836456299, 1.1265242099761963, 1.1724846363067627, 1.2184449434280396, 1.264405369758606, 1.3103656768798828, 1.3563261032104492, 1.402286410331726, 1.448246717453003, 1.4942071437835693, 1.5401674509048462]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 6.0, 3.0, 2.0, 3.0, 5.0, 5.0, 5.0, 15.0, 18.0, 15.0, 18.0, 18.0, 20.0, 30.0, 39.0, 30.0, 30.0, 21.0, 37.0, 34.0, 48.0, 43.0, 49.0, 46.0, 48.0, 52.0, 41.0, 52.0, 30.0, 35.0, 19.0, 25.0, 38.0, 22.0, 19.0, 15.0, 15.0, 18.0, 8.0, 10.0, 10.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8428260684013367, -0.8140411972999573, -0.7852563261985779, -0.7564714550971985, -0.7276865839958191, -0.6989017128944397, -0.6701167821884155, -0.6413319110870361, -0.6125470399856567, -0.5837621688842773, -0.554977297782898, -0.5261924266815186, -0.49740755558013916, -0.46862268447875977, -0.439837783575058, -0.4110529124736786, -0.3822680711746216, -0.3534832000732422, -0.3246983289718628, -0.2959134578704834, -0.267128586769104, -0.23834370076656342, -0.20955881476402283, -0.18077394366264343, -0.15198907256126404, -0.12320420145988464, -0.09441932290792465, -0.06563444435596466, -0.036849573254585266, -0.008064702153205872, 0.020720183849334717, 0.04950505495071411, 0.0782899260520935, 0.1070747971534729, 0.1358596682548523, 0.16464455425739288, 0.19342942535877228, 0.22221429646015167, 0.25099918246269226, 0.27978405356407166, 0.30856892466545105, 0.33735379576683044, 0.36613866686820984, 0.3949235677719116, 0.423708438873291, 0.4524933099746704, 0.4812781810760498, 0.5100630521774292, 0.5388479232788086, 0.567632794380188, 0.5964176654815674, 0.6252025365829468, 0.6539874076843262, 0.6827722787857056, 0.711557149887085, 0.7403420209884644, 0.7691268920898438, 0.7979117631912231, 0.8266966342926025, 0.8554815053939819, 0.8842663764953613, 0.9130512475967407, 0.9418361186981201, 0.9706209897994995, 0.9994059205055237]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 5.0, 6.0, 11.0, 17.0, 30.0, 45.0, 55.0, 76.0, 143.0, 225.0, 405.0, 660.0, 1075.0, 1864.0, 3419.0, 6358.0, 12090.0, 23906.0, 49893.0, 110366.0, 242432.0, 300603.0, 157497.0, 69962.0, 32661.0, 16078.0, 8386.0, 4567.0, 2396.0, 1345.0, 773.0, 456.0, 279.0, 173.0, 106.0, 74.0, 48.0, 20.0, 20.0, 8.0, 10.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.362548828125, -0.3492279052734375, -0.335906982421875, -0.3225860595703125, -0.30926513671875, -0.2959442138671875, -0.282623291015625, -0.2693023681640625, -0.2559814453125, -0.2426605224609375, -0.229339599609375, -0.2160186767578125, -0.20269775390625, -0.1893768310546875, -0.176055908203125, -0.1627349853515625, -0.1494140625, -0.1360931396484375, -0.122772216796875, -0.1094512939453125, -0.09613037109375, -0.0828094482421875, -0.069488525390625, -0.0561676025390625, -0.0428466796875, -0.0295257568359375, -0.016204833984375, -0.0028839111328125, 0.01043701171875, 0.0237579345703125, 0.037078857421875, 0.0503997802734375, 0.063720703125, 0.0770416259765625, 0.090362548828125, 0.1036834716796875, 0.11700439453125, 0.1303253173828125, 0.143646240234375, 0.1569671630859375, 0.1702880859375, 0.1836090087890625, 0.196929931640625, 0.2102508544921875, 0.22357177734375, 0.2368927001953125, 0.250213623046875, 0.2635345458984375, 0.27685546875, 0.2901763916015625, 0.303497314453125, 0.3168182373046875, 0.33013916015625, 0.3434600830078125, 0.356781005859375, 0.3701019287109375, 0.3834228515625, 0.3967437744140625, 0.410064697265625, 0.4233856201171875, 0.43670654296875, 0.4500274658203125, 0.463348388671875, 0.4766693115234375, 0.489990234375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 2.0, 13.0, 14.0, 17.0, 17.0, 19.0, 25.0, 24.0, 38.0, 34.0, 50.0, 56.0, 38.0, 39.0, 51.0, 44.0, 60.0, 57.0, 47.0, 46.0, 38.0, 46.0, 37.0, 31.0, 26.0, 26.0, 20.0, 18.0, 19.0, 9.0, 12.0, 5.0, 7.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60595703125, -0.5836029052734375, -0.561248779296875, -0.5388946533203125, -0.51654052734375, -0.4941864013671875, -0.471832275390625, -0.4494781494140625, -0.4271240234375, -0.4047698974609375, -0.382415771484375, -0.3600616455078125, -0.33770751953125, -0.3153533935546875, -0.292999267578125, -0.2706451416015625, -0.248291015625, -0.2259368896484375, -0.203582763671875, -0.1812286376953125, -0.15887451171875, -0.1365203857421875, -0.114166259765625, -0.0918121337890625, -0.0694580078125, -0.0471038818359375, -0.024749755859375, -0.0023956298828125, 0.01995849609375, 0.0423126220703125, 0.064666748046875, 0.0870208740234375, 0.109375, 0.1317291259765625, 0.154083251953125, 0.1764373779296875, 0.19879150390625, 0.2211456298828125, 0.243499755859375, 0.2658538818359375, 0.2882080078125, 0.3105621337890625, 0.332916259765625, 0.3552703857421875, 0.37762451171875, 0.3999786376953125, 0.422332763671875, 0.4446868896484375, 0.467041015625, 0.4893951416015625, 0.511749267578125, 0.5341033935546875, 0.55645751953125, 0.5788116455078125, 0.601165771484375, 0.6235198974609375, 0.6458740234375, 0.6682281494140625, 0.690582275390625, 0.7129364013671875, 0.73529052734375, 0.7576446533203125, 0.779998779296875, 0.8023529052734375, 0.82470703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 6.0, 14.0, 8.0, 12.0, 25.0, 24.0, 45.0, 83.0, 106.0, 185.0, 280.0, 490.0, 972.0, 1872.0, 4010.0, 9404.0, 23813.0, 66248.0, 188819.0, 373466.0, 240522.0, 85921.0, 30576.0, 11867.0, 4976.0, 2229.0, 1080.0, 581.0, 353.0, 205.0, 133.0, 85.0, 52.0, 31.0, 25.0, 15.0, 8.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.54296875, -0.5281448364257812, -0.5133209228515625, -0.49849700927734375, -0.483673095703125, -0.46884918212890625, -0.4540252685546875, -0.43920135498046875, -0.42437744140625, -0.40955352783203125, -0.3947296142578125, -0.37990570068359375, -0.365081787109375, -0.35025787353515625, -0.3354339599609375, -0.32061004638671875, -0.3057861328125, -0.29096221923828125, -0.2761383056640625, -0.26131439208984375, -0.246490478515625, -0.23166656494140625, -0.2168426513671875, -0.20201873779296875, -0.18719482421875, -0.17237091064453125, -0.1575469970703125, -0.14272308349609375, -0.127899169921875, -0.11307525634765625, -0.0982513427734375, -0.08342742919921875, -0.068603515625, -0.05377960205078125, -0.0389556884765625, -0.02413177490234375, -0.009307861328125, 0.00551605224609375, 0.0203399658203125, 0.03516387939453125, 0.04998779296875, 0.06481170654296875, 0.0796356201171875, 0.09445953369140625, 0.109283447265625, 0.12410736083984375, 0.1389312744140625, 0.15375518798828125, 0.1685791015625, 0.18340301513671875, 0.1982269287109375, 0.21305084228515625, 0.227874755859375, 0.24269866943359375, 0.2575225830078125, 0.27234649658203125, 0.28717041015625, 0.30199432373046875, 0.3168182373046875, 0.33164215087890625, 0.346466064453125, 0.36128997802734375, 0.3761138916015625, 0.39093780517578125, 0.40576171875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 6.0, 13.0, 9.0, 11.0, 21.0, 30.0, 23.0, 31.0, 29.0, 25.0, 51.0, 36.0, 35.0, 50.0, 59.0, 55.0, 54.0, 45.0, 33.0, 42.0, 40.0, 39.0, 41.0, 48.0, 24.0, 20.0, 23.0, 18.0, 11.0, 17.0, 13.0, 10.0, 4.0, 8.0, 2.0, 5.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0927734375, -1.0533294677734375, -1.013885498046875, -0.9744415283203125, -0.93499755859375, -0.8955535888671875, -0.856109619140625, -0.8166656494140625, -0.7772216796875, -0.7377777099609375, -0.698333740234375, -0.6588897705078125, -0.61944580078125, -0.5800018310546875, -0.540557861328125, -0.5011138916015625, -0.461669921875, -0.4222259521484375, -0.382781982421875, -0.3433380126953125, -0.30389404296875, -0.2644500732421875, -0.225006103515625, -0.1855621337890625, -0.1461181640625, -0.1066741943359375, -0.067230224609375, -0.0277862548828125, 0.01165771484375, 0.0511016845703125, 0.090545654296875, 0.1299896240234375, 0.16943359375, 0.2088775634765625, 0.248321533203125, 0.2877655029296875, 0.32720947265625, 0.3666534423828125, 0.406097412109375, 0.4455413818359375, 0.4849853515625, 0.5244293212890625, 0.563873291015625, 0.6033172607421875, 0.64276123046875, 0.6822052001953125, 0.721649169921875, 0.7610931396484375, 0.800537109375, 0.8399810791015625, 0.879425048828125, 0.9188690185546875, 0.95831298828125, 0.9977569580078125, 1.037200927734375, 1.0766448974609375, 1.1160888671875, 1.1555328369140625, 1.194976806640625, 1.2344207763671875, 1.27386474609375, 1.3133087158203125, 1.352752685546875, 1.3921966552734375, 1.431640625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 7.0, 13.0, 10.0, 19.0, 11.0, 32.0, 35.0, 45.0, 99.0, 149.0, 253.0, 380.0, 588.0, 955.0, 1747.0, 3359.0, 6390.0, 13362.0, 30336.0, 73600.0, 174878.0, 313032.0, 240968.0, 107368.0, 43852.0, 18589.0, 8668.0, 4332.0, 2187.0, 1310.0, 730.0, 476.0, 284.0, 144.0, 91.0, 81.0, 55.0, 39.0, 28.0, 21.0, 11.0, 11.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.0863037109375, -0.0838174819946289, -0.08133125305175781, -0.07884502410888672, -0.07635879516601562, -0.07387256622314453, -0.07138633728027344, -0.06890010833740234, -0.06641387939453125, -0.06392765045166016, -0.06144142150878906, -0.05895519256591797, -0.056468963623046875, -0.05398273468017578, -0.05149650573730469, -0.049010276794433594, -0.0465240478515625, -0.044037818908691406, -0.04155158996582031, -0.03906536102294922, -0.036579132080078125, -0.03409290313720703, -0.03160667419433594, -0.029120445251464844, -0.02663421630859375, -0.024147987365722656, -0.021661758422851562, -0.01917552947998047, -0.016689300537109375, -0.014203071594238281, -0.011716842651367188, -0.009230613708496094, -0.006744384765625, -0.004258155822753906, -0.0017719268798828125, 0.0007143020629882812, 0.003200531005859375, 0.005686759948730469, 0.008172988891601562, 0.010659217834472656, 0.01314544677734375, 0.015631675720214844, 0.018117904663085938, 0.02060413360595703, 0.023090362548828125, 0.02557659149169922, 0.028062820434570312, 0.030549049377441406, 0.0330352783203125, 0.035521507263183594, 0.03800773620605469, 0.04049396514892578, 0.042980194091796875, 0.04546642303466797, 0.04795265197753906, 0.050438880920410156, 0.05292510986328125, 0.055411338806152344, 0.05789756774902344, 0.06038379669189453, 0.06287002563476562, 0.06535625457763672, 0.06784248352050781, 0.0703287124633789, 0.07281494140625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 3.0, 6.0, 9.0, 10.0, 13.0, 18.0, 22.0, 40.0, 50.0, 64.0, 80.0, 98.0, 105.0, 95.0, 94.0, 70.0, 54.0, 40.0, 26.0, 34.0, 22.0, 10.0, 10.0, 5.0, 3.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.441375732421875e-05, -9.152665734291077e-05, -8.863955736160278e-05, -8.57524573802948e-05, -8.286535739898682e-05, -7.997825741767883e-05, -7.709115743637085e-05, -7.420405745506287e-05, -7.131695747375488e-05, -6.84298574924469e-05, -6.554275751113892e-05, -6.265565752983093e-05, -5.976855754852295e-05, -5.6881457567214966e-05, -5.399435758590698e-05, -5.1107257604599e-05, -4.8220157623291016e-05, -4.533305764198303e-05, -4.244595766067505e-05, -3.9558857679367065e-05, -3.667175769805908e-05, -3.37846577167511e-05, -3.0897557735443115e-05, -2.8010457754135132e-05, -2.512335777282715e-05, -2.2236257791519165e-05, -1.934915781021118e-05, -1.6462057828903198e-05, -1.3574957847595215e-05, -1.0687857866287231e-05, -7.800757884979248e-06, -4.913657903671265e-06, -2.0265579223632812e-06, 8.605420589447021e-07, 3.7476420402526855e-06, 6.634742021560669e-06, 9.521842002868652e-06, 1.2408941984176636e-05, 1.529604196548462e-05, 1.8183141946792603e-05, 2.1070241928100586e-05, 2.395734190940857e-05, 2.6844441890716553e-05, 2.9731541872024536e-05, 3.261864185333252e-05, 3.55057418346405e-05, 3.8392841815948486e-05, 4.127994179725647e-05, 4.416704177856445e-05, 4.7054141759872437e-05, 4.994124174118042e-05, 5.28283417224884e-05, 5.571544170379639e-05, 5.860254168510437e-05, 6.148964166641235e-05, 6.437674164772034e-05, 6.726384162902832e-05, 7.01509416103363e-05, 7.303804159164429e-05, 7.592514157295227e-05, 7.881224155426025e-05, 8.169934153556824e-05, 8.458644151687622e-05, 8.74735414981842e-05, 9.036064147949219e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 11.0, 12.0, 13.0, 27.0, 29.0, 32.0, 64.0, 98.0, 360.0, 4012.0, 312282.0, 720970.0, 9691.0, 556.0, 141.0, 71.0, 42.0, 40.0, 18.0, 18.0, 15.0, 14.0, 3.0, 4.0, 5.0, 6.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.40380859375, -0.3916168212890625, -0.379425048828125, -0.3672332763671875, -0.35504150390625, -0.3428497314453125, -0.330657958984375, -0.3184661865234375, -0.3062744140625, -0.2940826416015625, -0.281890869140625, -0.2696990966796875, -0.25750732421875, -0.2453155517578125, -0.233123779296875, -0.2209320068359375, -0.208740234375, -0.1965484619140625, -0.184356689453125, -0.1721649169921875, -0.15997314453125, -0.1477813720703125, -0.135589599609375, -0.1233978271484375, -0.1112060546875, -0.0990142822265625, -0.086822509765625, -0.0746307373046875, -0.06243896484375, -0.0502471923828125, -0.038055419921875, -0.0258636474609375, -0.013671875, -0.0014801025390625, 0.010711669921875, 0.0229034423828125, 0.03509521484375, 0.0472869873046875, 0.059478759765625, 0.0716705322265625, 0.0838623046875, 0.0960540771484375, 0.108245849609375, 0.1204376220703125, 0.13262939453125, 0.1448211669921875, 0.157012939453125, 0.1692047119140625, 0.181396484375, 0.1935882568359375, 0.205780029296875, 0.2179718017578125, 0.23016357421875, 0.2423553466796875, 0.254547119140625, 0.2667388916015625, 0.2789306640625, 0.2911224365234375, 0.303314208984375, 0.3155059814453125, 0.32769775390625, 0.3398895263671875, 0.352081298828125, 0.3642730712890625, 0.37646484375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 6.0, 7.0, 5.0, 9.0, 14.0, 19.0, 20.0, 19.0, 13.0, 26.0, 25.0, 39.0, 39.0, 30.0, 32.0, 40.0, 40.0, 48.0, 47.0, 57.0, 39.0, 39.0, 40.0, 42.0, 34.0, 33.0, 34.0, 25.0, 23.0, 18.0, 22.0, 18.0, 13.0, 15.0, 9.0, 7.0, 6.0, 7.0, 4.0, 9.0, 3.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0205841064453125, -0.019893646240234375, -0.01920318603515625, -0.018512725830078125, -0.017822265625, -0.017131805419921875, -0.01644134521484375, -0.015750885009765625, -0.0150604248046875, -0.014369964599609375, -0.01367950439453125, -0.012989044189453125, -0.012298583984375, -0.011608123779296875, -0.01091766357421875, -0.010227203369140625, -0.0095367431640625, -0.008846282958984375, -0.00815582275390625, -0.007465362548828125, -0.00677490234375, -0.006084442138671875, -0.00539398193359375, -0.004703521728515625, -0.0040130615234375, -0.003322601318359375, -0.00263214111328125, -0.001941680908203125, -0.001251220703125, -0.000560760498046875, 0.00012969970703125, 0.000820159912109375, 0.0015106201171875, 0.002201080322265625, 0.00289154052734375, 0.003582000732421875, 0.0042724609375, 0.004962921142578125, 0.00565338134765625, 0.006343841552734375, 0.0070343017578125, 0.007724761962890625, 0.00841522216796875, 0.009105682373046875, 0.009796142578125, 0.010486602783203125, 0.01117706298828125, 0.011867523193359375, 0.0125579833984375, 0.013248443603515625, 0.01393890380859375, 0.014629364013671875, 0.01531982421875, 0.016010284423828125, 0.01670074462890625, 0.017391204833984375, 0.0180816650390625, 0.018772125244140625, 0.01946258544921875, 0.020153045654296875, 0.020843505859375, 0.021533966064453125, 0.02222442626953125, 0.022914886474609375, 0.0236053466796875]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 8.0, 19.0, 26.0, 34.0, 79.0, 98.0, 110.0, 145.0, 152.0, 103.0, 85.0, 56.0, 40.0, 21.0, 7.0, 9.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9421945214271545, -0.9026233553886414, -0.8630521297454834, -0.8234809637069702, -0.7839097380638123, -0.7443385720252991, -0.7047673463821411, -0.6651961803436279, -0.6256250143051147, -0.5860538482666016, -0.5464826226234436, -0.5069114565849304, -0.46734023094177246, -0.4277690649032593, -0.3881978690624237, -0.34862667322158813, -0.3090554475784302, -0.2694842517375946, -0.22991305589675903, -0.19034187495708466, -0.15077067911624908, -0.11119948327541351, -0.07162830233573914, -0.032057106494903564, 0.007514089345932007, 0.04708528146147728, 0.08665647357702255, 0.12622766196727753, 0.1657988578081131, 0.20537005364894867, 0.24494123458862305, 0.2845124304294586, 0.3240835666656494, 0.363654762506485, 0.40322595834732056, 0.44279712438583374, 0.4823683500289917, 0.5219395160675049, 0.5615106821060181, 0.601081907749176, 0.640653133392334, 0.6802242994308472, 0.7197955250740051, 0.7593666911125183, 0.7989379167556763, 0.8385090827941895, 0.8780802488327026, 0.9176514744758606, 0.9572226405143738, 0.996793806552887, 1.036365032196045, 1.075936198234558, 1.1155073642730713, 1.155078649520874, 1.1946498155593872, 1.2342209815979004, 1.2737921476364136, 1.3133633136749268, 1.35293447971344, 1.3925057649612427, 1.4320769309997559, 1.471648097038269, 1.5112192630767822, 1.550790548324585, 1.5903617143630981]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 7.0, 9.0, 5.0, 9.0, 19.0, 23.0, 17.0, 30.0, 22.0, 36.0, 28.0, 37.0, 44.0, 43.0, 45.0, 38.0, 58.0, 37.0, 50.0, 65.0, 50.0, 45.0, 39.0, 32.0, 41.0, 34.0, 21.0, 26.0, 18.0, 15.0, 10.0, 7.0, 7.0, 12.0, 6.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6159753203392029, -0.5949367880821228, -0.5738983154296875, -0.5528597831726074, -0.5318212509155273, -0.5107827186584473, -0.48974424600601196, -0.4687057137489319, -0.4476671814918518, -0.4266286790370941, -0.40559014678001404, -0.38455164432525635, -0.36351311206817627, -0.3424746096134186, -0.3214361071586609, -0.3003975749015808, -0.2793590724468231, -0.25832056999206543, -0.23728203773498535, -0.21624353528022766, -0.19520500302314758, -0.1741665005683899, -0.153127983212471, -0.13208946585655212, -0.11105094850063324, -0.09001243114471436, -0.06897391378879547, -0.047935403883457184, -0.0268968865275383, -0.005858369171619415, 0.015180140733718872, 0.036218658089637756, 0.05725717544555664, 0.07829569280147552, 0.09933421015739441, 0.1203727200627327, 0.14141124486923218, 0.16244974732398987, 0.18348826467990875, 0.20452678203582764, 0.22556529939174652, 0.2466038167476654, 0.2676423192024231, 0.2886808514595032, 0.30971935391426086, 0.33075788617134094, 0.35179638862609863, 0.3728349208831787, 0.3938734233379364, 0.4149119257926941, 0.43595045804977417, 0.45698896050453186, 0.47802749276161194, 0.49906599521636963, 0.5201045274734497, 0.5411430597305298, 0.5621815323829651, 0.5832200646400452, 0.6042585372924805, 0.6252970695495605, 0.6463356018066406, 0.6673741340637207, 0.688412606716156, 0.7094511389732361, 0.7304896712303162]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 7.0, 5.0, 12.0, 17.0, 20.0, 12.0, 26.0, 55.0, 69.0, 78.0, 99.0, 164.0, 245.0, 401.0, 648.0, 1058.0, 1854.0, 3333.0, 6735.0, 14911.0, 40206.0, 148845.0, 541373.0, 203766.0, 49653.0, 18109.0, 7821.0, 3838.0, 2069.0, 1147.0, 632.0, 479.0, 239.0, 204.0, 122.0, 81.0, 55.0, 37.0, 26.0, 25.0, 17.0, 13.0, 11.0, 9.0, 5.0, 8.0, 6.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.5546875, -0.5371322631835938, -0.5195770263671875, -0.5020217895507812, -0.484466552734375, -0.46691131591796875, -0.4493560791015625, -0.43180084228515625, -0.41424560546875, -0.39669036865234375, -0.3791351318359375, -0.36157989501953125, -0.344024658203125, -0.32646942138671875, -0.3089141845703125, -0.29135894775390625, -0.2738037109375, -0.25624847412109375, -0.2386932373046875, -0.22113800048828125, -0.203582763671875, -0.18602752685546875, -0.1684722900390625, -0.15091705322265625, -0.13336181640625, -0.11580657958984375, -0.0982513427734375, -0.08069610595703125, -0.063140869140625, -0.04558563232421875, -0.0280303955078125, -0.01047515869140625, 0.007080078125, 0.02463531494140625, 0.0421905517578125, 0.05974578857421875, 0.077301025390625, 0.09485626220703125, 0.1124114990234375, 0.12996673583984375, 0.14752197265625, 0.16507720947265625, 0.1826324462890625, 0.20018768310546875, 0.217742919921875, 0.23529815673828125, 0.2528533935546875, 0.27040863037109375, 0.2879638671875, 0.30551910400390625, 0.3230743408203125, 0.34062957763671875, 0.358184814453125, 0.37574005126953125, 0.3932952880859375, 0.41085052490234375, 0.42840576171875, 0.44596099853515625, 0.4635162353515625, 0.48107147216796875, 0.498626708984375, 0.5161819458007812, 0.5337371826171875, 0.5512924194335938, 0.56884765625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 5.0, 8.0, 5.0, 6.0, 16.0, 12.0, 13.0, 13.0, 22.0, 8.0, 29.0, 25.0, 25.0, 32.0, 34.0, 36.0, 37.0, 35.0, 55.0, 38.0, 43.0, 54.0, 57.0, 47.0, 49.0, 40.0, 45.0, 34.0, 32.0, 32.0, 26.0, 23.0, 12.0, 13.0, 20.0, 7.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8193359375, -1.762969970703125, -1.70660400390625, -1.650238037109375, -1.5938720703125, -1.537506103515625, -1.48114013671875, -1.424774169921875, -1.368408203125, -1.312042236328125, -1.25567626953125, -1.199310302734375, -1.1429443359375, -1.086578369140625, -1.03021240234375, -0.973846435546875, -0.91748046875, -0.861114501953125, -0.80474853515625, -0.748382568359375, -0.6920166015625, -0.635650634765625, -0.57928466796875, -0.522918701171875, -0.466552734375, -0.410186767578125, -0.35382080078125, -0.297454833984375, -0.2410888671875, -0.184722900390625, -0.12835693359375, -0.071990966796875, -0.015625, 0.040740966796875, 0.09710693359375, 0.153472900390625, 0.2098388671875, 0.266204833984375, 0.32257080078125, 0.378936767578125, 0.435302734375, 0.491668701171875, 0.54803466796875, 0.604400634765625, 0.6607666015625, 0.717132568359375, 0.77349853515625, 0.829864501953125, 0.88623046875, 0.942596435546875, 0.99896240234375, 1.055328369140625, 1.1116943359375, 1.168060302734375, 1.22442626953125, 1.280792236328125, 1.337158203125, 1.393524169921875, 1.44989013671875, 1.506256103515625, 1.5626220703125, 1.618988037109375, 1.67535400390625, 1.731719970703125, 1.7880859375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 4.0, 7.0, 16.0, 17.0, 24.0, 25.0, 30.0, 48.0, 77.0, 67.0, 99.0, 223.0, 3021.0, 1043090.0, 1194.0, 177.0, 103.0, 77.0, 53.0, 51.0, 39.0, 21.0, 19.0, 16.0, 13.0, 9.0, 7.0, 5.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4609375, -8.228515625, -7.99609375, -7.763671875, -7.53125, -7.298828125, -7.06640625, -6.833984375, -6.6015625, -6.369140625, -6.13671875, -5.904296875, -5.671875, -5.439453125, -5.20703125, -4.974609375, -4.7421875, -4.509765625, -4.27734375, -4.044921875, -3.8125, -3.580078125, -3.34765625, -3.115234375, -2.8828125, -2.650390625, -2.41796875, -2.185546875, -1.953125, -1.720703125, -1.48828125, -1.255859375, -1.0234375, -0.791015625, -0.55859375, -0.326171875, -0.09375, 0.138671875, 0.37109375, 0.603515625, 0.8359375, 1.068359375, 1.30078125, 1.533203125, 1.765625, 1.998046875, 2.23046875, 2.462890625, 2.6953125, 2.927734375, 3.16015625, 3.392578125, 3.625, 3.857421875, 4.08984375, 4.322265625, 4.5546875, 4.787109375, 5.01953125, 5.251953125, 5.484375, 5.716796875, 5.94921875, 6.181640625, 6.4140625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 3.0, 5.0, 10.0, 14.0, 18.0, 21.0, 25.0, 30.0, 35.0, 55.0, 46.0, 53.0, 67.0, 70.0, 58.0, 72.0, 74.0, 67.0, 54.0, 41.0, 42.0, 25.0, 30.0, 19.0, 16.0, 10.0, 10.0, 7.0, 7.0, 6.0, 3.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.322265625, -3.23101806640625, -3.1397705078125, -3.04852294921875, -2.957275390625, -2.86602783203125, -2.7747802734375, -2.68353271484375, -2.59228515625, -2.50103759765625, -2.4097900390625, -2.31854248046875, -2.227294921875, -2.13604736328125, -2.0447998046875, -1.95355224609375, -1.8623046875, -1.77105712890625, -1.6798095703125, -1.58856201171875, -1.497314453125, -1.40606689453125, -1.3148193359375, -1.22357177734375, -1.13232421875, -1.04107666015625, -0.9498291015625, -0.85858154296875, -0.767333984375, -0.67608642578125, -0.5848388671875, -0.49359130859375, -0.40234375, -0.31109619140625, -0.2198486328125, -0.12860107421875, -0.037353515625, 0.05389404296875, 0.1451416015625, 0.23638916015625, 0.32763671875, 0.41888427734375, 0.5101318359375, 0.60137939453125, 0.692626953125, 0.78387451171875, 0.8751220703125, 0.96636962890625, 1.0576171875, 1.14886474609375, 1.2401123046875, 1.33135986328125, 1.422607421875, 1.51385498046875, 1.6051025390625, 1.69635009765625, 1.78759765625, 1.87884521484375, 1.9700927734375, 2.06134033203125, 2.152587890625, 2.24383544921875, 2.3350830078125, 2.42633056640625, 2.517578125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 2.0, 3.0, 9.0, 11.0, 18.0, 38.0, 93.0, 370.0, 4585.0, 1012531.0, 29838.0, 745.0, 150.0, 61.0, 35.0, 15.0, 17.0, 9.0, 3.0, 3.0, 9.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4306640625, -1.380828857421875, -1.33099365234375, -1.281158447265625, -1.2313232421875, -1.181488037109375, -1.13165283203125, -1.081817626953125, -1.031982421875, -0.982147216796875, -0.93231201171875, -0.882476806640625, -0.8326416015625, -0.782806396484375, -0.73297119140625, -0.683135986328125, -0.63330078125, -0.583465576171875, -0.53363037109375, -0.483795166015625, -0.4339599609375, -0.384124755859375, -0.33428955078125, -0.284454345703125, -0.234619140625, -0.184783935546875, -0.13494873046875, -0.085113525390625, -0.0352783203125, 0.014556884765625, 0.06439208984375, 0.114227294921875, 0.1640625, 0.213897705078125, 0.26373291015625, 0.313568115234375, 0.3634033203125, 0.413238525390625, 0.46307373046875, 0.512908935546875, 0.562744140625, 0.612579345703125, 0.66241455078125, 0.712249755859375, 0.7620849609375, 0.811920166015625, 0.86175537109375, 0.911590576171875, 0.96142578125, 1.011260986328125, 1.06109619140625, 1.110931396484375, 1.1607666015625, 1.210601806640625, 1.26043701171875, 1.310272216796875, 1.360107421875, 1.409942626953125, 1.45977783203125, 1.509613037109375, 1.5594482421875, 1.609283447265625, 1.65911865234375, 1.708953857421875, 1.7587890625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 6.0, 1.0, 1.0, 2.0, 7.0, 4.0, 5.0, 11.0, 14.0, 17.0, 39.0, 50.0, 84.0, 166.0, 247.0, 137.0, 93.0, 36.0, 20.0, 25.0, 23.0, 3.0, 2.0, 2.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.113550186157227e-05, -8.908286690711975e-05, -8.703023195266724e-05, -8.497759699821472e-05, -8.292496204376221e-05, -8.087232708930969e-05, -7.881969213485718e-05, -7.676705718040466e-05, -7.471442222595215e-05, -7.266178727149963e-05, -7.060915231704712e-05, -6.85565173625946e-05, -6.650388240814209e-05, -6.445124745368958e-05, -6.239861249923706e-05, -6.0345977544784546e-05, -5.829334259033203e-05, -5.6240707635879517e-05, -5.4188072681427e-05, -5.213543772697449e-05, -5.008280277252197e-05, -4.803016781806946e-05, -4.597753286361694e-05, -4.392489790916443e-05, -4.1872262954711914e-05, -3.98196280002594e-05, -3.7766993045806885e-05, -3.571435809135437e-05, -3.3661723136901855e-05, -3.160908818244934e-05, -2.9556453227996826e-05, -2.750381827354431e-05, -2.5451183319091797e-05, -2.3398548364639282e-05, -2.1345913410186768e-05, -1.9293278455734253e-05, -1.7240643501281738e-05, -1.5188008546829224e-05, -1.3135373592376709e-05, -1.1082738637924194e-05, -9.03010368347168e-06, -6.977468729019165e-06, -4.92483377456665e-06, -2.8721988201141357e-06, -8.195638656616211e-07, 1.2330710887908936e-06, 3.285706043243408e-06, 5.338340997695923e-06, 7.3909759521484375e-06, 9.443610906600952e-06, 1.1496245861053467e-05, 1.3548880815505981e-05, 1.5601515769958496e-05, 1.765415072441101e-05, 1.9706785678863525e-05, 2.175942063331604e-05, 2.3812055587768555e-05, 2.586469054222107e-05, 2.7917325496673584e-05, 2.99699604511261e-05, 3.202259540557861e-05, 3.407523036003113e-05, 3.612786531448364e-05, 3.818050026893616e-05, 4.023313522338867e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 5.0, 6.0, 11.0, 13.0, 18.0, 23.0, 38.0, 74.0, 205.0, 932.0, 18461.0, 1008751.0, 18538.0, 1070.0, 231.0, 69.0, 39.0, 22.0, 15.0, 8.0, 4.0, 8.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.47265625, -1.4371719360351562, -1.4016876220703125, -1.3662033081054688, -1.330718994140625, -1.2952346801757812, -1.2597503662109375, -1.2242660522460938, -1.18878173828125, -1.1532974243164062, -1.1178131103515625, -1.0823287963867188, -1.046844482421875, -1.0113601684570312, -0.9758758544921875, -0.9403915405273438, -0.9049072265625, -0.8694229125976562, -0.8339385986328125, -0.7984542846679688, -0.762969970703125, -0.7274856567382812, -0.6920013427734375, -0.6565170288085938, -0.62103271484375, -0.5855484008789062, -0.5500640869140625, -0.5145797729492188, -0.479095458984375, -0.44361114501953125, -0.4081268310546875, -0.37264251708984375, -0.337158203125, -0.30167388916015625, -0.2661895751953125, -0.23070526123046875, -0.195220947265625, -0.15973663330078125, -0.1242523193359375, -0.08876800537109375, -0.05328369140625, -0.01779937744140625, 0.0176849365234375, 0.05316925048828125, 0.088653564453125, 0.12413787841796875, 0.1596221923828125, 0.19510650634765625, 0.2305908203125, 0.26607513427734375, 0.3015594482421875, 0.33704376220703125, 0.372528076171875, 0.40801239013671875, 0.4434967041015625, 0.47898101806640625, 0.51446533203125, 0.5499496459960938, 0.5854339599609375, 0.6209182739257812, 0.656402587890625, 0.6918869018554688, 0.7273712158203125, 0.7628555297851562, 0.79833984375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 6.0, 5.0, 7.0, 7.0, 11.0, 17.0, 16.0, 48.0, 60.0, 83.0, 169.0, 224.0, 118.0, 75.0, 37.0, 30.0, 25.0, 13.0, 16.0, 10.0, 6.0, 5.0, 8.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1075439453125, -0.10291671752929688, -0.09828948974609375, -0.09366226196289062, -0.0890350341796875, -0.08440780639648438, -0.07978057861328125, -0.07515335083007812, -0.070526123046875, -0.06589889526367188, -0.06127166748046875, -0.056644439697265625, -0.0520172119140625, -0.047389984130859375, -0.04276275634765625, -0.038135528564453125, -0.03350830078125, -0.028881072998046875, -0.02425384521484375, -0.019626617431640625, -0.0149993896484375, -0.010372161865234375, -0.00574493408203125, -0.001117706298828125, 0.003509521484375, 0.008136749267578125, 0.01276397705078125, 0.017391204833984375, 0.0220184326171875, 0.026645660400390625, 0.03127288818359375, 0.035900115966796875, 0.04052734375, 0.045154571533203125, 0.04978179931640625, 0.054409027099609375, 0.0590362548828125, 0.06366348266601562, 0.06829071044921875, 0.07291793823242188, 0.077545166015625, 0.08217239379882812, 0.08679962158203125, 0.09142684936523438, 0.0960540771484375, 0.10068130493164062, 0.10530853271484375, 0.10993576049804688, 0.11456298828125, 0.11919021606445312, 0.12381744384765625, 0.12844467163085938, 0.1330718994140625, 0.13769912719726562, 0.14232635498046875, 0.14695358276367188, 0.151580810546875, 0.15620803833007812, 0.16083526611328125, 0.16546249389648438, 0.1700897216796875, 0.17471694946289062, 0.17934417724609375, 0.18397140502929688, 0.1885986328125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 63.0, 460.0, 441.0, 46.0, 3.0, 1.0], "bins": [-21.95492935180664, -21.588531494140625, -21.22213363647461, -20.855735778808594, -20.489337921142578, -20.122940063476562, -19.756542205810547, -19.39014434814453, -19.023746490478516, -18.6573486328125, -18.290950775146484, -17.92455291748047, -17.558155059814453, -17.191757202148438, -16.825359344482422, -16.458961486816406, -16.092565536499023, -15.726167678833008, -15.359769821166992, -14.993371963500977, -14.626974105834961, -14.260577201843262, -13.894179344177246, -13.52778148651123, -13.161383628845215, -12.7949857711792, -12.428587913513184, -12.062190055847168, -11.695793151855469, -11.329395294189453, -10.962997436523438, -10.596599578857422, -10.230201721191406, -9.86380386352539, -9.497406005859375, -9.13100814819336, -8.764610290527344, -8.398213386535645, -8.031815528869629, -7.665417671203613, -7.299019813537598, -6.932621955871582, -6.566224098205566, -6.199826717376709, -5.833428859710693, -5.467031002044678, -5.10063362121582, -4.734235763549805, -4.367837905883789, -4.001440048217773, -3.635042428970337, -3.2686448097229004, -2.9022469520568848, -2.535849094390869, -2.1694514751434326, -1.803053855895996, -1.4366559982299805, -1.0702582597732544, -0.7038605213165283, -0.33746278285980225, 0.028934955596923828, 0.3953326940536499, 0.761730432510376, 1.1281280517578125, 1.4945259094238281]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 8.0, 8.0, 12.0, 10.0, 12.0, 17.0, 21.0, 20.0, 26.0, 27.0, 20.0, 36.0, 42.0, 40.0, 35.0, 44.0, 49.0, 50.0, 42.0, 45.0, 46.0, 52.0, 35.0, 43.0, 34.0, 42.0, 37.0, 22.0, 25.0, 12.0, 21.0, 16.0, 9.0, 7.0, 5.0, 6.0, 8.0, 5.0, 6.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.004420280456543, -2.91115140914917, -2.817882776260376, -2.724614143371582, -2.631345272064209, -2.538076400756836, -2.444807767868042, -2.351539134979248, -2.258270263671875, -2.165001392364502, -2.071732759475708, -1.9784640073776245, -1.885195255279541, -1.7919265031814575, -1.698657751083374, -1.6053889989852905, -1.512120246887207, -1.4188514947891235, -1.32558274269104, -1.2323139905929565, -1.139045238494873, -1.0457764863967896, -0.952507734298706, -0.8592389822006226, -0.7659702301025391, -0.6727014780044556, -0.5794327259063721, -0.4861639738082886, -0.3928952217102051, -0.2996264696121216, -0.20635771751403809, -0.11308896541595459, -0.019820451736450195, 0.0734483003616333, 0.1667170524597168, 0.2599858045578003, 0.3532545566558838, 0.4465233087539673, 0.5397920608520508, 0.6330608129501343, 0.7263295650482178, 0.8195983171463013, 0.9128670692443848, 1.0061358213424683, 1.0994045734405518, 1.1926733255386353, 1.2859420776367188, 1.3792108297348022, 1.4724795818328857, 1.5657483339309692, 1.6590170860290527, 1.7522858381271362, 1.8455545902252197, 1.9388233423233032, 2.0320920944213867, 2.1253609657287598, 2.2186295986175537, 2.3118982315063477, 2.4051671028137207, 2.4984359741210938, 2.5917046070098877, 2.6849732398986816, 2.7782421112060547, 2.8715109825134277, 2.9647796154022217]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 0.0, 6.0, 3.0, 4.0, 8.0, 6.0, 17.0, 13.0, 14.0, 14.0, 21.0, 25.0, 24.0, 26.0, 23.0, 33.0, 50.0, 106.0, 355.0, 1991.0, 23901.0, 2346223.0, 1798905.0, 20144.0, 1698.0, 294.0, 86.0, 57.0, 41.0, 34.0, 22.0, 22.0, 20.0, 23.0, 12.0, 15.0, 10.0, 10.0, 5.0, 8.0, 4.0, 0.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7734375, -2.680877685546875, -2.58831787109375, -2.495758056640625, -2.4031982421875, -2.310638427734375, -2.21807861328125, -2.125518798828125, -2.032958984375, -1.940399169921875, -1.84783935546875, -1.755279541015625, -1.6627197265625, -1.570159912109375, -1.47760009765625, -1.385040283203125, -1.29248046875, -1.199920654296875, -1.10736083984375, -1.014801025390625, -0.9222412109375, -0.829681396484375, -0.73712158203125, -0.644561767578125, -0.552001953125, -0.459442138671875, -0.36688232421875, -0.274322509765625, -0.1817626953125, -0.089202880859375, 0.00335693359375, 0.095916748046875, 0.1884765625, 0.281036376953125, 0.37359619140625, 0.466156005859375, 0.5587158203125, 0.651275634765625, 0.74383544921875, 0.836395263671875, 0.928955078125, 1.021514892578125, 1.11407470703125, 1.206634521484375, 1.2991943359375, 1.391754150390625, 1.48431396484375, 1.576873779296875, 1.66943359375, 1.761993408203125, 1.85455322265625, 1.947113037109375, 2.0396728515625, 2.132232666015625, 2.22479248046875, 2.317352294921875, 2.409912109375, 2.502471923828125, 2.59503173828125, 2.687591552734375, 2.7801513671875, 2.872711181640625, 2.96527099609375, 3.057830810546875, 3.150390625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 14.0, 8.0, 14.0, 13.0, 16.0, 24.0, 27.0, 28.0, 34.0, 40.0, 41.0, 37.0, 50.0, 51.0, 50.0, 45.0, 60.0, 51.0, 48.0, 43.0, 53.0, 35.0, 40.0, 33.0, 25.0, 24.0, 17.0, 16.0, 13.0, 8.0, 11.0, 8.0, 3.0, 8.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.74365234375, -0.7209320068359375, -0.698211669921875, -0.6754913330078125, -0.65277099609375, -0.6300506591796875, -0.607330322265625, -0.5846099853515625, -0.5618896484375, -0.5391693115234375, -0.516448974609375, -0.4937286376953125, -0.47100830078125, -0.4482879638671875, -0.425567626953125, -0.4028472900390625, -0.380126953125, -0.3574066162109375, -0.334686279296875, -0.3119659423828125, -0.28924560546875, -0.2665252685546875, -0.243804931640625, -0.2210845947265625, -0.1983642578125, -0.1756439208984375, -0.152923583984375, -0.1302032470703125, -0.10748291015625, -0.0847625732421875, -0.062042236328125, -0.0393218994140625, -0.0166015625, 0.0061187744140625, 0.028839111328125, 0.0515594482421875, 0.07427978515625, 0.0970001220703125, 0.119720458984375, 0.1424407958984375, 0.1651611328125, 0.1878814697265625, 0.210601806640625, 0.2333221435546875, 0.25604248046875, 0.2787628173828125, 0.301483154296875, 0.3242034912109375, 0.346923828125, 0.3696441650390625, 0.392364501953125, 0.4150848388671875, 0.43780517578125, 0.4605255126953125, 0.483245849609375, 0.5059661865234375, 0.5286865234375, 0.5514068603515625, 0.574127197265625, 0.5968475341796875, 0.61956787109375, 0.6422882080078125, 0.665008544921875, 0.6877288818359375, 0.71044921875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 2.0, 4.0, 6.0, 2.0, 5.0, 8.0, 14.0, 14.0, 37.0, 52.0, 100.0, 189.0, 373.0, 1424.0, 1751784.0, 2437976.0, 1413.0, 413.0, 190.0, 112.0, 72.0, 29.0, 19.0, 14.0, 17.0, 3.0, 6.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.5, -7.241455078125, -6.98291015625, -6.724365234375, -6.4658203125, -6.207275390625, -5.94873046875, -5.690185546875, -5.431640625, -5.173095703125, -4.91455078125, -4.656005859375, -4.3974609375, -4.138916015625, -3.88037109375, -3.621826171875, -3.36328125, -3.104736328125, -2.84619140625, -2.587646484375, -2.3291015625, -2.070556640625, -1.81201171875, -1.553466796875, -1.294921875, -1.036376953125, -0.77783203125, -0.519287109375, -0.2607421875, -0.002197265625, 0.25634765625, 0.514892578125, 0.7734375, 1.031982421875, 1.29052734375, 1.549072265625, 1.8076171875, 2.066162109375, 2.32470703125, 2.583251953125, 2.841796875, 3.100341796875, 3.35888671875, 3.617431640625, 3.8759765625, 4.134521484375, 4.39306640625, 4.651611328125, 4.91015625, 5.168701171875, 5.42724609375, 5.685791015625, 5.9443359375, 6.202880859375, 6.46142578125, 6.719970703125, 6.978515625, 7.237060546875, 7.49560546875, 7.754150390625, 8.0126953125, 8.271240234375, 8.52978515625, 8.788330078125, 9.046875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 7.0, 9.0, 20.0, 15.0, 22.0, 42.0, 78.0, 116.0, 206.0, 419.0, 740.0, 979.0, 635.0, 338.0, 185.0, 100.0, 54.0, 42.0, 19.0, 15.0, 5.0, 8.0, 7.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.5556640625, -0.5385055541992188, -0.5213470458984375, -0.5041885375976562, -0.487030029296875, -0.46987152099609375, -0.4527130126953125, -0.43555450439453125, -0.41839599609375, -0.40123748779296875, -0.3840789794921875, -0.36692047119140625, -0.349761962890625, -0.33260345458984375, -0.3154449462890625, -0.29828643798828125, -0.2811279296875, -0.26396942138671875, -0.2468109130859375, -0.22965240478515625, -0.212493896484375, -0.19533538818359375, -0.1781768798828125, -0.16101837158203125, -0.14385986328125, -0.12670135498046875, -0.1095428466796875, -0.09238433837890625, -0.075225830078125, -0.05806732177734375, -0.0409088134765625, -0.02375030517578125, -0.006591796875, 0.01056671142578125, 0.0277252197265625, 0.04488372802734375, 0.062042236328125, 0.07920074462890625, 0.0963592529296875, 0.11351776123046875, 0.13067626953125, 0.14783477783203125, 0.1649932861328125, 0.18215179443359375, 0.199310302734375, 0.21646881103515625, 0.2336273193359375, 0.25078582763671875, 0.2679443359375, 0.28510284423828125, 0.3022613525390625, 0.31941986083984375, 0.336578369140625, 0.35373687744140625, 0.3708953857421875, 0.38805389404296875, 0.40521240234375, 0.42237091064453125, 0.4395294189453125, 0.45668792724609375, 0.473846435546875, 0.49100494384765625, 0.5081634521484375, 0.5253219604492188, 0.54248046875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 7.0, 9.0, 22.0, 15.0, 10.0, 35.0, 35.0, 36.0, 49.0, 56.0, 77.0, 69.0, 67.0, 82.0, 70.0, 53.0, 54.0, 54.0, 32.0, 30.0, 27.0, 21.0, 17.0, 9.0, 10.0, 13.0, 6.0, 1.0, 7.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.9879431128501892, -0.9588159918785095, -0.9296888113021851, -0.9005616903305054, -0.8714345693588257, -0.842307448387146, -0.8131802678108215, -0.7840531468391418, -0.7549259662628174, -0.7257988452911377, -0.6966716647148132, -0.6675445437431335, -0.6384174227714539, -0.6092902421951294, -0.5801631212234497, -0.55103600025177, -0.5219088792800903, -0.49278172850608826, -0.46365460753440857, -0.4345274567604065, -0.4054003357887268, -0.37627318501472473, -0.34714603424072266, -0.31801891326904297, -0.2888917624950409, -0.2597646117210388, -0.23063749074935913, -0.20151033997535706, -0.17238320410251617, -0.1432560682296753, -0.11412891745567322, -0.08500178158283234, -0.05587470531463623, -0.02674756571650505, 0.002379573881626129, 0.03150671720504761, 0.06063385307788849, 0.08976098895072937, 0.11888813972473145, 0.14801527559757233, 0.1771424114704132, 0.2062695473432541, 0.23539668321609497, 0.26452383399009705, 0.2936509847640991, 0.3227781057357788, 0.3519052565097809, 0.38103240728378296, 0.41015952825546265, 0.4392866790294647, 0.4684138000011444, 0.4975409507751465, 0.5266680717468262, 0.5557951927185059, 0.5849223732948303, 0.61404949426651, 0.6431766748428345, 0.6723037958145142, 0.7014309763908386, 0.7305580973625183, 0.759685218334198, 0.7888123989105225, 0.8179395198822021, 0.8470666408538818, 0.8761937618255615]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 7.0, 5.0, 7.0, 14.0, 19.0, 20.0, 12.0, 24.0, 23.0, 16.0, 33.0, 29.0, 36.0, 45.0, 33.0, 30.0, 42.0, 41.0, 52.0, 46.0, 36.0, 36.0, 40.0, 37.0, 38.0, 34.0, 29.0, 25.0, 30.0, 21.0, 28.0, 20.0, 15.0, 18.0, 12.0, 13.0, 7.0, 3.0, 8.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.6997560262680054, -0.6777433753013611, -0.655730664730072, -0.6337180137634277, -0.6117053031921387, -0.5896926522254944, -0.5676800012588501, -0.545667290687561, -0.523654580116272, -0.5016419291496277, -0.4796292185783386, -0.45761656761169434, -0.4356038570404053, -0.413591206073761, -0.3915785253047943, -0.36956584453582764, -0.34755319356918335, -0.3255405128002167, -0.30352783203125, -0.2815151810646057, -0.25950247049331665, -0.23748980462551117, -0.2154771387577057, -0.193464457988739, -0.17145177721977234, -0.14943909645080566, -0.127426415681839, -0.10541374981403351, -0.08340106904506683, -0.06138838827610016, -0.03937572240829468, -0.017363041639328003, 0.0046495795249938965, 0.026662256568670273, 0.04867493361234665, 0.07068760693073273, 0.0927002876996994, 0.11471296846866608, 0.13672563433647156, 0.15873831510543823, 0.1807509958744049, 0.20276367664337158, 0.22477635741233826, 0.24678902328014374, 0.2688016891479492, 0.2908143997192383, 0.31282705068588257, 0.33483973145484924, 0.3568524122238159, 0.3788650929927826, 0.40087777376174927, 0.42289042472839355, 0.4449031352996826, 0.4669157862663269, 0.4889284670352936, 0.5109411478042603, 0.5329538583755493, 0.5549665093421936, 0.5769792199134827, 0.598991870880127, 0.621004581451416, 0.6430172324180603, 0.6650298833847046, 0.6870425939559937, 0.7090552449226379]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 6.0, 6.0, 8.0, 10.0, 15.0, 21.0, 35.0, 41.0, 76.0, 122.0, 205.0, 376.0, 804.0, 1462.0, 3225.0, 6902.0, 15143.0, 38639.0, 123677.0, 442241.0, 293221.0, 74988.0, 26281.0, 11143.0, 5072.0, 2332.0, 1169.0, 569.0, 300.0, 162.0, 102.0, 62.0, 45.0, 20.0, 22.0, 11.0, 6.0, 9.0, 8.0, 4.0, 5.0, 0.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.477294921875, -0.4635810852050781, -0.44986724853515625, -0.4361534118652344, -0.4224395751953125, -0.4087257385253906, -0.39501190185546875, -0.3812980651855469, -0.367584228515625, -0.3538703918457031, -0.34015655517578125, -0.3264427185058594, -0.3127288818359375, -0.2990150451660156, -0.28530120849609375, -0.2715873718261719, -0.25787353515625, -0.24415969848632812, -0.23044586181640625, -0.21673202514648438, -0.2030181884765625, -0.18930435180664062, -0.17559051513671875, -0.16187667846679688, -0.148162841796875, -0.13444900512695312, -0.12073516845703125, -0.10702133178710938, -0.0933074951171875, -0.07959365844726562, -0.06587982177734375, -0.052165985107421875, -0.0384521484375, -0.024738311767578125, -0.01102447509765625, 0.002689361572265625, 0.0164031982421875, 0.030117034912109375, 0.04383087158203125, 0.057544708251953125, 0.071258544921875, 0.08497238159179688, 0.09868621826171875, 0.11240005493164062, 0.1261138916015625, 0.13982772827148438, 0.15354156494140625, 0.16725540161132812, 0.18096923828125, 0.19468307495117188, 0.20839691162109375, 0.22211074829101562, 0.2358245849609375, 0.24953842163085938, 0.26325225830078125, 0.2769660949707031, 0.290679931640625, 0.3043937683105469, 0.31810760498046875, 0.3318214416503906, 0.3455352783203125, 0.3592491149902344, 0.37296295166015625, 0.3866767883300781, 0.400390625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 4.0, 5.0, 12.0, 13.0, 21.0, 26.0, 26.0, 26.0, 30.0, 33.0, 38.0, 43.0, 40.0, 46.0, 50.0, 45.0, 41.0, 48.0, 49.0, 39.0, 48.0, 39.0, 48.0, 41.0, 26.0, 26.0, 20.0, 18.0, 19.0, 8.0, 19.0, 13.0, 9.0, 5.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.435546875, -0.42089080810546875, -0.4062347412109375, -0.39157867431640625, -0.376922607421875, -0.36226654052734375, -0.3476104736328125, -0.33295440673828125, -0.31829833984375, -0.30364227294921875, -0.2889862060546875, -0.27433013916015625, -0.259674072265625, -0.24501800537109375, -0.2303619384765625, -0.21570587158203125, -0.2010498046875, -0.18639373779296875, -0.1717376708984375, -0.15708160400390625, -0.142425537109375, -0.12776947021484375, -0.1131134033203125, -0.09845733642578125, -0.08380126953125, -0.06914520263671875, -0.0544891357421875, -0.03983306884765625, -0.025177001953125, -0.01052093505859375, 0.0041351318359375, 0.01879119873046875, 0.033447265625, 0.04810333251953125, 0.0627593994140625, 0.07741546630859375, 0.092071533203125, 0.10672760009765625, 0.1213836669921875, 0.13603973388671875, 0.15069580078125, 0.16535186767578125, 0.1800079345703125, 0.19466400146484375, 0.209320068359375, 0.22397613525390625, 0.2386322021484375, 0.25328826904296875, 0.2679443359375, 0.28260040283203125, 0.2972564697265625, 0.31191253662109375, 0.326568603515625, 0.34122467041015625, 0.3558807373046875, 0.37053680419921875, 0.38519287109375, 0.39984893798828125, 0.4145050048828125, 0.42916107177734375, 0.443817138671875, 0.45847320556640625, 0.4731292724609375, 0.48778533935546875, 0.50244140625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 5.0, 8.0, 13.0, 14.0, 22.0, 24.0, 43.0, 66.0, 102.0, 120.0, 205.0, 309.0, 484.0, 849.0, 1423.0, 2479.0, 4573.0, 8801.0, 17623.0, 37446.0, 88961.0, 222174.0, 339829.0, 185494.0, 73340.0, 32065.0, 14990.0, 7583.0, 3996.0, 2187.0, 1281.0, 738.0, 472.0, 277.0, 182.0, 117.0, 87.0, 64.0, 27.0, 25.0, 20.0, 13.0, 10.0, 7.0, 3.0, 1.0, 5.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.26318359375, -0.2557487487792969, -0.24831390380859375, -0.24087905883789062, -0.2334442138671875, -0.22600936889648438, -0.21857452392578125, -0.21113967895507812, -0.203704833984375, -0.19626998901367188, -0.18883514404296875, -0.18140029907226562, -0.1739654541015625, -0.16653060913085938, -0.15909576416015625, -0.15166091918945312, -0.14422607421875, -0.13679122924804688, -0.12935638427734375, -0.12192153930664062, -0.1144866943359375, -0.10705184936523438, -0.09961700439453125, -0.09218215942382812, -0.084747314453125, -0.07731246948242188, -0.06987762451171875, -0.062442779541015625, -0.0550079345703125, -0.047573089599609375, -0.04013824462890625, -0.032703399658203125, -0.0252685546875, -0.017833709716796875, -0.01039886474609375, -0.002964019775390625, 0.0044708251953125, 0.011905670166015625, 0.01934051513671875, 0.026775360107421875, 0.034210205078125, 0.041645050048828125, 0.04907989501953125, 0.056514739990234375, 0.0639495849609375, 0.07138442993164062, 0.07881927490234375, 0.08625411987304688, 0.09368896484375, 0.10112380981445312, 0.10855865478515625, 0.11599349975585938, 0.1234283447265625, 0.13086318969726562, 0.13829803466796875, 0.14573287963867188, 0.153167724609375, 0.16060256958007812, 0.16803741455078125, 0.17547225952148438, 0.1829071044921875, 0.19034194946289062, 0.19777679443359375, 0.20521163940429688, 0.212646484375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 8.0, 5.0, 11.0, 13.0, 16.0, 19.0, 19.0, 20.0, 40.0, 46.0, 64.0, 60.0, 60.0, 64.0, 65.0, 63.0, 65.0, 57.0, 48.0, 59.0, 38.0, 36.0, 33.0, 25.0, 12.0, 15.0, 12.0, 10.0, 3.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84130859375, -0.8064498901367188, -0.7715911865234375, -0.7367324829101562, -0.701873779296875, -0.6670150756835938, -0.6321563720703125, -0.5972976684570312, -0.56243896484375, -0.5275802612304688, -0.4927215576171875, -0.45786285400390625, -0.423004150390625, -0.38814544677734375, -0.3532867431640625, -0.31842803955078125, -0.2835693359375, -0.24871063232421875, -0.2138519287109375, -0.17899322509765625, -0.144134521484375, -0.10927581787109375, -0.0744171142578125, -0.03955841064453125, -0.00469970703125, 0.03015899658203125, 0.0650177001953125, 0.09987640380859375, 0.134735107421875, 0.16959381103515625, 0.2044525146484375, 0.23931121826171875, 0.274169921875, 0.30902862548828125, 0.3438873291015625, 0.37874603271484375, 0.413604736328125, 0.44846343994140625, 0.4833221435546875, 0.5181808471679688, 0.55303955078125, 0.5878982543945312, 0.6227569580078125, 0.6576156616210938, 0.692474365234375, 0.7273330688476562, 0.7621917724609375, 0.7970504760742188, 0.8319091796875, 0.8667678833007812, 0.9016265869140625, 0.9364852905273438, 0.971343994140625, 1.0062026977539062, 1.0410614013671875, 1.0759201049804688, 1.11077880859375, 1.1456375122070312, 1.1804962158203125, 1.2153549194335938, 1.250213623046875, 1.2850723266601562, 1.3199310302734375, 1.3547897338867188, 1.3896484375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 11.0, 13.0, 13.0, 16.0, 35.0, 58.0, 70.0, 115.0, 174.0, 279.0, 489.0, 833.0, 1419.0, 2620.0, 4893.0, 10517.0, 24441.0, 67428.0, 220571.0, 416991.0, 194806.0, 60025.0, 22443.0, 9761.0, 4806.0, 2457.0, 1334.0, 735.0, 456.0, 283.0, 149.0, 95.0, 61.0, 61.0, 36.0, 25.0, 11.0, 10.0, 3.0, 5.0, 6.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.098876953125, -0.09600639343261719, -0.09313583374023438, -0.09026527404785156, -0.08739471435546875, -0.08452415466308594, -0.08165359497070312, -0.07878303527832031, -0.0759124755859375, -0.07304191589355469, -0.07017135620117188, -0.06730079650878906, -0.06443023681640625, -0.06155967712402344, -0.058689117431640625, -0.05581855773925781, -0.052947998046875, -0.05007743835449219, -0.047206878662109375, -0.04433631896972656, -0.04146575927734375, -0.03859519958496094, -0.035724639892578125, -0.03285408020019531, -0.0299835205078125, -0.027112960815429688, -0.024242401123046875, -0.021371841430664062, -0.01850128173828125, -0.015630722045898438, -0.012760162353515625, -0.009889602661132812, -0.00701904296875, -0.0041484832763671875, -0.001277923583984375, 0.0015926361083984375, 0.00446319580078125, 0.0073337554931640625, 0.010204315185546875, 0.013074874877929688, 0.0159454345703125, 0.018815994262695312, 0.021686553955078125, 0.024557113647460938, 0.02742767333984375, 0.030298233032226562, 0.033168792724609375, 0.03603935241699219, 0.038909912109375, 0.04178047180175781, 0.044651031494140625, 0.04752159118652344, 0.05039215087890625, 0.05326271057128906, 0.056133270263671875, 0.05900382995605469, 0.0618743896484375, 0.06474494934082031, 0.06761550903320312, 0.07048606872558594, 0.07335662841796875, 0.07622718811035156, 0.07909774780273438, 0.08196830749511719, 0.0848388671875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 2.0, 5.0, 6.0, 8.0, 14.0, 16.0, 27.0, 29.0, 59.0, 62.0, 75.0, 113.0, 147.0, 131.0, 91.0, 64.0, 25.0, 28.0, 18.0, 13.0, 14.0, 7.0, 6.0, 5.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.00010854005813598633, -0.00010555237531661987, -0.00010256469249725342, -9.957700967788696e-05, -9.658932685852051e-05, -9.360164403915405e-05, -9.06139612197876e-05, -8.762627840042114e-05, -8.463859558105469e-05, -8.165091276168823e-05, -7.866322994232178e-05, -7.567554712295532e-05, -7.268786430358887e-05, -6.970018148422241e-05, -6.671249866485596e-05, -6.37248158454895e-05, -6.073713302612305e-05, -5.774945020675659e-05, -5.476176738739014e-05, -5.177408456802368e-05, -4.8786401748657227e-05, -4.579871892929077e-05, -4.2811036109924316e-05, -3.982335329055786e-05, -3.6835670471191406e-05, -3.384798765182495e-05, -3.0860304832458496e-05, -2.787262201309204e-05, -2.4884939193725586e-05, -2.189725637435913e-05, -1.8909573554992676e-05, -1.592189073562622e-05, -1.2934207916259766e-05, -9.94652509689331e-06, -6.9588422775268555e-06, -3.9711594581604e-06, -9.834766387939453e-07, 2.0042061805725098e-06, 4.991888999938965e-06, 7.97957181930542e-06, 1.0967254638671875e-05, 1.395493745803833e-05, 1.6942620277404785e-05, 1.993030309677124e-05, 2.2917985916137695e-05, 2.590566873550415e-05, 2.8893351554870605e-05, 3.188103437423706e-05, 3.4868717193603516e-05, 3.785640001296997e-05, 4.0844082832336426e-05, 4.383176565170288e-05, 4.6819448471069336e-05, 4.980713129043579e-05, 5.2794814109802246e-05, 5.57824969291687e-05, 5.8770179748535156e-05, 6.175786256790161e-05, 6.474554538726807e-05, 6.773322820663452e-05, 7.072091102600098e-05, 7.370859384536743e-05, 7.669627666473389e-05, 7.968395948410034e-05, 8.26716423034668e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 7.0, 19.0, 11.0, 21.0, 41.0, 39.0, 81.0, 120.0, 273.0, 483.0, 1058.0, 2800.0, 9518.0, 51849.0, 448429.0, 464127.0, 54783.0, 9855.0, 2825.0, 1072.0, 511.0, 251.0, 131.0, 67.0, 44.0, 36.0, 27.0, 17.0, 13.0, 8.0, 6.0, 3.0, 7.0, 6.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.164794921875, -0.15964698791503906, -0.15449905395507812, -0.1493511199951172, -0.14420318603515625, -0.1390552520751953, -0.13390731811523438, -0.12875938415527344, -0.1236114501953125, -0.11846351623535156, -0.11331558227539062, -0.10816764831542969, -0.10301971435546875, -0.09787178039550781, -0.09272384643554688, -0.08757591247558594, -0.082427978515625, -0.07728004455566406, -0.07213211059570312, -0.06698417663574219, -0.06183624267578125, -0.05668830871582031, -0.051540374755859375, -0.04639244079589844, -0.0412445068359375, -0.03609657287597656, -0.030948638916015625, -0.025800704956054688, -0.02065277099609375, -0.015504837036132812, -0.010356903076171875, -0.0052089691162109375, -6.103515625e-05, 0.0050868988037109375, 0.010234832763671875, 0.015382766723632812, 0.02053070068359375, 0.025678634643554688, 0.030826568603515625, 0.03597450256347656, 0.0411224365234375, 0.04627037048339844, 0.051418304443359375, 0.05656623840332031, 0.06171417236328125, 0.06686210632324219, 0.07201004028320312, 0.07715797424316406, 0.082305908203125, 0.08745384216308594, 0.09260177612304688, 0.09774971008300781, 0.10289764404296875, 0.10804557800292969, 0.11319351196289062, 0.11834144592285156, 0.1234893798828125, 0.12863731384277344, 0.13378524780273438, 0.1389331817626953, 0.14408111572265625, 0.1492290496826172, 0.15437698364257812, 0.15952491760253906, 0.1646728515625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 6.0, 7.0, 8.0, 14.0, 19.0, 11.0, 31.0, 24.0, 49.0, 60.0, 66.0, 67.0, 82.0, 69.0, 83.0, 68.0, 76.0, 54.0, 45.0, 34.0, 25.0, 23.0, 19.0, 13.0, 7.0, 9.0, 5.0, 4.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.02825927734375, -0.02743816375732422, -0.026617050170898438, -0.025795936584472656, -0.024974822998046875, -0.024153709411621094, -0.023332595825195312, -0.02251148223876953, -0.02169036865234375, -0.02086925506591797, -0.020048141479492188, -0.019227027893066406, -0.018405914306640625, -0.017584800720214844, -0.016763687133789062, -0.01594257354736328, -0.0151214599609375, -0.014300346374511719, -0.013479232788085938, -0.012658119201660156, -0.011837005615234375, -0.011015892028808594, -0.010194778442382812, -0.009373664855957031, -0.00855255126953125, -0.007731437683105469, -0.0069103240966796875, -0.006089210510253906, -0.005268096923828125, -0.004446983337402344, -0.0036258697509765625, -0.0028047561645507812, -0.001983642578125, -0.0011625289916992188, -0.0003414154052734375, 0.00047969818115234375, 0.001300811767578125, 0.0021219253540039062, 0.0029430389404296875, 0.0037641525268554688, 0.00458526611328125, 0.005406379699707031, 0.0062274932861328125, 0.007048606872558594, 0.007869720458984375, 0.008690834045410156, 0.009511947631835938, 0.010333061218261719, 0.0111541748046875, 0.011975288391113281, 0.012796401977539062, 0.013617515563964844, 0.014438629150390625, 0.015259742736816406, 0.016080856323242188, 0.01690196990966797, 0.01772308349609375, 0.01854419708251953, 0.019365310668945312, 0.020186424255371094, 0.021007537841796875, 0.021828651428222656, 0.022649765014648438, 0.02347087860107422, 0.0242919921875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 14.0, 16.0, 34.0, 65.0, 126.0, 144.0, 196.0, 155.0, 104.0, 67.0, 29.0, 25.0, 6.0, 10.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5643506050109863, -1.5246598720550537, -1.484969139099121, -1.4452784061431885, -1.4055876731872559, -1.3658969402313232, -1.3262062072753906, -1.286515474319458, -1.2468247413635254, -1.2071340084075928, -1.1674432754516602, -1.1277525424957275, -1.088061809539795, -1.0483710765838623, -1.0086803436279297, -0.9689896106719971, -0.9292988777160645, -0.8896081447601318, -0.8499174118041992, -0.8102266788482666, -0.770535945892334, -0.7308452129364014, -0.6911544799804688, -0.6514637470245361, -0.6117730140686035, -0.5720822811126709, -0.5323915481567383, -0.49270081520080566, -0.45301008224487305, -0.41331934928894043, -0.3736286163330078, -0.3339378833770752, -0.2942470908164978, -0.2545563578605652, -0.21486562490463257, -0.17517489194869995, -0.13548415899276733, -0.09579342603683472, -0.0561026930809021, -0.016411960124969482, 0.023278772830963135, 0.06296950578689575, 0.10266023874282837, 0.142350971698761, 0.1820417046546936, 0.22173243761062622, 0.26142317056655884, 0.30111390352249146, 0.3408046364784241, 0.3804953694343567, 0.4201861023902893, 0.4598768353462219, 0.49956756830215454, 0.5392583012580872, 0.5789490342140198, 0.6186397671699524, 0.658330500125885, 0.6980212330818176, 0.7377119660377502, 0.7774026989936829, 0.8170934319496155, 0.8567841649055481, 0.8964748978614807, 0.9361656308174133, 0.975856363773346]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 6.0, 5.0, 9.0, 12.0, 5.0, 21.0, 17.0, 22.0, 20.0, 21.0, 30.0, 25.0, 32.0, 34.0, 32.0, 41.0, 44.0, 34.0, 48.0, 46.0, 37.0, 41.0, 41.0, 34.0, 42.0, 36.0, 40.0, 24.0, 22.0, 25.0, 29.0, 23.0, 12.0, 16.0, 11.0, 13.0, 10.0, 11.0, 5.0, 2.0, 7.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.39865368604660034, -0.38615572452545166, -0.3736577332019806, -0.3611597716808319, -0.34866178035736084, -0.33616381883621216, -0.3236658573150635, -0.3111678659915924, -0.2986699044704437, -0.28617194294929504, -0.273673951625824, -0.2611759901046753, -0.24867801368236542, -0.23618003726005554, -0.22368206083774567, -0.2111840844154358, -0.19868610799312592, -0.18618813157081604, -0.17369015514850616, -0.1611921787261963, -0.1486942172050476, -0.13619624078273773, -0.12369826436042786, -0.11120029538869858, -0.0987023189663887, -0.08620434254407883, -0.07370637357234955, -0.06120839715003967, -0.048710424453020096, -0.03621245175600052, -0.023714475333690643, -0.011216506361961365, 0.0012814700603485107, 0.013779443688690662, 0.026277417317032814, 0.03877539187669754, 0.05127336457371712, 0.0637713372707367, 0.07626931369304657, 0.08876728266477585, 0.10126525908708572, 0.1137632355093956, 0.12626120448112488, 0.13875918090343475, 0.15125715732574463, 0.1637551188468933, 0.17625311017036438, 0.18875107169151306, 0.20124904811382294, 0.2137470245361328, 0.2262450009584427, 0.23874297738075256, 0.25124093890190125, 0.2637389302253723, 0.276236891746521, 0.2887348532676697, 0.30123284459114075, 0.31373080611228943, 0.3262287974357605, 0.3387267589569092, 0.35122475028038025, 0.36372271180152893, 0.376220703125, 0.3887186646461487, 0.40121662616729736]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 9.0, 12.0, 15.0, 18.0, 25.0, 49.0, 77.0, 106.0, 162.0, 212.0, 371.0, 621.0, 1061.0, 1719.0, 2998.0, 5419.0, 10299.0, 19949.0, 41034.0, 95475.0, 307930.0, 367556.0, 103787.0, 44041.0, 21144.0, 10878.0, 5699.0, 3178.0, 1831.0, 1088.0, 623.0, 411.0, 260.0, 147.0, 117.0, 72.0, 58.0, 19.0, 22.0, 11.0, 10.0, 10.0, 12.0, 3.0, 4.0, 2.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.471435546875, -0.4571685791015625, -0.442901611328125, -0.4286346435546875, -0.41436767578125, -0.4001007080078125, -0.385833740234375, -0.3715667724609375, -0.3572998046875, -0.3430328369140625, -0.328765869140625, -0.3144989013671875, -0.30023193359375, -0.2859649658203125, -0.271697998046875, -0.2574310302734375, -0.2431640625, -0.2288970947265625, -0.214630126953125, -0.2003631591796875, -0.18609619140625, -0.1718292236328125, -0.157562255859375, -0.1432952880859375, -0.1290283203125, -0.1147613525390625, -0.100494384765625, -0.0862274169921875, -0.07196044921875, -0.0576934814453125, -0.043426513671875, -0.0291595458984375, -0.014892578125, -0.0006256103515625, 0.013641357421875, 0.0279083251953125, 0.04217529296875, 0.0564422607421875, 0.070709228515625, 0.0849761962890625, 0.0992431640625, 0.1135101318359375, 0.127777099609375, 0.1420440673828125, 0.15631103515625, 0.1705780029296875, 0.184844970703125, 0.1991119384765625, 0.21337890625, 0.2276458740234375, 0.241912841796875, 0.2561798095703125, 0.27044677734375, 0.2847137451171875, 0.298980712890625, 0.3132476806640625, 0.3275146484375, 0.3417816162109375, 0.356048583984375, 0.3703155517578125, 0.38458251953125, 0.3988494873046875, 0.413116455078125, 0.4273834228515625, 0.441650390625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 7.0, 7.0, 12.0, 11.0, 12.0, 19.0, 17.0, 20.0, 29.0, 28.0, 33.0, 30.0, 48.0, 43.0, 37.0, 38.0, 49.0, 50.0, 52.0, 42.0, 52.0, 40.0, 51.0, 36.0, 32.0, 27.0, 33.0, 18.0, 26.0, 21.0, 18.0, 8.0, 9.0, 11.0, 9.0, 8.0, 4.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.998046875, -0.967803955078125, -0.93756103515625, -0.907318115234375, -0.8770751953125, -0.846832275390625, -0.81658935546875, -0.786346435546875, -0.756103515625, -0.725860595703125, -0.69561767578125, -0.665374755859375, -0.6351318359375, -0.604888916015625, -0.57464599609375, -0.544403076171875, -0.51416015625, -0.483917236328125, -0.45367431640625, -0.423431396484375, -0.3931884765625, -0.362945556640625, -0.33270263671875, -0.302459716796875, -0.272216796875, -0.241973876953125, -0.21173095703125, -0.181488037109375, -0.1512451171875, -0.121002197265625, -0.09075927734375, -0.060516357421875, -0.0302734375, -3.0517578125e-05, 0.03021240234375, 0.060455322265625, 0.0906982421875, 0.120941162109375, 0.15118408203125, 0.181427001953125, 0.211669921875, 0.241912841796875, 0.27215576171875, 0.302398681640625, 0.3326416015625, 0.362884521484375, 0.39312744140625, 0.423370361328125, 0.45361328125, 0.483856201171875, 0.51409912109375, 0.544342041015625, 0.5745849609375, 0.604827880859375, 0.63507080078125, 0.665313720703125, 0.695556640625, 0.725799560546875, 0.75604248046875, 0.786285400390625, 0.8165283203125, 0.846771240234375, 0.87701416015625, 0.907257080078125, 0.9375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 8.0, 4.0, 7.0, 10.0, 12.0, 17.0, 29.0, 23.0, 23.0, 22.0, 28.0, 36.0, 62.0, 95.0, 149.0, 571.0, 20638.0, 1021067.0, 4841.0, 409.0, 134.0, 65.0, 51.0, 48.0, 34.0, 29.0, 30.0, 14.0, 25.0, 17.0, 10.0, 16.0, 12.0, 5.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.66015625, -4.528411865234375, -4.39666748046875, -4.264923095703125, -4.1331787109375, -4.001434326171875, -3.86968994140625, -3.737945556640625, -3.606201171875, -3.474456787109375, -3.34271240234375, -3.210968017578125, -3.0792236328125, -2.947479248046875, -2.81573486328125, -2.683990478515625, -2.55224609375, -2.420501708984375, -2.28875732421875, -2.157012939453125, -2.0252685546875, -1.893524169921875, -1.76177978515625, -1.630035400390625, -1.498291015625, -1.366546630859375, -1.23480224609375, -1.103057861328125, -0.9713134765625, -0.839569091796875, -0.70782470703125, -0.576080322265625, -0.4443359375, -0.312591552734375, -0.18084716796875, -0.049102783203125, 0.0826416015625, 0.214385986328125, 0.34613037109375, 0.477874755859375, 0.609619140625, 0.741363525390625, 0.87310791015625, 1.004852294921875, 1.1365966796875, 1.268341064453125, 1.40008544921875, 1.531829833984375, 1.66357421875, 1.795318603515625, 1.92706298828125, 2.058807373046875, 2.1905517578125, 2.322296142578125, 2.45404052734375, 2.585784912109375, 2.717529296875, 2.849273681640625, 2.98101806640625, 3.112762451171875, 3.2445068359375, 3.376251220703125, 3.50799560546875, 3.639739990234375, 3.771484375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 5.0, 7.0, 5.0, 10.0, 5.0, 9.0, 15.0, 19.0, 17.0, 19.0, 32.0, 29.0, 25.0, 30.0, 31.0, 55.0, 47.0, 48.0, 37.0, 47.0, 52.0, 47.0, 46.0, 40.0, 39.0, 37.0, 32.0, 32.0, 16.0, 38.0, 16.0, 21.0, 19.0, 16.0, 16.0, 10.0, 13.0, 6.0, 8.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.072265625, -1.0425643920898438, -1.0128631591796875, -0.9831619262695312, -0.953460693359375, -0.9237594604492188, -0.8940582275390625, -0.8643569946289062, -0.83465576171875, -0.8049545288085938, -0.7752532958984375, -0.7455520629882812, -0.715850830078125, -0.6861495971679688, -0.6564483642578125, -0.6267471313476562, -0.5970458984375, -0.5673446655273438, -0.5376434326171875, -0.5079421997070312, -0.478240966796875, -0.44853973388671875, -0.4188385009765625, -0.38913726806640625, -0.35943603515625, -0.32973480224609375, -0.3000335693359375, -0.27033233642578125, -0.240631103515625, -0.21092987060546875, -0.1812286376953125, -0.15152740478515625, -0.121826171875, -0.09212493896484375, -0.0624237060546875, -0.03272247314453125, -0.003021240234375, 0.02667999267578125, 0.0563812255859375, 0.08608245849609375, 0.11578369140625, 0.14548492431640625, 0.1751861572265625, 0.20488739013671875, 0.234588623046875, 0.26428985595703125, 0.2939910888671875, 0.32369232177734375, 0.3533935546875, 0.38309478759765625, 0.4127960205078125, 0.44249725341796875, 0.472198486328125, 0.5018997192382812, 0.5316009521484375, 0.5613021850585938, 0.59100341796875, 0.6207046508789062, 0.6504058837890625, 0.6801071166992188, 0.709808349609375, 0.7395095825195312, 0.7692108154296875, 0.7989120483398438, 0.82861328125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 8.0, 5.0, 10.0, 27.0, 36.0, 45.0, 94.0, 157.0, 322.0, 782.0, 2374.0, 10781.0, 97184.0, 872326.0, 53836.0, 7479.0, 1837.0, 634.0, 280.0, 152.0, 71.0, 45.0, 30.0, 13.0, 7.0, 10.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6005859375, -0.5831222534179688, -0.5656585693359375, -0.5481948852539062, -0.530731201171875, -0.5132675170898438, -0.4958038330078125, -0.47834014892578125, -0.46087646484375, -0.44341278076171875, -0.4259490966796875, -0.40848541259765625, -0.391021728515625, -0.37355804443359375, -0.3560943603515625, -0.33863067626953125, -0.3211669921875, -0.30370330810546875, -0.2862396240234375, -0.26877593994140625, -0.251312255859375, -0.23384857177734375, -0.2163848876953125, -0.19892120361328125, -0.18145751953125, -0.16399383544921875, -0.1465301513671875, -0.12906646728515625, -0.111602783203125, -0.09413909912109375, -0.0766754150390625, -0.05921173095703125, -0.041748046875, -0.02428436279296875, -0.0068206787109375, 0.01064300537109375, 0.028106689453125, 0.04557037353515625, 0.0630340576171875, 0.08049774169921875, 0.09796142578125, 0.11542510986328125, 0.1328887939453125, 0.15035247802734375, 0.167816162109375, 0.18527984619140625, 0.2027435302734375, 0.22020721435546875, 0.2376708984375, 0.25513458251953125, 0.2725982666015625, 0.29006195068359375, 0.307525634765625, 0.32498931884765625, 0.3424530029296875, 0.35991668701171875, 0.37738037109375, 0.39484405517578125, 0.4123077392578125, 0.42977142333984375, 0.447235107421875, 0.46469879150390625, 0.4821624755859375, 0.49962615966796875, 0.51708984375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 1.0, 1.0, 5.0, 1.0, 4.0, 3.0, 2.0, 8.0, 2.0, 9.0, 8.0, 11.0, 18.0, 25.0, 34.0, 49.0, 37.0, 82.0, 110.0, 201.0, 118.0, 81.0, 53.0, 32.0, 26.0, 18.0, 9.0, 10.0, 12.0, 9.0, 7.0, 2.0, 1.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.571676254272461e-05, -4.416331648826599e-05, -4.260987043380737e-05, -4.1056424379348755e-05, -3.950297832489014e-05, -3.794953227043152e-05, -3.63960862159729e-05, -3.484264016151428e-05, -3.3289194107055664e-05, -3.1735748052597046e-05, -3.0182301998138428e-05, -2.862885594367981e-05, -2.707540988922119e-05, -2.5521963834762573e-05, -2.3968517780303955e-05, -2.2415071725845337e-05, -2.086162567138672e-05, -1.93081796169281e-05, -1.7754733562469482e-05, -1.6201287508010864e-05, -1.4647841453552246e-05, -1.3094395399093628e-05, -1.154094934463501e-05, -9.987503290176392e-06, -8.434057235717773e-06, -6.880611181259155e-06, -5.327165126800537e-06, -3.773719072341919e-06, -2.2202730178833008e-06, -6.668269634246826e-07, 8.866190910339355e-07, 2.4400651454925537e-06, 3.993511199951172e-06, 5.54695725440979e-06, 7.100403308868408e-06, 8.653849363327026e-06, 1.0207295417785645e-05, 1.1760741472244263e-05, 1.3314187526702881e-05, 1.4867633581161499e-05, 1.6421079635620117e-05, 1.7974525690078735e-05, 1.9527971744537354e-05, 2.108141779899597e-05, 2.263486385345459e-05, 2.4188309907913208e-05, 2.5741755962371826e-05, 2.7295202016830444e-05, 2.8848648071289062e-05, 3.040209412574768e-05, 3.19555401802063e-05, 3.350898623466492e-05, 3.5062432289123535e-05, 3.661587834358215e-05, 3.816932439804077e-05, 3.972277045249939e-05, 4.127621650695801e-05, 4.2829662561416626e-05, 4.4383108615875244e-05, 4.593655467033386e-05, 4.749000072479248e-05, 4.90434467792511e-05, 5.059689283370972e-05, 5.2150338888168335e-05, 5.370378494262695e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 4.0, 4.0, 12.0, 11.0, 20.0, 21.0, 42.0, 63.0, 94.0, 177.0, 339.0, 702.0, 1778.0, 5772.0, 23101.0, 160505.0, 761148.0, 74663.0, 13884.0, 3758.0, 1243.0, 546.0, 294.0, 134.0, 81.0, 47.0, 37.0, 24.0, 23.0, 13.0, 6.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.333740234375, -0.32196044921875, -0.3101806640625, -0.29840087890625, -0.28662109375, -0.27484130859375, -0.2630615234375, -0.25128173828125, -0.239501953125, -0.22772216796875, -0.2159423828125, -0.20416259765625, -0.1923828125, -0.18060302734375, -0.1688232421875, -0.15704345703125, -0.145263671875, -0.13348388671875, -0.1217041015625, -0.10992431640625, -0.09814453125, -0.08636474609375, -0.0745849609375, -0.06280517578125, -0.051025390625, -0.03924560546875, -0.0274658203125, -0.01568603515625, -0.00390625, 0.00787353515625, 0.0196533203125, 0.03143310546875, 0.043212890625, 0.05499267578125, 0.0667724609375, 0.07855224609375, 0.09033203125, 0.10211181640625, 0.1138916015625, 0.12567138671875, 0.137451171875, 0.14923095703125, 0.1610107421875, 0.17279052734375, 0.1845703125, 0.19635009765625, 0.2081298828125, 0.21990966796875, 0.231689453125, 0.24346923828125, 0.2552490234375, 0.26702880859375, 0.27880859375, 0.29058837890625, 0.3023681640625, 0.31414794921875, 0.325927734375, 0.33770751953125, 0.3494873046875, 0.36126708984375, 0.373046875, 0.38482666015625, 0.3966064453125, 0.40838623046875, 0.420166015625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 5.0, 6.0, 8.0, 7.0, 12.0, 15.0, 23.0, 23.0, 26.0, 38.0, 66.0, 66.0, 124.0, 172.0, 117.0, 66.0, 62.0, 36.0, 28.0, 18.0, 12.0, 10.0, 10.0, 14.0, 5.0, 8.0, 7.0, 2.0, 0.0, 5.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1099853515625, -0.10611724853515625, -0.1022491455078125, -0.09838104248046875, -0.094512939453125, -0.09064483642578125, -0.0867767333984375, -0.08290863037109375, -0.07904052734375, -0.07517242431640625, -0.0713043212890625, -0.06743621826171875, -0.063568115234375, -0.05970001220703125, -0.0558319091796875, -0.05196380615234375, -0.048095703125, -0.04422760009765625, -0.0403594970703125, -0.03649139404296875, -0.032623291015625, -0.02875518798828125, -0.0248870849609375, -0.02101898193359375, -0.01715087890625, -0.01328277587890625, -0.0094146728515625, -0.00554656982421875, -0.001678466796875, 0.00218963623046875, 0.0060577392578125, 0.00992584228515625, 0.0137939453125, 0.01766204833984375, 0.0215301513671875, 0.02539825439453125, 0.029266357421875, 0.03313446044921875, 0.0370025634765625, 0.04087066650390625, 0.04473876953125, 0.04860687255859375, 0.0524749755859375, 0.05634307861328125, 0.060211181640625, 0.06407928466796875, 0.0679473876953125, 0.07181549072265625, 0.07568359375, 0.07955169677734375, 0.0834197998046875, 0.08728790283203125, 0.091156005859375, 0.09502410888671875, 0.0988922119140625, 0.10276031494140625, 0.10662841796875, 0.11049652099609375, 0.1143646240234375, 0.11823272705078125, 0.122100830078125, 0.12596893310546875, 0.1298370361328125, 0.13370513916015625, 0.1375732421875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 29.0, 52.0, 150.0, 237.0, 264.0, 172.0, 69.0, 24.0, 4.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-6.7317328453063965, -6.605012893676758, -6.478292465209961, -6.351572036743164, -6.224852085113525, -6.098132133483887, -5.97141170501709, -5.844691276550293, -5.717971324920654, -5.591251373291016, -5.464530944824219, -5.337810516357422, -5.211090564727783, -5.0843706130981445, -4.957650184631348, -4.830929756164551, -4.704209804534912, -4.577489852905273, -4.450769424438477, -4.32404899597168, -4.197329044342041, -4.070609092712402, -3.9438886642456055, -3.8171684741973877, -3.69044828414917, -3.563728094100952, -3.4370079040527344, -3.3102877140045166, -3.183567523956299, -3.056847333908081, -2.9301271438598633, -2.8034069538116455, -2.676687240600586, -2.549967050552368, -2.4232468605041504, -2.2965266704559326, -2.169806480407715, -2.043086290359497, -1.9163661003112793, -1.7896459102630615, -1.6629256010055542, -1.5362054109573364, -1.4094852209091187, -1.2827650308609009, -1.156044840812683, -1.0293246507644653, -0.9026044607162476, -0.7758842706680298, -0.649164080619812, -0.5224438905715942, -0.39572370052337646, -0.2690035104751587, -0.14228332042694092, -0.015563130378723145, 0.11115705966949463, 0.2378772497177124, 0.3645974397659302, 0.49131762981414795, 0.6180378198623657, 0.7447580099105835, 0.8714781999588013, 0.998198390007019, 1.1249185800552368, 1.2516387701034546, 1.3783589601516724]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 2.0, 5.0, 8.0, 10.0, 11.0, 26.0, 19.0, 20.0, 19.0, 23.0, 33.0, 41.0, 37.0, 56.0, 44.0, 56.0, 46.0, 60.0, 63.0, 57.0, 53.0, 52.0, 42.0, 29.0, 37.0, 36.0, 23.0, 23.0, 24.0, 14.0, 9.0, 3.0, 12.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7252743244171143, -1.6719555854797363, -1.618636965751648, -1.56531822681427, -1.5119996070861816, -1.4586808681488037, -1.4053621292114258, -1.3520435094833374, -1.298724889755249, -1.245406150817871, -1.1920875310897827, -1.1387687921524048, -1.0854501724243164, -1.0321314334869385, -0.9788127541542053, -0.9254940748214722, -0.8721753358840942, -0.8188566565513611, -0.7655379772186279, -0.71221923828125, -0.6589006185531616, -0.6055818796157837, -0.5522632002830505, -0.4989445209503174, -0.44562584161758423, -0.3923071622848511, -0.3389884829521179, -0.2856697738170624, -0.23235109448432922, -0.17903241515159607, -0.12571370601654053, -0.07239502668380737, -0.01907634735107422, 0.03424233943223953, 0.08756102621555328, 0.14087972044944763, 0.1941983997821808, 0.24751707911491394, 0.3008357882499695, 0.35415446758270264, 0.4074731469154358, 0.46079182624816895, 0.5141105055809021, 0.5674291849136353, 0.6207479238510132, 0.6740665435791016, 0.7273852825164795, 0.7807039618492126, 0.8340226411819458, 0.887341320514679, 0.9406599998474121, 0.99397873878479, 1.0472973585128784, 1.1006160974502563, 1.1539347171783447, 1.2072534561157227, 1.2605721950531006, 1.3138909339904785, 1.367209553718567, 1.4205282926559448, 1.4738469123840332, 1.5271656513214111, 1.580484390258789, 1.6338030099868774, 1.6871216297149658]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 8.0, 11.0, 17.0, 16.0, 26.0, 48.0, 83.0, 119.0, 200.0, 334.0, 601.0, 1136.0, 2304.0, 5282.0, 14796.0, 54261.0, 297547.0, 1568596.0, 1781274.0, 376908.0, 63946.0, 16164.0, 5655.0, 2355.0, 1118.0, 594.0, 280.0, 206.0, 134.0, 84.0, 57.0, 37.0, 31.0, 20.0, 9.0, 4.0, 9.0, 5.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.845703125, -0.8193206787109375, -0.792938232421875, -0.7665557861328125, -0.74017333984375, -0.7137908935546875, -0.687408447265625, -0.6610260009765625, -0.6346435546875, -0.6082611083984375, -0.581878662109375, -0.5554962158203125, -0.52911376953125, -0.5027313232421875, -0.476348876953125, -0.4499664306640625, -0.423583984375, -0.3972015380859375, -0.370819091796875, -0.3444366455078125, -0.31805419921875, -0.2916717529296875, -0.265289306640625, -0.2389068603515625, -0.2125244140625, -0.1861419677734375, -0.159759521484375, -0.1333770751953125, -0.10699462890625, -0.0806121826171875, -0.054229736328125, -0.0278472900390625, -0.00146484375, 0.0249176025390625, 0.051300048828125, 0.0776824951171875, 0.10406494140625, 0.1304473876953125, 0.156829833984375, 0.1832122802734375, 0.2095947265625, 0.2359771728515625, 0.262359619140625, 0.2887420654296875, 0.31512451171875, 0.3415069580078125, 0.367889404296875, 0.3942718505859375, 0.420654296875, 0.4470367431640625, 0.473419189453125, 0.4998016357421875, 0.52618408203125, 0.5525665283203125, 0.578948974609375, 0.6053314208984375, 0.6317138671875, 0.6580963134765625, 0.684478759765625, 0.7108612060546875, 0.73724365234375, 0.7636260986328125, 0.790008544921875, 0.8163909912109375, 0.8427734375]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 6.0, 7.0, 8.0, 10.0, 16.0, 13.0, 18.0, 15.0, 24.0, 27.0, 35.0, 28.0, 34.0, 43.0, 45.0, 43.0, 50.0, 42.0, 45.0, 39.0, 54.0, 43.0, 38.0, 43.0, 45.0, 26.0, 29.0, 32.0, 22.0, 26.0, 10.0, 19.0, 14.0, 7.0, 11.0, 5.0, 12.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.646484375, -0.6278533935546875, -0.609222412109375, -0.5905914306640625, -0.57196044921875, -0.5533294677734375, -0.534698486328125, -0.5160675048828125, -0.4974365234375, -0.4788055419921875, -0.460174560546875, -0.4415435791015625, -0.42291259765625, -0.4042816162109375, -0.385650634765625, -0.3670196533203125, -0.348388671875, -0.3297576904296875, -0.311126708984375, -0.2924957275390625, -0.27386474609375, -0.2552337646484375, -0.236602783203125, -0.2179718017578125, -0.1993408203125, -0.1807098388671875, -0.162078857421875, -0.1434478759765625, -0.12481689453125, -0.1061859130859375, -0.087554931640625, -0.0689239501953125, -0.05029296875, -0.0316619873046875, -0.013031005859375, 0.0055999755859375, 0.02423095703125, 0.0428619384765625, 0.061492919921875, 0.0801239013671875, 0.0987548828125, 0.1173858642578125, 0.136016845703125, 0.1546478271484375, 0.17327880859375, 0.1919097900390625, 0.210540771484375, 0.2291717529296875, 0.247802734375, 0.2664337158203125, 0.285064697265625, 0.3036956787109375, 0.32232666015625, 0.3409576416015625, 0.359588623046875, 0.3782196044921875, 0.3968505859375, 0.4154815673828125, 0.434112548828125, 0.4527435302734375, 0.47137451171875, 0.4900054931640625, 0.508636474609375, 0.5272674560546875, 0.5458984375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 6.0, 7.0, 7.0, 8.0, 13.0, 19.0, 23.0, 44.0, 75.0, 154.0, 205.0, 471.0, 1299.0, 4671.0, 38342.0, 2397500.0, 1712165.0, 32552.0, 4486.0, 1242.0, 451.0, 183.0, 109.0, 74.0, 47.0, 36.0, 23.0, 21.0, 5.0, 9.0, 10.0, 5.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.064453125, -2.00860595703125, -1.9527587890625, -1.89691162109375, -1.841064453125, -1.78521728515625, -1.7293701171875, -1.67352294921875, -1.61767578125, -1.56182861328125, -1.5059814453125, -1.45013427734375, -1.394287109375, -1.33843994140625, -1.2825927734375, -1.22674560546875, -1.1708984375, -1.11505126953125, -1.0592041015625, -1.00335693359375, -0.947509765625, -0.89166259765625, -0.8358154296875, -0.77996826171875, -0.72412109375, -0.66827392578125, -0.6124267578125, -0.55657958984375, -0.500732421875, -0.44488525390625, -0.3890380859375, -0.33319091796875, -0.27734375, -0.22149658203125, -0.1656494140625, -0.10980224609375, -0.053955078125, 0.00189208984375, 0.0577392578125, 0.11358642578125, 0.16943359375, 0.22528076171875, 0.2811279296875, 0.33697509765625, 0.392822265625, 0.44866943359375, 0.5045166015625, 0.56036376953125, 0.6162109375, 0.67205810546875, 0.7279052734375, 0.78375244140625, 0.839599609375, 0.89544677734375, 0.9512939453125, 1.00714111328125, 1.06298828125, 1.11883544921875, 1.1746826171875, 1.23052978515625, 1.286376953125, 1.34222412109375, 1.3980712890625, 1.45391845703125, 1.509765625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 3.0, 7.0, 6.0, 10.0, 16.0, 20.0, 22.0, 34.0, 59.0, 89.0, 118.0, 185.0, 306.0, 437.0, 582.0, 672.0, 515.0, 332.0, 216.0, 141.0, 94.0, 64.0, 51.0, 24.0, 21.0, 12.0, 11.0, 6.0, 1.0, 9.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255615234375, -0.24585342407226562, -0.23609161376953125, -0.22632980346679688, -0.2165679931640625, -0.20680618286132812, -0.19704437255859375, -0.18728256225585938, -0.177520751953125, -0.16775894165039062, -0.15799713134765625, -0.14823532104492188, -0.1384735107421875, -0.12871170043945312, -0.11894989013671875, -0.10918807983398438, -0.09942626953125, -0.08966445922851562, -0.07990264892578125, -0.07014083862304688, -0.0603790283203125, -0.050617218017578125, -0.04085540771484375, -0.031093597412109375, -0.021331787109375, -0.011569976806640625, -0.00180816650390625, 0.007953643798828125, 0.0177154541015625, 0.027477264404296875, 0.03723907470703125, 0.047000885009765625, 0.0567626953125, 0.06652450561523438, 0.07628631591796875, 0.08604812622070312, 0.0958099365234375, 0.10557174682617188, 0.11533355712890625, 0.12509536743164062, 0.134857177734375, 0.14461898803710938, 0.15438079833984375, 0.16414260864257812, 0.1739044189453125, 0.18366622924804688, 0.19342803955078125, 0.20318984985351562, 0.21295166015625, 0.22271347045898438, 0.23247528076171875, 0.24223709106445312, 0.2519989013671875, 0.2617607116699219, 0.27152252197265625, 0.2812843322753906, 0.291046142578125, 0.3008079528808594, 0.31056976318359375, 0.3203315734863281, 0.3300933837890625, 0.3398551940917969, 0.34961700439453125, 0.3593788146972656, 0.369140625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 7.0, 5.0, 10.0, 21.0, 34.0, 34.0, 62.0, 93.0, 116.0, 133.0, 117.0, 98.0, 91.0, 71.0, 50.0, 25.0, 14.0, 11.0, 9.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.818373441696167, -1.772924780845642, -1.7274761199951172, -1.6820274591445923, -1.6365787982940674, -1.5911301374435425, -1.5456814765930176, -1.5002328157424927, -1.4547841548919678, -1.4093354940414429, -1.363886833190918, -1.318438172340393, -1.2729895114898682, -1.2275408506393433, -1.1820921897888184, -1.1366435289382935, -1.0911948680877686, -1.0457462072372437, -1.0002975463867188, -0.9548488855361938, -0.909400224685669, -0.863951563835144, -0.8185029029846191, -0.7730542421340942, -0.7276055812835693, -0.6821569204330444, -0.6367082595825195, -0.5912595987319946, -0.5458109378814697, -0.5003622770309448, -0.4549136161804199, -0.409464955329895, -0.3640162944793701, -0.3185676336288452, -0.2731189727783203, -0.2276703119277954, -0.1822216510772705, -0.1367729902267456, -0.0913243293762207, -0.0458756685256958, -0.00042700767517089844, 0.045021653175354004, 0.0904703140258789, 0.1359189748764038, 0.1813676357269287, 0.2268162965774536, 0.2722649574279785, 0.3177136182785034, 0.3631622791290283, 0.4086109399795532, 0.4540596008300781, 0.499508261680603, 0.5449569225311279, 0.5904055833816528, 0.6358542442321777, 0.6813029050827026, 0.7267515659332275, 0.7722002267837524, 0.8176488876342773, 0.8630975484848022, 0.9085462093353271, 0.953994870185852, 0.999443531036377, 1.0448921918869019, 1.0903408527374268]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 4.0, 2.0, 1.0, 9.0, 3.0, 8.0, 8.0, 10.0, 13.0, 19.0, 18.0, 20.0, 26.0, 27.0, 24.0, 30.0, 38.0, 49.0, 40.0, 42.0, 49.0, 55.0, 52.0, 40.0, 42.0, 44.0, 38.0, 35.0, 29.0, 35.0, 38.0, 30.0, 25.0, 19.0, 12.0, 14.0, 11.0, 7.0, 7.0, 6.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6541244387626648, -0.6333881616592407, -0.6126518845558167, -0.5919156074523926, -0.5711793303489685, -0.5504430532455444, -0.5297067761421204, -0.5089704990386963, -0.4882342517375946, -0.46749797463417053, -0.44676169753074646, -0.4260254204273224, -0.4052891731262207, -0.38455289602279663, -0.36381661891937256, -0.3430803418159485, -0.3223440647125244, -0.30160778760910034, -0.28087151050567627, -0.2601352334022522, -0.23939897119998932, -0.21866269409656525, -0.19792643189430237, -0.1771901547908783, -0.15645387768745422, -0.13571760058403015, -0.11498133093118668, -0.0942450612783432, -0.07350878417491913, -0.052772507071495056, -0.03203623741865158, -0.011299967765808105, 0.009436309337615967, 0.03017258271574974, 0.050908856093883514, 0.07164512574672699, 0.09238140285015106, 0.11311767995357513, 0.133853942155838, 0.15459021925926208, 0.17532649636268616, 0.19606277346611023, 0.2167990505695343, 0.23753531277179718, 0.25827157497406006, 0.27900785207748413, 0.2997441291809082, 0.3204804062843323, 0.34121668338775635, 0.3619529604911804, 0.3826892375946045, 0.40342551469802856, 0.42416179180145264, 0.4448980689048767, 0.4656343162059784, 0.48637059330940247, 0.5071069002151489, 0.527843177318573, 0.5485794544219971, 0.5693157315254211, 0.5900520086288452, 0.6107882857322693, 0.6315245628356934, 0.6522607803344727, 0.6729970574378967]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 8.0, 8.0, 12.0, 15.0, 32.0, 78.0, 156.0, 429.0, 1588.0, 5814.0, 26786.0, 356382.0, 610154.0, 36789.0, 7485.0, 1899.0, 549.0, 192.0, 72.0, 30.0, 32.0, 11.0, 9.0, 4.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8251953125, -0.8002548217773438, -0.7753143310546875, -0.7503738403320312, -0.725433349609375, -0.7004928588867188, -0.6755523681640625, -0.6506118774414062, -0.62567138671875, -0.6007308959960938, -0.5757904052734375, -0.5508499145507812, -0.525909423828125, -0.5009689331054688, -0.4760284423828125, -0.45108795166015625, -0.4261474609375, -0.40120697021484375, -0.3762664794921875, -0.35132598876953125, -0.326385498046875, -0.30144500732421875, -0.2765045166015625, -0.25156402587890625, -0.22662353515625, -0.20168304443359375, -0.1767425537109375, -0.15180206298828125, -0.126861572265625, -0.10192108154296875, -0.0769805908203125, -0.05204010009765625, -0.027099609375, -0.00215911865234375, 0.0227813720703125, 0.04772186279296875, 0.072662353515625, 0.09760284423828125, 0.1225433349609375, 0.14748382568359375, 0.17242431640625, 0.19736480712890625, 0.2223052978515625, 0.24724578857421875, 0.272186279296875, 0.29712677001953125, 0.3220672607421875, 0.34700775146484375, 0.3719482421875, 0.39688873291015625, 0.4218292236328125, 0.44676971435546875, 0.471710205078125, 0.49665069580078125, 0.5215911865234375, 0.5465316772460938, 0.57147216796875, 0.5964126586914062, 0.6213531494140625, 0.6462936401367188, 0.671234130859375, 0.6961746215820312, 0.7211151123046875, 0.7460556030273438, 0.77099609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 4.0, 7.0, 2.0, 18.0, 11.0, 15.0, 23.0, 28.0, 34.0, 41.0, 37.0, 49.0, 56.0, 67.0, 70.0, 63.0, 65.0, 58.0, 49.0, 48.0, 53.0, 36.0, 41.0, 23.0, 25.0, 18.0, 17.0, 12.0, 7.0, 6.0, 3.0, 2.0, 4.0, 3.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3955078125, -0.3795318603515625, -0.363555908203125, -0.3475799560546875, -0.33160400390625, -0.3156280517578125, -0.299652099609375, -0.2836761474609375, -0.2677001953125, -0.2517242431640625, -0.235748291015625, -0.2197723388671875, -0.20379638671875, -0.1878204345703125, -0.171844482421875, -0.1558685302734375, -0.139892578125, -0.1239166259765625, -0.107940673828125, -0.0919647216796875, -0.07598876953125, -0.0600128173828125, -0.044036865234375, -0.0280609130859375, -0.0120849609375, 0.0038909912109375, 0.019866943359375, 0.0358428955078125, 0.05181884765625, 0.0677947998046875, 0.083770751953125, 0.0997467041015625, 0.11572265625, 0.1316986083984375, 0.147674560546875, 0.1636505126953125, 0.17962646484375, 0.1956024169921875, 0.211578369140625, 0.2275543212890625, 0.2435302734375, 0.2595062255859375, 0.275482177734375, 0.2914581298828125, 0.30743408203125, 0.3234100341796875, 0.339385986328125, 0.3553619384765625, 0.371337890625, 0.3873138427734375, 0.403289794921875, 0.4192657470703125, 0.43524169921875, 0.4512176513671875, 0.467193603515625, 0.4831695556640625, 0.4991455078125, 0.5151214599609375, 0.531097412109375, 0.5470733642578125, 0.56304931640625, 0.5790252685546875, 0.595001220703125, 0.6109771728515625, 0.626953125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 11.0, 16.0, 17.0, 17.0, 42.0, 56.0, 62.0, 100.0, 159.0, 241.0, 357.0, 554.0, 919.0, 1515.0, 2636.0, 4955.0, 9650.0, 18957.0, 41613.0, 102555.0, 259863.0, 331754.0, 157890.0, 60422.0, 26368.0, 12604.0, 6546.0, 3534.0, 1960.0, 1110.0, 697.0, 440.0, 317.0, 191.0, 123.0, 98.0, 51.0, 44.0, 32.0, 17.0, 15.0, 10.0, 12.0, 6.0, 2.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.1614990234375, -0.15615463256835938, -0.15081024169921875, -0.14546585083007812, -0.1401214599609375, -0.13477706909179688, -0.12943267822265625, -0.12408828735351562, -0.118743896484375, -0.11339950561523438, -0.10805511474609375, -0.10271072387695312, -0.0973663330078125, -0.09202194213867188, -0.08667755126953125, -0.08133316040039062, -0.07598876953125, -0.07064437866210938, -0.06529998779296875, -0.059955596923828125, -0.0546112060546875, -0.049266815185546875, -0.04392242431640625, -0.038578033447265625, -0.033233642578125, -0.027889251708984375, -0.02254486083984375, -0.017200469970703125, -0.0118560791015625, -0.006511688232421875, -0.00116729736328125, 0.004177093505859375, 0.009521484375, 0.014865875244140625, 0.02021026611328125, 0.025554656982421875, 0.0308990478515625, 0.036243438720703125, 0.04158782958984375, 0.046932220458984375, 0.052276611328125, 0.057621002197265625, 0.06296539306640625, 0.06830978393554688, 0.0736541748046875, 0.07899856567382812, 0.08434295654296875, 0.08968734741210938, 0.09503173828125, 0.10037612915039062, 0.10572052001953125, 0.11106491088867188, 0.1164093017578125, 0.12175369262695312, 0.12709808349609375, 0.13244247436523438, 0.137786865234375, 0.14313125610351562, 0.14847564697265625, 0.15382003784179688, 0.1591644287109375, 0.16450881958007812, 0.16985321044921875, 0.17519760131835938, 0.1805419921875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 12.0, 9.0, 11.0, 9.0, 15.0, 25.0, 18.0, 24.0, 35.0, 35.0, 26.0, 48.0, 44.0, 39.0, 44.0, 47.0, 47.0, 48.0, 54.0, 55.0, 41.0, 39.0, 39.0, 38.0, 35.0, 32.0, 24.0, 21.0, 9.0, 17.0, 5.0, 11.0, 10.0, 7.0, 4.0, 6.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.849609375, -0.8239212036132812, -0.7982330322265625, -0.7725448608398438, -0.746856689453125, -0.7211685180664062, -0.6954803466796875, -0.6697921752929688, -0.64410400390625, -0.6184158325195312, -0.5927276611328125, -0.5670394897460938, -0.541351318359375, -0.5156631469726562, -0.4899749755859375, -0.46428680419921875, -0.4385986328125, -0.41291046142578125, -0.3872222900390625, -0.36153411865234375, -0.335845947265625, -0.31015777587890625, -0.2844696044921875, -0.25878143310546875, -0.23309326171875, -0.20740509033203125, -0.1817169189453125, -0.15602874755859375, -0.130340576171875, -0.10465240478515625, -0.0789642333984375, -0.05327606201171875, -0.027587890625, -0.00189971923828125, 0.0237884521484375, 0.04947662353515625, 0.075164794921875, 0.10085296630859375, 0.1265411376953125, 0.15222930908203125, 0.17791748046875, 0.20360565185546875, 0.2292938232421875, 0.25498199462890625, 0.280670166015625, 0.30635833740234375, 0.3320465087890625, 0.35773468017578125, 0.3834228515625, 0.40911102294921875, 0.4347991943359375, 0.46048736572265625, 0.486175537109375, 0.5118637084960938, 0.5375518798828125, 0.5632400512695312, 0.58892822265625, 0.6146163940429688, 0.6403045654296875, 0.6659927368164062, 0.691680908203125, 0.7173690795898438, 0.7430572509765625, 0.7687454223632812, 0.79443359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 11.0, 18.0, 17.0, 29.0, 57.0, 81.0, 155.0, 291.0, 591.0, 1199.0, 2858.0, 7305.0, 21363.0, 79683.0, 327958.0, 434804.0, 123545.0, 31667.0, 10162.0, 3553.0, 1590.0, 747.0, 376.0, 209.0, 101.0, 79.0, 33.0, 28.0, 16.0, 10.0, 7.0, 3.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07183837890625, -0.06960391998291016, -0.06736946105957031, -0.06513500213623047, -0.06290054321289062, -0.06066608428955078, -0.05843162536621094, -0.056197166442871094, -0.05396270751953125, -0.051728248596191406, -0.04949378967285156, -0.04725933074951172, -0.045024871826171875, -0.04279041290283203, -0.04055595397949219, -0.038321495056152344, -0.0360870361328125, -0.033852577209472656, -0.03161811828613281, -0.02938365936279297, -0.027149200439453125, -0.02491474151611328, -0.022680282592773438, -0.020445823669433594, -0.01821136474609375, -0.015976905822753906, -0.013742446899414062, -0.011507987976074219, -0.009273529052734375, -0.007039070129394531, -0.0048046112060546875, -0.0025701522827148438, -0.000335693359375, 0.0018987655639648438, 0.0041332244873046875, 0.006367683410644531, 0.008602142333984375, 0.010836601257324219, 0.013071060180664062, 0.015305519104003906, 0.01753997802734375, 0.019774436950683594, 0.022008895874023438, 0.02424335479736328, 0.026477813720703125, 0.02871227264404297, 0.030946731567382812, 0.033181190490722656, 0.0354156494140625, 0.037650108337402344, 0.03988456726074219, 0.04211902618408203, 0.044353485107421875, 0.04658794403076172, 0.04882240295410156, 0.051056861877441406, 0.05329132080078125, 0.055525779724121094, 0.05776023864746094, 0.05999469757080078, 0.062229156494140625, 0.06446361541748047, 0.06669807434082031, 0.06893253326416016, 0.0711669921875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 3.0, 7.0, 5.0, 9.0, 6.0, 12.0, 17.0, 29.0, 19.0, 40.0, 57.0, 84.0, 94.0, 113.0, 123.0, 90.0, 101.0, 55.0, 39.0, 24.0, 15.0, 14.0, 15.0, 8.0, 2.0, 6.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.337860107421875e-05, -3.192480653524399e-05, -3.0471011996269226e-05, -2.9017217457294464e-05, -2.7563422918319702e-05, -2.610962837934494e-05, -2.4655833840370178e-05, -2.3202039301395416e-05, -2.1748244762420654e-05, -2.0294450223445892e-05, -1.884065568447113e-05, -1.738686114549637e-05, -1.5933066606521606e-05, -1.4479272067546844e-05, -1.3025477528572083e-05, -1.157168298959732e-05, -1.0117888450622559e-05, -8.664093911647797e-06, -7.210299372673035e-06, -5.756504833698273e-06, -4.302710294723511e-06, -2.8489157557487488e-06, -1.3951212167739868e-06, 5.8673322200775146e-08, 1.5124678611755371e-06, 2.966262400150299e-06, 4.420056939125061e-06, 5.873851478099823e-06, 7.327646017074585e-06, 8.781440556049347e-06, 1.0235235095024109e-05, 1.1689029633998871e-05, 1.3142824172973633e-05, 1.4596618711948395e-05, 1.6050413250923157e-05, 1.750420778989792e-05, 1.895800232887268e-05, 2.0411796867847443e-05, 2.1865591406822205e-05, 2.3319385945796967e-05, 2.477318048477173e-05, 2.622697502374649e-05, 2.7680769562721252e-05, 2.9134564101696014e-05, 3.0588358640670776e-05, 3.204215317964554e-05, 3.34959477186203e-05, 3.494974225759506e-05, 3.6403536796569824e-05, 3.7857331335544586e-05, 3.931112587451935e-05, 4.076492041349411e-05, 4.221871495246887e-05, 4.3672509491443634e-05, 4.5126304030418396e-05, 4.658009856939316e-05, 4.803389310836792e-05, 4.948768764734268e-05, 5.0941482186317444e-05, 5.2395276725292206e-05, 5.384907126426697e-05, 5.530286580324173e-05, 5.675666034221649e-05, 5.8210454881191254e-05, 5.9664249420166016e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 8.0, 11.0, 29.0, 48.0, 91.0, 165.0, 414.0, 1247.0, 4424.0, 20379.0, 164937.0, 692577.0, 140040.0, 18233.0, 4042.0, 1143.0, 394.0, 133.0, 89.0, 56.0, 19.0, 23.0, 11.0, 9.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.120361328125, -0.11653614044189453, -0.11271095275878906, -0.1088857650756836, -0.10506057739257812, -0.10123538970947266, -0.09741020202636719, -0.09358501434326172, -0.08975982666015625, -0.08593463897705078, -0.08210945129394531, -0.07828426361083984, -0.07445907592773438, -0.0706338882446289, -0.06680870056152344, -0.06298351287841797, -0.0591583251953125, -0.05533313751220703, -0.05150794982910156, -0.047682762145996094, -0.043857574462890625, -0.040032386779785156, -0.03620719909667969, -0.03238201141357422, -0.02855682373046875, -0.02473163604736328, -0.020906448364257812, -0.017081260681152344, -0.013256072998046875, -0.009430885314941406, -0.0056056976318359375, -0.0017805099487304688, 0.002044677734375, 0.005869865417480469, 0.009695053100585938, 0.013520240783691406, 0.017345428466796875, 0.021170616149902344, 0.024995803833007812, 0.02882099151611328, 0.03264617919921875, 0.03647136688232422, 0.04029655456542969, 0.044121742248535156, 0.047946929931640625, 0.051772117614746094, 0.05559730529785156, 0.05942249298095703, 0.0632476806640625, 0.06707286834716797, 0.07089805603027344, 0.0747232437133789, 0.07854843139648438, 0.08237361907958984, 0.08619880676269531, 0.09002399444580078, 0.09384918212890625, 0.09767436981201172, 0.10149955749511719, 0.10532474517822266, 0.10914993286132812, 0.1129751205444336, 0.11680030822753906, 0.12062549591064453, 0.12445068359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 2.0, 5.0, 6.0, 9.0, 19.0, 21.0, 29.0, 35.0, 35.0, 57.0, 51.0, 80.0, 96.0, 91.0, 85.0, 75.0, 59.0, 58.0, 48.0, 28.0, 21.0, 15.0, 9.0, 14.0, 10.0, 8.0, 4.0, 3.0, 5.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0178070068359375, -0.017240524291992188, -0.016674041748046875, -0.016107559204101562, -0.01554107666015625, -0.014974594116210938, -0.014408111572265625, -0.013841629028320312, -0.013275146484375, -0.012708663940429688, -0.012142181396484375, -0.011575698852539062, -0.01100921630859375, -0.010442733764648438, -0.009876251220703125, -0.009309768676757812, -0.0087432861328125, -0.008176803588867188, -0.007610321044921875, -0.0070438385009765625, -0.00647735595703125, -0.0059108734130859375, -0.005344390869140625, -0.0047779083251953125, -0.00421142578125, -0.0036449432373046875, -0.003078460693359375, -0.0025119781494140625, -0.00194549560546875, -0.0013790130615234375, -0.000812530517578125, -0.0002460479736328125, 0.0003204345703125, 0.0008869171142578125, 0.001453399658203125, 0.0020198822021484375, 0.00258636474609375, 0.0031528472900390625, 0.003719329833984375, 0.0042858123779296875, 0.004852294921875, 0.0054187774658203125, 0.005985260009765625, 0.0065517425537109375, 0.00711822509765625, 0.0076847076416015625, 0.008251190185546875, 0.008817672729492188, 0.0093841552734375, 0.009950637817382812, 0.010517120361328125, 0.011083602905273438, 0.01165008544921875, 0.012216567993164062, 0.012783050537109375, 0.013349533081054688, 0.013916015625, 0.014482498168945312, 0.015048980712890625, 0.015615463256835938, 0.01618194580078125, 0.016748428344726562, 0.017314910888671875, 0.017881393432617188, 0.0184478759765625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 11.0, 16.0, 39.0, 97.0, 209.0, 236.0, 204.0, 104.0, 58.0, 17.0, 12.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0388071537017822, -1.9919952154159546, -1.9451831579208374, -1.8983712196350098, -1.8515591621398926, -1.804747223854065, -1.7579352855682373, -1.7111232280731201, -1.6643112897872925, -1.6174993515014648, -1.5706872940063477, -1.52387535572052, -1.4770632982254028, -1.4302513599395752, -1.383439302444458, -1.3366273641586304, -1.2898154258728027, -1.243003487586975, -1.196191430091858, -1.1493794918060303, -1.102567434310913, -1.0557554960250854, -1.0089435577392578, -0.9621315002441406, -0.9153194427490234, -0.868507444858551, -0.8216954469680786, -0.774883508682251, -0.7280715107917786, -0.6812595129013062, -0.6344475150108337, -0.5876355171203613, -0.5408235788345337, -0.4940115809440613, -0.44719961285591125, -0.40038761496543884, -0.3535756468772888, -0.3067636489868164, -0.259951651096344, -0.21313968300819397, -0.16632768511772156, -0.11951570212841034, -0.07270371168851852, -0.02589172124862671, 0.02092026174068451, 0.06773224472999573, 0.11454424262046814, 0.16135621070861816, 0.20816820859909058, 0.254980206489563, 0.301792174577713, 0.3486041724681854, 0.39541614055633545, 0.44222813844680786, 0.4890401363372803, 0.5358520746231079, 0.5826641321182251, 0.6294761300086975, 0.6762881278991699, 0.7231000661849976, 0.76991206407547, 0.8167240619659424, 0.8635360598564148, 0.9103480577468872, 0.9571599960327148]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 4.0, 1.0, 5.0, 3.0, 2.0, 6.0, 5.0, 5.0, 8.0, 16.0, 15.0, 22.0, 22.0, 30.0, 25.0, 38.0, 35.0, 41.0, 63.0, 34.0, 64.0, 54.0, 61.0, 48.0, 58.0, 44.0, 46.0, 29.0, 39.0, 33.0, 35.0, 26.0, 18.0, 15.0, 11.0, 11.0, 10.0, 6.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3494338393211365, -0.3361285626888275, -0.32282325625419617, -0.3095179796218872, -0.29621270298957825, -0.2829073965549469, -0.26960211992263794, -0.2562968134880066, -0.24299153685569763, -0.22968624532222748, -0.21638096868991852, -0.20307567715644836, -0.1897703856229782, -0.17646509408950806, -0.1631598174571991, -0.14985452592372894, -0.13654924929141998, -0.12324396520853043, -0.10993867367506027, -0.09663338959217072, -0.08332809805870056, -0.070022813975811, -0.05671752989292145, -0.043412238359451294, -0.030106954276561737, -0.01680166646838188, -0.0034963805228471756, 0.00980890542268753, 0.023114193230867386, 0.03641948103904724, 0.0497247651219368, 0.06303005665540695, 0.07633534073829651, 0.08964062482118607, 0.10294591635465622, 0.11625120043754578, 0.12955649197101593, 0.14286178350448608, 0.15616706013679504, 0.1694723516702652, 0.18277764320373535, 0.1960829347372055, 0.20938821136951447, 0.22269350290298462, 0.23599879443645477, 0.24930408596992493, 0.2626093626022339, 0.27591466903686523, 0.2892199158668518, 0.30252519249916077, 0.3158304989337921, 0.3291357755661011, 0.34244105219841003, 0.3557463586330414, 0.36905163526535034, 0.3823569416999817, 0.39566221833229065, 0.4089674949645996, 0.42227280139923096, 0.4355780780315399, 0.4488833546638489, 0.4621886610984802, 0.4754939377307892, 0.48879921436309814, 0.5021045207977295]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 8.0, 7.0, 5.0, 12.0, 16.0, 35.0, 48.0, 88.0, 158.0, 334.0, 584.0, 1163.0, 2463.0, 5847.0, 15189.0, 48055.0, 213310.0, 565713.0, 140299.0, 34796.0, 11593.0, 4702.0, 2144.0, 917.0, 464.0, 237.0, 161.0, 85.0, 46.0, 29.0, 18.0, 17.0, 4.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.87060546875, -0.8459930419921875, -0.821380615234375, -0.7967681884765625, -0.77215576171875, -0.7475433349609375, -0.722930908203125, -0.6983184814453125, -0.6737060546875, -0.6490936279296875, -0.624481201171875, -0.5998687744140625, -0.57525634765625, -0.5506439208984375, -0.526031494140625, -0.5014190673828125, -0.476806640625, -0.4521942138671875, -0.427581787109375, -0.4029693603515625, -0.37835693359375, -0.3537445068359375, -0.329132080078125, -0.3045196533203125, -0.2799072265625, -0.2552947998046875, -0.230682373046875, -0.2060699462890625, -0.18145751953125, -0.1568450927734375, -0.132232666015625, -0.1076202392578125, -0.0830078125, -0.0583953857421875, -0.033782958984375, -0.0091705322265625, 0.01544189453125, 0.0400543212890625, 0.064666748046875, 0.0892791748046875, 0.1138916015625, 0.1385040283203125, 0.163116455078125, 0.1877288818359375, 0.21234130859375, 0.2369537353515625, 0.261566162109375, 0.2861785888671875, 0.310791015625, 0.3354034423828125, 0.360015869140625, 0.3846282958984375, 0.40924072265625, 0.4338531494140625, 0.458465576171875, 0.4830780029296875, 0.5076904296875, 0.5323028564453125, 0.556915283203125, 0.5815277099609375, 0.60614013671875, 0.6307525634765625, 0.655364990234375, 0.6799774169921875, 0.70458984375]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 5.0, 1.0, 9.0, 1.0, 5.0, 3.0, 10.0, 10.0, 12.0, 26.0, 16.0, 42.0, 32.0, 34.0, 33.0, 42.0, 42.0, 45.0, 60.0, 64.0, 48.0, 54.0, 40.0, 44.0, 42.0, 41.0, 44.0, 37.0, 27.0, 29.0, 23.0, 11.0, 16.0, 12.0, 7.0, 9.0, 5.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61279296875, -0.5895843505859375, -0.566375732421875, -0.5431671142578125, -0.51995849609375, -0.4967498779296875, -0.473541259765625, -0.4503326416015625, -0.4271240234375, -0.4039154052734375, -0.380706787109375, -0.3574981689453125, -0.33428955078125, -0.3110809326171875, -0.287872314453125, -0.2646636962890625, -0.241455078125, -0.2182464599609375, -0.195037841796875, -0.1718292236328125, -0.14862060546875, -0.1254119873046875, -0.102203369140625, -0.0789947509765625, -0.0557861328125, -0.0325775146484375, -0.009368896484375, 0.0138397216796875, 0.03704833984375, 0.0602569580078125, 0.083465576171875, 0.1066741943359375, 0.1298828125, 0.1530914306640625, 0.176300048828125, 0.1995086669921875, 0.22271728515625, 0.2459259033203125, 0.269134521484375, 0.2923431396484375, 0.3155517578125, 0.3387603759765625, 0.361968994140625, 0.3851776123046875, 0.40838623046875, 0.4315948486328125, 0.454803466796875, 0.4780120849609375, 0.501220703125, 0.5244293212890625, 0.547637939453125, 0.5708465576171875, 0.59405517578125, 0.6172637939453125, 0.640472412109375, 0.6636810302734375, 0.6868896484375, 0.7100982666015625, 0.733306884765625, 0.7565155029296875, 0.77972412109375, 0.8029327392578125, 0.826141357421875, 0.8493499755859375, 0.87255859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 3.0, 4.0, 6.0, 8.0, 18.0, 18.0, 20.0, 21.0, 25.0, 22.0, 29.0, 43.0, 57.0, 67.0, 98.0, 138.0, 220.0, 492.0, 1987.0, 21672.0, 795846.0, 217275.0, 8336.0, 1095.0, 374.0, 162.0, 126.0, 77.0, 64.0, 46.0, 46.0, 25.0, 20.0, 24.0, 19.0, 16.0, 11.0, 11.0, 3.0, 7.0, 4.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8251953125, -1.7639923095703125, -1.702789306640625, -1.6415863037109375, -1.58038330078125, -1.5191802978515625, -1.457977294921875, -1.3967742919921875, -1.3355712890625, -1.2743682861328125, -1.213165283203125, -1.1519622802734375, -1.09075927734375, -1.0295562744140625, -0.968353271484375, -0.9071502685546875, -0.845947265625, -0.7847442626953125, -0.723541259765625, -0.6623382568359375, -0.60113525390625, -0.5399322509765625, -0.478729248046875, -0.4175262451171875, -0.3563232421875, -0.2951202392578125, -0.233917236328125, -0.1727142333984375, -0.11151123046875, -0.0503082275390625, 0.010894775390625, 0.0720977783203125, 0.13330078125, 0.1945037841796875, 0.255706787109375, 0.3169097900390625, 0.37811279296875, 0.4393157958984375, 0.500518798828125, 0.5617218017578125, 0.6229248046875, 0.6841278076171875, 0.745330810546875, 0.8065338134765625, 0.86773681640625, 0.9289398193359375, 0.990142822265625, 1.0513458251953125, 1.112548828125, 1.1737518310546875, 1.234954833984375, 1.2961578369140625, 1.35736083984375, 1.4185638427734375, 1.479766845703125, 1.5409698486328125, 1.6021728515625, 1.6633758544921875, 1.724578857421875, 1.7857818603515625, 1.84698486328125, 1.9081878662109375, 1.969390869140625, 2.0305938720703125, 2.091796875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 6.0, 9.0, 8.0, 7.0, 7.0, 19.0, 18.0, 13.0, 22.0, 34.0, 35.0, 34.0, 36.0, 31.0, 42.0, 44.0, 35.0, 40.0, 50.0, 53.0, 39.0, 45.0, 53.0, 43.0, 36.0, 32.0, 33.0, 21.0, 31.0, 17.0, 14.0, 17.0, 15.0, 9.0, 11.0, 13.0, 5.0, 10.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.794921875, -0.7722625732421875, -0.749603271484375, -0.7269439697265625, -0.70428466796875, -0.6816253662109375, -0.658966064453125, -0.6363067626953125, -0.6136474609375, -0.5909881591796875, -0.568328857421875, -0.5456695556640625, -0.52301025390625, -0.5003509521484375, -0.477691650390625, -0.4550323486328125, -0.432373046875, -0.4097137451171875, -0.387054443359375, -0.3643951416015625, -0.34173583984375, -0.3190765380859375, -0.296417236328125, -0.2737579345703125, -0.2510986328125, -0.2284393310546875, -0.205780029296875, -0.1831207275390625, -0.16046142578125, -0.1378021240234375, -0.115142822265625, -0.0924835205078125, -0.06982421875, -0.0471649169921875, -0.024505615234375, -0.0018463134765625, 0.02081298828125, 0.0434722900390625, 0.066131591796875, 0.0887908935546875, 0.1114501953125, 0.1341094970703125, 0.156768798828125, 0.1794281005859375, 0.20208740234375, 0.2247467041015625, 0.247406005859375, 0.2700653076171875, 0.292724609375, 0.3153839111328125, 0.338043212890625, 0.3607025146484375, 0.38336181640625, 0.4060211181640625, 0.428680419921875, 0.4513397216796875, 0.4739990234375, 0.4966583251953125, 0.519317626953125, 0.5419769287109375, 0.56463623046875, 0.5872955322265625, 0.609954833984375, 0.6326141357421875, 0.6552734375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 3.0, 13.0, 17.0, 30.0, 46.0, 75.0, 152.0, 356.0, 884.0, 2851.0, 14760.0, 344134.0, 658290.0, 21598.0, 3485.0, 1017.0, 427.0, 163.0, 98.0, 47.0, 31.0, 10.0, 17.0, 9.0, 7.0, 7.0, 5.0, 10.0, 0.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41064453125, -0.39490509033203125, -0.3791656494140625, -0.36342620849609375, -0.347686767578125, -0.33194732666015625, -0.3162078857421875, -0.30046844482421875, -0.28472900390625, -0.26898956298828125, -0.2532501220703125, -0.23751068115234375, -0.221771240234375, -0.20603179931640625, -0.1902923583984375, -0.17455291748046875, -0.1588134765625, -0.14307403564453125, -0.1273345947265625, -0.11159515380859375, -0.095855712890625, -0.08011627197265625, -0.0643768310546875, -0.04863739013671875, -0.03289794921875, -0.01715850830078125, -0.0014190673828125, 0.01432037353515625, 0.030059814453125, 0.04579925537109375, 0.0615386962890625, 0.07727813720703125, 0.093017578125, 0.10875701904296875, 0.1244964599609375, 0.14023590087890625, 0.155975341796875, 0.17171478271484375, 0.1874542236328125, 0.20319366455078125, 0.21893310546875, 0.23467254638671875, 0.2504119873046875, 0.26615142822265625, 0.281890869140625, 0.29763031005859375, 0.3133697509765625, 0.32910919189453125, 0.3448486328125, 0.36058807373046875, 0.3763275146484375, 0.39206695556640625, 0.407806396484375, 0.42354583740234375, 0.4392852783203125, 0.45502471923828125, 0.47076416015625, 0.48650360107421875, 0.5022430419921875, 0.5179824829101562, 0.533721923828125, 0.5494613647460938, 0.5652008056640625, 0.5809402465820312, 0.5966796875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 2.0, 4.0, 2.0, 4.0, 8.0, 18.0, 10.0, 40.0, 47.0, 76.0, 102.0, 162.0, 157.0, 123.0, 79.0, 45.0, 46.0, 19.0, 14.0, 13.0, 9.0, 6.0, 7.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.106760025024414e-05, -3.943406045436859e-05, -3.780052065849304e-05, -3.616698086261749e-05, -3.453344106674194e-05, -3.2899901270866394e-05, -3.1266361474990845e-05, -2.9632821679115295e-05, -2.7999281883239746e-05, -2.6365742087364197e-05, -2.4732202291488647e-05, -2.3098662495613098e-05, -2.146512269973755e-05, -1.9831582903862e-05, -1.819804310798645e-05, -1.65645033121109e-05, -1.4930963516235352e-05, -1.3297423720359802e-05, -1.1663883924484253e-05, -1.0030344128608704e-05, -8.396804332733154e-06, -6.763264536857605e-06, -5.129724740982056e-06, -3.4961849451065063e-06, -1.862645149230957e-06, -2.2910535335540771e-07, 1.4044344425201416e-06, 3.037974238395691e-06, 4.67151403427124e-06, 6.3050538301467896e-06, 7.938593626022339e-06, 9.572133421897888e-06, 1.1205673217773438e-05, 1.2839213013648987e-05, 1.4472752809524536e-05, 1.6106292605400085e-05, 1.7739832401275635e-05, 1.9373372197151184e-05, 2.1006911993026733e-05, 2.2640451788902283e-05, 2.4273991584777832e-05, 2.590753138065338e-05, 2.754107117652893e-05, 2.917461097240448e-05, 3.080815076828003e-05, 3.244169056415558e-05, 3.407523036003113e-05, 3.570877015590668e-05, 3.7342309951782227e-05, 3.8975849747657776e-05, 4.0609389543533325e-05, 4.2242929339408875e-05, 4.3876469135284424e-05, 4.551000893115997e-05, 4.714354872703552e-05, 4.877708852291107e-05, 5.041062831878662e-05, 5.204416811466217e-05, 5.367770791053772e-05, 5.531124770641327e-05, 5.694478750228882e-05, 5.857832729816437e-05, 6.021186709403992e-05, 6.184540688991547e-05, 6.347894668579102e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 4.0, 14.0, 19.0, 43.0, 77.0, 195.0, 602.0, 2852.0, 43139.0, 962127.0, 35944.0, 2577.0, 590.0, 203.0, 82.0, 39.0, 18.0, 12.0, 8.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90478515625, -0.8824310302734375, -0.860076904296875, -0.8377227783203125, -0.81536865234375, -0.7930145263671875, -0.770660400390625, -0.7483062744140625, -0.7259521484375, -0.7035980224609375, -0.681243896484375, -0.6588897705078125, -0.63653564453125, -0.6141815185546875, -0.591827392578125, -0.5694732666015625, -0.547119140625, -0.5247650146484375, -0.502410888671875, -0.4800567626953125, -0.45770263671875, -0.4353485107421875, -0.412994384765625, -0.3906402587890625, -0.3682861328125, -0.3459320068359375, -0.323577880859375, -0.3012237548828125, -0.27886962890625, -0.2565155029296875, -0.234161376953125, -0.2118072509765625, -0.189453125, -0.1670989990234375, -0.144744873046875, -0.1223907470703125, -0.10003662109375, -0.0776824951171875, -0.055328369140625, -0.0329742431640625, -0.0106201171875, 0.0117340087890625, 0.034088134765625, 0.0564422607421875, 0.07879638671875, 0.1011505126953125, 0.123504638671875, 0.1458587646484375, 0.168212890625, 0.1905670166015625, 0.212921142578125, 0.2352752685546875, 0.25762939453125, 0.2799835205078125, 0.302337646484375, 0.3246917724609375, 0.3470458984375, 0.3694000244140625, 0.391754150390625, 0.4141082763671875, 0.43646240234375, 0.4588165283203125, 0.481170654296875, 0.5035247802734375, 0.52587890625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 9.0, 9.0, 12.0, 27.0, 52.0, 86.0, 135.0, 207.0, 188.0, 116.0, 68.0, 34.0, 20.0, 12.0, 6.0, 9.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.119873046875, -0.11352157592773438, -0.10717010498046875, -0.10081863403320312, -0.0944671630859375, -0.08811569213867188, -0.08176422119140625, -0.07541275024414062, -0.069061279296875, -0.06270980834960938, -0.05635833740234375, -0.050006866455078125, -0.0436553955078125, -0.037303924560546875, -0.03095245361328125, -0.024600982666015625, -0.01824951171875, -0.011898040771484375, -0.00554656982421875, 0.000804901123046875, 0.0071563720703125, 0.013507843017578125, 0.01985931396484375, 0.026210784912109375, 0.032562255859375, 0.038913726806640625, 0.04526519775390625, 0.051616668701171875, 0.0579681396484375, 0.06431961059570312, 0.07067108154296875, 0.07702255249023438, 0.0833740234375, 0.08972549438476562, 0.09607696533203125, 0.10242843627929688, 0.1087799072265625, 0.11513137817382812, 0.12148284912109375, 0.12783432006835938, 0.134185791015625, 0.14053726196289062, 0.14688873291015625, 0.15324020385742188, 0.1595916748046875, 0.16594314575195312, 0.17229461669921875, 0.17864608764648438, 0.18499755859375, 0.19134902954101562, 0.19770050048828125, 0.20405197143554688, 0.2104034423828125, 0.21675491333007812, 0.22310638427734375, 0.22945785522460938, 0.235809326171875, 0.24216079711914062, 0.24851226806640625, 0.2548637390136719, 0.2612152099609375, 0.2675666809082031, 0.27391815185546875, 0.2802696228027344, 0.28662109375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 16.0, 43.0, 98.0, 177.0, 241.0, 222.0, 109.0, 52.0, 30.0, 10.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3290119171142578, -1.2319542169570923, -1.1348965167999268, -1.0378386974334717, -0.9407809972763062, -0.8437232971191406, -0.7466655373573303, -0.64960777759552, -0.5525500774383545, -0.4554923474788666, -0.35843461751937866, -0.26137688755989075, -0.16431915760040283, -0.06726142764091492, 0.029796302318572998, 0.1268540620803833, 0.22391176223754883, 0.32096949219703674, 0.41802722215652466, 0.515084981918335, 0.6121426820755005, 0.709200382232666, 0.8062581419944763, 0.9033159017562866, 1.0003736019134521, 1.0974313020706177, 1.1944890022277832, 1.2915468215942383, 1.3886045217514038, 1.4856622219085693, 1.5827200412750244, 1.67977774143219, 1.7768354415893555, 1.873893141746521, 1.9709508419036865, 2.0680086612701416, 2.1650662422180176, 2.2621240615844727, 2.3591818809509277, 2.456239700317383, 2.553297281265259, 2.650355100631714, 2.74741268157959, 2.844470500946045, 2.9415283203125, 3.038585901260376, 3.135643720626831, 3.232701301574707, 3.329759120941162, 3.426816940307617, 3.523874521255493, 3.6209323406219482, 3.717989921569824, 3.8150477409362793, 3.9121055603027344, 4.0091633796691895, 4.1062211990356445, 4.2032790184021, 4.300336837768555, 4.397394180297852, 4.494451999664307, 4.591509819030762, 4.688567638397217, 4.785625457763672, 4.882682800292969]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 7.0, 9.0, 10.0, 9.0, 11.0, 18.0, 23.0, 21.0, 28.0, 33.0, 41.0, 45.0, 42.0, 41.0, 43.0, 57.0, 50.0, 50.0, 34.0, 52.0, 50.0, 41.0, 38.0, 43.0, 27.0, 29.0, 25.0, 20.0, 16.0, 20.0, 6.0, 14.0, 14.0, 13.0, 3.0, 3.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.309946894645691, -1.2691545486450195, -1.2283622026443481, -1.1875699758529663, -1.146777629852295, -1.1059852838516235, -1.0651929378509521, -1.0244007110595703, -0.9836083650588989, -0.9428160190582275, -0.9020237326622009, -0.8612313866615295, -0.8204391002655029, -0.7796467542648315, -0.7388544082641602, -0.6980621218681335, -0.6572697758674622, -0.6164774298667908, -0.5756851434707642, -0.5348927974700928, -0.49410051107406616, -0.4533081650733948, -0.4125158488750458, -0.3717235326766968, -0.3309312164783478, -0.2901389002799988, -0.24934658408164978, -0.2085542529821396, -0.1677619367837906, -0.1269696205854416, -0.0861772894859314, -0.0453849732875824, -0.0045926570892333984, 0.0361996628344059, 0.0769919827580452, 0.11778430640697479, 0.1585766226053238, 0.1993689388036728, 0.24016126990318298, 0.280953586101532, 0.321745902299881, 0.36253821849823, 0.403330534696579, 0.444122850894928, 0.48491519689559937, 0.525707483291626, 0.5664998292922974, 0.6072921752929688, 0.6480844616889954, 0.6888768076896667, 0.7296690940856934, 0.7704614400863647, 0.8112537264823914, 0.8520460724830627, 0.8928383588790894, 0.9336307048797607, 0.9744230508804321, 1.0152153968811035, 1.056007742881775, 1.0967999696731567, 1.1375923156738281, 1.1783846616744995, 1.219177007675171, 1.2599692344665527, 1.3007615804672241]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 5.0, 5.0, 10.0, 7.0, 18.0, 15.0, 22.0, 32.0, 72.0, 108.0, 228.0, 462.0, 1021.0, 3003.0, 13824.0, 145568.0, 2609292.0, 1349423.0, 60258.0, 7634.0, 1918.0, 650.0, 305.0, 182.0, 86.0, 60.0, 21.0, 18.0, 13.0, 12.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.150390625, -1.1090850830078125, -1.067779541015625, -1.0264739990234375, -0.98516845703125, -0.9438629150390625, -0.902557373046875, -0.8612518310546875, -0.8199462890625, -0.7786407470703125, -0.737335205078125, -0.6960296630859375, -0.65472412109375, -0.6134185791015625, -0.572113037109375, -0.5308074951171875, -0.489501953125, -0.4481964111328125, -0.406890869140625, -0.3655853271484375, -0.32427978515625, -0.2829742431640625, -0.241668701171875, -0.2003631591796875, -0.1590576171875, -0.1177520751953125, -0.076446533203125, -0.0351409912109375, 0.00616455078125, 0.0474700927734375, 0.088775634765625, 0.1300811767578125, 0.17138671875, 0.2126922607421875, 0.253997802734375, 0.2953033447265625, 0.33660888671875, 0.3779144287109375, 0.419219970703125, 0.4605255126953125, 0.5018310546875, 0.5431365966796875, 0.584442138671875, 0.6257476806640625, 0.66705322265625, 0.7083587646484375, 0.749664306640625, 0.7909698486328125, 0.832275390625, 0.8735809326171875, 0.914886474609375, 0.9561920166015625, 0.99749755859375, 1.0388031005859375, 1.080108642578125, 1.1214141845703125, 1.1627197265625, 1.2040252685546875, 1.245330810546875, 1.2866363525390625, 1.32794189453125, 1.3692474365234375, 1.410552978515625, 1.4518585205078125, 1.4931640625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 7.0, 6.0, 20.0, 16.0, 13.0, 27.0, 30.0, 36.0, 34.0, 42.0, 34.0, 50.0, 52.0, 71.0, 72.0, 44.0, 61.0, 49.0, 56.0, 56.0, 38.0, 28.0, 31.0, 17.0, 15.0, 16.0, 14.0, 11.0, 11.0, 12.0, 9.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53857421875, -0.5185165405273438, -0.4984588623046875, -0.47840118408203125, -0.458343505859375, -0.43828582763671875, -0.4182281494140625, -0.39817047119140625, -0.37811279296875, -0.35805511474609375, -0.3379974365234375, -0.31793975830078125, -0.297882080078125, -0.27782440185546875, -0.2577667236328125, -0.23770904541015625, -0.2176513671875, -0.19759368896484375, -0.1775360107421875, -0.15747833251953125, -0.137420654296875, -0.11736297607421875, -0.0973052978515625, -0.07724761962890625, -0.05718994140625, -0.03713226318359375, -0.0170745849609375, 0.00298309326171875, 0.023040771484375, 0.04309844970703125, 0.0631561279296875, 0.08321380615234375, 0.103271484375, 0.12332916259765625, 0.1433868408203125, 0.16344451904296875, 0.183502197265625, 0.20355987548828125, 0.2236175537109375, 0.24367523193359375, 0.26373291015625, 0.28379058837890625, 0.3038482666015625, 0.32390594482421875, 0.343963623046875, 0.36402130126953125, 0.3840789794921875, 0.40413665771484375, 0.4241943359375, 0.44425201416015625, 0.4643096923828125, 0.48436737060546875, 0.504425048828125, 0.5244827270507812, 0.5445404052734375, 0.5645980834960938, 0.58465576171875, 0.6047134399414062, 0.6247711181640625, 0.6448287963867188, 0.664886474609375, 0.6849441528320312, 0.7050018310546875, 0.7250595092773438, 0.7451171875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 4.0, 4.0, 6.0, 10.0, 21.0, 53.0, 99.0, 195.0, 468.0, 2220.0, 41941.0, 4080995.0, 64738.0, 2561.0, 540.0, 219.0, 92.0, 51.0, 36.0, 22.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.08203125, -2.99993896484375, -2.9178466796875, -2.83575439453125, -2.753662109375, -2.67156982421875, -2.5894775390625, -2.50738525390625, -2.42529296875, -2.34320068359375, -2.2611083984375, -2.17901611328125, -2.096923828125, -2.01483154296875, -1.9327392578125, -1.85064697265625, -1.7685546875, -1.68646240234375, -1.6043701171875, -1.52227783203125, -1.440185546875, -1.35809326171875, -1.2760009765625, -1.19390869140625, -1.11181640625, -1.02972412109375, -0.9476318359375, -0.86553955078125, -0.783447265625, -0.70135498046875, -0.6192626953125, -0.53717041015625, -0.455078125, -0.37298583984375, -0.2908935546875, -0.20880126953125, -0.126708984375, -0.04461669921875, 0.0374755859375, 0.11956787109375, 0.20166015625, 0.28375244140625, 0.3658447265625, 0.44793701171875, 0.530029296875, 0.61212158203125, 0.6942138671875, 0.77630615234375, 0.8583984375, 0.94049072265625, 1.0225830078125, 1.10467529296875, 1.186767578125, 1.26885986328125, 1.3509521484375, 1.43304443359375, 1.51513671875, 1.59722900390625, 1.6793212890625, 1.76141357421875, 1.843505859375, 1.92559814453125, 2.0076904296875, 2.08978271484375, 2.171875]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 2.0, 7.0, 4.0, 10.0, 28.0, 22.0, 53.0, 63.0, 92.0, 151.0, 270.0, 423.0, 674.0, 745.0, 603.0, 348.0, 216.0, 122.0, 82.0, 45.0, 43.0, 25.0, 9.0, 10.0, 9.0, 2.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.289794921875, -0.2802391052246094, -0.27068328857421875, -0.2611274719238281, -0.2515716552734375, -0.24201583862304688, -0.23246002197265625, -0.22290420532226562, -0.213348388671875, -0.20379257202148438, -0.19423675537109375, -0.18468093872070312, -0.1751251220703125, -0.16556930541992188, -0.15601348876953125, -0.14645767211914062, -0.13690185546875, -0.12734603881835938, -0.11779022216796875, -0.10823440551757812, -0.0986785888671875, -0.08912277221679688, -0.07956695556640625, -0.07001113891601562, -0.060455322265625, -0.050899505615234375, -0.04134368896484375, -0.031787872314453125, -0.0222320556640625, -0.012676239013671875, -0.00312042236328125, 0.006435394287109375, 0.0159912109375, 0.025547027587890625, 0.03510284423828125, 0.044658660888671875, 0.0542144775390625, 0.06377029418945312, 0.07332611083984375, 0.08288192749023438, 0.092437744140625, 0.10199356079101562, 0.11154937744140625, 0.12110519409179688, 0.1306610107421875, 0.14021682739257812, 0.14977264404296875, 0.15932846069335938, 0.16888427734375, 0.17844009399414062, 0.18799591064453125, 0.19755172729492188, 0.2071075439453125, 0.21666336059570312, 0.22621917724609375, 0.23577499389648438, 0.245330810546875, 0.2548866271972656, 0.26444244384765625, 0.2739982604980469, 0.2835540771484375, 0.2931098937988281, 0.30266571044921875, 0.3122215270996094, 0.32177734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 9.0, 9.0, 26.0, 37.0, 67.0, 77.0, 140.0, 142.0, 116.0, 109.0, 87.0, 72.0, 47.0, 28.0, 12.0, 10.0, 8.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6545131206512451, -1.6121437549591064, -1.5697743892669678, -1.527405023574829, -1.4850356578826904, -1.4426661729812622, -1.4002968072891235, -1.3579274415969849, -1.3155580759048462, -1.2731887102127075, -1.2308193445205688, -1.1884499788284302, -1.146080493927002, -1.1037111282348633, -1.0613417625427246, -1.018972396850586, -0.9766030311584473, -0.9342336654663086, -0.8918642997741699, -0.8494948744773865, -0.8071255087852478, -0.7647561430931091, -0.7223867177963257, -0.680017352104187, -0.6376479864120483, -0.5952786207199097, -0.552909255027771, -0.5105398297309875, -0.4681704640388489, -0.4258010983467102, -0.38343170285224915, -0.3410623073577881, -0.29869282245635986, -0.2563234567642212, -0.21395406126976013, -0.17158468067646027, -0.1292153000831604, -0.08684591948986053, -0.04447653889656067, -0.0021071434020996094, 0.04026222229003906, 0.08263160288333893, 0.1250009834766388, 0.16737036406993866, 0.20973974466323853, 0.2521091103553772, 0.29447850584983826, 0.3368479013442993, 0.379217267036438, 0.42158663272857666, 0.4639560282230377, 0.5063254237174988, 0.5486947894096375, 0.5910641551017761, 0.6334335803985596, 0.6758029460906982, 0.7181723117828369, 0.7605416774749756, 0.8029110431671143, 0.8452804684638977, 0.8876498341560364, 0.930019199848175, 0.9723886251449585, 1.0147579908370972, 1.0571273565292358]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 8.0, 3.0, 8.0, 9.0, 9.0, 20.0, 10.0, 24.0, 32.0, 33.0, 34.0, 43.0, 51.0, 45.0, 52.0, 51.0, 37.0, 45.0, 61.0, 46.0, 48.0, 34.0, 48.0, 28.0, 37.0, 30.0, 23.0, 15.0, 26.0, 19.0, 19.0, 12.0, 8.0, 8.0, 6.0, 4.0, 4.0, 4.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6787095069885254, -0.6585495471954346, -0.638389527797699, -0.6182295680046082, -0.5980696082115173, -0.5779095888137817, -0.5577496290206909, -0.5375896692276001, -0.5174297094345093, -0.49726971983909607, -0.47710976004600525, -0.45694977045059204, -0.4367898106575012, -0.416629821062088, -0.3964698314666748, -0.376309871673584, -0.3561498522758484, -0.3359898626804352, -0.31582990288734436, -0.29566991329193115, -0.27550995349884033, -0.2553499639034271, -0.23518997430801392, -0.2150299996137619, -0.1948700249195099, -0.17471005022525787, -0.15455007553100586, -0.13439008593559265, -0.11423011124134064, -0.09407013654708862, -0.07391015440225601, -0.0537501722574234, -0.03359025716781616, -0.01343027874827385, 0.006729699671268463, 0.026889678090810776, 0.04704965651035309, 0.0672096312046051, 0.08736961334943771, 0.10752959549427032, 0.12768957018852234, 0.14784954488277435, 0.16800951957702637, 0.18816950917243958, 0.2083294838666916, 0.2284894585609436, 0.2486494481563568, 0.26880943775177, 0.28896939754486084, 0.30912938714027405, 0.32928934693336487, 0.3494493365287781, 0.3696092963218689, 0.3897692859172821, 0.4099292755126953, 0.43008923530578613, 0.45024922490119934, 0.47040921449661255, 0.49056917428970337, 0.5107291340827942, 0.5308891534805298, 0.5510491132736206, 0.5712090730667114, 0.591369092464447, 0.6115290522575378]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 5.0, 7.0, 7.0, 12.0, 16.0, 19.0, 32.0, 47.0, 84.0, 141.0, 368.0, 783.0, 1810.0, 5224.0, 17306.0, 71349.0, 344864.0, 460338.0, 110064.0, 24613.0, 7204.0, 2453.0, 985.0, 380.0, 183.0, 99.0, 52.0, 32.0, 17.0, 13.0, 10.0, 9.0, 9.0, 5.0, 4.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.176025390625, -0.169769287109375, -0.16351318359375, -0.157257080078125, -0.1510009765625, -0.144744873046875, -0.13848876953125, -0.132232666015625, -0.1259765625, -0.119720458984375, -0.11346435546875, -0.107208251953125, -0.1009521484375, -0.094696044921875, -0.08843994140625, -0.082183837890625, -0.075927734375, -0.069671630859375, -0.06341552734375, -0.057159423828125, -0.0509033203125, -0.044647216796875, -0.03839111328125, -0.032135009765625, -0.02587890625, -0.019622802734375, -0.01336669921875, -0.007110595703125, -0.0008544921875, 0.005401611328125, 0.01165771484375, 0.017913818359375, 0.024169921875, 0.030426025390625, 0.03668212890625, 0.042938232421875, 0.0491943359375, 0.055450439453125, 0.06170654296875, 0.067962646484375, 0.07421875, 0.080474853515625, 0.08673095703125, 0.092987060546875, 0.0992431640625, 0.105499267578125, 0.11175537109375, 0.118011474609375, 0.124267578125, 0.130523681640625, 0.13677978515625, 0.143035888671875, 0.1492919921875, 0.155548095703125, 0.16180419921875, 0.168060302734375, 0.17431640625, 0.180572509765625, 0.18682861328125, 0.193084716796875, 0.1993408203125, 0.205596923828125, 0.21185302734375, 0.218109130859375, 0.224365234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 7.0, 6.0, 6.0, 5.0, 7.0, 8.0, 9.0, 20.0, 21.0, 27.0, 30.0, 32.0, 32.0, 47.0, 56.0, 56.0, 59.0, 45.0, 61.0, 55.0, 60.0, 41.0, 44.0, 45.0, 35.0, 27.0, 32.0, 30.0, 16.0, 20.0, 18.0, 11.0, 10.0, 6.0, 4.0, 4.0, 2.0, 1.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.50146484375, -0.4869537353515625, -0.472442626953125, -0.4579315185546875, -0.44342041015625, -0.4289093017578125, -0.414398193359375, -0.3998870849609375, -0.3853759765625, -0.3708648681640625, -0.356353759765625, -0.3418426513671875, -0.32733154296875, -0.3128204345703125, -0.298309326171875, -0.2837982177734375, -0.269287109375, -0.2547760009765625, -0.240264892578125, -0.2257537841796875, -0.21124267578125, -0.1967315673828125, -0.182220458984375, -0.1677093505859375, -0.1531982421875, -0.1386871337890625, -0.124176025390625, -0.1096649169921875, -0.09515380859375, -0.0806427001953125, -0.066131591796875, -0.0516204833984375, -0.037109375, -0.0225982666015625, -0.008087158203125, 0.0064239501953125, 0.02093505859375, 0.0354461669921875, 0.049957275390625, 0.0644683837890625, 0.0789794921875, 0.0934906005859375, 0.108001708984375, 0.1225128173828125, 0.13702392578125, 0.1515350341796875, 0.166046142578125, 0.1805572509765625, 0.195068359375, 0.2095794677734375, 0.224090576171875, 0.2386016845703125, 0.25311279296875, 0.2676239013671875, 0.282135009765625, 0.2966461181640625, 0.3111572265625, 0.3256683349609375, 0.340179443359375, 0.3546905517578125, 0.36920166015625, 0.3837127685546875, 0.398223876953125, 0.4127349853515625, 0.42724609375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 4.0, 6.0, 4.0, 7.0, 16.0, 28.0, 26.0, 34.0, 58.0, 98.0, 163.0, 233.0, 400.0, 715.0, 1184.0, 2348.0, 4990.0, 11864.0, 30611.0, 86475.0, 228827.0, 350043.0, 205630.0, 76733.0, 27539.0, 10845.0, 4670.0, 2147.0, 1138.0, 669.0, 361.0, 270.0, 133.0, 110.0, 57.0, 45.0, 23.0, 16.0, 11.0, 8.0, 6.0, 8.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1441650390625, -0.14020919799804688, -0.13625335693359375, -0.13229751586914062, -0.1283416748046875, -0.12438583374023438, -0.12042999267578125, -0.11647415161132812, -0.112518310546875, -0.10856246948242188, -0.10460662841796875, -0.10065078735351562, -0.0966949462890625, -0.09273910522460938, -0.08878326416015625, -0.08482742309570312, -0.08087158203125, -0.07691574096679688, -0.07295989990234375, -0.06900405883789062, -0.0650482177734375, -0.061092376708984375, -0.05713653564453125, -0.053180694580078125, -0.049224853515625, -0.045269012451171875, -0.04131317138671875, -0.037357330322265625, -0.0334014892578125, -0.029445648193359375, -0.02548980712890625, -0.021533966064453125, -0.017578125, -0.013622283935546875, -0.00966644287109375, -0.005710601806640625, -0.0017547607421875, 0.002201080322265625, 0.00615692138671875, 0.010112762451171875, 0.014068603515625, 0.018024444580078125, 0.02198028564453125, 0.025936126708984375, 0.0298919677734375, 0.033847808837890625, 0.03780364990234375, 0.041759490966796875, 0.04571533203125, 0.049671173095703125, 0.05362701416015625, 0.057582855224609375, 0.0615386962890625, 0.06549453735351562, 0.06945037841796875, 0.07340621948242188, 0.077362060546875, 0.08131790161132812, 0.08527374267578125, 0.08922958374023438, 0.0931854248046875, 0.09714126586914062, 0.10109710693359375, 0.10505294799804688, 0.1090087890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 3.0, 11.0, 10.0, 4.0, 13.0, 20.0, 20.0, 28.0, 22.0, 33.0, 38.0, 51.0, 44.0, 42.0, 41.0, 47.0, 46.0, 66.0, 49.0, 60.0, 54.0, 41.0, 31.0, 35.0, 36.0, 30.0, 27.0, 22.0, 12.0, 14.0, 6.0, 9.0, 9.0, 4.0, 6.0, 5.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.708984375, -0.681121826171875, -0.65325927734375, -0.625396728515625, -0.5975341796875, -0.569671630859375, -0.54180908203125, -0.513946533203125, -0.486083984375, -0.458221435546875, -0.43035888671875, -0.402496337890625, -0.3746337890625, -0.346771240234375, -0.31890869140625, -0.291046142578125, -0.26318359375, -0.235321044921875, -0.20745849609375, -0.179595947265625, -0.1517333984375, -0.123870849609375, -0.09600830078125, -0.068145751953125, -0.040283203125, -0.012420654296875, 0.01544189453125, 0.043304443359375, 0.0711669921875, 0.099029541015625, 0.12689208984375, 0.154754638671875, 0.1826171875, 0.210479736328125, 0.23834228515625, 0.266204833984375, 0.2940673828125, 0.321929931640625, 0.34979248046875, 0.377655029296875, 0.405517578125, 0.433380126953125, 0.46124267578125, 0.489105224609375, 0.5169677734375, 0.544830322265625, 0.57269287109375, 0.600555419921875, 0.62841796875, 0.656280517578125, 0.68414306640625, 0.712005615234375, 0.7398681640625, 0.767730712890625, 0.79559326171875, 0.823455810546875, 0.851318359375, 0.879180908203125, 0.90704345703125, 0.934906005859375, 0.9627685546875, 0.990631103515625, 1.01849365234375, 1.046356201171875, 1.07421875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 14.0, 9.0, 10.0, 25.0, 41.0, 53.0, 102.0, 176.0, 309.0, 642.0, 1189.0, 2715.0, 6290.0, 17421.0, 58963.0, 238408.0, 471000.0, 181741.0, 45613.0, 14021.0, 5189.0, 2342.0, 1074.0, 502.0, 287.0, 163.0, 91.0, 64.0, 32.0, 19.0, 14.0, 12.0, 11.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05316162109375, -0.05152082443237305, -0.049880027770996094, -0.04823923110961914, -0.04659843444824219, -0.044957637786865234, -0.04331684112548828, -0.04167604446411133, -0.040035247802734375, -0.03839445114135742, -0.03675365447998047, -0.035112857818603516, -0.03347206115722656, -0.03183126449584961, -0.030190467834472656, -0.028549671173095703, -0.02690887451171875, -0.025268077850341797, -0.023627281188964844, -0.02198648452758789, -0.020345687866210938, -0.018704891204833984, -0.01706409454345703, -0.015423297882080078, -0.013782501220703125, -0.012141704559326172, -0.010500907897949219, -0.008860111236572266, -0.0072193145751953125, -0.005578517913818359, -0.003937721252441406, -0.002296924591064453, -0.0006561279296875, 0.0009846687316894531, 0.0026254653930664062, 0.004266262054443359, 0.0059070587158203125, 0.007547855377197266, 0.009188652038574219, 0.010829448699951172, 0.012470245361328125, 0.014111042022705078, 0.01575183868408203, 0.017392635345458984, 0.019033432006835938, 0.02067422866821289, 0.022315025329589844, 0.023955821990966797, 0.02559661865234375, 0.027237415313720703, 0.028878211975097656, 0.03051900863647461, 0.03215980529785156, 0.033800601959228516, 0.03544139862060547, 0.03708219528198242, 0.038722991943359375, 0.04036378860473633, 0.04200458526611328, 0.043645381927490234, 0.04528617858886719, 0.04692697525024414, 0.048567771911621094, 0.05020856857299805, 0.051849365234375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 7.0, 3.0, 16.0, 12.0, 24.0, 43.0, 55.0, 77.0, 99.0, 126.0, 134.0, 115.0, 88.0, 58.0, 45.0, 21.0, 17.0, 17.0, 17.0, 7.0, 4.0, 1.0, 2.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0517578125e-05, -2.9309652745723724e-05, -2.810172736644745e-05, -2.6893801987171173e-05, -2.5685876607894897e-05, -2.4477951228618622e-05, -2.3270025849342346e-05, -2.206210047006607e-05, -2.0854175090789795e-05, -1.964624971151352e-05, -1.8438324332237244e-05, -1.7230398952960968e-05, -1.6022473573684692e-05, -1.4814548194408417e-05, -1.3606622815132141e-05, -1.2398697435855865e-05, -1.119077205657959e-05, -9.982846677303314e-06, -8.774921298027039e-06, -7.566995918750763e-06, -6.359070539474487e-06, -5.151145160198212e-06, -3.943219780921936e-06, -2.7352944016456604e-06, -1.5273690223693848e-06, -3.1944364309310913e-07, 8.884817361831665e-07, 2.096407115459442e-06, 3.3043324947357178e-06, 4.512257874011993e-06, 5.720183253288269e-06, 6.928108632564545e-06, 8.13603401184082e-06, 9.343959391117096e-06, 1.0551884770393372e-05, 1.1759810149669647e-05, 1.2967735528945923e-05, 1.4175660908222198e-05, 1.5383586287498474e-05, 1.659151166677475e-05, 1.7799437046051025e-05, 1.90073624253273e-05, 2.0215287804603577e-05, 2.1423213183879852e-05, 2.2631138563156128e-05, 2.3839063942432404e-05, 2.504698932170868e-05, 2.6254914700984955e-05, 2.746284008026123e-05, 2.8670765459537506e-05, 2.9878690838813782e-05, 3.108661621809006e-05, 3.229454159736633e-05, 3.350246697664261e-05, 3.4710392355918884e-05, 3.591831773519516e-05, 3.7126243114471436e-05, 3.833416849374771e-05, 3.954209387302399e-05, 4.075001925230026e-05, 4.195794463157654e-05, 4.3165870010852814e-05, 4.437379539012909e-05, 4.5581720769405365e-05, 4.678964614868164e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 5.0, 8.0, 9.0, 17.0, 22.0, 22.0, 36.0, 65.0, 100.0, 180.0, 266.0, 539.0, 1133.0, 2775.0, 7354.0, 22518.0, 83909.0, 295614.0, 414596.0, 158020.0, 41004.0, 12470.0, 4509.0, 1681.0, 759.0, 389.0, 196.0, 124.0, 70.0, 52.0, 31.0, 23.0, 17.0, 13.0, 11.0, 3.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.049591064453125, -0.048142433166503906, -0.04669380187988281, -0.04524517059326172, -0.043796539306640625, -0.04234790802001953, -0.04089927673339844, -0.039450645446777344, -0.03800201416015625, -0.036553382873535156, -0.03510475158691406, -0.03365612030029297, -0.032207489013671875, -0.03075885772705078, -0.029310226440429688, -0.027861595153808594, -0.0264129638671875, -0.024964332580566406, -0.023515701293945312, -0.02206707000732422, -0.020618438720703125, -0.01916980743408203, -0.017721176147460938, -0.016272544860839844, -0.01482391357421875, -0.013375282287597656, -0.011926651000976562, -0.010478019714355469, -0.009029388427734375, -0.007580757141113281, -0.0061321258544921875, -0.004683494567871094, -0.00323486328125, -0.0017862319946289062, -0.0003376007080078125, 0.0011110305786132812, 0.002559661865234375, 0.004008293151855469, 0.0054569244384765625, 0.006905555725097656, 0.00835418701171875, 0.009802818298339844, 0.011251449584960938, 0.012700080871582031, 0.014148712158203125, 0.015597343444824219, 0.017045974731445312, 0.018494606018066406, 0.0199432373046875, 0.021391868591308594, 0.022840499877929688, 0.02428913116455078, 0.025737762451171875, 0.02718639373779297, 0.028635025024414062, 0.030083656311035156, 0.03153228759765625, 0.032980918884277344, 0.03442955017089844, 0.03587818145751953, 0.037326812744140625, 0.03877544403076172, 0.04022407531738281, 0.041672706604003906, 0.043121337890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 4.0, 6.0, 10.0, 7.0, 10.0, 9.0, 21.0, 19.0, 31.0, 32.0, 37.0, 38.0, 45.0, 55.0, 62.0, 57.0, 64.0, 57.0, 57.0, 38.0, 58.0, 58.0, 28.0, 41.0, 28.0, 24.0, 19.0, 12.0, 12.0, 12.0, 9.0, 9.0, 5.0, 9.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0112457275390625, -0.010927438735961914, -0.010609149932861328, -0.010290861129760742, -0.009972572326660156, -0.00965428352355957, -0.009335994720458984, -0.009017705917358398, -0.008699417114257812, -0.008381128311157227, -0.00806283950805664, -0.007744550704956055, -0.007426261901855469, -0.007107973098754883, -0.006789684295654297, -0.006471395492553711, -0.006153106689453125, -0.005834817886352539, -0.005516529083251953, -0.005198240280151367, -0.004879951477050781, -0.004561662673950195, -0.004243373870849609, -0.0039250850677490234, -0.0036067962646484375, -0.0032885074615478516, -0.0029702186584472656, -0.0026519298553466797, -0.0023336410522460938, -0.002015352249145508, -0.0016970634460449219, -0.001378774642944336, -0.00106048583984375, -0.0007421970367431641, -0.0004239082336425781, -0.00010561943054199219, 0.00021266937255859375, 0.0005309581756591797, 0.0008492469787597656, 0.0011675357818603516, 0.0014858245849609375, 0.0018041133880615234, 0.0021224021911621094, 0.0024406909942626953, 0.0027589797973632812, 0.003077268600463867, 0.003395557403564453, 0.003713846206665039, 0.004032135009765625, 0.004350423812866211, 0.004668712615966797, 0.004987001419067383, 0.005305290222167969, 0.005623579025268555, 0.005941867828369141, 0.0062601566314697266, 0.0065784454345703125, 0.0068967342376708984, 0.007215023040771484, 0.00753331184387207, 0.007851600646972656, 0.008169889450073242, 0.008488178253173828, 0.008806467056274414, 0.009124755859375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 12.0, 53.0, 245.0, 410.0, 221.0, 51.0, 16.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.242868900299072, -4.16200065612793, -4.081132411956787, -4.000264644622803, -3.91939640045166, -3.8385281562805176, -3.757659912109375, -3.6767919063568115, -3.595923662185669, -3.5150554180145264, -3.434187412261963, -3.3533191680908203, -3.272451162338257, -3.1915829181671143, -3.110714912414551, -3.029846668243408, -2.9489784240722656, -2.868110179901123, -2.7872421741485596, -2.706373929977417, -2.6255059242248535, -2.544637680053711, -2.4637694358825684, -2.382901430130005, -2.3020334243774414, -2.221165180206299, -2.1402971744537354, -2.0594289302825928, -1.9785608053207397, -1.8976926803588867, -1.8168245553970337, -1.7359564304351807, -1.655088186264038, -1.574220061302185, -1.493351936340332, -1.4124836921691895, -1.3316155672073364, -1.2507474422454834, -1.1698793172836304, -1.0890111923217773, -1.0081429481506348, -0.9272748231887817, -0.8464066386222839, -0.7655385136604309, -0.6846703290939331, -0.6038022041320801, -0.522934079170227, -0.44206589460372925, -0.3611977696418762, -0.2803296148777008, -0.19946147501468658, -0.11859333515167236, -0.03772518038749695, 0.04314297437667847, 0.1240110993385315, 0.2048792839050293, 0.2857474088668823, 0.36661556363105774, 0.44748371839523315, 0.5283518433570862, 0.609220027923584, 0.690088152885437, 0.77095627784729, 0.8518244624137878, 0.9326925873756409]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 2.0, 6.0, 6.0, 9.0, 12.0, 9.0, 13.0, 20.0, 32.0, 34.0, 26.0, 40.0, 47.0, 63.0, 54.0, 48.0, 44.0, 59.0, 55.0, 48.0, 58.0, 45.0, 36.0, 30.0, 36.0, 26.0, 22.0, 26.0, 22.0, 17.0, 14.0, 6.0, 8.0, 7.0, 3.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.461410790681839, -0.4476940631866455, -0.43397730588912964, -0.42026054859161377, -0.4065438210964203, -0.3928270936012268, -0.37911033630371094, -0.36539357900619507, -0.3516768515110016, -0.3379601240158081, -0.32424336671829224, -0.31052660942077637, -0.2968098819255829, -0.2830931544303894, -0.26937639713287354, -0.25565963983535767, -0.24194291234016418, -0.2282261699438095, -0.21450942754745483, -0.20079268515110016, -0.18707594275474548, -0.1733592003583908, -0.15964245796203613, -0.14592571556568146, -0.13220897316932678, -0.1184922307729721, -0.10477548837661743, -0.09105874598026276, -0.07734200358390808, -0.0636252611875534, -0.04990851879119873, -0.036191776394844055, -0.022475063800811768, -0.008758321404457092, 0.004958420991897583, 0.01867516338825226, 0.032391905784606934, 0.04610864818096161, 0.059825390577316284, 0.07354213297367096, 0.08725887537002563, 0.10097561776638031, 0.11469236016273499, 0.12840910255908966, 0.14212584495544434, 0.155842587351799, 0.1695593297481537, 0.18327607214450836, 0.19699281454086304, 0.2107095569372177, 0.2244262993335724, 0.23814304172992706, 0.25185978412628174, 0.2655765414237976, 0.2792932689189911, 0.29300999641418457, 0.30672675371170044, 0.3204435110092163, 0.3341602385044098, 0.34787696599960327, 0.36159372329711914, 0.375310480594635, 0.3890272080898285, 0.402743935585022, 0.41646069288253784]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 7.0, 11.0, 9.0, 8.0, 21.0, 31.0, 32.0, 69.0, 226.0, 1107.0, 9429.0, 235972.0, 766225.0, 32117.0, 2619.0, 426.0, 121.0, 46.0, 22.0, 16.0, 4.0, 11.0, 7.0, 9.0, 3.0, 3.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6484375, -1.6029205322265625, -1.557403564453125, -1.5118865966796875, -1.46636962890625, -1.4208526611328125, -1.375335693359375, -1.3298187255859375, -1.2843017578125, -1.2387847900390625, -1.193267822265625, -1.1477508544921875, -1.10223388671875, -1.0567169189453125, -1.011199951171875, -0.9656829833984375, -0.920166015625, -0.8746490478515625, -0.829132080078125, -0.7836151123046875, -0.73809814453125, -0.6925811767578125, -0.647064208984375, -0.6015472412109375, -0.5560302734375, -0.5105133056640625, -0.464996337890625, -0.4194793701171875, -0.37396240234375, -0.3284454345703125, -0.282928466796875, -0.2374114990234375, -0.19189453125, -0.1463775634765625, -0.100860595703125, -0.0553436279296875, -0.00982666015625, 0.0356903076171875, 0.081207275390625, 0.1267242431640625, 0.1722412109375, 0.2177581787109375, 0.263275146484375, 0.3087921142578125, 0.35430908203125, 0.3998260498046875, 0.445343017578125, 0.4908599853515625, 0.536376953125, 0.5818939208984375, 0.627410888671875, 0.6729278564453125, 0.71844482421875, 0.7639617919921875, 0.809478759765625, 0.8549957275390625, 0.9005126953125, 0.9460296630859375, 0.991546630859375, 1.0370635986328125, 1.08258056640625, 1.1280975341796875, 1.173614501953125, 1.2191314697265625, 1.2646484375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 8.0, 8.0, 13.0, 19.0, 28.0, 25.0, 43.0, 48.0, 65.0, 72.0, 87.0, 78.0, 80.0, 80.0, 70.0, 62.0, 49.0, 41.0, 26.0, 34.0, 19.0, 18.0, 7.0, 10.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.796875, -0.7592010498046875, -0.721527099609375, -0.6838531494140625, -0.64617919921875, -0.6085052490234375, -0.570831298828125, -0.5331573486328125, -0.4954833984375, -0.4578094482421875, -0.420135498046875, -0.3824615478515625, -0.34478759765625, -0.3071136474609375, -0.269439697265625, -0.2317657470703125, -0.194091796875, -0.1564178466796875, -0.118743896484375, -0.0810699462890625, -0.04339599609375, -0.0057220458984375, 0.031951904296875, 0.0696258544921875, 0.1072998046875, 0.1449737548828125, 0.182647705078125, 0.2203216552734375, 0.25799560546875, 0.2956695556640625, 0.333343505859375, 0.3710174560546875, 0.40869140625, 0.4463653564453125, 0.484039306640625, 0.5217132568359375, 0.55938720703125, 0.5970611572265625, 0.634735107421875, 0.6724090576171875, 0.7100830078125, 0.7477569580078125, 0.785430908203125, 0.8231048583984375, 0.86077880859375, 0.8984527587890625, 0.936126708984375, 0.9738006591796875, 1.011474609375, 1.0491485595703125, 1.086822509765625, 1.1244964599609375, 1.16217041015625, 1.1998443603515625, 1.237518310546875, 1.2751922607421875, 1.3128662109375, 1.3505401611328125, 1.388214111328125, 1.4258880615234375, 1.46356201171875, 1.5012359619140625, 1.538909912109375, 1.5765838623046875, 1.6142578125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 8.0, 6.0, 8.0, 6.0, 13.0, 13.0, 19.0, 32.0, 36.0, 45.0, 56.0, 72.0, 106.0, 129.0, 191.0, 242.0, 454.0, 1298.0, 7104.0, 123252.0, 838155.0, 69758.0, 5184.0, 1063.0, 389.0, 226.0, 156.0, 115.0, 88.0, 59.0, 54.0, 43.0, 32.0, 32.0, 25.0, 18.0, 25.0, 9.0, 9.0, 6.0, 2.0, 4.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.068359375, -1.033233642578125, -0.99810791015625, -0.962982177734375, -0.9278564453125, -0.892730712890625, -0.85760498046875, -0.822479248046875, -0.787353515625, -0.752227783203125, -0.71710205078125, -0.681976318359375, -0.6468505859375, -0.611724853515625, -0.57659912109375, -0.541473388671875, -0.50634765625, -0.471221923828125, -0.43609619140625, -0.400970458984375, -0.3658447265625, -0.330718994140625, -0.29559326171875, -0.260467529296875, -0.225341796875, -0.190216064453125, -0.15509033203125, -0.119964599609375, -0.0848388671875, -0.049713134765625, -0.01458740234375, 0.020538330078125, 0.0556640625, 0.090789794921875, 0.12591552734375, 0.161041259765625, 0.1961669921875, 0.231292724609375, 0.26641845703125, 0.301544189453125, 0.336669921875, 0.371795654296875, 0.40692138671875, 0.442047119140625, 0.4771728515625, 0.512298583984375, 0.54742431640625, 0.582550048828125, 0.61767578125, 0.652801513671875, 0.68792724609375, 0.723052978515625, 0.7581787109375, 0.793304443359375, 0.82843017578125, 0.863555908203125, 0.898681640625, 0.933807373046875, 0.96893310546875, 1.004058837890625, 1.0391845703125, 1.074310302734375, 1.10943603515625, 1.144561767578125, 1.1796875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 9.0, 9.0, 17.0, 9.0, 16.0, 14.0, 25.0, 21.0, 22.0, 34.0, 41.0, 42.0, 34.0, 41.0, 50.0, 55.0, 52.0, 32.0, 44.0, 53.0, 36.0, 41.0, 30.0, 38.0, 24.0, 26.0, 33.0, 22.0, 21.0, 21.0, 13.0, 18.0, 10.0, 13.0, 4.0, 10.0, 7.0, 1.0, 2.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6279296875, -0.605072021484375, -0.58221435546875, -0.559356689453125, -0.5364990234375, -0.513641357421875, -0.49078369140625, -0.467926025390625, -0.445068359375, -0.422210693359375, -0.39935302734375, -0.376495361328125, -0.3536376953125, -0.330780029296875, -0.30792236328125, -0.285064697265625, -0.26220703125, -0.239349365234375, -0.21649169921875, -0.193634033203125, -0.1707763671875, -0.147918701171875, -0.12506103515625, -0.102203369140625, -0.079345703125, -0.056488037109375, -0.03363037109375, -0.010772705078125, 0.0120849609375, 0.034942626953125, 0.05780029296875, 0.080657958984375, 0.103515625, 0.126373291015625, 0.14923095703125, 0.172088623046875, 0.1949462890625, 0.217803955078125, 0.24066162109375, 0.263519287109375, 0.286376953125, 0.309234619140625, 0.33209228515625, 0.354949951171875, 0.3778076171875, 0.400665283203125, 0.42352294921875, 0.446380615234375, 0.46923828125, 0.492095947265625, 0.51495361328125, 0.537811279296875, 0.5606689453125, 0.583526611328125, 0.60638427734375, 0.629241943359375, 0.652099609375, 0.674957275390625, 0.69781494140625, 0.720672607421875, 0.7435302734375, 0.766387939453125, 0.78924560546875, 0.812103271484375, 0.8349609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 8.0, 7.0, 13.0, 22.0, 25.0, 70.0, 130.0, 324.0, 1009.0, 4993.0, 70778.0, 922826.0, 43090.0, 3884.0, 843.0, 275.0, 116.0, 55.0, 29.0, 20.0, 13.0, 14.0, 6.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3740234375, -0.358062744140625, -0.34210205078125, -0.326141357421875, -0.3101806640625, -0.294219970703125, -0.27825927734375, -0.262298583984375, -0.246337890625, -0.230377197265625, -0.21441650390625, -0.198455810546875, -0.1824951171875, -0.166534423828125, -0.15057373046875, -0.134613037109375, -0.11865234375, -0.102691650390625, -0.08673095703125, -0.070770263671875, -0.0548095703125, -0.038848876953125, -0.02288818359375, -0.006927490234375, 0.009033203125, 0.024993896484375, 0.04095458984375, 0.056915283203125, 0.0728759765625, 0.088836669921875, 0.10479736328125, 0.120758056640625, 0.13671875, 0.152679443359375, 0.16864013671875, 0.184600830078125, 0.2005615234375, 0.216522216796875, 0.23248291015625, 0.248443603515625, 0.264404296875, 0.280364990234375, 0.29632568359375, 0.312286376953125, 0.3282470703125, 0.344207763671875, 0.36016845703125, 0.376129150390625, 0.39208984375, 0.408050537109375, 0.42401123046875, 0.439971923828125, 0.4559326171875, 0.471893310546875, 0.48785400390625, 0.503814697265625, 0.519775390625, 0.535736083984375, 0.55169677734375, 0.567657470703125, 0.5836181640625, 0.599578857421875, 0.61553955078125, 0.631500244140625, 0.6474609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 2.0, 7.0, 4.0, 2.0, 12.0, 14.0, 23.0, 31.0, 59.0, 66.0, 96.0, 120.0, 110.0, 119.0, 83.0, 81.0, 47.0, 36.0, 22.0, 12.0, 19.0, 12.0, 9.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.017353057861328e-05, -3.9013102650642395e-05, -3.785267472267151e-05, -3.669224679470062e-05, -3.5531818866729736e-05, -3.437139093875885e-05, -3.3210963010787964e-05, -3.205053508281708e-05, -3.089010715484619e-05, -2.9729679226875305e-05, -2.856925129890442e-05, -2.7408823370933533e-05, -2.6248395442962646e-05, -2.508796751499176e-05, -2.3927539587020874e-05, -2.2767111659049988e-05, -2.16066837310791e-05, -2.0446255803108215e-05, -1.928582787513733e-05, -1.8125399947166443e-05, -1.6964972019195557e-05, -1.580454409122467e-05, -1.4644116163253784e-05, -1.3483688235282898e-05, -1.2323260307312012e-05, -1.1162832379341125e-05, -1.000240445137024e-05, -8.841976523399353e-06, -7.681548595428467e-06, -6.5211206674575806e-06, -5.360692739486694e-06, -4.200264811515808e-06, -3.039836883544922e-06, -1.8794089555740356e-06, -7.189810276031494e-07, 4.414469003677368e-07, 1.601874828338623e-06, 2.7623027563095093e-06, 3.9227306842803955e-06, 5.083158612251282e-06, 6.243586540222168e-06, 7.404014468193054e-06, 8.56444239616394e-06, 9.724870324134827e-06, 1.0885298252105713e-05, 1.2045726180076599e-05, 1.3206154108047485e-05, 1.4366582036018372e-05, 1.5527009963989258e-05, 1.6687437891960144e-05, 1.784786581993103e-05, 1.9008293747901917e-05, 2.0168721675872803e-05, 2.132914960384369e-05, 2.2489577531814575e-05, 2.365000545978546e-05, 2.4810433387756348e-05, 2.5970861315727234e-05, 2.713128924369812e-05, 2.8291717171669006e-05, 2.9452145099639893e-05, 3.061257302761078e-05, 3.1773000955581665e-05, 3.293342888355255e-05, 3.409385681152344e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 5.0, 11.0, 17.0, 22.0, 28.0, 59.0, 96.0, 182.0, 450.0, 1599.0, 9436.0, 234707.0, 775117.0, 22754.0, 2836.0, 682.0, 255.0, 115.0, 62.0, 36.0, 31.0, 14.0, 7.0, 7.0, 4.0, 3.0, 8.0, 1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46630859375, -0.45085906982421875, -0.4354095458984375, -0.41996002197265625, -0.404510498046875, -0.38906097412109375, -0.3736114501953125, -0.35816192626953125, -0.34271240234375, -0.32726287841796875, -0.3118133544921875, -0.29636383056640625, -0.280914306640625, -0.26546478271484375, -0.2500152587890625, -0.23456573486328125, -0.2191162109375, -0.20366668701171875, -0.1882171630859375, -0.17276763916015625, -0.157318115234375, -0.14186859130859375, -0.1264190673828125, -0.11096954345703125, -0.09552001953125, -0.08007049560546875, -0.0646209716796875, -0.04917144775390625, -0.033721923828125, -0.01827239990234375, -0.0028228759765625, 0.01262664794921875, 0.028076171875, 0.04352569580078125, 0.0589752197265625, 0.07442474365234375, 0.089874267578125, 0.10532379150390625, 0.1207733154296875, 0.13622283935546875, 0.15167236328125, 0.16712188720703125, 0.1825714111328125, 0.19802093505859375, 0.213470458984375, 0.22891998291015625, 0.2443695068359375, 0.25981903076171875, 0.2752685546875, 0.29071807861328125, 0.3061676025390625, 0.32161712646484375, 0.337066650390625, 0.35251617431640625, 0.3679656982421875, 0.38341522216796875, 0.39886474609375, 0.41431427001953125, 0.4297637939453125, 0.44521331787109375, 0.460662841796875, 0.47611236572265625, 0.4915618896484375, 0.5070114135742188, 0.5224609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 15.0, 12.0, 21.0, 49.0, 51.0, 63.0, 91.0, 113.0, 134.0, 112.0, 90.0, 62.0, 56.0, 27.0, 24.0, 20.0, 13.0, 5.0, 6.0, 4.0, 7.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12237548828125, -0.11870670318603516, -0.11503791809082031, -0.11136913299560547, -0.10770034790039062, -0.10403156280517578, -0.10036277770996094, -0.0966939926147461, -0.09302520751953125, -0.0893564224243164, -0.08568763732910156, -0.08201885223388672, -0.07835006713867188, -0.07468128204345703, -0.07101249694824219, -0.06734371185302734, -0.0636749267578125, -0.060006141662597656, -0.05633735656738281, -0.05266857147216797, -0.048999786376953125, -0.04533100128173828, -0.04166221618652344, -0.037993431091308594, -0.03432464599609375, -0.030655860900878906, -0.026987075805664062, -0.02331829071044922, -0.019649505615234375, -0.01598072052001953, -0.012311935424804688, -0.008643150329589844, -0.004974365234375, -0.0013055801391601562, 0.0023632049560546875, 0.006031990051269531, 0.009700775146484375, 0.013369560241699219, 0.017038345336914062, 0.020707130432128906, 0.02437591552734375, 0.028044700622558594, 0.03171348571777344, 0.03538227081298828, 0.039051055908203125, 0.04271984100341797, 0.04638862609863281, 0.050057411193847656, 0.0537261962890625, 0.057394981384277344, 0.06106376647949219, 0.06473255157470703, 0.06840133666992188, 0.07207012176513672, 0.07573890686035156, 0.0794076919555664, 0.08307647705078125, 0.0867452621459961, 0.09041404724121094, 0.09408283233642578, 0.09775161743164062, 0.10142040252685547, 0.10508918762207031, 0.10875797271728516, 0.1124267578125]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 15.0, 44.0, 114.0, 256.0, 293.0, 176.0, 69.0, 25.0, 11.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1168487071990967, -2.006702184677124, -1.8965555429458618, -1.7864090204238892, -1.676262378692627, -1.5661158561706543, -1.4559693336486816, -1.345822811126709, -1.2356761693954468, -1.1255296468734741, -1.015383005142212, -0.9052364826202393, -0.7950899004936218, -0.6849433183670044, -0.5747967958450317, -0.4646502137184143, -0.3545036315917969, -0.24435706436634064, -0.1342104971408844, -0.024063944816589355, 0.08608263731002808, 0.1962292194366455, 0.30637574195861816, 0.4165223240852356, 0.526668906211853, 0.6368154883384705, 0.7469620704650879, 0.8571085929870605, 0.967255175113678, 1.0774017572402954, 1.187548279762268, 1.2976949214935303, 1.407841682434082, 1.5179882049560547, 1.628134846687317, 1.7382813692092896, 1.8484280109405518, 1.9585745334625244, 2.068721055984497, 2.1788675785064697, 2.2890143394470215, 2.399160861968994, 2.509307384490967, 2.6194539070129395, 2.729600667953491, 2.839747190475464, 2.9498937129974365, 3.060040235519409, 3.170186758041382, 3.2803332805633545, 3.390479803085327, 3.500626564025879, 3.6107730865478516, 3.720919609069824, 3.831066131591797, 3.9412126541137695, 4.051359176635742, 4.161505699157715, 4.2716522216796875, 4.38179874420166, 4.491945266723633, 4.6020917892456055, 4.712238311767578, 4.822385311126709, 4.932531833648682]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 3.0, 5.0, 6.0, 8.0, 4.0, 10.0, 7.0, 7.0, 17.0, 24.0, 16.0, 20.0, 28.0, 38.0, 38.0, 33.0, 41.0, 45.0, 41.0, 53.0, 54.0, 44.0, 55.0, 47.0, 47.0, 41.0, 30.0, 35.0, 37.0, 26.0, 25.0, 24.0, 14.0, 15.0, 12.0, 13.0, 10.0, 8.0, 4.0, 7.0, 4.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.356858491897583, -1.3146865367889404, -1.2725145816802979, -1.2303426265716553, -1.1881706714630127, -1.1459985971450806, -1.103826642036438, -1.0616546869277954, -1.0194827318191528, -0.9773107767105103, -0.9351388216018677, -0.8929668068885803, -0.8507948517799377, -0.8086228966712952, -0.7664508819580078, -0.7242789268493652, -0.6821069717407227, -0.6399350166320801, -0.5977630615234375, -0.5555910468101501, -0.5134190917015076, -0.471247136592865, -0.4290751516819, -0.38690316677093506, -0.3447312116622925, -0.3025592565536499, -0.26038727164268494, -0.21821530163288116, -0.1760433316230774, -0.13387136161327362, -0.09169939160346985, -0.04952740669250488, -0.007355451583862305, 0.03481651842594147, 0.07698848843574524, 0.11916045844554901, 0.16133242845535278, 0.20350439846515656, 0.24567636847496033, 0.2878483533859253, 0.33002030849456787, 0.37219226360321045, 0.4143642485141754, 0.4565362334251404, 0.49870818853378296, 0.5408801436424255, 0.5830521583557129, 0.6252241134643555, 0.667396068572998, 0.7095680236816406, 0.7517399787902832, 0.7939119935035706, 0.8360839486122131, 0.8782559037208557, 0.9204279184341431, 0.9625998735427856, 1.0047718286514282, 1.0469437837600708, 1.0891157388687134, 1.131287693977356, 1.173459768295288, 1.2156317234039307, 1.2578036785125732, 1.2999756336212158, 1.3421475887298584]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 7.0, 6.0, 7.0, 16.0, 20.0, 28.0, 40.0, 62.0, 91.0, 152.0, 315.0, 727.0, 1863.0, 8247.0, 159653.0, 3612587.0, 394327.0, 12885.0, 2035.0, 641.0, 249.0, 121.0, 70.0, 49.0, 28.0, 22.0, 8.0, 10.0, 8.0, 2.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.900390625, -1.851165771484375, -1.80194091796875, -1.752716064453125, -1.7034912109375, -1.654266357421875, -1.60504150390625, -1.555816650390625, -1.506591796875, -1.457366943359375, -1.40814208984375, -1.358917236328125, -1.3096923828125, -1.260467529296875, -1.21124267578125, -1.162017822265625, -1.11279296875, -1.063568115234375, -1.01434326171875, -0.965118408203125, -0.9158935546875, -0.866668701171875, -0.81744384765625, -0.768218994140625, -0.718994140625, -0.669769287109375, -0.62054443359375, -0.571319580078125, -0.5220947265625, -0.472869873046875, -0.42364501953125, -0.374420166015625, -0.3251953125, -0.275970458984375, -0.22674560546875, -0.177520751953125, -0.1282958984375, -0.079071044921875, -0.02984619140625, 0.019378662109375, 0.068603515625, 0.117828369140625, 0.16705322265625, 0.216278076171875, 0.2655029296875, 0.314727783203125, 0.36395263671875, 0.413177490234375, 0.46240234375, 0.511627197265625, 0.56085205078125, 0.610076904296875, 0.6593017578125, 0.708526611328125, 0.75775146484375, 0.806976318359375, 0.856201171875, 0.905426025390625, 0.95465087890625, 1.003875732421875, 1.0531005859375, 1.102325439453125, 1.15155029296875, 1.200775146484375, 1.25]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 3.0, 10.0, 14.0, 16.0, 17.0, 36.0, 36.0, 48.0, 56.0, 76.0, 72.0, 76.0, 77.0, 80.0, 57.0, 57.0, 50.0, 58.0, 36.0, 32.0, 19.0, 19.0, 17.0, 13.0, 8.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.603515625, -0.57781982421875, -0.5521240234375, -0.52642822265625, -0.500732421875, -0.47503662109375, -0.4493408203125, -0.42364501953125, -0.39794921875, -0.37225341796875, -0.3465576171875, -0.32086181640625, -0.295166015625, -0.26947021484375, -0.2437744140625, -0.21807861328125, -0.1923828125, -0.16668701171875, -0.1409912109375, -0.11529541015625, -0.089599609375, -0.06390380859375, -0.0382080078125, -0.01251220703125, 0.01318359375, 0.03887939453125, 0.0645751953125, 0.09027099609375, 0.115966796875, 0.14166259765625, 0.1673583984375, 0.19305419921875, 0.21875, 0.24444580078125, 0.2701416015625, 0.29583740234375, 0.321533203125, 0.34722900390625, 0.3729248046875, 0.39862060546875, 0.42431640625, 0.45001220703125, 0.4757080078125, 0.50140380859375, 0.527099609375, 0.55279541015625, 0.5784912109375, 0.60418701171875, 0.6298828125, 0.65557861328125, 0.6812744140625, 0.70697021484375, 0.732666015625, 0.75836181640625, 0.7840576171875, 0.80975341796875, 0.83544921875, 0.86114501953125, 0.8868408203125, 0.91253662109375, 0.938232421875, 0.96392822265625, 0.9896240234375, 1.01531982421875, 1.041015625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 6.0, 10.0, 18.0, 20.0, 44.0, 97.0, 179.0, 500.0, 1722.0, 11692.0, 1633841.0, 2529406.0, 13904.0, 1873.0, 553.0, 203.0, 99.0, 40.0, 26.0, 22.0, 13.0, 4.0, 7.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.6484375, -2.588287353515625, -2.52813720703125, -2.467987060546875, -2.4078369140625, -2.347686767578125, -2.28753662109375, -2.227386474609375, -2.167236328125, -2.107086181640625, -2.04693603515625, -1.986785888671875, -1.9266357421875, -1.866485595703125, -1.80633544921875, -1.746185302734375, -1.68603515625, -1.625885009765625, -1.56573486328125, -1.505584716796875, -1.4454345703125, -1.385284423828125, -1.32513427734375, -1.264984130859375, -1.204833984375, -1.144683837890625, -1.08453369140625, -1.024383544921875, -0.9642333984375, -0.904083251953125, -0.84393310546875, -0.783782958984375, -0.7236328125, -0.663482666015625, -0.60333251953125, -0.543182373046875, -0.4830322265625, -0.422882080078125, -0.36273193359375, -0.302581787109375, -0.242431640625, -0.182281494140625, -0.12213134765625, -0.061981201171875, -0.0018310546875, 0.058319091796875, 0.11846923828125, 0.178619384765625, 0.23876953125, 0.298919677734375, 0.35906982421875, 0.419219970703125, 0.4793701171875, 0.539520263671875, 0.59967041015625, 0.659820556640625, 0.719970703125, 0.780120849609375, 0.84027099609375, 0.900421142578125, 0.9605712890625, 1.020721435546875, 1.08087158203125, 1.141021728515625, 1.201171875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 1.0, 14.0, 10.0, 14.0, 15.0, 23.0, 39.0, 57.0, 88.0, 102.0, 171.0, 294.0, 442.0, 656.0, 683.0, 509.0, 357.0, 219.0, 122.0, 77.0, 58.0, 38.0, 22.0, 17.0, 15.0, 12.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.22607421875, -0.21882057189941406, -0.21156692504882812, -0.2043132781982422, -0.19705963134765625, -0.1898059844970703, -0.18255233764648438, -0.17529869079589844, -0.1680450439453125, -0.16079139709472656, -0.15353775024414062, -0.1462841033935547, -0.13903045654296875, -0.1317768096923828, -0.12452316284179688, -0.11726951599121094, -0.110015869140625, -0.10276222229003906, -0.09550857543945312, -0.08825492858886719, -0.08100128173828125, -0.07374763488769531, -0.06649398803710938, -0.05924034118652344, -0.0519866943359375, -0.04473304748535156, -0.037479400634765625, -0.030225753784179688, -0.02297210693359375, -0.015718460083007812, -0.008464813232421875, -0.0012111663818359375, 0.00604248046875, 0.013296127319335938, 0.020549774169921875, 0.027803421020507812, 0.03505706787109375, 0.04231071472167969, 0.049564361572265625, 0.05681800842285156, 0.0640716552734375, 0.07132530212402344, 0.07857894897460938, 0.08583259582519531, 0.09308624267578125, 0.10033988952636719, 0.10759353637695312, 0.11484718322753906, 0.122100830078125, 0.12935447692871094, 0.13660812377929688, 0.1438617706298828, 0.15111541748046875, 0.1583690643310547, 0.16562271118164062, 0.17287635803222656, 0.1801300048828125, 0.18738365173339844, 0.19463729858398438, 0.2018909454345703, 0.20914459228515625, 0.2163982391357422, 0.22365188598632812, 0.23090553283691406, 0.2381591796875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 8.0, 30.0, 40.0, 72.0, 143.0, 198.0, 222.0, 151.0, 66.0, 42.0, 25.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.8788716793060303, -2.8188812732696533, -2.7588911056518555, -2.6989006996154785, -2.6389105319976807, -2.5789201259613037, -2.518929958343506, -2.458939552307129, -2.398949384689331, -2.338958978652954, -2.2789688110351562, -2.2189784049987793, -2.1589882373809814, -2.0989978313446045, -2.0390076637268066, -1.9790172576904297, -1.9190269708633423, -1.8590366840362549, -1.7990463972091675, -1.73905611038208, -1.6790658235549927, -1.6190755367279053, -1.5590851306915283, -1.4990949630737305, -1.4391045570373535, -1.3791142702102661, -1.3191239833831787, -1.2591336965560913, -1.199143409729004, -1.1391531229019165, -1.079162836074829, -1.0191724300384521, -0.9591822028160095, -0.8991919159889221, -0.8392016291618347, -0.7792112827301025, -0.7192209959030151, -0.6592307090759277, -0.5992404222488403, -0.5392501354217529, -0.4792598485946655, -0.4192695617675781, -0.3592792749404907, -0.29928895831108093, -0.23929867148399353, -0.17930838465690613, -0.11931806802749634, -0.059327781200408936, 0.0006625056266784668, 0.060652799904346466, 0.12064309418201447, 0.18063339591026306, 0.24062368273735046, 0.30061396956443787, 0.36060428619384766, 0.42059457302093506, 0.48058485984802246, 0.5405751466751099, 0.6005654335021973, 0.6605557203292847, 0.7205460071563721, 0.7805362939834595, 0.8405266404151917, 0.900516927242279, 0.9605072140693665]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 8.0, 11.0, 11.0, 19.0, 26.0, 24.0, 22.0, 25.0, 47.0, 41.0, 40.0, 48.0, 52.0, 54.0, 46.0, 49.0, 59.0, 47.0, 49.0, 46.0, 38.0, 35.0, 38.0, 27.0, 24.0, 20.0, 18.0, 13.0, 12.0, 9.0, 9.0, 2.0, 2.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6236315369606018, -0.6038021445274353, -0.5839727520942688, -0.5641433596611023, -0.5443139672279358, -0.5244845747947693, -0.5046551823616028, -0.48482581973075867, -0.46499642729759216, -0.44516703486442566, -0.42533764243125916, -0.40550824999809265, -0.38567888736724854, -0.36584949493408203, -0.3460201025009155, -0.326190710067749, -0.3063613176345825, -0.286531925201416, -0.2667025327682495, -0.2468731552362442, -0.2270437628030777, -0.2072143703699112, -0.18738499283790588, -0.16755560040473938, -0.14772620797157288, -0.12789681553840637, -0.10806743055582047, -0.08823804557323456, -0.06840865314006805, -0.04857926070690155, -0.028749875724315643, -0.008920490741729736, 0.010908961296081543, 0.03073835000395775, 0.050567738711833954, 0.07039712369441986, 0.09022651612758636, 0.11005590856075287, 0.12988528609275818, 0.14971467852592468, 0.1695440709590912, 0.1893734633922577, 0.2092028558254242, 0.2290322333574295, 0.248861625790596, 0.2686910033226013, 0.2885203957557678, 0.3083497881889343, 0.32817918062210083, 0.34800857305526733, 0.36783796548843384, 0.38766735792160034, 0.40749675035476685, 0.42732614278793335, 0.44715550541877747, 0.46698489785194397, 0.4868142902851105, 0.5066436529159546, 0.5264730453491211, 0.5463024377822876, 0.5661318302154541, 0.5859612226486206, 0.6057906150817871, 0.6256200075149536, 0.6454493999481201]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 8.0, 11.0, 15.0, 15.0, 39.0, 77.0, 229.0, 511.0, 1365.0, 3847.0, 14853.0, 138325.0, 762772.0, 107699.0, 13169.0, 3612.0, 1214.0, 426.0, 193.0, 72.0, 30.0, 20.0, 14.0, 5.0, 9.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.33837890625, -0.3279533386230469, -0.31752777099609375, -0.3071022033691406, -0.2966766357421875, -0.2862510681152344, -0.27582550048828125, -0.2653999328613281, -0.254974365234375, -0.24454879760742188, -0.23412322998046875, -0.22369766235351562, -0.2132720947265625, -0.20284652709960938, -0.19242095947265625, -0.18199539184570312, -0.17156982421875, -0.16114425659179688, -0.15071868896484375, -0.14029312133789062, -0.1298675537109375, -0.11944198608398438, -0.10901641845703125, -0.09859085083007812, -0.088165283203125, -0.07773971557617188, -0.06731414794921875, -0.056888580322265625, -0.0464630126953125, -0.036037445068359375, -0.02561187744140625, -0.015186309814453125, -0.0047607421875, 0.005664825439453125, 0.01609039306640625, 0.026515960693359375, 0.0369415283203125, 0.047367095947265625, 0.05779266357421875, 0.06821823120117188, 0.078643798828125, 0.08906936645507812, 0.09949493408203125, 0.10992050170898438, 0.1203460693359375, 0.13077163696289062, 0.14119720458984375, 0.15162277221679688, 0.16204833984375, 0.17247390747070312, 0.18289947509765625, 0.19332504272460938, 0.2037506103515625, 0.21417617797851562, 0.22460174560546875, 0.23502731323242188, 0.245452880859375, 0.2558784484863281, 0.26630401611328125, 0.2767295837402344, 0.2871551513671875, 0.2975807189941406, 0.30800628662109375, 0.3184318542480469, 0.328857421875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 3.0, 1.0, 4.0, 9.0, 7.0, 7.0, 14.0, 18.0, 15.0, 24.0, 22.0, 26.0, 35.0, 44.0, 46.0, 40.0, 46.0, 50.0, 46.0, 60.0, 53.0, 56.0, 53.0, 50.0, 41.0, 39.0, 30.0, 33.0, 25.0, 16.0, 21.0, 14.0, 8.0, 8.0, 9.0, 8.0, 5.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.420166015625, -0.406402587890625, -0.39263916015625, -0.378875732421875, -0.3651123046875, -0.351348876953125, -0.33758544921875, -0.323822021484375, -0.31005859375, -0.296295166015625, -0.28253173828125, -0.268768310546875, -0.2550048828125, -0.241241455078125, -0.22747802734375, -0.213714599609375, -0.199951171875, -0.186187744140625, -0.17242431640625, -0.158660888671875, -0.1448974609375, -0.131134033203125, -0.11737060546875, -0.103607177734375, -0.08984375, -0.076080322265625, -0.06231689453125, -0.048553466796875, -0.0347900390625, -0.021026611328125, -0.00726318359375, 0.006500244140625, 0.020263671875, 0.034027099609375, 0.04779052734375, 0.061553955078125, 0.0753173828125, 0.089080810546875, 0.10284423828125, 0.116607666015625, 0.13037109375, 0.144134521484375, 0.15789794921875, 0.171661376953125, 0.1854248046875, 0.199188232421875, 0.21295166015625, 0.226715087890625, 0.240478515625, 0.254241943359375, 0.26800537109375, 0.281768798828125, 0.2955322265625, 0.309295654296875, 0.32305908203125, 0.336822509765625, 0.3505859375, 0.364349365234375, 0.37811279296875, 0.391876220703125, 0.4056396484375, 0.419403076171875, 0.43316650390625, 0.446929931640625, 0.460693359375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 7.0, 4.0, 11.0, 11.0, 13.0, 16.0, 22.0, 40.0, 34.0, 67.0, 93.0, 141.0, 174.0, 261.0, 383.0, 566.0, 935.0, 1511.0, 2565.0, 4546.0, 9082.0, 21226.0, 59936.0, 180448.0, 359296.0, 257055.0, 92497.0, 31163.0, 12191.0, 5821.0, 3139.0, 1842.0, 1175.0, 752.0, 492.0, 321.0, 191.0, 138.0, 95.0, 86.0, 52.0, 34.0, 21.0, 24.0, 16.0, 9.0, 13.0, 10.0, 6.0, 7.0, 6.0, 6.0, 2.0, 2.0, 3.0, 2.0], "bins": [-0.11712646484375, -0.11354351043701172, -0.10996055603027344, -0.10637760162353516, -0.10279464721679688, -0.0992116928100586, -0.09562873840332031, -0.09204578399658203, -0.08846282958984375, -0.08487987518310547, -0.08129692077636719, -0.0777139663696289, -0.07413101196289062, -0.07054805755615234, -0.06696510314941406, -0.06338214874267578, -0.0597991943359375, -0.05621623992919922, -0.05263328552246094, -0.049050331115722656, -0.045467376708984375, -0.041884422302246094, -0.03830146789550781, -0.03471851348876953, -0.03113555908203125, -0.02755260467529297, -0.023969650268554688, -0.020386695861816406, -0.016803741455078125, -0.013220787048339844, -0.009637832641601562, -0.006054878234863281, -0.002471923828125, 0.0011110305786132812, 0.0046939849853515625, 0.008276939392089844, 0.011859893798828125, 0.015442848205566406, 0.019025802612304688, 0.02260875701904297, 0.02619171142578125, 0.02977466583251953, 0.03335762023925781, 0.036940574645996094, 0.040523529052734375, 0.044106483459472656, 0.04768943786621094, 0.05127239227294922, 0.0548553466796875, 0.05843830108642578, 0.06202125549316406, 0.06560420989990234, 0.06918716430664062, 0.0727701187133789, 0.07635307312011719, 0.07993602752685547, 0.08351898193359375, 0.08710193634033203, 0.09068489074707031, 0.0942678451538086, 0.09785079956054688, 0.10143375396728516, 0.10501670837402344, 0.10859966278076172, 0.1121826171875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 0.0, 7.0, 4.0, 3.0, 9.0, 10.0, 14.0, 19.0, 15.0, 8.0, 15.0, 19.0, 26.0, 36.0, 23.0, 33.0, 32.0, 36.0, 53.0, 43.0, 47.0, 38.0, 50.0, 47.0, 50.0, 49.0, 36.0, 36.0, 31.0, 25.0, 40.0, 21.0, 17.0, 20.0, 13.0, 14.0, 8.0, 3.0, 14.0, 5.0, 6.0, 7.0, 2.0, 2.0, 6.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.728515625, -0.7064666748046875, -0.684417724609375, -0.6623687744140625, -0.64031982421875, -0.6182708740234375, -0.596221923828125, -0.5741729736328125, -0.5521240234375, -0.5300750732421875, -0.508026123046875, -0.4859771728515625, -0.46392822265625, -0.4418792724609375, -0.419830322265625, -0.3977813720703125, -0.375732421875, -0.3536834716796875, -0.331634521484375, -0.3095855712890625, -0.28753662109375, -0.2654876708984375, -0.243438720703125, -0.2213897705078125, -0.1993408203125, -0.1772918701171875, -0.155242919921875, -0.1331939697265625, -0.11114501953125, -0.0890960693359375, -0.067047119140625, -0.0449981689453125, -0.02294921875, -0.0009002685546875, 0.021148681640625, 0.0431976318359375, 0.06524658203125, 0.0872955322265625, 0.109344482421875, 0.1313934326171875, 0.1534423828125, 0.1754913330078125, 0.197540283203125, 0.2195892333984375, 0.24163818359375, 0.2636871337890625, 0.285736083984375, 0.3077850341796875, 0.329833984375, 0.3518829345703125, 0.373931884765625, 0.3959808349609375, 0.41802978515625, 0.4400787353515625, 0.462127685546875, 0.4841766357421875, 0.5062255859375, 0.5282745361328125, 0.550323486328125, 0.5723724365234375, 0.59442138671875, 0.6164703369140625, 0.638519287109375, 0.6605682373046875, 0.6826171875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 16.0, 21.0, 37.0, 45.0, 95.0, 162.0, 241.0, 496.0, 849.0, 1796.0, 4156.0, 10679.0, 35453.0, 163746.0, 504383.0, 249867.0, 52398.0, 14398.0, 5289.0, 2146.0, 1067.0, 500.0, 291.0, 137.0, 96.0, 81.0, 36.0, 25.0, 13.0, 8.0, 9.0, 4.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057281494140625, -0.05562782287597656, -0.053974151611328125, -0.05232048034667969, -0.05066680908203125, -0.04901313781738281, -0.047359466552734375, -0.04570579528808594, -0.0440521240234375, -0.04239845275878906, -0.040744781494140625, -0.03909111022949219, -0.03743743896484375, -0.03578376770019531, -0.034130096435546875, -0.03247642517089844, -0.03082275390625, -0.029169082641601562, -0.027515411376953125, -0.025861740112304688, -0.02420806884765625, -0.022554397583007812, -0.020900726318359375, -0.019247055053710938, -0.0175933837890625, -0.015939712524414062, -0.014286041259765625, -0.012632369995117188, -0.01097869873046875, -0.009325027465820312, -0.007671356201171875, -0.0060176849365234375, -0.004364013671875, -0.0027103424072265625, -0.001056671142578125, 0.0005970001220703125, 0.00225067138671875, 0.0039043426513671875, 0.005558013916015625, 0.0072116851806640625, 0.0088653564453125, 0.010519027709960938, 0.012172698974609375, 0.013826370239257812, 0.01548004150390625, 0.017133712768554688, 0.018787384033203125, 0.020441055297851562, 0.0220947265625, 0.023748397827148438, 0.025402069091796875, 0.027055740356445312, 0.02870941162109375, 0.030363082885742188, 0.032016754150390625, 0.03367042541503906, 0.0353240966796875, 0.03697776794433594, 0.038631439208984375, 0.04028511047363281, 0.04193878173828125, 0.04359245300292969, 0.045246124267578125, 0.04689979553222656, 0.048553466796875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 14.0, 19.0, 36.0, 119.0, 186.0, 256.0, 174.0, 95.0, 59.0, 14.0, 7.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.82012939453125e-05, -7.626786828041077e-05, -7.433444261550903e-05, -7.24010169506073e-05, -7.046759128570557e-05, -6.853416562080383e-05, -6.66007399559021e-05, -6.466731429100037e-05, -6.273388862609863e-05, -6.08004629611969e-05, -5.8867037296295166e-05, -5.693361163139343e-05, -5.50001859664917e-05, -5.3066760301589966e-05, -5.113333463668823e-05, -4.91999089717865e-05, -4.7266483306884766e-05, -4.533305764198303e-05, -4.33996319770813e-05, -4.1466206312179565e-05, -3.953278064727783e-05, -3.75993549823761e-05, -3.5665929317474365e-05, -3.373250365257263e-05, -3.17990779876709e-05, -2.9865652322769165e-05, -2.793222665786743e-05, -2.5998800992965698e-05, -2.4065375328063965e-05, -2.213194966316223e-05, -2.0198523998260498e-05, -1.8265098333358765e-05, -1.633167266845703e-05, -1.4398247003555298e-05, -1.2464821338653564e-05, -1.0531395673751831e-05, -8.597970008850098e-06, -6.664544343948364e-06, -4.731118679046631e-06, -2.7976930141448975e-06, -8.642673492431641e-07, 1.0691583156585693e-06, 3.0025839805603027e-06, 4.936009645462036e-06, 6.8694353103637695e-06, 8.802860975265503e-06, 1.0736286640167236e-05, 1.266971230506897e-05, 1.4603137969970703e-05, 1.6536563634872437e-05, 1.846998929977417e-05, 2.0403414964675903e-05, 2.2336840629577637e-05, 2.427026629447937e-05, 2.6203691959381104e-05, 2.8137117624282837e-05, 3.007054328918457e-05, 3.2003968954086304e-05, 3.393739461898804e-05, 3.587082028388977e-05, 3.7804245948791504e-05, 3.973767161369324e-05, 4.167109727859497e-05, 4.3604522943496704e-05, 4.553794860839844e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 5.0, 3.0, 2.0, 6.0, 2.0, 11.0, 11.0, 24.0, 43.0, 35.0, 76.0, 113.0, 189.0, 302.0, 581.0, 1062.0, 2305.0, 5574.0, 17349.0, 71619.0, 296072.0, 447114.0, 154209.0, 34965.0, 9753.0, 3705.0, 1606.0, 767.0, 412.0, 224.0, 139.0, 83.0, 55.0, 36.0, 26.0, 29.0, 13.0, 10.0, 8.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.04486083984375, -0.043425559997558594, -0.04199028015136719, -0.04055500030517578, -0.039119720458984375, -0.03768444061279297, -0.03624916076660156, -0.034813880920410156, -0.03337860107421875, -0.031943321228027344, -0.030508041381835938, -0.02907276153564453, -0.027637481689453125, -0.02620220184326172, -0.024766921997070312, -0.023331642150878906, -0.0218963623046875, -0.020461082458496094, -0.019025802612304688, -0.01759052276611328, -0.016155242919921875, -0.014719963073730469, -0.013284683227539062, -0.011849403381347656, -0.01041412353515625, -0.008978843688964844, -0.0075435638427734375, -0.006108283996582031, -0.004673004150390625, -0.0032377243041992188, -0.0018024444580078125, -0.00036716461181640625, 0.001068115234375, 0.0025033950805664062, 0.0039386749267578125, 0.005373954772949219, 0.006809234619140625, 0.008244514465332031, 0.009679794311523438, 0.011115074157714844, 0.01255035400390625, 0.013985633850097656, 0.015420913696289062, 0.01685619354248047, 0.018291473388671875, 0.01972675323486328, 0.021162033081054688, 0.022597312927246094, 0.0240325927734375, 0.025467872619628906, 0.026903152465820312, 0.02833843231201172, 0.029773712158203125, 0.03120899200439453, 0.03264427185058594, 0.034079551696777344, 0.03551483154296875, 0.036950111389160156, 0.03838539123535156, 0.03982067108154297, 0.041255950927734375, 0.04269123077392578, 0.04412651062011719, 0.045561790466308594, 0.0469970703125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 4.0, 10.0, 4.0, 10.0, 14.0, 13.0, 22.0, 28.0, 35.0, 58.0, 60.0, 84.0, 79.0, 84.0, 76.0, 77.0, 80.0, 60.0, 53.0, 41.0, 26.0, 16.0, 18.0, 17.0, 8.0, 3.0, 6.0, 4.0, 2.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.01544952392578125, -0.015019059181213379, -0.014588594436645508, -0.014158129692077637, -0.013727664947509766, -0.013297200202941895, -0.012866735458374023, -0.012436270713806152, -0.012005805969238281, -0.01157534122467041, -0.011144876480102539, -0.010714411735534668, -0.010283946990966797, -0.009853482246398926, -0.009423017501831055, -0.008992552757263184, -0.008562088012695312, -0.008131623268127441, -0.00770115852355957, -0.007270693778991699, -0.006840229034423828, -0.006409764289855957, -0.005979299545288086, -0.005548834800720215, -0.005118370056152344, -0.004687905311584473, -0.0042574405670166016, -0.0038269758224487305, -0.0033965110778808594, -0.0029660463333129883, -0.002535581588745117, -0.002105116844177246, -0.001674652099609375, -0.001244187355041504, -0.0008137226104736328, -0.0003832578659057617, 4.7206878662109375e-05, 0.00047767162322998047, 0.0009081363677978516, 0.0013386011123657227, 0.0017690658569335938, 0.002199530601501465, 0.002629995346069336, 0.003060460090637207, 0.003490924835205078, 0.003921389579772949, 0.00435185432434082, 0.004782319068908691, 0.0052127838134765625, 0.005643248558044434, 0.006073713302612305, 0.006504178047180176, 0.006934642791748047, 0.007365107536315918, 0.007795572280883789, 0.00822603702545166, 0.008656501770019531, 0.009086966514587402, 0.009517431259155273, 0.009947896003723145, 0.010378360748291016, 0.010808825492858887, 0.011239290237426758, 0.011669754981994629, 0.0121002197265625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 56.0, 556.0, 378.0, 25.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.198397636413574, -8.048991203308105, -7.899584770202637, -7.750178337097168, -7.600771903991699, -7.4513654708862305, -7.301959037780762, -7.152552604675293, -7.003146171569824, -6.8537397384643555, -6.704333305358887, -6.554926872253418, -6.405520439147949, -6.2561140060424805, -6.106707572937012, -5.957301139831543, -5.807894706726074, -5.6584882736206055, -5.509081840515137, -5.359675407409668, -5.210268974304199, -5.0608625411987305, -4.911456108093262, -4.762049674987793, -4.612643718719482, -4.463237285614014, -4.313830852508545, -4.164424419403076, -4.015017986297607, -3.8656115531921387, -3.71620512008667, -3.566798686981201, -3.4173922538757324, -3.2679858207702637, -3.118579387664795, -2.969172954559326, -2.8197665214538574, -2.6703600883483887, -2.52095365524292, -2.371547222137451, -2.2221407890319824, -2.0727343559265137, -1.923327922821045, -1.7739214897155762, -1.6245150566101074, -1.4751086235046387, -1.3257023096084595, -1.1762958765029907, -1.0268895626068115, -0.8774831295013428, -0.728076696395874, -0.57867032289505, -0.4292638897895813, -0.27985745668411255, -0.13045108318328857, 0.018955349922180176, 0.16836178302764893, 0.3177682161331177, 0.46717461943626404, 0.6165810227394104, 0.7659874558448792, 0.9153938889503479, 1.0648002624511719, 1.2142066955566406, 1.3636131286621094]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 3.0, 10.0, 8.0, 8.0, 19.0, 18.0, 29.0, 20.0, 33.0, 34.0, 45.0, 44.0, 47.0, 61.0, 61.0, 54.0, 49.0, 61.0, 50.0, 49.0, 43.0, 50.0, 39.0, 29.0, 23.0, 25.0, 17.0, 14.0, 13.0, 9.0, 3.0, 7.0, 5.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4294917583465576, -0.4152313470840454, -0.4009709656238556, -0.38671058416366577, -0.37245017290115356, -0.35818976163864136, -0.34392938017845154, -0.3296689987182617, -0.3154085874557495, -0.3011481761932373, -0.2868877947330475, -0.27262741327285767, -0.25836700201034546, -0.24410660564899445, -0.22984620928764343, -0.21558581292629242, -0.2013254165649414, -0.1870650202035904, -0.17280462384223938, -0.15854422748088837, -0.14428383111953735, -0.13002343475818634, -0.11576303839683533, -0.10150264203548431, -0.0872422456741333, -0.07298184931278229, -0.058721452951431274, -0.04446105659008026, -0.030200660228729248, -0.015940263867378235, -0.0016798675060272217, 0.012580528855323792, 0.026840955018997192, 0.041101351380348206, 0.05536174774169922, 0.06962214410305023, 0.08388254046440125, 0.09814293682575226, 0.11240333318710327, 0.12666372954845428, 0.1409241259098053, 0.1551845222711563, 0.16944491863250732, 0.18370531499385834, 0.19796571135520935, 0.21222610771656036, 0.22648650407791138, 0.2407469004392624, 0.2550072968006134, 0.2692676782608032, 0.28352808952331543, 0.29778850078582764, 0.31204888224601746, 0.3263092637062073, 0.3405696749687195, 0.3548300862312317, 0.3690904676914215, 0.38335084915161133, 0.39761126041412354, 0.41187167167663574, 0.42613205313682556, 0.4403924345970154, 0.4546528458595276, 0.4689132571220398, 0.4831736385822296]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 1.0, 6.0, 4.0, 10.0, 16.0, 17.0, 36.0, 67.0, 93.0, 161.0, 306.0, 693.0, 1616.0, 4225.0, 14127.0, 86981.0, 700633.0, 205871.0, 23509.0, 6178.0, 2228.0, 892.0, 399.0, 210.0, 92.0, 64.0, 35.0, 24.0, 18.0, 16.0, 7.0, 5.0, 9.0, 2.0, 0.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.861328125, -0.8357467651367188, -0.8101654052734375, -0.7845840454101562, -0.759002685546875, -0.7334213256835938, -0.7078399658203125, -0.6822586059570312, -0.65667724609375, -0.6310958862304688, -0.6055145263671875, -0.5799331665039062, -0.554351806640625, -0.5287704467773438, -0.5031890869140625, -0.47760772705078125, -0.4520263671875, -0.42644500732421875, -0.4008636474609375, -0.37528228759765625, -0.349700927734375, -0.32411956787109375, -0.2985382080078125, -0.27295684814453125, -0.24737548828125, -0.22179412841796875, -0.1962127685546875, -0.17063140869140625, -0.145050048828125, -0.11946868896484375, -0.0938873291015625, -0.06830596923828125, -0.042724609375, -0.01714324951171875, 0.0084381103515625, 0.03401947021484375, 0.059600830078125, 0.08518218994140625, 0.1107635498046875, 0.13634490966796875, 0.16192626953125, 0.18750762939453125, 0.2130889892578125, 0.23867034912109375, 0.264251708984375, 0.28983306884765625, 0.3154144287109375, 0.34099578857421875, 0.3665771484375, 0.39215850830078125, 0.4177398681640625, 0.44332122802734375, 0.468902587890625, 0.49448394775390625, 0.5200653076171875, 0.5456466674804688, 0.57122802734375, 0.5968093872070312, 0.6223907470703125, 0.6479721069335938, 0.673553466796875, 0.6991348266601562, 0.7247161865234375, 0.7502975463867188, 0.77587890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 7.0, 7.0, 15.0, 13.0, 20.0, 36.0, 32.0, 59.0, 70.0, 79.0, 84.0, 88.0, 96.0, 81.0, 72.0, 74.0, 46.0, 36.0, 25.0, 18.0, 13.0, 9.0, 6.0, 9.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78369140625, -0.7421798706054688, -0.7006683349609375, -0.6591567993164062, -0.617645263671875, -0.5761337280273438, -0.5346221923828125, -0.49311065673828125, -0.45159912109375, -0.41008758544921875, -0.3685760498046875, -0.32706451416015625, -0.285552978515625, -0.24404144287109375, -0.2025299072265625, -0.16101837158203125, -0.1195068359375, -0.07799530029296875, -0.0364837646484375, 0.00502777099609375, 0.046539306640625, 0.08805084228515625, 0.1295623779296875, 0.17107391357421875, 0.21258544921875, 0.25409698486328125, 0.2956085205078125, 0.33712005615234375, 0.378631591796875, 0.42014312744140625, 0.4616546630859375, 0.5031661987304688, 0.544677734375, 0.5861892700195312, 0.6277008056640625, 0.6692123413085938, 0.710723876953125, 0.7522354125976562, 0.7937469482421875, 0.8352584838867188, 0.87677001953125, 0.9182815551757812, 0.9597930908203125, 1.0013046264648438, 1.042816162109375, 1.0843276977539062, 1.1258392333984375, 1.1673507690429688, 1.2088623046875, 1.2503738403320312, 1.2918853759765625, 1.3333969116210938, 1.374908447265625, 1.4164199829101562, 1.4579315185546875, 1.4994430541992188, 1.54095458984375, 1.5824661254882812, 1.6239776611328125, 1.6654891967773438, 1.707000732421875, 1.7485122680664062, 1.7900238037109375, 1.8315353393554688, 1.873046875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 5.0, 1.0, 8.0, 5.0, 14.0, 10.0, 23.0, 31.0, 52.0, 78.0, 162.0, 263.0, 486.0, 1058.0, 4007.0, 30004.0, 839672.0, 159977.0, 9153.0, 1969.0, 710.0, 322.0, 198.0, 110.0, 61.0, 48.0, 38.0, 16.0, 19.0, 14.0, 5.0, 3.0, 4.0, 5.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1494140625, -1.1107635498046875, -1.072113037109375, -1.0334625244140625, -0.99481201171875, -0.9561614990234375, -0.917510986328125, -0.8788604736328125, -0.8402099609375, -0.8015594482421875, -0.762908935546875, -0.7242584228515625, -0.68560791015625, -0.6469573974609375, -0.608306884765625, -0.5696563720703125, -0.531005859375, -0.4923553466796875, -0.453704833984375, -0.4150543212890625, -0.37640380859375, -0.3377532958984375, -0.299102783203125, -0.2604522705078125, -0.2218017578125, -0.1831512451171875, -0.144500732421875, -0.1058502197265625, -0.06719970703125, -0.0285491943359375, 0.010101318359375, 0.0487518310546875, 0.08740234375, 0.1260528564453125, 0.164703369140625, 0.2033538818359375, 0.24200439453125, 0.2806549072265625, 0.319305419921875, 0.3579559326171875, 0.3966064453125, 0.4352569580078125, 0.473907470703125, 0.5125579833984375, 0.55120849609375, 0.5898590087890625, 0.628509521484375, 0.6671600341796875, 0.705810546875, 0.7444610595703125, 0.783111572265625, 0.8217620849609375, 0.86041259765625, 0.8990631103515625, 0.937713623046875, 0.9763641357421875, 1.0150146484375, 1.0536651611328125, 1.092315673828125, 1.1309661865234375, 1.16961669921875, 1.2082672119140625, 1.246917724609375, 1.2855682373046875, 1.32421875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 2.0, 2.0, 7.0, 13.0, 11.0, 11.0, 11.0, 13.0, 19.0, 25.0, 13.0, 26.0, 32.0, 31.0, 40.0, 43.0, 46.0, 48.0, 47.0, 41.0, 49.0, 42.0, 43.0, 43.0, 37.0, 47.0, 30.0, 46.0, 26.0, 21.0, 26.0, 14.0, 17.0, 13.0, 11.0, 23.0, 3.0, 8.0, 8.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.796875, -0.7696533203125, -0.742431640625, -0.7152099609375, -0.68798828125, -0.6607666015625, -0.633544921875, -0.6063232421875, -0.5791015625, -0.5518798828125, -0.524658203125, -0.4974365234375, -0.47021484375, -0.4429931640625, -0.415771484375, -0.3885498046875, -0.361328125, -0.3341064453125, -0.306884765625, -0.2796630859375, -0.25244140625, -0.2252197265625, -0.197998046875, -0.1707763671875, -0.1435546875, -0.1163330078125, -0.089111328125, -0.0618896484375, -0.03466796875, -0.0074462890625, 0.019775390625, 0.0469970703125, 0.07421875, 0.1014404296875, 0.128662109375, 0.1558837890625, 0.18310546875, 0.2103271484375, 0.237548828125, 0.2647705078125, 0.2919921875, 0.3192138671875, 0.346435546875, 0.3736572265625, 0.40087890625, 0.4281005859375, 0.455322265625, 0.4825439453125, 0.509765625, 0.5369873046875, 0.564208984375, 0.5914306640625, 0.61865234375, 0.6458740234375, 0.673095703125, 0.7003173828125, 0.7275390625, 0.7547607421875, 0.781982421875, 0.8092041015625, 0.83642578125, 0.8636474609375, 0.890869140625, 0.9180908203125, 0.9453125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 11.0, 9.0, 10.0, 22.0, 19.0, 68.0, 100.0, 255.0, 785.0, 2964.0, 23569.0, 943674.0, 70468.0, 4832.0, 1123.0, 339.0, 140.0, 60.0, 40.0, 16.0, 10.0, 11.0, 4.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.515625, -0.4998321533203125, -0.484039306640625, -0.4682464599609375, -0.45245361328125, -0.4366607666015625, -0.420867919921875, -0.4050750732421875, -0.3892822265625, -0.3734893798828125, -0.357696533203125, -0.3419036865234375, -0.32611083984375, -0.3103179931640625, -0.294525146484375, -0.2787322998046875, -0.262939453125, -0.2471466064453125, -0.231353759765625, -0.2155609130859375, -0.19976806640625, -0.1839752197265625, -0.168182373046875, -0.1523895263671875, -0.1365966796875, -0.1208038330078125, -0.105010986328125, -0.0892181396484375, -0.07342529296875, -0.0576324462890625, -0.041839599609375, -0.0260467529296875, -0.01025390625, 0.0055389404296875, 0.021331787109375, 0.0371246337890625, 0.05291748046875, 0.0687103271484375, 0.084503173828125, 0.1002960205078125, 0.1160888671875, 0.1318817138671875, 0.147674560546875, 0.1634674072265625, 0.17926025390625, 0.1950531005859375, 0.210845947265625, 0.2266387939453125, 0.242431640625, 0.2582244873046875, 0.274017333984375, 0.2898101806640625, 0.30560302734375, 0.3213958740234375, 0.337188720703125, 0.3529815673828125, 0.3687744140625, 0.3845672607421875, 0.400360107421875, 0.4161529541015625, 0.43194580078125, 0.4477386474609375, 0.463531494140625, 0.4793243408203125, 0.4951171875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 2.0, 4.0, 9.0, 7.0, 14.0, 17.0, 14.0, 41.0, 67.0, 90.0, 139.0, 168.0, 128.0, 97.0, 71.0, 38.0, 25.0, 17.0, 17.0, 10.0, 2.0, 5.0, 3.0, 2.0, 3.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.236532211303711e-05, -3.114994615316391e-05, -2.993457019329071e-05, -2.871919423341751e-05, -2.750381827354431e-05, -2.6288442313671112e-05, -2.5073066353797913e-05, -2.3857690393924713e-05, -2.2642314434051514e-05, -2.1426938474178314e-05, -2.0211562514305115e-05, -1.8996186554431915e-05, -1.7780810594558716e-05, -1.6565434634685516e-05, -1.5350058674812317e-05, -1.4134682714939117e-05, -1.2919306755065918e-05, -1.1703930795192719e-05, -1.0488554835319519e-05, -9.27317887544632e-06, -8.05780291557312e-06, -6.842426955699921e-06, -5.627050995826721e-06, -4.411675035953522e-06, -3.1962990760803223e-06, -1.980923116207123e-06, -7.655471563339233e-07, 4.498288035392761e-07, 1.6652047634124756e-06, 2.880580723285675e-06, 4.0959566831588745e-06, 5.311332643032074e-06, 6.5267086029052734e-06, 7.742084562778473e-06, 8.957460522651672e-06, 1.0172836482524872e-05, 1.1388212442398071e-05, 1.260358840227127e-05, 1.381896436214447e-05, 1.503434032201767e-05, 1.624971628189087e-05, 1.746509224176407e-05, 1.8680468201637268e-05, 1.9895844161510468e-05, 2.1111220121383667e-05, 2.2326596081256866e-05, 2.3541972041130066e-05, 2.4757348001003265e-05, 2.5972723960876465e-05, 2.7188099920749664e-05, 2.8403475880622864e-05, 2.9618851840496063e-05, 3.083422780036926e-05, 3.204960376024246e-05, 3.326497972011566e-05, 3.448035567998886e-05, 3.569573163986206e-05, 3.691110759973526e-05, 3.812648355960846e-05, 3.934185951948166e-05, 4.055723547935486e-05, 4.177261143922806e-05, 4.298798739910126e-05, 4.420336335897446e-05, 4.5418739318847656e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 6.0, 9.0, 5.0, 12.0, 20.0, 32.0, 50.0, 111.0, 202.0, 550.0, 1877.0, 12146.0, 764591.0, 259361.0, 7357.0, 1432.0, 407.0, 160.0, 72.0, 50.0, 32.0, 20.0, 15.0, 9.0, 7.0, 7.0, 2.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.5498046875, -0.5335807800292969, -0.5173568725585938, -0.5011329650878906, -0.4849090576171875, -0.4686851501464844, -0.45246124267578125, -0.4362373352050781, -0.420013427734375, -0.4037895202636719, -0.38756561279296875, -0.3713417053222656, -0.3551177978515625, -0.3388938903808594, -0.32266998291015625, -0.3064460754394531, -0.29022216796875, -0.2739982604980469, -0.25777435302734375, -0.24155044555664062, -0.2253265380859375, -0.20910263061523438, -0.19287872314453125, -0.17665481567382812, -0.160430908203125, -0.14420700073242188, -0.12798309326171875, -0.11175918579101562, -0.0955352783203125, -0.07931137084960938, -0.06308746337890625, -0.046863555908203125, -0.0306396484375, -0.014415740966796875, 0.00180816650390625, 0.018032073974609375, 0.0342559814453125, 0.050479888916015625, 0.06670379638671875, 0.08292770385742188, 0.099151611328125, 0.11537551879882812, 0.13159942626953125, 0.14782333374023438, 0.1640472412109375, 0.18027114868164062, 0.19649505615234375, 0.21271896362304688, 0.22894287109375, 0.24516677856445312, 0.26139068603515625, 0.2776145935058594, 0.2938385009765625, 0.3100624084472656, 0.32628631591796875, 0.3425102233886719, 0.358734130859375, 0.3749580383300781, 0.39118194580078125, 0.4074058532714844, 0.4236297607421875, 0.4398536682128906, 0.45607757568359375, 0.4723014831542969, 0.488525390625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 9.0, 8.0, 4.0, 10.0, 13.0, 14.0, 22.0, 27.0, 43.0, 46.0, 71.0, 97.0, 131.0, 117.0, 103.0, 78.0, 58.0, 37.0, 32.0, 16.0, 17.0, 8.0, 9.0, 7.0, 9.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08319091796875, -0.08021831512451172, -0.07724571228027344, -0.07427310943603516, -0.07130050659179688, -0.0683279037475586, -0.06535530090332031, -0.06238269805908203, -0.05941009521484375, -0.05643749237060547, -0.05346488952636719, -0.050492286682128906, -0.047519683837890625, -0.044547080993652344, -0.04157447814941406, -0.03860187530517578, -0.0356292724609375, -0.03265666961669922, -0.029684066772460938, -0.026711463928222656, -0.023738861083984375, -0.020766258239746094, -0.017793655395507812, -0.014821052551269531, -0.01184844970703125, -0.008875846862792969, -0.0059032440185546875, -0.0029306411743164062, 4.1961669921875e-05, 0.0030145645141601562, 0.0059871673583984375, 0.008959770202636719, 0.011932373046875, 0.014904975891113281, 0.017877578735351562, 0.020850181579589844, 0.023822784423828125, 0.026795387268066406, 0.029767990112304688, 0.03274059295654297, 0.03571319580078125, 0.03868579864501953, 0.04165840148925781, 0.044631004333496094, 0.047603607177734375, 0.050576210021972656, 0.05354881286621094, 0.05652141571044922, 0.0594940185546875, 0.06246662139892578, 0.06543922424316406, 0.06841182708740234, 0.07138442993164062, 0.0743570327758789, 0.07732963562011719, 0.08030223846435547, 0.08327484130859375, 0.08624744415283203, 0.08922004699707031, 0.0921926498413086, 0.09516525268554688, 0.09813785552978516, 0.10111045837402344, 0.10408306121826172, 0.1070556640625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 17.0, 44.0, 110.0, 274.0, 291.0, 169.0, 57.0, 32.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.430222511291504, -4.327600002288818, -4.224977493286133, -4.122354984283447, -4.019732475280762, -3.917109966278076, -3.8144874572753906, -3.711864948272705, -3.6092424392700195, -3.506619930267334, -3.4039974212646484, -3.301374912261963, -3.1987524032592773, -3.096129894256592, -2.9935073852539062, -2.8908848762512207, -2.788262367248535, -2.6856398582458496, -2.583017349243164, -2.4803948402404785, -2.377772331237793, -2.2751498222351074, -2.172527313232422, -2.0699048042297363, -1.9672820568084717, -1.8646595478057861, -1.7620370388031006, -1.659414529800415, -1.5567920207977295, -1.454169511795044, -1.3515470027923584, -1.2489244937896729, -1.1463019847869873, -1.0436794757843018, -0.9410569667816162, -0.8384344577789307, -0.7358119487762451, -0.6331893801689148, -0.5305668711662292, -0.4279443621635437, -0.32532185316085815, -0.2226993441581726, -0.12007682025432587, -0.017454296350479126, 0.08516821265220642, 0.18779075145721436, 0.2904132604598999, 0.39303576946258545, 0.495658278465271, 0.5982807874679565, 0.7009032964706421, 0.8035258054733276, 0.9061483144760132, 1.0087709426879883, 1.1113934516906738, 1.2140159606933594, 1.316638469696045, 1.4192609786987305, 1.521883487701416, 1.6245059967041016, 1.727128505706787, 1.8297510147094727, 1.9323735237121582, 2.0349960327148438, 2.1376185417175293]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 9.0, 9.0, 7.0, 14.0, 9.0, 13.0, 12.0, 18.0, 18.0, 21.0, 34.0, 30.0, 42.0, 41.0, 43.0, 53.0, 46.0, 41.0, 45.0, 40.0, 44.0, 54.0, 38.0, 47.0, 32.0, 41.0, 30.0, 27.0, 19.0, 18.0, 25.0, 12.0, 15.0, 17.0, 8.0, 7.0, 8.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.7526599168777466, -1.7049481868743896, -1.6572365760803223, -1.6095249652862549, -1.561813235282898, -1.514101505279541, -1.4663898944854736, -1.4186782836914062, -1.3709665536880493, -1.3232548236846924, -1.275543212890625, -1.2278316020965576, -1.1801198720932007, -1.1324081420898438, -1.0846965312957764, -1.036984920501709, -0.989273190498352, -0.9415615200996399, -0.8938498497009277, -0.8461381793022156, -0.7984265089035034, -0.7507148385047913, -0.7030031681060791, -0.6552914977073669, -0.6075798273086548, -0.5598681569099426, -0.5121564865112305, -0.4644448161125183, -0.41673314571380615, -0.369021475315094, -0.32130980491638184, -0.2735981345176697, -0.22588646411895752, -0.17817479372024536, -0.1304631233215332, -0.08275145292282104, -0.03503978252410889, 0.012671887874603271, 0.06038355827331543, 0.10809522867202759, 0.15580689907073975, 0.2035185694694519, 0.25123023986816406, 0.2989419102668762, 0.3466535806655884, 0.39436525106430054, 0.4420769214630127, 0.48978859186172485, 0.537500262260437, 0.5852119326591492, 0.6329236030578613, 0.6806352734565735, 0.7283469438552856, 0.7760586142539978, 0.82377028465271, 0.8714819550514221, 0.9191936254501343, 0.9669052958488464, 1.0146169662475586, 1.062328577041626, 1.110040307044983, 1.1577520370483398, 1.2054636478424072, 1.2531752586364746, 1.3008869886398315]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 12.0, 13.0, 18.0, 37.0, 50.0, 93.0, 183.0, 298.0, 594.0, 1428.0, 4946.0, 43075.0, 2128690.0, 1965655.0, 41991.0, 4565.0, 1374.0, 587.0, 284.0, 160.0, 89.0, 45.0, 30.0, 24.0, 11.0, 8.0, 5.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.25390625, -1.2106475830078125, -1.167388916015625, -1.1241302490234375, -1.08087158203125, -1.0376129150390625, -0.994354248046875, -0.9510955810546875, -0.9078369140625, -0.8645782470703125, -0.821319580078125, -0.7780609130859375, -0.73480224609375, -0.6915435791015625, -0.648284912109375, -0.6050262451171875, -0.561767578125, -0.5185089111328125, -0.475250244140625, -0.4319915771484375, -0.38873291015625, -0.3454742431640625, -0.302215576171875, -0.2589569091796875, -0.2156982421875, -0.1724395751953125, -0.129180908203125, -0.0859222412109375, -0.04266357421875, 0.0005950927734375, 0.043853759765625, 0.0871124267578125, 0.13037109375, 0.1736297607421875, 0.216888427734375, 0.2601470947265625, 0.30340576171875, 0.3466644287109375, 0.389923095703125, 0.4331817626953125, 0.4764404296875, 0.5196990966796875, 0.562957763671875, 0.6062164306640625, 0.64947509765625, 0.6927337646484375, 0.735992431640625, 0.7792510986328125, 0.822509765625, 0.8657684326171875, 0.909027099609375, 0.9522857666015625, 0.99554443359375, 1.0388031005859375, 1.082061767578125, 1.1253204345703125, 1.1685791015625, 1.2118377685546875, 1.255096435546875, 1.2983551025390625, 1.34161376953125, 1.3848724365234375, 1.428131103515625, 1.4713897705078125, 1.5146484375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 8.0, 5.0, 5.0, 14.0, 19.0, 9.0, 11.0, 20.0, 25.0, 25.0, 36.0, 38.0, 44.0, 56.0, 50.0, 60.0, 55.0, 71.0, 56.0, 57.0, 48.0, 43.0, 34.0, 46.0, 30.0, 29.0, 23.0, 17.0, 16.0, 8.0, 9.0, 12.0, 4.0, 5.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5341796875, -0.5176239013671875, -0.501068115234375, -0.4845123291015625, -0.46795654296875, -0.4514007568359375, -0.434844970703125, -0.4182891845703125, -0.4017333984375, -0.3851776123046875, -0.368621826171875, -0.3520660400390625, -0.33551025390625, -0.3189544677734375, -0.302398681640625, -0.2858428955078125, -0.269287109375, -0.2527313232421875, -0.236175537109375, -0.2196197509765625, -0.20306396484375, -0.1865081787109375, -0.169952392578125, -0.1533966064453125, -0.1368408203125, -0.1202850341796875, -0.103729248046875, -0.0871734619140625, -0.07061767578125, -0.0540618896484375, -0.037506103515625, -0.0209503173828125, -0.00439453125, 0.0121612548828125, 0.028717041015625, 0.0452728271484375, 0.06182861328125, 0.0783843994140625, 0.094940185546875, 0.1114959716796875, 0.1280517578125, 0.1446075439453125, 0.161163330078125, 0.1777191162109375, 0.19427490234375, 0.2108306884765625, 0.227386474609375, 0.2439422607421875, 0.260498046875, 0.2770538330078125, 0.293609619140625, 0.3101654052734375, 0.32672119140625, 0.3432769775390625, 0.359832763671875, 0.3763885498046875, 0.3929443359375, 0.4095001220703125, 0.426055908203125, 0.4426116943359375, 0.45916748046875, 0.4757232666015625, 0.492279052734375, 0.5088348388671875, 0.525390625]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 11.0, 5.0, 5.0, 8.0, 13.0, 11.0, 17.0, 18.0, 23.0, 42.0, 61.0, 109.0, 124.0, 222.0, 354.0, 593.0, 1047.0, 1981.0, 5218.0, 16489.0, 81871.0, 1030515.0, 2821920.0, 190676.0, 29363.0, 7644.0, 2808.0, 1323.0, 676.0, 372.0, 239.0, 158.0, 109.0, 75.0, 55.0, 38.0, 26.0, 25.0, 12.0, 4.0, 10.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.68115234375, -0.6606369018554688, -0.6401214599609375, -0.6196060180664062, -0.599090576171875, -0.5785751342773438, -0.5580596923828125, -0.5375442504882812, -0.51702880859375, -0.49651336669921875, -0.4759979248046875, -0.45548248291015625, -0.434967041015625, -0.41445159912109375, -0.3939361572265625, -0.37342071533203125, -0.3529052734375, -0.33238983154296875, -0.3118743896484375, -0.29135894775390625, -0.270843505859375, -0.25032806396484375, -0.2298126220703125, -0.20929718017578125, -0.18878173828125, -0.16826629638671875, -0.1477508544921875, -0.12723541259765625, -0.106719970703125, -0.08620452880859375, -0.0656890869140625, -0.04517364501953125, -0.024658203125, -0.00414276123046875, 0.0163726806640625, 0.03688812255859375, 0.057403564453125, 0.07791900634765625, 0.0984344482421875, 0.11894989013671875, 0.13946533203125, 0.15998077392578125, 0.1804962158203125, 0.20101165771484375, 0.221527099609375, 0.24204254150390625, 0.2625579833984375, 0.28307342529296875, 0.3035888671875, 0.32410430908203125, 0.3446197509765625, 0.36513519287109375, 0.385650634765625, 0.40616607666015625, 0.4266815185546875, 0.44719696044921875, 0.46771240234375, 0.48822784423828125, 0.5087432861328125, 0.5292587280273438, 0.549774169921875, 0.5702896118164062, 0.5908050537109375, 0.6113204956054688, 0.6318359375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 13.0, 5.0, 8.0, 14.0, 18.0, 19.0, 23.0, 24.0, 62.0, 69.0, 93.0, 140.0, 203.0, 324.0, 472.0, 510.0, 531.0, 446.0, 315.0, 224.0, 159.0, 98.0, 74.0, 64.0, 41.0, 18.0, 33.0, 15.0, 17.0, 9.0, 5.0, 8.0, 3.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1910400390625, -0.18543243408203125, -0.1798248291015625, -0.17421722412109375, -0.168609619140625, -0.16300201416015625, -0.1573944091796875, -0.15178680419921875, -0.14617919921875, -0.14057159423828125, -0.1349639892578125, -0.12935638427734375, -0.123748779296875, -0.11814117431640625, -0.1125335693359375, -0.10692596435546875, -0.101318359375, -0.09571075439453125, -0.0901031494140625, -0.08449554443359375, -0.078887939453125, -0.07328033447265625, -0.0676727294921875, -0.06206512451171875, -0.05645751953125, -0.05084991455078125, -0.0452423095703125, -0.03963470458984375, -0.034027099609375, -0.02841949462890625, -0.0228118896484375, -0.01720428466796875, -0.0115966796875, -0.00598907470703125, -0.0003814697265625, 0.00522613525390625, 0.010833740234375, 0.01644134521484375, 0.0220489501953125, 0.02765655517578125, 0.03326416015625, 0.03887176513671875, 0.0444793701171875, 0.05008697509765625, 0.055694580078125, 0.06130218505859375, 0.0669097900390625, 0.07251739501953125, 0.078125, 0.08373260498046875, 0.0893402099609375, 0.09494781494140625, 0.100555419921875, 0.10616302490234375, 0.1117706298828125, 0.11737823486328125, 0.12298583984375, 0.12859344482421875, 0.1342010498046875, 0.13980865478515625, 0.145416259765625, 0.15102386474609375, 0.1566314697265625, 0.16223907470703125, 0.1678466796875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 12.0, 27.0, 59.0, 123.0, 233.0, 260.0, 137.0, 93.0, 28.0, 17.0, 9.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.063856840133667, -3.0026767253875732, -2.9414968490600586, -2.880316734313965, -2.81913685798645, -2.7579567432403564, -2.6967766284942627, -2.635596752166748, -2.5744166374206543, -2.5132365226745605, -2.452056646347046, -2.390876531600952, -2.3296966552734375, -2.2685165405273438, -2.20733642578125, -2.1461565494537354, -2.0849764347076416, -2.023796319961548, -1.9626164436340332, -1.9014363288879395, -1.8402563333511353, -1.779076337814331, -1.7178963422775269, -1.6567163467407227, -1.5955363512039185, -1.5343563556671143, -1.47317636013031, -1.4119962453842163, -1.350816249847412, -1.289636254310608, -1.2284562587738037, -1.16727614402771, -1.1060962677001953, -1.0449162721633911, -0.9837362170219421, -0.9225562214851379, -0.861376166343689, -0.8001961708068848, -0.7390161752700806, -0.6778361201286316, -0.6166560649871826, -0.5554760694503784, -0.49429601430892944, -0.43311601877212524, -0.37193596363067627, -0.31075596809387207, -0.24957594275474548, -0.1883959174156189, -0.12721586227416992, -0.06603583693504333, -0.004855819046497345, 0.056324198842048645, 0.11750422418117523, 0.17868423461914062, 0.2398642599582672, 0.3010442852973938, 0.3622243106365204, 0.423404335975647, 0.48458436131477356, 0.5457643866539001, 0.6069443821907043, 0.6681244373321533, 0.7293044328689575, 0.7904844284057617, 0.8516644835472107]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 4.0, 2.0, 1.0, 5.0, 4.0, 6.0, 8.0, 12.0, 12.0, 16.0, 9.0, 25.0, 20.0, 18.0, 27.0, 52.0, 34.0, 47.0, 54.0, 50.0, 70.0, 56.0, 59.0, 46.0, 58.0, 44.0, 43.0, 49.0, 35.0, 24.0, 26.0, 17.0, 16.0, 12.0, 11.0, 12.0, 9.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6152368783950806, -0.5964518785476685, -0.5776668787002563, -0.5588818788528442, -0.5400968790054321, -0.5213118195533752, -0.5025268197059631, -0.483741819858551, -0.4649568200111389, -0.4461718201637268, -0.4273868203163147, -0.4086017906665802, -0.3898167908191681, -0.371031790971756, -0.3522467613220215, -0.3334617614746094, -0.31467676162719727, -0.29589176177978516, -0.27710676193237305, -0.25832173228263855, -0.23953673243522644, -0.22075173258781433, -0.20196671783924103, -0.18318170309066772, -0.16439670324325562, -0.1456117033958435, -0.1268266886472702, -0.1080416813492775, -0.08925667405128479, -0.07047166675329208, -0.05168665945529938, -0.032901644706726074, -0.01411658525466919, 0.004668422043323517, 0.023453429341316223, 0.04223843663930893, 0.061023443937301636, 0.07980845123529434, 0.09859345853328705, 0.11737847328186035, 0.13616347312927246, 0.15494847297668457, 0.17373348772525787, 0.19251850247383118, 0.2113035023212433, 0.2300885021686554, 0.2488735169172287, 0.267658531665802, 0.2864435315132141, 0.3052285313606262, 0.32401353120803833, 0.3427985608577728, 0.36158356070518494, 0.38036856055259705, 0.39915359020233154, 0.41793859004974365, 0.43672358989715576, 0.45550858974456787, 0.47429358959198, 0.4930786192417145, 0.5118635892868042, 0.5306486487388611, 0.5494336485862732, 0.5682186484336853, 0.5870036482810974]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 10.0, 12.0, 26.0, 46.0, 50.0, 80.0, 177.0, 389.0, 1126.0, 4230.0, 20761.0, 124859.0, 510649.0, 318027.0, 54632.0, 9896.0, 2284.0, 665.0, 278.0, 130.0, 79.0, 50.0, 28.0, 17.0, 15.0, 14.0, 10.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1705322265625, -0.16562843322753906, -0.16072463989257812, -0.1558208465576172, -0.15091705322265625, -0.1460132598876953, -0.14110946655273438, -0.13620567321777344, -0.1313018798828125, -0.12639808654785156, -0.12149429321289062, -0.11659049987792969, -0.11168670654296875, -0.10678291320800781, -0.10187911987304688, -0.09697532653808594, -0.092071533203125, -0.08716773986816406, -0.08226394653320312, -0.07736015319824219, -0.07245635986328125, -0.06755256652832031, -0.06264877319335938, -0.05774497985839844, -0.0528411865234375, -0.04793739318847656, -0.043033599853515625, -0.03812980651855469, -0.03322601318359375, -0.028322219848632812, -0.023418426513671875, -0.018514633178710938, -0.01361083984375, -0.008707046508789062, -0.003803253173828125, 0.0011005401611328125, 0.00600433349609375, 0.010908126831054688, 0.015811920166015625, 0.020715713500976562, 0.0256195068359375, 0.030523300170898438, 0.035427093505859375, 0.04033088684082031, 0.04523468017578125, 0.05013847351074219, 0.055042266845703125, 0.05994606018066406, 0.064849853515625, 0.06975364685058594, 0.07465744018554688, 0.07956123352050781, 0.08446502685546875, 0.08936882019042969, 0.09427261352539062, 0.09917640686035156, 0.1040802001953125, 0.10898399353027344, 0.11388778686523438, 0.11879158020019531, 0.12369537353515625, 0.1285991668701172, 0.13350296020507812, 0.13840675354003906, 0.143310546875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 4.0, 3.0, 9.0, 15.0, 11.0, 16.0, 17.0, 23.0, 33.0, 48.0, 46.0, 72.0, 79.0, 87.0, 99.0, 87.0, 58.0, 69.0, 56.0, 49.0, 25.0, 27.0, 17.0, 21.0, 13.0, 12.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.458740234375, -0.4406242370605469, -0.42250823974609375, -0.4043922424316406, -0.3862762451171875, -0.3681602478027344, -0.35004425048828125, -0.3319282531738281, -0.313812255859375, -0.2956962585449219, -0.27758026123046875, -0.2594642639160156, -0.2413482666015625, -0.22323226928710938, -0.20511627197265625, -0.18700027465820312, -0.16888427734375, -0.15076828002929688, -0.13265228271484375, -0.11453628540039062, -0.0964202880859375, -0.07830429077148438, -0.06018829345703125, -0.042072296142578125, -0.023956298828125, -0.005840301513671875, 0.01227569580078125, 0.030391693115234375, 0.0485076904296875, 0.06662368774414062, 0.08473968505859375, 0.10285568237304688, 0.1209716796875, 0.13908767700195312, 0.15720367431640625, 0.17531967163085938, 0.1934356689453125, 0.21155166625976562, 0.22966766357421875, 0.24778366088867188, 0.265899658203125, 0.2840156555175781, 0.30213165283203125, 0.3202476501464844, 0.3383636474609375, 0.3564796447753906, 0.37459564208984375, 0.3927116394042969, 0.41082763671875, 0.4289436340332031, 0.44705963134765625, 0.4651756286621094, 0.4832916259765625, 0.5014076232910156, 0.5195236206054688, 0.5376396179199219, 0.555755615234375, 0.5738716125488281, 0.5919876098632812, 0.6101036071777344, 0.6282196044921875, 0.6463356018066406, 0.6644515991210938, 0.6825675964355469, 0.70068359375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 8.0, 4.0, 9.0, 13.0, 16.0, 20.0, 28.0, 47.0, 49.0, 87.0, 115.0, 149.0, 264.0, 381.0, 590.0, 1065.0, 1773.0, 3590.0, 6652.0, 13870.0, 29026.0, 62380.0, 128140.0, 221112.0, 247492.0, 167976.0, 84936.0, 40279.0, 18861.0, 9196.0, 4590.0, 2359.0, 1354.0, 763.0, 425.0, 274.0, 180.0, 130.0, 96.0, 76.0, 48.0, 30.0, 28.0, 18.0, 21.0, 5.0, 9.0, 11.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06072998046875, -0.05878448486328125, -0.0568389892578125, -0.05489349365234375, -0.052947998046875, -0.05100250244140625, -0.0490570068359375, -0.04711151123046875, -0.045166015625, -0.04322052001953125, -0.0412750244140625, -0.03932952880859375, -0.037384033203125, -0.03543853759765625, -0.0334930419921875, -0.03154754638671875, -0.02960205078125, -0.02765655517578125, -0.0257110595703125, -0.02376556396484375, -0.021820068359375, -0.01987457275390625, -0.0179290771484375, -0.01598358154296875, -0.0140380859375, -0.01209259033203125, -0.0101470947265625, -0.00820159912109375, -0.006256103515625, -0.00431060791015625, -0.0023651123046875, -0.00041961669921875, 0.00152587890625, 0.00347137451171875, 0.0054168701171875, 0.00736236572265625, 0.009307861328125, 0.01125335693359375, 0.0131988525390625, 0.01514434814453125, 0.01708984375, 0.01903533935546875, 0.0209808349609375, 0.02292633056640625, 0.024871826171875, 0.02681732177734375, 0.0287628173828125, 0.03070831298828125, 0.03265380859375, 0.03459930419921875, 0.0365447998046875, 0.03849029541015625, 0.040435791015625, 0.04238128662109375, 0.0443267822265625, 0.04627227783203125, 0.0482177734375, 0.05016326904296875, 0.0521087646484375, 0.05405426025390625, 0.055999755859375, 0.05794525146484375, 0.0598907470703125, 0.06183624267578125, 0.06378173828125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 7.0, 2.0, 3.0, 7.0, 4.0, 9.0, 10.0, 18.0, 10.0, 21.0, 11.0, 21.0, 27.0, 24.0, 31.0, 41.0, 47.0, 37.0, 52.0, 52.0, 48.0, 63.0, 44.0, 38.0, 49.0, 35.0, 45.0, 43.0, 23.0, 33.0, 14.0, 25.0, 20.0, 19.0, 8.0, 7.0, 14.0, 6.0, 8.0, 5.0, 2.0, 8.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.69921875, -0.6778106689453125, -0.656402587890625, -0.6349945068359375, -0.61358642578125, -0.5921783447265625, -0.570770263671875, -0.5493621826171875, -0.5279541015625, -0.5065460205078125, -0.485137939453125, -0.4637298583984375, -0.44232177734375, -0.4209136962890625, -0.399505615234375, -0.3780975341796875, -0.356689453125, -0.3352813720703125, -0.313873291015625, -0.2924652099609375, -0.27105712890625, -0.2496490478515625, -0.228240966796875, -0.2068328857421875, -0.1854248046875, -0.1640167236328125, -0.142608642578125, -0.1212005615234375, -0.09979248046875, -0.0783843994140625, -0.056976318359375, -0.0355682373046875, -0.01416015625, 0.0072479248046875, 0.028656005859375, 0.0500640869140625, 0.07147216796875, 0.0928802490234375, 0.114288330078125, 0.1356964111328125, 0.1571044921875, 0.1785125732421875, 0.199920654296875, 0.2213287353515625, 0.24273681640625, 0.2641448974609375, 0.285552978515625, 0.3069610595703125, 0.328369140625, 0.3497772216796875, 0.371185302734375, 0.3925933837890625, 0.41400146484375, 0.4354095458984375, 0.456817626953125, 0.4782257080078125, 0.4996337890625, 0.5210418701171875, 0.542449951171875, 0.5638580322265625, 0.58526611328125, 0.6066741943359375, 0.628082275390625, 0.6494903564453125, 0.6708984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 7.0, 5.0, 9.0, 24.0, 33.0, 56.0, 55.0, 92.0, 122.0, 208.0, 363.0, 650.0, 1044.0, 2137.0, 4728.0, 12165.0, 39406.0, 156823.0, 449738.0, 277935.0, 69672.0, 19766.0, 7049.0, 2997.0, 1528.0, 792.0, 432.0, 235.0, 173.0, 114.0, 67.0, 34.0, 29.0, 17.0, 12.0, 9.0, 4.0, 7.0, 1.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.032379150390625, -0.03135824203491211, -0.03033733367919922, -0.029316425323486328, -0.028295516967773438, -0.027274608612060547, -0.026253700256347656, -0.025232791900634766, -0.024211883544921875, -0.023190975189208984, -0.022170066833496094, -0.021149158477783203, -0.020128250122070312, -0.019107341766357422, -0.01808643341064453, -0.01706552505493164, -0.01604461669921875, -0.01502370834350586, -0.014002799987792969, -0.012981891632080078, -0.011960983276367188, -0.010940074920654297, -0.009919166564941406, -0.008898258209228516, -0.007877349853515625, -0.006856441497802734, -0.005835533142089844, -0.004814624786376953, -0.0037937164306640625, -0.002772808074951172, -0.0017518997192382812, -0.0007309913635253906, 0.0002899169921875, 0.0013108253479003906, 0.0023317337036132812, 0.003352642059326172, 0.0043735504150390625, 0.005394458770751953, 0.006415367126464844, 0.007436275482177734, 0.008457183837890625, 0.009478092193603516, 0.010499000549316406, 0.011519908905029297, 0.012540817260742188, 0.013561725616455078, 0.014582633972167969, 0.01560354232788086, 0.01662445068359375, 0.01764535903930664, 0.01866626739501953, 0.019687175750732422, 0.020708084106445312, 0.021728992462158203, 0.022749900817871094, 0.023770809173583984, 0.024791717529296875, 0.025812625885009766, 0.026833534240722656, 0.027854442596435547, 0.028875350952148438, 0.029896259307861328, 0.03091716766357422, 0.03193807601928711, 0.032958984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 5.0, 12.0, 16.0, 17.0, 30.0, 40.0, 70.0, 70.0, 85.0, 88.0, 99.0, 97.0, 99.0, 67.0, 62.0, 44.0, 38.0, 22.0, 11.0, 3.0, 10.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.71661376953125e-05, -1.6568228602409363e-05, -1.5970319509506226e-05, -1.537241041660309e-05, -1.4774501323699951e-05, -1.4176592230796814e-05, -1.3578683137893677e-05, -1.298077404499054e-05, -1.2382864952087402e-05, -1.1784955859184265e-05, -1.1187046766281128e-05, -1.058913767337799e-05, -9.991228580474854e-06, -9.393319487571716e-06, -8.795410394668579e-06, -8.197501301765442e-06, -7.599592208862305e-06, -7.0016831159591675e-06, -6.40377402305603e-06, -5.805864930152893e-06, -5.207955837249756e-06, -4.610046744346619e-06, -4.0121376514434814e-06, -3.4142285585403442e-06, -2.816319465637207e-06, -2.21841037273407e-06, -1.6205012798309326e-06, -1.0225921869277954e-06, -4.246830940246582e-07, 1.73225998878479e-07, 7.711350917816162e-07, 1.3690441846847534e-06, 1.9669532775878906e-06, 2.564862370491028e-06, 3.162771463394165e-06, 3.7606805562973022e-06, 4.3585896492004395e-06, 4.956498742103577e-06, 5.554407835006714e-06, 6.152316927909851e-06, 6.750226020812988e-06, 7.3481351137161255e-06, 7.946044206619263e-06, 8.5439532995224e-06, 9.141862392425537e-06, 9.739771485328674e-06, 1.0337680578231812e-05, 1.0935589671134949e-05, 1.1533498764038086e-05, 1.2131407856941223e-05, 1.272931694984436e-05, 1.3327226042747498e-05, 1.3925135135650635e-05, 1.4523044228553772e-05, 1.512095332145691e-05, 1.5718862414360046e-05, 1.6316771507263184e-05, 1.691468060016632e-05, 1.7512589693069458e-05, 1.8110498785972595e-05, 1.8708407878875732e-05, 1.930631697177887e-05, 1.9904226064682007e-05, 2.0502135157585144e-05, 2.110004425048828e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 5.0, 6.0, 5.0, 20.0, 18.0, 24.0, 43.0, 61.0, 64.0, 108.0, 189.0, 316.0, 570.0, 1202.0, 2655.0, 7204.0, 22753.0, 79725.0, 257296.0, 393055.0, 198391.0, 58016.0, 16840.0, 5666.0, 2142.0, 945.0, 468.0, 291.0, 154.0, 102.0, 59.0, 43.0, 40.0, 20.0, 12.0, 14.0, 14.0, 4.0, 5.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.031524658203125, -0.03058004379272461, -0.02963542938232422, -0.028690814971923828, -0.027746200561523438, -0.026801586151123047, -0.025856971740722656, -0.024912357330322266, -0.023967742919921875, -0.023023128509521484, -0.022078514099121094, -0.021133899688720703, -0.020189285278320312, -0.019244670867919922, -0.01830005645751953, -0.01735544204711914, -0.01641082763671875, -0.01546621322631836, -0.014521598815917969, -0.013576984405517578, -0.012632369995117188, -0.011687755584716797, -0.010743141174316406, -0.009798526763916016, -0.008853912353515625, -0.007909297943115234, -0.006964683532714844, -0.006020069122314453, -0.0050754547119140625, -0.004130840301513672, -0.0031862258911132812, -0.0022416114807128906, -0.0012969970703125, -0.0003523826599121094, 0.0005922317504882812, 0.0015368461608886719, 0.0024814605712890625, 0.003426074981689453, 0.004370689392089844, 0.005315303802490234, 0.006259918212890625, 0.007204532623291016, 0.008149147033691406, 0.009093761444091797, 0.010038375854492188, 0.010982990264892578, 0.011927604675292969, 0.01287221908569336, 0.01381683349609375, 0.01476144790649414, 0.01570606231689453, 0.016650676727294922, 0.017595291137695312, 0.018539905548095703, 0.019484519958496094, 0.020429134368896484, 0.021373748779296875, 0.022318363189697266, 0.023262977600097656, 0.024207592010498047, 0.025152206420898438, 0.026096820831298828, 0.02704143524169922, 0.02798604965209961, 0.0289306640625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 1.0, 8.0, 11.0, 6.0, 12.0, 15.0, 9.0, 20.0, 29.0, 32.0, 40.0, 40.0, 33.0, 59.0, 59.0, 63.0, 52.0, 52.0, 51.0, 45.0, 64.0, 34.0, 39.0, 36.0, 36.0, 31.0, 12.0, 19.0, 18.0, 23.0, 12.0, 7.0, 3.0, 7.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.008056640625, -0.007813096046447754, -0.007569551467895508, -0.007326006889343262, -0.007082462310791016, -0.0068389177322387695, -0.0065953731536865234, -0.006351828575134277, -0.006108283996582031, -0.005864739418029785, -0.005621194839477539, -0.005377650260925293, -0.005134105682373047, -0.004890561103820801, -0.004647016525268555, -0.004403471946716309, -0.0041599273681640625, -0.003916382789611816, -0.0036728382110595703, -0.0034292936325073242, -0.003185749053955078, -0.002942204475402832, -0.002698659896850586, -0.00245511531829834, -0.0022115707397460938, -0.0019680261611938477, -0.0017244815826416016, -0.0014809370040893555, -0.0012373924255371094, -0.0009938478469848633, -0.0007503032684326172, -0.0005067586898803711, -0.000263214111328125, -1.9669532775878906e-05, 0.0002238750457763672, 0.0004674196243286133, 0.0007109642028808594, 0.0009545087814331055, 0.0011980533599853516, 0.0014415979385375977, 0.0016851425170898438, 0.0019286870956420898, 0.002172231674194336, 0.002415776252746582, 0.002659320831298828, 0.0029028654098510742, 0.0031464099884033203, 0.0033899545669555664, 0.0036334991455078125, 0.0038770437240600586, 0.004120588302612305, 0.004364132881164551, 0.004607677459716797, 0.004851222038269043, 0.005094766616821289, 0.005338311195373535, 0.005581855773925781, 0.005825400352478027, 0.0060689449310302734, 0.0063124895095825195, 0.006556034088134766, 0.006799578666687012, 0.007043123245239258, 0.007286667823791504, 0.00753021240234375]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 9.0, 167.0, 753.0, 77.0, 10.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.984787940979004, -7.8405842781066895, -7.696380615234375, -7.5521769523620605, -7.407973289489746, -7.263769626617432, -7.119565963745117, -6.975362300872803, -6.831158638000488, -6.686954975128174, -6.542751312255859, -6.398547649383545, -6.2543439865112305, -6.110140323638916, -5.965936660766602, -5.821732997894287, -5.677529335021973, -5.533325672149658, -5.389122009277344, -5.244918346405029, -5.100714683532715, -4.9565110206604, -4.812307357788086, -4.6681036949157715, -4.523899555206299, -4.379695892333984, -4.23549222946167, -4.0912885665893555, -3.947084903717041, -3.8028812408447266, -3.658677577972412, -3.5144739151000977, -3.3702704906463623, -3.226066827774048, -3.0818631649017334, -2.937659502029419, -2.7934558391571045, -2.64925217628479, -2.5050482749938965, -2.360844612121582, -2.2166409492492676, -2.072437286376953, -1.9282336235046387, -1.7840299606323242, -1.6398262977600098, -1.4956226348876953, -1.3514188528060913, -1.2072151899337769, -1.063011646270752, -0.9188079833984375, -0.774604320526123, -0.6304005980491638, -0.48619693517684937, -0.3419932723045349, -0.19778954982757568, -0.05358588695526123, 0.09061777591705322, 0.23482145369052887, 0.3790251314640045, 0.5232288241386414, 0.6674324870109558, 0.8116361498832703, 0.9558398723602295, 1.100043535232544, 1.2442471981048584]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 7.0, 5.0, 7.0, 13.0, 15.0, 17.0, 17.0, 23.0, 21.0, 37.0, 51.0, 42.0, 75.0, 81.0, 71.0, 79.0, 71.0, 70.0, 54.0, 57.0, 40.0, 38.0, 26.0, 20.0, 16.0, 20.0, 7.0, 9.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4294459819793701, -0.4136611819267273, -0.3978763818740845, -0.38209158182144165, -0.36630678176879883, -0.350521981716156, -0.3347371518611908, -0.318952351808548, -0.30316755175590515, -0.28738275170326233, -0.2715979516506195, -0.2558131515979767, -0.24002833664417267, -0.22424353659152985, -0.20845872163772583, -0.192673921585083, -0.17688912153244019, -0.16110432147979736, -0.14531952142715454, -0.12953470647335052, -0.1137499064207077, -0.09796510636806488, -0.08218029886484146, -0.06639549136161804, -0.05061069130897522, -0.0348258875310421, -0.01904108375310898, -0.0032562799751758575, 0.012528523802757263, 0.028313323855400085, 0.044098131358623505, 0.059882938861846924, 0.07566767930984497, 0.09145247936248779, 0.10723728686571121, 0.12302209436893463, 0.13880689442157745, 0.15459169447422028, 0.1703765094280243, 0.18616130948066711, 0.20194610953330994, 0.21773090958595276, 0.23351570963859558, 0.2493005245923996, 0.2650853395462036, 0.28087013959884644, 0.29665493965148926, 0.3124397397041321, 0.3282245397567749, 0.3440093398094177, 0.35979413986206055, 0.37557893991470337, 0.3913637399673462, 0.407148540019989, 0.4229333698749542, 0.43871816992759705, 0.45450296998023987, 0.4702877700328827, 0.4860725700855255, 0.5018573999404907, 0.5176421999931335, 0.5334270000457764, 0.5492118000984192, 0.564996600151062, 0.5807814002037048]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 9.0, 12.0, 15.0, 9.0, 24.0, 30.0, 41.0, 72.0, 105.0, 190.0, 268.0, 428.0, 668.0, 1114.0, 2057.0, 4166.0, 8619.0, 19970.0, 53038.0, 169025.0, 415145.0, 247196.0, 76592.0, 26991.0, 11199.0, 5232.0, 2665.0, 1466.0, 840.0, 505.0, 318.0, 170.0, 97.0, 85.0, 59.0, 26.0, 29.0, 21.0, 13.0, 11.0, 11.0, 3.0, 7.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.335693359375, -0.32572174072265625, -0.3157501220703125, -0.30577850341796875, -0.295806884765625, -0.28583526611328125, -0.2758636474609375, -0.26589202880859375, -0.25592041015625, -0.24594879150390625, -0.2359771728515625, -0.22600555419921875, -0.216033935546875, -0.20606231689453125, -0.1960906982421875, -0.18611907958984375, -0.1761474609375, -0.16617584228515625, -0.1562042236328125, -0.14623260498046875, -0.136260986328125, -0.12628936767578125, -0.1163177490234375, -0.10634613037109375, -0.09637451171875, -0.08640289306640625, -0.0764312744140625, -0.06645965576171875, -0.056488037109375, -0.04651641845703125, -0.0365447998046875, -0.02657318115234375, -0.0166015625, -0.00662994384765625, 0.0033416748046875, 0.01331329345703125, 0.023284912109375, 0.03325653076171875, 0.0432281494140625, 0.05319976806640625, 0.06317138671875, 0.07314300537109375, 0.0831146240234375, 0.09308624267578125, 0.103057861328125, 0.11302947998046875, 0.1230010986328125, 0.13297271728515625, 0.1429443359375, 0.15291595458984375, 0.1628875732421875, 0.17285919189453125, 0.182830810546875, 0.19280242919921875, 0.2027740478515625, 0.21274566650390625, 0.22271728515625, 0.23268890380859375, 0.2426605224609375, 0.25263214111328125, 0.262603759765625, 0.27257537841796875, 0.2825469970703125, 0.29251861572265625, 0.302490234375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 6.0, 4.0, 4.0, 5.0, 8.0, 3.0, 14.0, 13.0, 13.0, 15.0, 21.0, 17.0, 22.0, 27.0, 33.0, 43.0, 49.0, 40.0, 57.0, 65.0, 55.0, 55.0, 66.0, 45.0, 55.0, 41.0, 25.0, 37.0, 32.0, 24.0, 22.0, 15.0, 17.0, 16.0, 13.0, 5.0, 5.0, 4.0, 2.0, 4.0, 1.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.8583984375, -0.8349456787109375, -0.811492919921875, -0.7880401611328125, -0.76458740234375, -0.7411346435546875, -0.717681884765625, -0.6942291259765625, -0.6707763671875, -0.6473236083984375, -0.623870849609375, -0.6004180908203125, -0.57696533203125, -0.5535125732421875, -0.530059814453125, -0.5066070556640625, -0.483154296875, -0.4597015380859375, -0.436248779296875, -0.4127960205078125, -0.38934326171875, -0.3658905029296875, -0.342437744140625, -0.3189849853515625, -0.2955322265625, -0.2720794677734375, -0.248626708984375, -0.2251739501953125, -0.20172119140625, -0.1782684326171875, -0.154815673828125, -0.1313629150390625, -0.10791015625, -0.0844573974609375, -0.061004638671875, -0.0375518798828125, -0.01409912109375, 0.0093536376953125, 0.032806396484375, 0.0562591552734375, 0.0797119140625, 0.1031646728515625, 0.126617431640625, 0.1500701904296875, 0.17352294921875, 0.1969757080078125, 0.220428466796875, 0.2438812255859375, 0.267333984375, 0.2907867431640625, 0.314239501953125, 0.3376922607421875, 0.36114501953125, 0.3845977783203125, 0.408050537109375, 0.4315032958984375, 0.4549560546875, 0.4784088134765625, 0.501861572265625, 0.5253143310546875, 0.54876708984375, 0.5722198486328125, 0.595672607421875, 0.6191253662109375, 0.642578125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 6.0, 4.0, 13.0, 14.0, 18.0, 16.0, 39.0, 63.0, 123.0, 197.0, 494.0, 2044.0, 39623.0, 952473.0, 50160.0, 2231.0, 540.0, 209.0, 92.0, 57.0, 40.0, 32.0, 19.0, 16.0, 8.0, 6.0, 8.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.08203125, -1.042724609375, -1.00341796875, -0.964111328125, -0.9248046875, -0.885498046875, -0.84619140625, -0.806884765625, -0.767578125, -0.728271484375, -0.68896484375, -0.649658203125, -0.6103515625, -0.571044921875, -0.53173828125, -0.492431640625, -0.453125, -0.413818359375, -0.37451171875, -0.335205078125, -0.2958984375, -0.256591796875, -0.21728515625, -0.177978515625, -0.138671875, -0.099365234375, -0.06005859375, -0.020751953125, 0.0185546875, 0.057861328125, 0.09716796875, 0.136474609375, 0.17578125, 0.215087890625, 0.25439453125, 0.293701171875, 0.3330078125, 0.372314453125, 0.41162109375, 0.450927734375, 0.490234375, 0.529541015625, 0.56884765625, 0.608154296875, 0.6474609375, 0.686767578125, 0.72607421875, 0.765380859375, 0.8046875, 0.843994140625, 0.88330078125, 0.922607421875, 0.9619140625, 1.001220703125, 1.04052734375, 1.079833984375, 1.119140625, 1.158447265625, 1.19775390625, 1.237060546875, 1.2763671875, 1.315673828125, 1.35498046875, 1.394287109375, 1.43359375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 5.0, 1.0, 2.0, 6.0, 7.0, 11.0, 11.0, 17.0, 16.0, 19.0, 27.0, 25.0, 22.0, 27.0, 35.0, 44.0, 42.0, 24.0, 42.0, 57.0, 36.0, 46.0, 47.0, 49.0, 48.0, 37.0, 36.0, 35.0, 28.0, 31.0, 33.0, 19.0, 25.0, 17.0, 11.0, 15.0, 14.0, 10.0, 6.0, 8.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.81640625, -0.7922134399414062, -0.7680206298828125, -0.7438278198242188, -0.719635009765625, -0.6954421997070312, -0.6712493896484375, -0.6470565795898438, -0.62286376953125, -0.5986709594726562, -0.5744781494140625, -0.5502853393554688, -0.526092529296875, -0.5018997192382812, -0.4777069091796875, -0.45351409912109375, -0.4293212890625, -0.40512847900390625, -0.3809356689453125, -0.35674285888671875, -0.332550048828125, -0.30835723876953125, -0.2841644287109375, -0.25997161865234375, -0.23577880859375, -0.21158599853515625, -0.1873931884765625, -0.16320037841796875, -0.139007568359375, -0.11481475830078125, -0.0906219482421875, -0.06642913818359375, -0.042236328125, -0.01804351806640625, 0.0061492919921875, 0.03034210205078125, 0.054534912109375, 0.07872772216796875, 0.1029205322265625, 0.12711334228515625, 0.15130615234375, 0.17549896240234375, 0.1996917724609375, 0.22388458251953125, 0.248077392578125, 0.27227020263671875, 0.2964630126953125, 0.32065582275390625, 0.3448486328125, 0.36904144287109375, 0.3932342529296875, 0.41742706298828125, 0.441619873046875, 0.46581268310546875, 0.4900054931640625, 0.5141983032226562, 0.53839111328125, 0.5625839233398438, 0.5867767333984375, 0.6109695434570312, 0.635162353515625, 0.6593551635742188, 0.6835479736328125, 0.7077407836914062, 0.73193359375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 7.0, 9.0, 19.0, 34.0, 84.0, 158.0, 458.0, 1627.0, 10430.0, 895634.0, 134281.0, 4337.0, 892.0, 317.0, 117.0, 54.0, 29.0, 14.0, 9.0, 5.0, 8.0, 6.0, 5.0, 4.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.494384765625, -0.4766044616699219, -0.45882415771484375, -0.4410438537597656, -0.4232635498046875, -0.4054832458496094, -0.38770294189453125, -0.3699226379394531, -0.352142333984375, -0.3343620300292969, -0.31658172607421875, -0.2988014221191406, -0.2810211181640625, -0.2632408142089844, -0.24546051025390625, -0.22768020629882812, -0.20989990234375, -0.19211959838867188, -0.17433929443359375, -0.15655899047851562, -0.1387786865234375, -0.12099838256835938, -0.10321807861328125, -0.08543777465820312, -0.067657470703125, -0.049877166748046875, -0.03209686279296875, -0.014316558837890625, 0.0034637451171875, 0.021244049072265625, 0.03902435302734375, 0.056804656982421875, 0.0745849609375, 0.09236526489257812, 0.11014556884765625, 0.12792587280273438, 0.1457061767578125, 0.16348648071289062, 0.18126678466796875, 0.19904708862304688, 0.216827392578125, 0.23460769653320312, 0.25238800048828125, 0.2701683044433594, 0.2879486083984375, 0.3057289123535156, 0.32350921630859375, 0.3412895202636719, 0.35906982421875, 0.3768501281738281, 0.39463043212890625, 0.4124107360839844, 0.4301910400390625, 0.4479713439941406, 0.46575164794921875, 0.4835319519042969, 0.501312255859375, 0.5190925598144531, 0.5368728637695312, 0.5546531677246094, 0.5724334716796875, 0.5902137756347656, 0.6079940795898438, 0.6257743835449219, 0.6435546875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 9.0, 10.0, 10.0, 25.0, 33.0, 58.0, 95.0, 153.0, 182.0, 167.0, 100.0, 63.0, 30.0, 18.0, 19.0, 9.0, 11.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.863739013671875e-05, -4.7147274017333984e-05, -4.565715789794922e-05, -4.416704177856445e-05, -4.267692565917969e-05, -4.118680953979492e-05, -3.9696693420410156e-05, -3.820657730102539e-05, -3.6716461181640625e-05, -3.522634506225586e-05, -3.3736228942871094e-05, -3.224611282348633e-05, -3.075599670410156e-05, -2.9265880584716797e-05, -2.777576446533203e-05, -2.6285648345947266e-05, -2.47955322265625e-05, -2.3305416107177734e-05, -2.181529998779297e-05, -2.0325183868408203e-05, -1.8835067749023438e-05, -1.7344951629638672e-05, -1.5854835510253906e-05, -1.436471939086914e-05, -1.2874603271484375e-05, -1.138448715209961e-05, -9.894371032714844e-06, -8.404254913330078e-06, -6.9141387939453125e-06, -5.424022674560547e-06, -3.933906555175781e-06, -2.4437904357910156e-06, -9.5367431640625e-07, 5.364418029785156e-07, 2.0265579223632812e-06, 3.516674041748047e-06, 5.0067901611328125e-06, 6.496906280517578e-06, 7.987022399902344e-06, 9.47713851928711e-06, 1.0967254638671875e-05, 1.245737075805664e-05, 1.3947486877441406e-05, 1.5437602996826172e-05, 1.6927719116210938e-05, 1.8417835235595703e-05, 1.990795135498047e-05, 2.1398067474365234e-05, 2.288818359375e-05, 2.4378299713134766e-05, 2.586841583251953e-05, 2.7358531951904297e-05, 2.8848648071289062e-05, 3.0338764190673828e-05, 3.1828880310058594e-05, 3.331899642944336e-05, 3.4809112548828125e-05, 3.629922866821289e-05, 3.7789344787597656e-05, 3.927946090698242e-05, 4.076957702636719e-05, 4.225969314575195e-05, 4.374980926513672e-05, 4.5239925384521484e-05, 4.673004150390625e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 10.0, 4.0, 11.0, 17.0, 22.0, 35.0, 69.0, 109.0, 218.0, 532.0, 1424.0, 6051.0, 95980.0, 909639.0, 28870.0, 3649.0, 1049.0, 409.0, 182.0, 93.0, 55.0, 30.0, 27.0, 17.0, 9.0, 8.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4462890625, -0.4329032897949219, -0.41951751708984375, -0.4061317443847656, -0.3927459716796875, -0.3793601989746094, -0.36597442626953125, -0.3525886535644531, -0.339202880859375, -0.3258171081542969, -0.31243133544921875, -0.2990455627441406, -0.2856597900390625, -0.2722740173339844, -0.25888824462890625, -0.24550247192382812, -0.23211669921875, -0.21873092651367188, -0.20534515380859375, -0.19195938110351562, -0.1785736083984375, -0.16518783569335938, -0.15180206298828125, -0.13841629028320312, -0.125030517578125, -0.11164474487304688, -0.09825897216796875, -0.08487319946289062, -0.0714874267578125, -0.058101654052734375, -0.04471588134765625, -0.031330108642578125, -0.0179443359375, -0.004558563232421875, 0.00882720947265625, 0.022212982177734375, 0.0355987548828125, 0.048984527587890625, 0.06237030029296875, 0.07575607299804688, 0.089141845703125, 0.10252761840820312, 0.11591339111328125, 0.12929916381835938, 0.1426849365234375, 0.15607070922851562, 0.16945648193359375, 0.18284225463867188, 0.19622802734375, 0.20961380004882812, 0.22299957275390625, 0.23638534545898438, 0.2497711181640625, 0.2631568908691406, 0.27654266357421875, 0.2899284362792969, 0.303314208984375, 0.3166999816894531, 0.33008575439453125, 0.3434715270996094, 0.3568572998046875, 0.3702430725097656, 0.38362884521484375, 0.3970146179199219, 0.410400390625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 9.0, 13.0, 16.0, 9.0, 23.0, 35.0, 48.0, 59.0, 106.0, 132.0, 119.0, 113.0, 112.0, 46.0, 49.0, 31.0, 24.0, 13.0, 9.0, 12.0, 5.0, 4.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08697509765625, -0.08391666412353516, -0.08085823059082031, -0.07779979705810547, -0.07474136352539062, -0.07168292999267578, -0.06862449645996094, -0.0655660629272461, -0.06250762939453125, -0.059449195861816406, -0.05639076232910156, -0.05333232879638672, -0.050273895263671875, -0.04721546173095703, -0.04415702819824219, -0.041098594665527344, -0.0380401611328125, -0.034981727600097656, -0.03192329406738281, -0.02886486053466797, -0.025806427001953125, -0.02274799346923828, -0.019689559936523438, -0.016631126403808594, -0.01357269287109375, -0.010514259338378906, -0.0074558258056640625, -0.004397392272949219, -0.001338958740234375, 0.0017194747924804688, 0.0047779083251953125, 0.007836341857910156, 0.010894775390625, 0.013953208923339844, 0.017011642456054688, 0.02007007598876953, 0.023128509521484375, 0.02618694305419922, 0.029245376586914062, 0.032303810119628906, 0.03536224365234375, 0.038420677185058594, 0.04147911071777344, 0.04453754425048828, 0.047595977783203125, 0.05065441131591797, 0.05371284484863281, 0.056771278381347656, 0.0598297119140625, 0.06288814544677734, 0.06594657897949219, 0.06900501251220703, 0.07206344604492188, 0.07512187957763672, 0.07818031311035156, 0.0812387466430664, 0.08429718017578125, 0.0873556137084961, 0.09041404724121094, 0.09347248077392578, 0.09653091430664062, 0.09958934783935547, 0.10264778137207031, 0.10570621490478516, 0.1087646484375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 13.0, 49.0, 112.0, 210.0, 264.0, 198.0, 92.0, 30.0, 11.0, 14.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.367982864379883, -2.284615993499756, -2.201249122619629, -2.117882251739502, -2.034515380859375, -1.951148509979248, -1.867781639099121, -1.7844147682189941, -1.7010478973388672, -1.6176810264587402, -1.5343141555786133, -1.4509472846984863, -1.3675804138183594, -1.2842135429382324, -1.2008466720581055, -1.1174798011779785, -1.0341129302978516, -0.9507460594177246, -0.8673791885375977, -0.7840123176574707, -0.7006454467773438, -0.6172785758972168, -0.5339117050170898, -0.4505448341369629, -0.36717796325683594, -0.283811092376709, -0.20044422149658203, -0.11707735061645508, -0.033710479736328125, 0.04965639114379883, 0.13302326202392578, 0.21639013290405273, 0.2997572422027588, 0.38312411308288574, 0.4664909839630127, 0.5498578548431396, 0.6332247257232666, 0.7165915966033936, 0.7999584674835205, 0.8833253383636475, 0.9666922092437744, 1.0500590801239014, 1.1334259510040283, 1.2167928218841553, 1.3001596927642822, 1.3835265636444092, 1.4668934345245361, 1.550260305404663, 1.63362717628479, 1.716994047164917, 1.800360918045044, 1.883727788925171, 1.9670946598052979, 2.050461530685425, 2.1338284015655518, 2.2171952724456787, 2.3005621433258057, 2.3839290142059326, 2.4672958850860596, 2.5506627559661865, 2.6340296268463135, 2.7173964977264404, 2.8007633686065674, 2.8841302394866943, 2.9674971103668213]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 8.0, 6.0, 15.0, 9.0, 13.0, 22.0, 21.0, 23.0, 32.0, 30.0, 34.0, 36.0, 31.0, 43.0, 46.0, 48.0, 51.0, 49.0, 48.0, 45.0, 42.0, 38.0, 34.0, 32.0, 31.0, 20.0, 15.0, 25.0, 21.0, 20.0, 18.0, 16.0, 16.0, 9.0, 13.0, 8.0, 3.0, 10.0, 6.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.428632140159607, -1.3868021965026855, -1.3449722528457642, -1.3031423091888428, -1.2613122463226318, -1.2194823026657104, -1.177652359008789, -1.1358224153518677, -1.0939924716949463, -1.052162528038025, -1.0103325843811035, -0.9685025811195374, -0.926672637462616, -0.8848426938056946, -0.8430126905441284, -0.801182746887207, -0.7593528032302856, -0.7175228595733643, -0.6756929159164429, -0.6338629126548767, -0.5920329689979553, -0.5502030253410339, -0.5083730220794678, -0.4665430784225464, -0.424713134765625, -0.3828831911087036, -0.34105321764945984, -0.29922324419021606, -0.2573933005332947, -0.2155633419752121, -0.17373338341712952, -0.13190340995788574, -0.0900733470916748, -0.048243388533592224, -0.0064134299755096436, 0.03541652858257294, 0.07724648714065552, 0.1190764456987381, 0.16090640425682068, 0.20273637771606445, 0.24456632137298584, 0.2863962650299072, 0.328226238489151, 0.3700562119483948, 0.41188615560531616, 0.45371609926223755, 0.4955460727214813, 0.5373760461807251, 0.5792059898376465, 0.6210359334945679, 0.6628658771514893, 0.7046958804130554, 0.7465258240699768, 0.7883557677268982, 0.8301857709884644, 0.8720157146453857, 0.9138456583023071, 0.9556756019592285, 0.9975055456161499, 1.0393354892730713, 1.0811655521392822, 1.1229954957962036, 1.164825439453125, 1.2066553831100464, 1.2484853267669678]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 2.0, 4.0, 10.0, 8.0, 13.0, 27.0, 30.0, 48.0, 84.0, 144.0, 240.0, 442.0, 1059.0, 2567.0, 8121.0, 52529.0, 1066541.0, 2839877.0, 197661.0, 18607.0, 3807.0, 1273.0, 542.0, 285.0, 118.0, 78.0, 63.0, 31.0, 24.0, 8.0, 10.0, 10.0, 6.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86474609375, -0.8361358642578125, -0.807525634765625, -0.7789154052734375, -0.75030517578125, -0.7216949462890625, -0.693084716796875, -0.6644744873046875, -0.6358642578125, -0.6072540283203125, -0.578643798828125, -0.5500335693359375, -0.52142333984375, -0.4928131103515625, -0.464202880859375, -0.4355926513671875, -0.406982421875, -0.3783721923828125, -0.349761962890625, -0.3211517333984375, -0.29254150390625, -0.2639312744140625, -0.235321044921875, -0.2067108154296875, -0.1781005859375, -0.1494903564453125, -0.120880126953125, -0.0922698974609375, -0.06365966796875, -0.0350494384765625, -0.006439208984375, 0.0221710205078125, 0.05078125, 0.0793914794921875, 0.108001708984375, 0.1366119384765625, 0.16522216796875, 0.1938323974609375, 0.222442626953125, 0.2510528564453125, 0.2796630859375, 0.3082733154296875, 0.336883544921875, 0.3654937744140625, 0.39410400390625, 0.4227142333984375, 0.451324462890625, 0.4799346923828125, 0.508544921875, 0.5371551513671875, 0.565765380859375, 0.5943756103515625, 0.62298583984375, 0.6515960693359375, 0.680206298828125, 0.7088165283203125, 0.7374267578125, 0.7660369873046875, 0.794647216796875, 0.8232574462890625, 0.85186767578125, 0.8804779052734375, 0.909088134765625, 0.9376983642578125, 0.96630859375]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 8.0, 7.0, 9.0, 11.0, 26.0, 17.0, 31.0, 36.0, 54.0, 64.0, 75.0, 85.0, 95.0, 92.0, 80.0, 72.0, 60.0, 62.0, 27.0, 31.0, 18.0, 13.0, 8.0, 12.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.619140625, -0.5959548950195312, -0.5727691650390625, -0.5495834350585938, -0.526397705078125, -0.5032119750976562, -0.4800262451171875, -0.45684051513671875, -0.43365478515625, -0.41046905517578125, -0.3872833251953125, -0.36409759521484375, -0.340911865234375, -0.31772613525390625, -0.2945404052734375, -0.27135467529296875, -0.2481689453125, -0.22498321533203125, -0.2017974853515625, -0.17861175537109375, -0.155426025390625, -0.13224029541015625, -0.1090545654296875, -0.08586883544921875, -0.06268310546875, -0.03949737548828125, -0.0163116455078125, 0.00687408447265625, 0.030059814453125, 0.05324554443359375, 0.0764312744140625, 0.09961700439453125, 0.122802734375, 0.14598846435546875, 0.1691741943359375, 0.19235992431640625, 0.215545654296875, 0.23873138427734375, 0.2619171142578125, 0.28510284423828125, 0.30828857421875, 0.33147430419921875, 0.3546600341796875, 0.37784576416015625, 0.401031494140625, 0.42421722412109375, 0.4474029541015625, 0.47058868408203125, 0.4937744140625, 0.5169601440429688, 0.5401458740234375, 0.5633316040039062, 0.586517333984375, 0.6097030639648438, 0.6328887939453125, 0.6560745239257812, 0.67926025390625, 0.7024459838867188, 0.7256317138671875, 0.7488174438476562, 0.772003173828125, 0.7951889038085938, 0.8183746337890625, 0.8415603637695312, 0.86474609375]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 2.0, 7.0, 12.0, 6.0, 16.0, 30.0, 19.0, 39.0, 75.0, 67.0, 129.0, 206.0, 363.0, 640.0, 1336.0, 2971.0, 9119.0, 42094.0, 519509.0, 3339824.0, 239489.0, 27361.0, 6542.0, 2205.0, 888.0, 465.0, 286.0, 182.0, 118.0, 77.0, 61.0, 37.0, 31.0, 25.0, 15.0, 9.0, 11.0, 4.0, 3.0, 1.0, 1.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.6953125, -0.6738357543945312, -0.6523590087890625, -0.6308822631835938, -0.609405517578125, -0.5879287719726562, -0.5664520263671875, -0.5449752807617188, -0.52349853515625, -0.5020217895507812, -0.4805450439453125, -0.45906829833984375, -0.437591552734375, -0.41611480712890625, -0.3946380615234375, -0.37316131591796875, -0.3516845703125, -0.33020782470703125, -0.3087310791015625, -0.28725433349609375, -0.265777587890625, -0.24430084228515625, -0.2228240966796875, -0.20134735107421875, -0.17987060546875, -0.15839385986328125, -0.1369171142578125, -0.11544036865234375, -0.093963623046875, -0.07248687744140625, -0.0510101318359375, -0.02953338623046875, -0.008056640625, 0.01342010498046875, 0.0348968505859375, 0.05637359619140625, 0.077850341796875, 0.09932708740234375, 0.1208038330078125, 0.14228057861328125, 0.16375732421875, 0.18523406982421875, 0.2067108154296875, 0.22818756103515625, 0.249664306640625, 0.27114105224609375, 0.2926177978515625, 0.31409454345703125, 0.3355712890625, 0.35704803466796875, 0.3785247802734375, 0.40000152587890625, 0.421478271484375, 0.44295501708984375, 0.4644317626953125, 0.48590850830078125, 0.50738525390625, 0.5288619995117188, 0.5503387451171875, 0.5718154907226562, 0.593292236328125, 0.6147689819335938, 0.6362457275390625, 0.6577224731445312, 0.67919921875]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 6.0, 4.0, 13.0, 5.0, 16.0, 16.0, 15.0, 31.0, 38.0, 42.0, 62.0, 108.0, 123.0, 161.0, 237.0, 358.0, 455.0, 498.0, 462.0, 361.0, 297.0, 193.0, 163.0, 128.0, 71.0, 47.0, 48.0, 25.0, 18.0, 18.0, 13.0, 15.0, 5.0, 1.0, 5.0, 4.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.14599609375, -0.141387939453125, -0.13677978515625, -0.132171630859375, -0.1275634765625, -0.122955322265625, -0.11834716796875, -0.113739013671875, -0.109130859375, -0.104522705078125, -0.09991455078125, -0.095306396484375, -0.0906982421875, -0.086090087890625, -0.08148193359375, -0.076873779296875, -0.072265625, -0.067657470703125, -0.06304931640625, -0.058441162109375, -0.0538330078125, -0.049224853515625, -0.04461669921875, -0.040008544921875, -0.035400390625, -0.030792236328125, -0.02618408203125, -0.021575927734375, -0.0169677734375, -0.012359619140625, -0.00775146484375, -0.003143310546875, 0.00146484375, 0.006072998046875, 0.01068115234375, 0.015289306640625, 0.0198974609375, 0.024505615234375, 0.02911376953125, 0.033721923828125, 0.038330078125, 0.042938232421875, 0.04754638671875, 0.052154541015625, 0.0567626953125, 0.061370849609375, 0.06597900390625, 0.070587158203125, 0.0751953125, 0.079803466796875, 0.08441162109375, 0.089019775390625, 0.0936279296875, 0.098236083984375, 0.10284423828125, 0.107452392578125, 0.112060546875, 0.116668701171875, 0.12127685546875, 0.125885009765625, 0.1304931640625, 0.135101318359375, 0.13970947265625, 0.144317626953125, 0.14892578125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 15.0, 36.0, 74.0, 169.0, 254.0, 231.0, 129.0, 53.0, 26.0, 12.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5428178310394287, -2.4818809032440186, -2.4209437370300293, -2.360006809234619, -2.299069881439209, -2.238132953643799, -2.1771957874298096, -2.1162588596343994, -2.05532169342041, -1.9943846464157104, -1.9334477186203003, -1.8725106716156006, -1.8115737438201904, -1.7506366968154907, -1.689699649810791, -1.6287627220153809, -1.5678257942199707, -1.506888747215271, -1.4459518194198608, -1.3850147724151611, -1.324077844619751, -1.2631407976150513, -1.2022037506103516, -1.1412668228149414, -1.0803297758102417, -1.019392728805542, -0.9584558010101318, -0.8975187540054321, -0.8365817666053772, -0.7756447792053223, -0.7147077322006226, -0.6537707448005676, -0.5928338766098022, -0.5318968892097473, -0.47095987200737, -0.4100228548049927, -0.34908586740493774, -0.2881488800048828, -0.2272118628025055, -0.16627484560012817, -0.10533785820007324, -0.04440085589885712, 0.01653614640235901, 0.07747314870357513, 0.13841015100479126, 0.1993471384048462, 0.2602841556072235, 0.32122117280960083, 0.38215816020965576, 0.4430951476097107, 0.5040321350097656, 0.5649691820144653, 0.6259061694145203, 0.6868431568145752, 0.7477802038192749, 0.8087171912193298, 0.8696541786193848, 0.9305911660194397, 0.9915281534194946, 1.0524652004241943, 1.1134021282196045, 1.1743391752243042, 1.235276222229004, 1.296213150024414, 1.3571501970291138]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 2.0, 2.0, 12.0, 5.0, 8.0, 11.0, 8.0, 11.0, 27.0, 18.0, 35.0, 42.0, 46.0, 44.0, 51.0, 69.0, 68.0, 57.0, 52.0, 71.0, 66.0, 34.0, 42.0, 45.0, 33.0, 33.0, 21.0, 26.0, 16.0, 17.0, 8.0, 10.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5787622928619385, -0.560859739780426, -0.5429572463035583, -0.5250546932220459, -0.5071521997451782, -0.48924964666366577, -0.4713471233844757, -0.45344460010528564, -0.4355420768260956, -0.4176395535469055, -0.39973703026771545, -0.3818345069885254, -0.36393195390701294, -0.34602946043014526, -0.3281269073486328, -0.31022438406944275, -0.2923218607902527, -0.2744193375110626, -0.25651681423187256, -0.2386142760515213, -0.22071175277233124, -0.20280922949314117, -0.18490669131278992, -0.16700416803359985, -0.1491016447544098, -0.13119912147521973, -0.11329659074544907, -0.0953940600156784, -0.07749153673648834, -0.05958901345729828, -0.04168648272752762, -0.023783951997756958, -0.005881369113922119, 0.012021157890558243, 0.029923684895038605, 0.04782621189951897, 0.06572873890399933, 0.08363126218318939, 0.10153379291296005, 0.11943632364273071, 0.13733884692192078, 0.15524137020111084, 0.1731438934803009, 0.19104643166065216, 0.20894895493984222, 0.2268514782190323, 0.24475401639938354, 0.2626565396785736, 0.28055906295776367, 0.29846158623695374, 0.3163641095161438, 0.33426663279533386, 0.3521691560745239, 0.3700717091560364, 0.38797423243522644, 0.4058767557144165, 0.42377927899360657, 0.44168180227279663, 0.4595843255519867, 0.47748684883117676, 0.4953894019126892, 0.5132918953895569, 0.5311944484710693, 0.549096941947937, 0.5669994950294495]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 5.0, 4.0, 5.0, 4.0, 10.0, 14.0, 22.0, 24.0, 48.0, 70.0, 97.0, 206.0, 343.0, 636.0, 1356.0, 3449.0, 10597.0, 43657.0, 214361.0, 500400.0, 213078.0, 43099.0, 10714.0, 3439.0, 1428.0, 629.0, 328.0, 197.0, 119.0, 76.0, 42.0, 28.0, 15.0, 14.0, 11.0, 7.0, 8.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1339111328125, -0.12965965270996094, -0.12540817260742188, -0.12115669250488281, -0.11690521240234375, -0.11265373229980469, -0.10840225219726562, -0.10415077209472656, -0.0998992919921875, -0.09564781188964844, -0.09139633178710938, -0.08714485168457031, -0.08289337158203125, -0.07864189147949219, -0.07439041137695312, -0.07013893127441406, -0.065887451171875, -0.06163597106933594, -0.057384490966796875, -0.05313301086425781, -0.04888153076171875, -0.04463005065917969, -0.040378570556640625, -0.03612709045410156, -0.0318756103515625, -0.027624130249023438, -0.023372650146484375, -0.019121170043945312, -0.01486968994140625, -0.010618209838867188, -0.006366729736328125, -0.0021152496337890625, 0.00213623046875, 0.0063877105712890625, 0.010639190673828125, 0.014890670776367188, 0.01914215087890625, 0.023393630981445312, 0.027645111083984375, 0.03189659118652344, 0.0361480712890625, 0.04039955139160156, 0.044651031494140625, 0.04890251159667969, 0.05315399169921875, 0.05740547180175781, 0.061656951904296875, 0.06590843200683594, 0.070159912109375, 0.07441139221191406, 0.07866287231445312, 0.08291435241699219, 0.08716583251953125, 0.09141731262207031, 0.09566879272460938, 0.09992027282714844, 0.1041717529296875, 0.10842323303222656, 0.11267471313476562, 0.11692619323730469, 0.12117767333984375, 0.1254291534423828, 0.12968063354492188, 0.13393211364746094, 0.13818359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 11.0, 9.0, 13.0, 15.0, 9.0, 21.0, 41.0, 57.0, 61.0, 79.0, 81.0, 94.0, 91.0, 67.0, 79.0, 64.0, 56.0, 34.0, 42.0, 19.0, 20.0, 10.0, 9.0, 7.0, 6.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.517578125, -0.4997711181640625, -0.481964111328125, -0.4641571044921875, -0.44635009765625, -0.4285430908203125, -0.410736083984375, -0.3929290771484375, -0.3751220703125, -0.3573150634765625, -0.339508056640625, -0.3217010498046875, -0.30389404296875, -0.2860870361328125, -0.268280029296875, -0.2504730224609375, -0.232666015625, -0.2148590087890625, -0.197052001953125, -0.1792449951171875, -0.16143798828125, -0.1436309814453125, -0.125823974609375, -0.1080169677734375, -0.0902099609375, -0.0724029541015625, -0.054595947265625, -0.0367889404296875, -0.01898193359375, -0.0011749267578125, 0.016632080078125, 0.0344390869140625, 0.05224609375, 0.0700531005859375, 0.087860107421875, 0.1056671142578125, 0.12347412109375, 0.1412811279296875, 0.159088134765625, 0.1768951416015625, 0.1947021484375, 0.2125091552734375, 0.230316162109375, 0.2481231689453125, 0.26593017578125, 0.2837371826171875, 0.301544189453125, 0.3193511962890625, 0.337158203125, 0.3549652099609375, 0.372772216796875, 0.3905792236328125, 0.40838623046875, 0.4261932373046875, 0.444000244140625, 0.4618072509765625, 0.4796142578125, 0.4974212646484375, 0.515228271484375, 0.5330352783203125, 0.55084228515625, 0.5686492919921875, 0.586456298828125, 0.6042633056640625, 0.6220703125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 10.0, 25.0, 25.0, 36.0, 40.0, 69.0, 104.0, 181.0, 228.0, 448.0, 800.0, 1497.0, 3080.0, 7404.0, 19631.0, 57645.0, 176319.0, 360270.0, 270348.0, 98368.0, 31649.0, 11263.0, 4570.0, 2058.0, 986.0, 569.0, 326.0, 215.0, 115.0, 89.0, 58.0, 38.0, 30.0, 25.0, 12.0, 5.0, 4.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08819580078125, -0.0853261947631836, -0.08245658874511719, -0.07958698272705078, -0.07671737670898438, -0.07384777069091797, -0.07097816467285156, -0.06810855865478516, -0.06523895263671875, -0.062369346618652344, -0.05949974060058594, -0.05663013458251953, -0.053760528564453125, -0.05089092254638672, -0.04802131652832031, -0.045151710510253906, -0.0422821044921875, -0.039412498474121094, -0.03654289245605469, -0.03367328643798828, -0.030803680419921875, -0.02793407440185547, -0.025064468383789062, -0.022194862365722656, -0.01932525634765625, -0.016455650329589844, -0.013586044311523438, -0.010716438293457031, -0.007846832275390625, -0.004977226257324219, -0.0021076202392578125, 0.0007619857788085938, 0.003631591796875, 0.006501197814941406, 0.009370803833007812, 0.012240409851074219, 0.015110015869140625, 0.01797962188720703, 0.020849227905273438, 0.023718833923339844, 0.02658843994140625, 0.029458045959472656, 0.03232765197753906, 0.03519725799560547, 0.038066864013671875, 0.04093647003173828, 0.04380607604980469, 0.046675682067871094, 0.0495452880859375, 0.052414894104003906, 0.05528450012207031, 0.05815410614013672, 0.061023712158203125, 0.06389331817626953, 0.06676292419433594, 0.06963253021240234, 0.07250213623046875, 0.07537174224853516, 0.07824134826660156, 0.08111095428466797, 0.08398056030273438, 0.08685016632080078, 0.08971977233886719, 0.0925893783569336, 0.095458984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 5.0, 1.0, 3.0, 6.0, 8.0, 2.0, 10.0, 14.0, 11.0, 11.0, 12.0, 25.0, 24.0, 22.0, 32.0, 22.0, 46.0, 41.0, 31.0, 42.0, 37.0, 46.0, 43.0, 43.0, 44.0, 40.0, 44.0, 44.0, 33.0, 40.0, 40.0, 29.0, 18.0, 23.0, 19.0, 20.0, 11.0, 10.0, 14.0, 7.0, 6.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.64599609375, -0.6275711059570312, -0.6091461181640625, -0.5907211303710938, -0.572296142578125, -0.5538711547851562, -0.5354461669921875, -0.5170211791992188, -0.49859619140625, -0.48017120361328125, -0.4617462158203125, -0.44332122802734375, -0.424896240234375, -0.40647125244140625, -0.3880462646484375, -0.36962127685546875, -0.3511962890625, -0.33277130126953125, -0.3143463134765625, -0.29592132568359375, -0.277496337890625, -0.25907135009765625, -0.2406463623046875, -0.22222137451171875, -0.20379638671875, -0.18537139892578125, -0.1669464111328125, -0.14852142333984375, -0.130096435546875, -0.11167144775390625, -0.0932464599609375, -0.07482147216796875, -0.056396484375, -0.03797149658203125, -0.0195465087890625, -0.00112152099609375, 0.017303466796875, 0.03572845458984375, 0.0541534423828125, 0.07257843017578125, 0.09100341796875, 0.10942840576171875, 0.1278533935546875, 0.14627838134765625, 0.164703369140625, 0.18312835693359375, 0.2015533447265625, 0.21997833251953125, 0.2384033203125, 0.25682830810546875, 0.2752532958984375, 0.29367828369140625, 0.312103271484375, 0.33052825927734375, 0.3489532470703125, 0.36737823486328125, 0.38580322265625, 0.40422821044921875, 0.4226531982421875, 0.44107818603515625, 0.459503173828125, 0.47792816162109375, 0.4963531494140625, 0.5147781372070312, 0.533203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 9.0, 7.0, 4.0, 14.0, 26.0, 37.0, 61.0, 79.0, 131.0, 228.0, 411.0, 740.0, 1732.0, 4352.0, 14771.0, 75856.0, 383523.0, 441120.0, 97870.0, 18405.0, 5121.0, 2052.0, 914.0, 421.0, 281.0, 139.0, 83.0, 53.0, 36.0, 22.0, 14.0, 10.0, 10.0, 7.0, 9.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034454345703125, -0.033226966857910156, -0.03199958801269531, -0.03077220916748047, -0.029544830322265625, -0.02831745147705078, -0.027090072631835938, -0.025862693786621094, -0.02463531494140625, -0.023407936096191406, -0.022180557250976562, -0.02095317840576172, -0.019725799560546875, -0.01849842071533203, -0.017271041870117188, -0.016043663024902344, -0.0148162841796875, -0.013588905334472656, -0.012361526489257812, -0.011134147644042969, -0.009906768798828125, -0.008679389953613281, -0.0074520111083984375, -0.006224632263183594, -0.00499725341796875, -0.0037698745727539062, -0.0025424957275390625, -0.0013151168823242188, -8.7738037109375e-05, 0.0011396408081054688, 0.0023670196533203125, 0.0035943984985351562, 0.00482177734375, 0.006049156188964844, 0.0072765350341796875, 0.008503913879394531, 0.009731292724609375, 0.010958671569824219, 0.012186050415039062, 0.013413429260253906, 0.01464080810546875, 0.015868186950683594, 0.017095565795898438, 0.01832294464111328, 0.019550323486328125, 0.02077770233154297, 0.022005081176757812, 0.023232460021972656, 0.0244598388671875, 0.025687217712402344, 0.026914596557617188, 0.02814197540283203, 0.029369354248046875, 0.03059673309326172, 0.03182411193847656, 0.033051490783691406, 0.03427886962890625, 0.035506248474121094, 0.03673362731933594, 0.03796100616455078, 0.039188385009765625, 0.04041576385498047, 0.04164314270019531, 0.042870521545410156, 0.044097900390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 6.0, 0.0, 4.0, 7.0, 7.0, 12.0, 13.0, 13.0, 19.0, 30.0, 33.0, 62.0, 44.0, 54.0, 83.0, 103.0, 84.0, 86.0, 71.0, 74.0, 50.0, 37.0, 22.0, 22.0, 21.0, 16.0, 8.0, 5.0, 6.0, 5.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4662742614746094e-05, -1.4194287359714508e-05, -1.3725832104682922e-05, -1.3257376849651337e-05, -1.2788921594619751e-05, -1.2320466339588165e-05, -1.185201108455658e-05, -1.1383555829524994e-05, -1.0915100574493408e-05, -1.0446645319461823e-05, -9.978190064430237e-06, -9.509734809398651e-06, -9.041279554367065e-06, -8.57282429933548e-06, -8.104369044303894e-06, -7.635913789272308e-06, -7.167458534240723e-06, -6.699003279209137e-06, -6.230548024177551e-06, -5.7620927691459656e-06, -5.29363751411438e-06, -4.825182259082794e-06, -4.3567270040512085e-06, -3.888271749019623e-06, -3.419816493988037e-06, -2.9513612389564514e-06, -2.4829059839248657e-06, -2.01445072889328e-06, -1.5459954738616943e-06, -1.0775402188301086e-06, -6.09084963798523e-07, -1.4062970876693726e-07, 3.2782554626464844e-07, 7.962808012962341e-07, 1.2647360563278198e-06, 1.7331913113594055e-06, 2.201646566390991e-06, 2.670101821422577e-06, 3.1385570764541626e-06, 3.6070123314857483e-06, 4.075467586517334e-06, 4.54392284154892e-06, 5.012378096580505e-06, 5.480833351612091e-06, 5.949288606643677e-06, 6.4177438616752625e-06, 6.886199116706848e-06, 7.354654371738434e-06, 7.82310962677002e-06, 8.291564881801605e-06, 8.760020136833191e-06, 9.228475391864777e-06, 9.696930646896362e-06, 1.0165385901927948e-05, 1.0633841156959534e-05, 1.110229641199112e-05, 1.1570751667022705e-05, 1.203920692205429e-05, 1.2507662177085876e-05, 1.2976117432117462e-05, 1.3444572687149048e-05, 1.3913027942180634e-05, 1.438148319721222e-05, 1.4849938452243805e-05, 1.531839370727539e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 1.0, 7.0, 11.0, 7.0, 11.0, 13.0, 19.0, 26.0, 26.0, 38.0, 60.0, 116.0, 160.0, 270.0, 462.0, 842.0, 1974.0, 5439.0, 17122.0, 58764.0, 189612.0, 371358.0, 268750.0, 92770.0, 26813.0, 8316.0, 2893.0, 1153.0, 603.0, 310.0, 191.0, 121.0, 90.0, 60.0, 42.0, 30.0, 27.0, 12.0, 16.0, 7.0, 4.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0235595703125, -0.022708654403686523, -0.021857738494873047, -0.02100682258605957, -0.020155906677246094, -0.019304990768432617, -0.01845407485961914, -0.017603158950805664, -0.016752243041992188, -0.01590132713317871, -0.015050411224365234, -0.014199495315551758, -0.013348579406738281, -0.012497663497924805, -0.011646747589111328, -0.010795831680297852, -0.009944915771484375, -0.009093999862670898, -0.008243083953857422, -0.007392168045043945, -0.006541252136230469, -0.005690336227416992, -0.004839420318603516, -0.003988504409790039, -0.0031375885009765625, -0.002286672592163086, -0.0014357566833496094, -0.0005848407745361328, 0.00026607513427734375, 0.0011169910430908203, 0.001967906951904297, 0.0028188228607177734, 0.00366973876953125, 0.0045206546783447266, 0.005371570587158203, 0.00622248649597168, 0.007073402404785156, 0.007924318313598633, 0.00877523422241211, 0.009626150131225586, 0.010477066040039062, 0.011327981948852539, 0.012178897857666016, 0.013029813766479492, 0.013880729675292969, 0.014731645584106445, 0.015582561492919922, 0.0164334774017334, 0.017284393310546875, 0.01813530921936035, 0.018986225128173828, 0.019837141036987305, 0.02068805694580078, 0.021538972854614258, 0.022389888763427734, 0.02324080467224121, 0.024091720581054688, 0.024942636489868164, 0.02579355239868164, 0.026644468307495117, 0.027495384216308594, 0.02834630012512207, 0.029197216033935547, 0.030048131942749023, 0.0308990478515625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 5.0, 4.0, 6.0, 15.0, 9.0, 18.0, 14.0, 15.0, 19.0, 27.0, 27.0, 34.0, 40.0, 40.0, 35.0, 44.0, 55.0, 46.0, 51.0, 32.0, 43.0, 49.0, 43.0, 52.0, 39.0, 38.0, 30.0, 36.0, 14.0, 22.0, 11.0, 11.0, 15.0, 13.0, 5.0, 10.0, 8.0, 4.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.00684356689453125, -0.006635427474975586, -0.006427288055419922, -0.006219148635864258, -0.006011009216308594, -0.00580286979675293, -0.005594730377197266, -0.0053865909576416016, -0.0051784515380859375, -0.0049703121185302734, -0.004762172698974609, -0.004554033279418945, -0.004345893859863281, -0.004137754440307617, -0.003929615020751953, -0.003721475601196289, -0.003513336181640625, -0.003305196762084961, -0.003097057342529297, -0.002888917922973633, -0.0026807785034179688, -0.0024726390838623047, -0.0022644996643066406, -0.0020563602447509766, -0.0018482208251953125, -0.0016400814056396484, -0.0014319419860839844, -0.0012238025665283203, -0.0010156631469726562, -0.0008075237274169922, -0.0005993843078613281, -0.00039124488830566406, -0.00018310546875, 2.5033950805664062e-05, 0.00023317337036132812, 0.0004413127899169922, 0.0006494522094726562, 0.0008575916290283203, 0.0010657310485839844, 0.0012738704681396484, 0.0014820098876953125, 0.0016901493072509766, 0.0018982887268066406, 0.0021064281463623047, 0.0023145675659179688, 0.002522706985473633, 0.002730846405029297, 0.002938985824584961, 0.003147125244140625, 0.003355264663696289, 0.003563404083251953, 0.003771543502807617, 0.003979682922363281, 0.004187822341918945, 0.004395961761474609, 0.0046041011810302734, 0.0048122406005859375, 0.0050203800201416016, 0.005228519439697266, 0.00543665885925293, 0.005644798278808594, 0.005852937698364258, 0.006061077117919922, 0.006269216537475586, 0.00647735595703125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 106.0, 719.0, 169.0, 15.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.54862117767334, -6.416533470153809, -6.284445762634277, -6.152358531951904, -6.020270824432373, -5.888183116912842, -5.7560954093933105, -5.6240081787109375, -5.491920471191406, -5.359832763671875, -5.227745056152344, -5.095657825469971, -4.9635701179504395, -4.831482410430908, -4.699394702911377, -4.567307472229004, -4.435219764709473, -4.303132057189941, -4.17104434967041, -4.038957118988037, -3.906869411468506, -3.7747817039489746, -3.6426939964294434, -3.510606527328491, -3.378518581390381, -3.2464308738708496, -3.1143434047698975, -2.982255697250366, -2.850168228149414, -2.718080520629883, -2.5859928131103516, -2.4539053440093994, -2.321817398071289, -2.189729690551758, -2.0576422214508057, -1.9255545139312744, -1.7934670448303223, -1.661379337310791, -1.5292917490005493, -1.3972041606903076, -1.2651166915893555, -1.1330291032791138, -1.000941514968872, -0.8688538670539856, -0.7367662787437439, -0.6046786904335022, -0.4725910425186157, -0.340503454208374, -0.20841586589813232, -0.07632826268672943, 0.05575934052467346, 0.18784695863723755, 0.31993454694747925, 0.45202213525772095, 0.5841097831726074, 0.7161973714828491, 0.8482849597930908, 0.9803725481033325, 1.1124601364135742, 1.2445478439331055, 1.3766353130340576, 1.5087230205535889, 1.6408106088638306, 1.7728981971740723, 1.904985785484314]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 1.0, 12.0, 6.0, 16.0, 9.0, 15.0, 20.0, 31.0, 44.0, 65.0, 59.0, 73.0, 95.0, 77.0, 76.0, 77.0, 65.0, 51.0, 57.0, 32.0, 35.0, 31.0, 17.0, 15.0, 10.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4810790717601776, -0.4649052023887634, -0.44873133301734924, -0.43255746364593506, -0.4163835644721985, -0.4002097249031067, -0.3840358257293701, -0.36786195635795593, -0.35168808698654175, -0.33551421761512756, -0.3193403482437134, -0.3031664788722992, -0.286992609500885, -0.27081871032714844, -0.25464484095573425, -0.23847097158432007, -0.22229710221290588, -0.2061232328414917, -0.18994936347007751, -0.17377547919750214, -0.15760160982608795, -0.14142774045467377, -0.1252538561820984, -0.1090799868106842, -0.09290611743927002, -0.07673224806785583, -0.06055837124586105, -0.04438449814915657, -0.028210625052452087, -0.012036755681037903, 0.004137121140956879, 0.02031099796295166, 0.03648489713668823, 0.052658770233392715, 0.0688326433300972, 0.08500652015209198, 0.10118038952350616, 0.11735425889492035, 0.13352814316749573, 0.1497020125389099, 0.1658758819103241, 0.18204975128173828, 0.19822362065315247, 0.21439750492572784, 0.23057137429714203, 0.2467452436685562, 0.2629191279411316, 0.2790929973125458, 0.29526686668395996, 0.31144073605537415, 0.32761460542678833, 0.3437884747982025, 0.3599623441696167, 0.37613624334335327, 0.39231011271476746, 0.40848398208618164, 0.4246578514575958, 0.44083172082901, 0.4570055902004242, 0.4731794595718384, 0.48935335874557495, 0.5055271983146667, 0.5217010974884033, 0.5378749370574951, 0.5540488362312317]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 2.0, 6.0, 12.0, 17.0, 11.0, 39.0, 39.0, 45.0, 83.0, 124.0, 193.0, 335.0, 493.0, 907.0, 1525.0, 2758.0, 5138.0, 10086.0, 21885.0, 52350.0, 137776.0, 382266.0, 267578.0, 94268.0, 37244.0, 16279.0, 7647.0, 4067.0, 2168.0, 1267.0, 738.0, 422.0, 305.0, 156.0, 122.0, 64.0, 54.0, 20.0, 24.0, 14.0, 8.0, 5.0, 11.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.18994140625, -0.18377685546875, -0.1776123046875, -0.17144775390625, -0.165283203125, -0.15911865234375, -0.1529541015625, -0.14678955078125, -0.140625, -0.13446044921875, -0.1282958984375, -0.12213134765625, -0.115966796875, -0.10980224609375, -0.1036376953125, -0.09747314453125, -0.09130859375, -0.08514404296875, -0.0789794921875, -0.07281494140625, -0.066650390625, -0.06048583984375, -0.0543212890625, -0.04815673828125, -0.0419921875, -0.03582763671875, -0.0296630859375, -0.02349853515625, -0.017333984375, -0.01116943359375, -0.0050048828125, 0.00115966796875, 0.00732421875, 0.01348876953125, 0.0196533203125, 0.02581787109375, 0.031982421875, 0.03814697265625, 0.0443115234375, 0.05047607421875, 0.056640625, 0.06280517578125, 0.0689697265625, 0.07513427734375, 0.081298828125, 0.08746337890625, 0.0936279296875, 0.09979248046875, 0.10595703125, 0.11212158203125, 0.1182861328125, 0.12445068359375, 0.130615234375, 0.13677978515625, 0.1429443359375, 0.14910888671875, 0.1552734375, 0.16143798828125, 0.1676025390625, 0.17376708984375, 0.179931640625, 0.18609619140625, 0.1922607421875, 0.19842529296875, 0.20458984375]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 3.0, 14.0, 3.0, 8.0, 14.0, 11.0, 16.0, 20.0, 32.0, 52.0, 45.0, 63.0, 43.0, 61.0, 71.0, 75.0, 69.0, 65.0, 52.0, 57.0, 34.0, 41.0, 31.0, 33.0, 13.0, 19.0, 11.0, 19.0, 5.0, 9.0, 0.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.96044921875, -0.9340896606445312, -0.9077301025390625, -0.8813705444335938, -0.855010986328125, -0.8286514282226562, -0.8022918701171875, -0.7759323120117188, -0.74957275390625, -0.7232131958007812, -0.6968536376953125, -0.6704940795898438, -0.644134521484375, -0.6177749633789062, -0.5914154052734375, -0.5650558471679688, -0.5386962890625, -0.5123367309570312, -0.4859771728515625, -0.45961761474609375, -0.433258056640625, -0.40689849853515625, -0.3805389404296875, -0.35417938232421875, -0.32781982421875, -0.30146026611328125, -0.2751007080078125, -0.24874114990234375, -0.222381591796875, -0.19602203369140625, -0.1696624755859375, -0.14330291748046875, -0.116943359375, -0.09058380126953125, -0.0642242431640625, -0.03786468505859375, -0.011505126953125, 0.01485443115234375, 0.0412139892578125, 0.06757354736328125, 0.09393310546875, 0.12029266357421875, 0.1466522216796875, 0.17301177978515625, 0.199371337890625, 0.22573089599609375, 0.2520904541015625, 0.27845001220703125, 0.3048095703125, 0.33116912841796875, 0.3575286865234375, 0.38388824462890625, 0.410247802734375, 0.43660736083984375, 0.4629669189453125, 0.48932647705078125, 0.51568603515625, 0.5420455932617188, 0.5684051513671875, 0.5947647094726562, 0.621124267578125, 0.6474838256835938, 0.6738433837890625, 0.7002029418945312, 0.7265625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 9.0, 4.0, 9.0, 10.0, 22.0, 29.0, 30.0, 64.0, 100.0, 142.0, 257.0, 532.0, 1692.0, 11559.0, 394254.0, 621080.0, 15446.0, 1968.0, 578.0, 304.0, 154.0, 95.0, 62.0, 42.0, 26.0, 27.0, 9.0, 10.0, 10.0, 8.0, 5.0, 3.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.671875, -0.6487503051757812, -0.6256256103515625, -0.6025009155273438, -0.579376220703125, -0.5562515258789062, -0.5331268310546875, -0.5100021362304688, -0.48687744140625, -0.46375274658203125, -0.4406280517578125, -0.41750335693359375, -0.394378662109375, -0.37125396728515625, -0.3481292724609375, -0.32500457763671875, -0.3018798828125, -0.27875518798828125, -0.2556304931640625, -0.23250579833984375, -0.209381103515625, -0.18625640869140625, -0.1631317138671875, -0.14000701904296875, -0.11688232421875, -0.09375762939453125, -0.0706329345703125, -0.04750823974609375, -0.024383544921875, -0.00125885009765625, 0.0218658447265625, 0.04499053955078125, 0.068115234375, 0.09123992919921875, 0.1143646240234375, 0.13748931884765625, 0.160614013671875, 0.18373870849609375, 0.2068634033203125, 0.22998809814453125, 0.25311279296875, 0.27623748779296875, 0.2993621826171875, 0.32248687744140625, 0.345611572265625, 0.36873626708984375, 0.3918609619140625, 0.41498565673828125, 0.4381103515625, 0.46123504638671875, 0.4843597412109375, 0.5074844360351562, 0.530609130859375, 0.5537338256835938, 0.5768585205078125, 0.5999832153320312, 0.62310791015625, 0.6462326049804688, 0.6693572998046875, 0.6924819946289062, 0.715606689453125, 0.7387313842773438, 0.7618560791015625, 0.7849807739257812, 0.80810546875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 4.0, 4.0, 5.0, 6.0, 16.0, 15.0, 17.0, 19.0, 17.0, 34.0, 26.0, 33.0, 47.0, 31.0, 41.0, 56.0, 56.0, 48.0, 63.0, 55.0, 54.0, 56.0, 45.0, 47.0, 33.0, 34.0, 24.0, 22.0, 19.0, 23.0, 15.0, 11.0, 10.0, 6.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8916015625, -0.8628463745117188, -0.8340911865234375, -0.8053359985351562, -0.776580810546875, -0.7478256225585938, -0.7190704345703125, -0.6903152465820312, -0.66156005859375, -0.6328048706054688, -0.6040496826171875, -0.5752944946289062, -0.546539306640625, -0.5177841186523438, -0.4890289306640625, -0.46027374267578125, -0.4315185546875, -0.40276336669921875, -0.3740081787109375, -0.34525299072265625, -0.316497802734375, -0.28774261474609375, -0.2589874267578125, -0.23023223876953125, -0.20147705078125, -0.17272186279296875, -0.1439666748046875, -0.11521148681640625, -0.086456298828125, -0.05770111083984375, -0.0289459228515625, -0.00019073486328125, 0.028564453125, 0.05731964111328125, 0.0860748291015625, 0.11483001708984375, 0.143585205078125, 0.17234039306640625, 0.2010955810546875, 0.22985076904296875, 0.25860595703125, 0.28736114501953125, 0.3161163330078125, 0.34487152099609375, 0.373626708984375, 0.40238189697265625, 0.4311370849609375, 0.45989227294921875, 0.4886474609375, 0.5174026489257812, 0.5461578369140625, 0.5749130249023438, 0.603668212890625, 0.6324234008789062, 0.6611785888671875, 0.6899337768554688, 0.71868896484375, 0.7474441528320312, 0.7761993408203125, 0.8049545288085938, 0.833709716796875, 0.8624649047851562, 0.8912200927734375, 0.9199752807617188, 0.94873046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 8.0, 18.0, 12.0, 37.0, 61.0, 117.0, 280.0, 808.0, 3246.0, 32019.0, 965345.0, 41529.0, 3597.0, 867.0, 285.0, 146.0, 59.0, 36.0, 24.0, 21.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.326416015625, -0.3145599365234375, -0.302703857421875, -0.2908477783203125, -0.27899169921875, -0.2671356201171875, -0.255279541015625, -0.2434234619140625, -0.2315673828125, -0.2197113037109375, -0.207855224609375, -0.1959991455078125, -0.18414306640625, -0.1722869873046875, -0.160430908203125, -0.1485748291015625, -0.13671875, -0.1248626708984375, -0.113006591796875, -0.1011505126953125, -0.08929443359375, -0.0774383544921875, -0.065582275390625, -0.0537261962890625, -0.0418701171875, -0.0300140380859375, -0.018157958984375, -0.0063018798828125, 0.00555419921875, 0.0174102783203125, 0.029266357421875, 0.0411224365234375, 0.052978515625, 0.0648345947265625, 0.076690673828125, 0.0885467529296875, 0.10040283203125, 0.1122589111328125, 0.124114990234375, 0.1359710693359375, 0.1478271484375, 0.1596832275390625, 0.171539306640625, 0.1833953857421875, 0.19525146484375, 0.2071075439453125, 0.218963623046875, 0.2308197021484375, 0.24267578125, 0.2545318603515625, 0.266387939453125, 0.2782440185546875, 0.29010009765625, 0.3019561767578125, 0.313812255859375, 0.3256683349609375, 0.3375244140625, 0.3493804931640625, 0.361236572265625, 0.3730926513671875, 0.38494873046875, 0.3968048095703125, 0.408660888671875, 0.4205169677734375, 0.432373046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 1.0, 1.0, 7.0, 11.0, 11.0, 20.0, 39.0, 46.0, 67.0, 83.0, 152.0, 182.0, 114.0, 80.0, 60.0, 37.0, 42.0, 18.0, 8.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.641843795776367e-05, -3.54154035449028e-05, -3.441236913204193e-05, -3.340933471918106e-05, -3.240630030632019e-05, -3.140326589345932e-05, -3.040023148059845e-05, -2.939719706773758e-05, -2.839416265487671e-05, -2.739112824201584e-05, -2.6388093829154968e-05, -2.5385059416294098e-05, -2.4382025003433228e-05, -2.3378990590572357e-05, -2.2375956177711487e-05, -2.1372921764850616e-05, -2.0369887351989746e-05, -1.9366852939128876e-05, -1.8363818526268005e-05, -1.7360784113407135e-05, -1.6357749700546265e-05, -1.5354715287685394e-05, -1.4351680874824524e-05, -1.3348646461963654e-05, -1.2345612049102783e-05, -1.1342577636241913e-05, -1.0339543223381042e-05, -9.336508810520172e-06, -8.333474397659302e-06, -7.330439984798431e-06, -6.327405571937561e-06, -5.324371159076691e-06, -4.32133674621582e-06, -3.31830233335495e-06, -2.3152679204940796e-06, -1.3122335076332092e-06, -3.0919909477233887e-07, 6.938353180885315e-07, 1.6968697309494019e-06, 2.6999041438102722e-06, 3.7029385566711426e-06, 4.705972969532013e-06, 5.709007382392883e-06, 6.712041795253754e-06, 7.715076208114624e-06, 8.718110620975494e-06, 9.721145033836365e-06, 1.0724179446697235e-05, 1.1727213859558105e-05, 1.2730248272418976e-05, 1.3733282685279846e-05, 1.4736317098140717e-05, 1.5739351511001587e-05, 1.6742385923862457e-05, 1.7745420336723328e-05, 1.8748454749584198e-05, 1.975148916244507e-05, 2.075452357530594e-05, 2.175755798816681e-05, 2.276059240102768e-05, 2.376362681388855e-05, 2.476666122674942e-05, 2.576969563961029e-05, 2.677273005247116e-05, 2.777576446533203e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 8.0, 13.0, 15.0, 37.0, 46.0, 86.0, 199.0, 539.0, 1769.0, 9284.0, 318171.0, 701829.0, 13194.0, 2270.0, 579.0, 238.0, 102.0, 50.0, 37.0, 18.0, 23.0, 8.0, 10.0, 7.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.311767578125, -0.30025482177734375, -0.2887420654296875, -0.27722930908203125, -0.265716552734375, -0.25420379638671875, -0.2426910400390625, -0.23117828369140625, -0.21966552734375, -0.20815277099609375, -0.1966400146484375, -0.18512725830078125, -0.173614501953125, -0.16210174560546875, -0.1505889892578125, -0.13907623291015625, -0.1275634765625, -0.11605072021484375, -0.1045379638671875, -0.09302520751953125, -0.081512451171875, -0.06999969482421875, -0.0584869384765625, -0.04697418212890625, -0.03546142578125, -0.02394866943359375, -0.0124359130859375, -0.00092315673828125, 0.010589599609375, 0.02210235595703125, 0.0336151123046875, 0.04512786865234375, 0.056640625, 0.06815338134765625, 0.0796661376953125, 0.09117889404296875, 0.102691650390625, 0.11420440673828125, 0.1257171630859375, 0.13722991943359375, 0.14874267578125, 0.16025543212890625, 0.1717681884765625, 0.18328094482421875, 0.194793701171875, 0.20630645751953125, 0.2178192138671875, 0.22933197021484375, 0.2408447265625, 0.25235748291015625, 0.2638702392578125, 0.27538299560546875, 0.286895751953125, 0.29840850830078125, 0.3099212646484375, 0.32143402099609375, 0.33294677734375, 0.34445953369140625, 0.3559722900390625, 0.36748504638671875, 0.378997802734375, 0.39051055908203125, 0.4020233154296875, 0.41353607177734375, 0.425048828125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 3.0, 5.0, 3.0, 4.0, 0.0, 7.0, 6.0, 7.0, 10.0, 19.0, 20.0, 37.0, 49.0, 84.0, 101.0, 153.0, 145.0, 97.0, 78.0, 51.0, 29.0, 30.0, 13.0, 14.0, 12.0, 7.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.08868408203125, -0.08635950088500977, -0.08403491973876953, -0.0817103385925293, -0.07938575744628906, -0.07706117630004883, -0.0747365951538086, -0.07241201400756836, -0.07008743286132812, -0.06776285171508789, -0.06543827056884766, -0.06311368942260742, -0.06078910827636719, -0.05846452713012695, -0.05613994598388672, -0.053815364837646484, -0.05149078369140625, -0.049166202545166016, -0.04684162139892578, -0.04451704025268555, -0.04219245910644531, -0.03986787796020508, -0.037543296813964844, -0.03521871566772461, -0.032894134521484375, -0.03056955337524414, -0.028244972229003906, -0.025920391082763672, -0.023595809936523438, -0.021271228790283203, -0.01894664764404297, -0.016622066497802734, -0.0142974853515625, -0.011972904205322266, -0.009648323059082031, -0.007323741912841797, -0.0049991607666015625, -0.002674579620361328, -0.00034999847412109375, 0.0019745826721191406, 0.004299163818359375, 0.006623744964599609, 0.008948326110839844, 0.011272907257080078, 0.013597488403320312, 0.015922069549560547, 0.01824665069580078, 0.020571231842041016, 0.02289581298828125, 0.025220394134521484, 0.02754497528076172, 0.029869556427001953, 0.03219413757324219, 0.03451871871948242, 0.036843299865722656, 0.03916788101196289, 0.041492462158203125, 0.04381704330444336, 0.046141624450683594, 0.04846620559692383, 0.05079078674316406, 0.0531153678894043, 0.05543994903564453, 0.057764530181884766, 0.060089111328125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 10.0, 42.0, 87.0, 214.0, 291.0, 213.0, 77.0, 34.0, 16.0, 9.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.911703586578369, -2.8270459175109863, -2.7423884868621826, -2.6577308177948, -2.573073387145996, -2.4884157180786133, -2.4037580490112305, -2.3191003799438477, -2.234442949295044, -2.149785280227661, -2.0651278495788574, -1.9804701805114746, -1.8958126306533813, -1.811155080795288, -1.7264974117279053, -1.641839861869812, -1.5571823120117188, -1.4725247621536255, -1.3878672122955322, -1.3032095432281494, -1.2185519933700562, -1.133894443511963, -1.04923677444458, -0.9645792245864868, -0.8799216747283936, -0.7952641248703003, -0.7106065154075623, -0.6259489059448242, -0.541291356086731, -0.4566337764263153, -0.37197619676589966, -0.2873185873031616, -0.20266127586364746, -0.11800369620323181, -0.03334611654281616, 0.05131146311759949, 0.13596904277801514, 0.2206266224384308, 0.30528420209884644, 0.3899418115615845, 0.47459936141967773, 0.559256911277771, 0.643914520740509, 0.7285721302032471, 0.8132296800613403, 0.8978872299194336, 0.9825448393821716, 1.0672024488449097, 1.151859998703003, 1.2365175485610962, 1.3211750984191895, 1.4058327674865723, 1.4904903173446655, 1.5751478672027588, 1.6598055362701416, 1.7444630861282349, 1.8291206359863281, 1.9137781858444214, 1.9984357357025146, 2.0830934047698975, 2.167750835418701, 2.252408504486084, 2.337066173553467, 2.4217238426208496, 2.5063812732696533]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 5.0, 8.0, 10.0, 15.0, 12.0, 15.0, 21.0, 16.0, 23.0, 29.0, 27.0, 28.0, 33.0, 38.0, 45.0, 44.0, 45.0, 60.0, 42.0, 43.0, 45.0, 36.0, 42.0, 37.0, 38.0, 36.0, 35.0, 28.0, 24.0, 27.0, 24.0, 15.0, 8.0, 8.0, 6.0, 13.0, 12.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.16165292263031, -1.122979760169983, -1.0843065977096558, -1.0456334352493286, -1.0069602727890015, -0.9682871103286743, -0.9296139478683472, -0.89094078540802, -0.8522676229476929, -0.8135944604873657, -0.7749212980270386, -0.7362481355667114, -0.6975749731063843, -0.6589018106460571, -0.62022864818573, -0.5815554857254028, -0.5428823232650757, -0.5042091608047485, -0.4655359983444214, -0.42686283588409424, -0.3881896734237671, -0.34951651096343994, -0.3108433485031128, -0.27217018604278564, -0.2334970235824585, -0.19482386112213135, -0.1561506986618042, -0.11747753620147705, -0.0788043737411499, -0.040131211280822754, -0.0014580488204956055, 0.03721511363983154, 0.07588815689086914, 0.11456131935119629, 0.15323448181152344, 0.19190764427185059, 0.23058080673217773, 0.2692539691925049, 0.30792713165283203, 0.3466002941131592, 0.38527345657348633, 0.4239466190338135, 0.4626197814941406, 0.5012929439544678, 0.5399661064147949, 0.5786392688751221, 0.6173124313354492, 0.6559855937957764, 0.6946587562561035, 0.7333319187164307, 0.7720050811767578, 0.810678243637085, 0.8493514060974121, 0.8880245685577393, 0.9266977310180664, 0.9653708934783936, 1.0040440559387207, 1.0427172183990479, 1.081390380859375, 1.1200635433197021, 1.1587367057800293, 1.1974098682403564, 1.2360830307006836, 1.2747561931610107, 1.313429355621338]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 1.0, 4.0, 7.0, 12.0, 13.0, 24.0, 31.0, 46.0, 69.0, 114.0, 245.0, 548.0, 1382.0, 4678.0, 36943.0, 2250496.0, 1856220.0, 36526.0, 4608.0, 1228.0, 544.0, 250.0, 128.0, 59.0, 37.0, 24.0, 15.0, 18.0, 5.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.724609375, -1.6862640380859375, -1.647918701171875, -1.6095733642578125, -1.57122802734375, -1.5328826904296875, -1.494537353515625, -1.4561920166015625, -1.4178466796875, -1.3795013427734375, -1.341156005859375, -1.3028106689453125, -1.26446533203125, -1.2261199951171875, -1.187774658203125, -1.1494293212890625, -1.111083984375, -1.0727386474609375, -1.034393310546875, -0.9960479736328125, -0.95770263671875, -0.9193572998046875, -0.881011962890625, -0.8426666259765625, -0.8043212890625, -0.7659759521484375, -0.727630615234375, -0.6892852783203125, -0.65093994140625, -0.6125946044921875, -0.574249267578125, -0.5359039306640625, -0.49755859375, -0.4592132568359375, -0.420867919921875, -0.3825225830078125, -0.34417724609375, -0.3058319091796875, -0.267486572265625, -0.2291412353515625, -0.1907958984375, -0.1524505615234375, -0.114105224609375, -0.0757598876953125, -0.03741455078125, 0.0009307861328125, 0.039276123046875, 0.0776214599609375, 0.115966796875, 0.1543121337890625, 0.192657470703125, 0.2310028076171875, 0.26934814453125, 0.3076934814453125, 0.346038818359375, 0.3843841552734375, 0.4227294921875, 0.4610748291015625, 0.499420166015625, 0.5377655029296875, 0.57611083984375, 0.6144561767578125, 0.652801513671875, 0.6911468505859375, 0.7294921875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 6.0, 8.0, 19.0, 19.0, 26.0, 24.0, 48.0, 46.0, 58.0, 57.0, 72.0, 77.0, 67.0, 77.0, 64.0, 72.0, 46.0, 43.0, 48.0, 23.0, 22.0, 16.0, 17.0, 17.0, 8.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56884765625, -0.5518035888671875, -0.534759521484375, -0.5177154541015625, -0.50067138671875, -0.4836273193359375, -0.466583251953125, -0.4495391845703125, -0.4324951171875, -0.4154510498046875, -0.398406982421875, -0.3813629150390625, -0.36431884765625, -0.3472747802734375, -0.330230712890625, -0.3131866455078125, -0.296142578125, -0.2790985107421875, -0.262054443359375, -0.2450103759765625, -0.22796630859375, -0.2109222412109375, -0.193878173828125, -0.1768341064453125, -0.1597900390625, -0.1427459716796875, -0.125701904296875, -0.1086578369140625, -0.09161376953125, -0.0745697021484375, -0.057525634765625, -0.0404815673828125, -0.0234375, -0.0063934326171875, 0.010650634765625, 0.0276947021484375, 0.04473876953125, 0.0617828369140625, 0.078826904296875, 0.0958709716796875, 0.1129150390625, 0.1299591064453125, 0.147003173828125, 0.1640472412109375, 0.18109130859375, 0.1981353759765625, 0.215179443359375, 0.2322235107421875, 0.249267578125, 0.2663116455078125, 0.283355712890625, 0.3003997802734375, 0.31744384765625, 0.3344879150390625, 0.351531982421875, 0.3685760498046875, 0.3856201171875, 0.4026641845703125, 0.419708251953125, 0.4367523193359375, 0.45379638671875, 0.4708404541015625, 0.487884521484375, 0.5049285888671875, 0.52197265625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 6.0, 5.0, 7.0, 11.0, 19.0, 36.0, 61.0, 98.0, 202.0, 545.0, 1821.0, 10438.0, 397189.0, 3740012.0, 38715.0, 3584.0, 891.0, 336.0, 128.0, 80.0, 38.0, 20.0, 18.0, 7.0, 8.0, 6.0, 0.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.158203125, -1.1171875, -1.076171875, -1.03515625, -0.994140625, -0.953125, -0.912109375, -0.87109375, -0.830078125, -0.7890625, -0.748046875, -0.70703125, -0.666015625, -0.625, -0.583984375, -0.54296875, -0.501953125, -0.4609375, -0.419921875, -0.37890625, -0.337890625, -0.296875, -0.255859375, -0.21484375, -0.173828125, -0.1328125, -0.091796875, -0.05078125, -0.009765625, 0.03125, 0.072265625, 0.11328125, 0.154296875, 0.1953125, 0.236328125, 0.27734375, 0.318359375, 0.359375, 0.400390625, 0.44140625, 0.482421875, 0.5234375, 0.564453125, 0.60546875, 0.646484375, 0.6875, 0.728515625, 0.76953125, 0.810546875, 0.8515625, 0.892578125, 0.93359375, 0.974609375, 1.015625, 1.056640625, 1.09765625, 1.138671875, 1.1796875, 1.220703125, 1.26171875, 1.302734375, 1.34375, 1.384765625, 1.42578125, 1.466796875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 10.0, 7.0, 9.0, 19.0, 35.0, 56.0, 69.0, 130.0, 185.0, 307.0, 524.0, 686.0, 696.0, 491.0, 300.0, 209.0, 96.0, 68.0, 56.0, 34.0, 23.0, 17.0, 17.0, 4.0, 11.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2154541015625, -0.20891380310058594, -0.20237350463867188, -0.1958332061767578, -0.18929290771484375, -0.1827526092529297, -0.17621231079101562, -0.16967201232910156, -0.1631317138671875, -0.15659141540527344, -0.15005111694335938, -0.1435108184814453, -0.13697052001953125, -0.1304302215576172, -0.12388992309570312, -0.11734962463378906, -0.110809326171875, -0.10426902770996094, -0.09772872924804688, -0.09118843078613281, -0.08464813232421875, -0.07810783386230469, -0.07156753540039062, -0.06502723693847656, -0.0584869384765625, -0.05194664001464844, -0.045406341552734375, -0.03886604309082031, -0.03232574462890625, -0.025785446166992188, -0.019245147705078125, -0.012704849243164062, -0.00616455078125, 0.0003757476806640625, 0.006916046142578125, 0.013456344604492188, 0.01999664306640625, 0.026536941528320312, 0.033077239990234375, 0.03961753845214844, 0.0461578369140625, 0.05269813537597656, 0.059238433837890625, 0.06577873229980469, 0.07231903076171875, 0.07885932922363281, 0.08539962768554688, 0.09193992614746094, 0.098480224609375, 0.10502052307128906, 0.11156082153320312, 0.11810111999511719, 0.12464141845703125, 0.1311817169189453, 0.13772201538085938, 0.14426231384277344, 0.1508026123046875, 0.15734291076660156, 0.16388320922851562, 0.1704235076904297, 0.17696380615234375, 0.1835041046142578, 0.19004440307617188, 0.19658470153808594, 0.203125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 17.0, 54.0, 100.0, 158.0, 239.0, 200.0, 118.0, 68.0, 24.0, 12.0, 9.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4945473670959473, -2.4410018920898438, -2.3874564170837402, -2.3339109420776367, -2.280365467071533, -2.2268199920654297, -2.173274517059326, -2.1197290420532227, -2.06618332862854, -2.0126378536224365, -1.959092378616333, -1.9055469036102295, -1.8520013093948364, -1.798455834388733, -1.7449103593826294, -1.6913648843765259, -1.637819528579712, -1.5842740535736084, -1.5307285785675049, -1.4771831035614014, -1.4236375093460083, -1.3700920343399048, -1.3165465593338013, -1.2630010843276978, -1.2094554901123047, -1.1559100151062012, -1.1023645401000977, -1.0488190650939941, -0.9952735304832458, -0.9417279958724976, -0.888182520866394, -0.8346370458602905, -0.7810916304588318, -0.7275461554527283, -0.67400062084198, -0.6204551458358765, -0.566909670829773, -0.5133641958236694, -0.45981866121292114, -0.4062731862068176, -0.3527276813983917, -0.2991821765899658, -0.2456367015838623, -0.1920911967754364, -0.1385457068681717, -0.08500021696090698, -0.03145471215248108, 0.022090762853622437, 0.07563626766204834, 0.12918175756931305, 0.18272724747657776, 0.23627275228500366, 0.2898182272911072, 0.3433637320995331, 0.396909236907959, 0.4504547119140625, 0.504000186920166, 0.5575456619262695, 0.6110911965370178, 0.6646366715431213, 0.7181821465492249, 0.7717276811599731, 0.8252731561660767, 0.8788186311721802, 0.9323641657829285]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 4.0, 5.0, 5.0, 10.0, 13.0, 13.0, 20.0, 25.0, 37.0, 48.0, 51.0, 56.0, 64.0, 73.0, 69.0, 64.0, 53.0, 68.0, 51.0, 54.0, 56.0, 31.0, 31.0, 29.0, 23.0, 13.0, 15.0, 5.0, 5.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4739203155040741, -0.45512574911117554, -0.4363311529159546, -0.41753658652305603, -0.39874202013015747, -0.3799474537372589, -0.36115288734436035, -0.3423582911491394, -0.32356372475624084, -0.3047691583633423, -0.28597456216812134, -0.2671799957752228, -0.24838542938232422, -0.22959086298942566, -0.2107962816953659, -0.19200170040130615, -0.1732071340084076, -0.15441256761550903, -0.13561798632144928, -0.11682341247797012, -0.09802883863449097, -0.07923426479101181, -0.060439690947532654, -0.0416451096534729, -0.02285054326057434, -0.004055969417095184, 0.014738604426383972, 0.03353317826986313, 0.052327752113342285, 0.07112232595682144, 0.0899168998003006, 0.10871148109436035, 0.1275060772895813, 0.14630064368247986, 0.1650952249765396, 0.18388980627059937, 0.20268437266349792, 0.22147893905639648, 0.24027352035045624, 0.259068101644516, 0.27786266803741455, 0.2966572344303131, 0.31545180082321167, 0.3342463970184326, 0.3530409634113312, 0.37183552980422974, 0.3906301259994507, 0.40942469239234924, 0.4282192587852478, 0.44701382517814636, 0.4658083915710449, 0.48460298776626587, 0.5033975839614868, 0.522192120552063, 0.5409867167472839, 0.5597813129425049, 0.578575849533081, 0.597370445728302, 0.6161649823188782, 0.6349595785140991, 0.6537541151046753, 0.6725487112998962, 0.6913433074951172, 0.7101378440856934, 0.7289324402809143]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 7.0, 5.0, 15.0, 20.0, 83.0, 246.0, 1053.0, 5538.0, 96439.0, 913103.0, 27928.0, 3246.0, 667.0, 129.0, 41.0, 11.0, 9.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53369140625, -0.5201263427734375, -0.506561279296875, -0.4929962158203125, -0.47943115234375, -0.4658660888671875, -0.452301025390625, -0.4387359619140625, -0.4251708984375, -0.4116058349609375, -0.398040771484375, -0.3844757080078125, -0.37091064453125, -0.3573455810546875, -0.343780517578125, -0.3302154541015625, -0.316650390625, -0.3030853271484375, -0.289520263671875, -0.2759552001953125, -0.26239013671875, -0.2488250732421875, -0.235260009765625, -0.2216949462890625, -0.2081298828125, -0.1945648193359375, -0.180999755859375, -0.1674346923828125, -0.15386962890625, -0.1403045654296875, -0.126739501953125, -0.1131744384765625, -0.099609375, -0.0860443115234375, -0.072479248046875, -0.0589141845703125, -0.04534912109375, -0.0317840576171875, -0.018218994140625, -0.0046539306640625, 0.0089111328125, 0.0224761962890625, 0.036041259765625, 0.0496063232421875, 0.06317138671875, 0.0767364501953125, 0.090301513671875, 0.1038665771484375, 0.117431640625, 0.1309967041015625, 0.144561767578125, 0.1581268310546875, 0.17169189453125, 0.1852569580078125, 0.198822021484375, 0.2123870849609375, 0.2259521484375, 0.2395172119140625, 0.253082275390625, 0.2666473388671875, 0.28021240234375, 0.2937774658203125, 0.307342529296875, 0.3209075927734375, 0.33447265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 7.0, 8.0, 6.0, 13.0, 22.0, 24.0, 37.0, 35.0, 46.0, 67.0, 82.0, 85.0, 87.0, 62.0, 56.0, 73.0, 68.0, 54.0, 41.0, 34.0, 31.0, 17.0, 17.0, 9.0, 7.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.392578125, -0.378570556640625, -0.36456298828125, -0.350555419921875, -0.3365478515625, -0.322540283203125, -0.30853271484375, -0.294525146484375, -0.280517578125, -0.266510009765625, -0.25250244140625, -0.238494873046875, -0.2244873046875, -0.210479736328125, -0.19647216796875, -0.182464599609375, -0.16845703125, -0.154449462890625, -0.14044189453125, -0.126434326171875, -0.1124267578125, -0.098419189453125, -0.08441162109375, -0.070404052734375, -0.056396484375, -0.042388916015625, -0.02838134765625, -0.014373779296875, -0.0003662109375, 0.013641357421875, 0.02764892578125, 0.041656494140625, 0.0556640625, 0.069671630859375, 0.08367919921875, 0.097686767578125, 0.1116943359375, 0.125701904296875, 0.13970947265625, 0.153717041015625, 0.167724609375, 0.181732177734375, 0.19573974609375, 0.209747314453125, 0.2237548828125, 0.237762451171875, 0.25177001953125, 0.265777587890625, 0.27978515625, 0.293792724609375, 0.30780029296875, 0.321807861328125, 0.3358154296875, 0.349822998046875, 0.36383056640625, 0.377838134765625, 0.391845703125, 0.405853271484375, 0.41986083984375, 0.433868408203125, 0.4478759765625, 0.461883544921875, 0.47589111328125, 0.489898681640625, 0.50390625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 8.0, 8.0, 5.0, 8.0, 17.0, 24.0, 38.0, 32.0, 68.0, 84.0, 150.0, 234.0, 344.0, 604.0, 935.0, 1664.0, 2983.0, 5873.0, 14535.0, 54841.0, 258164.0, 481972.0, 168240.0, 35921.0, 11022.0, 4687.0, 2510.0, 1400.0, 807.0, 512.0, 307.0, 197.0, 109.0, 70.0, 52.0, 37.0, 23.0, 25.0, 8.0, 9.0, 7.0, 8.0, 6.0, 3.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09942626953125, -0.096038818359375, -0.0926513671875, -0.089263916015625, -0.08587646484375, -0.082489013671875, -0.0791015625, -0.075714111328125, -0.07232666015625, -0.068939208984375, -0.0655517578125, -0.062164306640625, -0.05877685546875, -0.055389404296875, -0.052001953125, -0.048614501953125, -0.04522705078125, -0.041839599609375, -0.0384521484375, -0.035064697265625, -0.03167724609375, -0.028289794921875, -0.02490234375, -0.021514892578125, -0.01812744140625, -0.014739990234375, -0.0113525390625, -0.007965087890625, -0.00457763671875, -0.001190185546875, 0.002197265625, 0.005584716796875, 0.00897216796875, 0.012359619140625, 0.0157470703125, 0.019134521484375, 0.02252197265625, 0.025909423828125, 0.029296875, 0.032684326171875, 0.03607177734375, 0.039459228515625, 0.0428466796875, 0.046234130859375, 0.04962158203125, 0.053009033203125, 0.056396484375, 0.059783935546875, 0.06317138671875, 0.066558837890625, 0.0699462890625, 0.073333740234375, 0.07672119140625, 0.080108642578125, 0.08349609375, 0.086883544921875, 0.09027099609375, 0.093658447265625, 0.0970458984375, 0.100433349609375, 0.10382080078125, 0.107208251953125, 0.110595703125, 0.113983154296875, 0.11737060546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 5.0, 4.0, 4.0, 10.0, 11.0, 20.0, 19.0, 15.0, 16.0, 20.0, 29.0, 29.0, 25.0, 37.0, 30.0, 43.0, 38.0, 45.0, 50.0, 47.0, 41.0, 53.0, 54.0, 32.0, 50.0, 31.0, 32.0, 35.0, 26.0, 24.0, 10.0, 14.0, 15.0, 18.0, 14.0, 12.0, 5.0, 7.0, 7.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.515625, -0.49910736083984375, -0.4825897216796875, -0.46607208251953125, -0.449554443359375, -0.43303680419921875, -0.4165191650390625, -0.40000152587890625, -0.38348388671875, -0.36696624755859375, -0.3504486083984375, -0.33393096923828125, -0.317413330078125, -0.30089569091796875, -0.2843780517578125, -0.26786041259765625, -0.2513427734375, -0.23482513427734375, -0.2183074951171875, -0.20178985595703125, -0.185272216796875, -0.16875457763671875, -0.1522369384765625, -0.13571929931640625, -0.11920166015625, -0.10268402099609375, -0.0861663818359375, -0.06964874267578125, -0.053131103515625, -0.03661346435546875, -0.0200958251953125, -0.00357818603515625, 0.012939453125, 0.02945709228515625, 0.0459747314453125, 0.06249237060546875, 0.079010009765625, 0.09552764892578125, 0.1120452880859375, 0.12856292724609375, 0.14508056640625, 0.16159820556640625, 0.1781158447265625, 0.19463348388671875, 0.211151123046875, 0.22766876220703125, 0.2441864013671875, 0.26070404052734375, 0.2772216796875, 0.29373931884765625, 0.3102569580078125, 0.32677459716796875, 0.343292236328125, 0.35980987548828125, 0.3763275146484375, 0.39284515380859375, 0.40936279296875, 0.42588043212890625, 0.4423980712890625, 0.45891571044921875, 0.475433349609375, 0.49195098876953125, 0.5084686279296875, 0.5249862670898438, 0.54150390625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 1.0, 4.0, 8.0, 15.0, 13.0, 15.0, 21.0, 37.0, 66.0, 92.0, 179.0, 271.0, 464.0, 853.0, 1620.0, 3412.0, 7745.0, 21429.0, 69332.0, 238705.0, 416689.0, 199057.0, 57618.0, 18164.0, 6615.0, 2797.0, 1446.0, 769.0, 427.0, 229.0, 157.0, 92.0, 63.0, 59.0, 24.0, 17.0, 15.0, 7.0, 8.0, 6.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.0312347412109375, -0.030327320098876953, -0.029419898986816406, -0.02851247787475586, -0.027605056762695312, -0.026697635650634766, -0.02579021453857422, -0.024882793426513672, -0.023975372314453125, -0.023067951202392578, -0.02216053009033203, -0.021253108978271484, -0.020345687866210938, -0.01943826675415039, -0.018530845642089844, -0.017623424530029297, -0.01671600341796875, -0.015808582305908203, -0.014901161193847656, -0.01399374008178711, -0.013086318969726562, -0.012178897857666016, -0.011271476745605469, -0.010364055633544922, -0.009456634521484375, -0.008549213409423828, -0.007641792297363281, -0.006734371185302734, -0.0058269500732421875, -0.004919528961181641, -0.004012107849121094, -0.003104686737060547, -0.002197265625, -0.0012898445129394531, -0.00038242340087890625, 0.0005249977111816406, 0.0014324188232421875, 0.0023398399353027344, 0.0032472610473632812, 0.004154682159423828, 0.005062103271484375, 0.005969524383544922, 0.006876945495605469, 0.007784366607666016, 0.008691787719726562, 0.00959920883178711, 0.010506629943847656, 0.011414051055908203, 0.01232147216796875, 0.013228893280029297, 0.014136314392089844, 0.01504373550415039, 0.015951156616210938, 0.016858577728271484, 0.01776599884033203, 0.018673419952392578, 0.019580841064453125, 0.020488262176513672, 0.02139568328857422, 0.022303104400634766, 0.023210525512695312, 0.02411794662475586, 0.025025367736816406, 0.025932788848876953, 0.0268402099609375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 2.0, 12.0, 10.0, 11.0, 15.0, 20.0, 21.0, 27.0, 35.0, 50.0, 64.0, 88.0, 73.0, 121.0, 104.0, 65.0, 74.0, 57.0, 41.0, 30.0, 21.0, 10.0, 15.0, 7.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.621246337890625e-05, -1.569557934999466e-05, -1.5178695321083069e-05, -1.4661811292171478e-05, -1.4144927263259888e-05, -1.3628043234348297e-05, -1.3111159205436707e-05, -1.2594275176525116e-05, -1.2077391147613525e-05, -1.1560507118701935e-05, -1.1043623089790344e-05, -1.0526739060878754e-05, -1.0009855031967163e-05, -9.492971003055573e-06, -8.976086974143982e-06, -8.459202945232391e-06, -7.9423189163208e-06, -7.42543488740921e-06, -6.90855085849762e-06, -6.391666829586029e-06, -5.8747828006744385e-06, -5.357898771762848e-06, -4.841014742851257e-06, -4.324130713939667e-06, -3.807246685028076e-06, -3.2903626561164856e-06, -2.773478627204895e-06, -2.2565945982933044e-06, -1.7397105693817139e-06, -1.2228265404701233e-06, -7.059425115585327e-07, -1.8905848264694214e-07, 3.2782554626464844e-07, 8.44709575176239e-07, 1.3615936040878296e-06, 1.8784776329994202e-06, 2.3953616619110107e-06, 2.9122456908226013e-06, 3.429129719734192e-06, 3.9460137486457825e-06, 4.462897777557373e-06, 4.979781806468964e-06, 5.496665835380554e-06, 6.013549864292145e-06, 6.530433893203735e-06, 7.047317922115326e-06, 7.5642019510269165e-06, 8.081085979938507e-06, 8.597970008850098e-06, 9.114854037761688e-06, 9.631738066673279e-06, 1.014862209558487e-05, 1.066550612449646e-05, 1.118239015340805e-05, 1.1699274182319641e-05, 1.2216158211231232e-05, 1.2733042240142822e-05, 1.3249926269054413e-05, 1.3766810297966003e-05, 1.4283694326877594e-05, 1.4800578355789185e-05, 1.5317462384700775e-05, 1.5834346413612366e-05, 1.6351230442523956e-05, 1.6868114471435547e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 2.0, 2.0, 5.0, 5.0, 10.0, 18.0, 15.0, 24.0, 35.0, 48.0, 67.0, 90.0, 139.0, 267.0, 437.0, 938.0, 2127.0, 5692.0, 17192.0, 60601.0, 219329.0, 417200.0, 230748.0, 64740.0, 18171.0, 6132.0, 2287.0, 1029.0, 471.0, 286.0, 151.0, 89.0, 83.0, 46.0, 19.0, 14.0, 11.0, 12.0, 9.0, 2.0, 5.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0308074951171875, -0.029830217361450195, -0.02885293960571289, -0.027875661849975586, -0.02689838409423828, -0.025921106338500977, -0.024943828582763672, -0.023966550827026367, -0.022989273071289062, -0.022011995315551758, -0.021034717559814453, -0.02005743980407715, -0.019080162048339844, -0.01810288429260254, -0.017125606536865234, -0.01614832878112793, -0.015171051025390625, -0.01419377326965332, -0.013216495513916016, -0.012239217758178711, -0.011261940002441406, -0.010284662246704102, -0.009307384490966797, -0.008330106735229492, -0.0073528289794921875, -0.006375551223754883, -0.005398273468017578, -0.0044209957122802734, -0.0034437179565429688, -0.002466440200805664, -0.0014891624450683594, -0.0005118846893310547, 0.00046539306640625, 0.0014426708221435547, 0.0024199485778808594, 0.003397226333618164, 0.004374504089355469, 0.0053517818450927734, 0.006329059600830078, 0.007306337356567383, 0.008283615112304688, 0.009260892868041992, 0.010238170623779297, 0.011215448379516602, 0.012192726135253906, 0.013170003890991211, 0.014147281646728516, 0.01512455940246582, 0.016101837158203125, 0.01707911491394043, 0.018056392669677734, 0.01903367042541504, 0.020010948181152344, 0.02098822593688965, 0.021965503692626953, 0.022942781448364258, 0.023920059204101562, 0.024897336959838867, 0.025874614715576172, 0.026851892471313477, 0.02782917022705078, 0.028806447982788086, 0.02978372573852539, 0.030761003494262695, 0.03173828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 8.0, 10.0, 9.0, 7.0, 14.0, 20.0, 9.0, 21.0, 29.0, 34.0, 37.0, 37.0, 58.0, 50.0, 57.0, 46.0, 55.0, 50.0, 59.0, 33.0, 51.0, 45.0, 41.0, 38.0, 32.0, 20.0, 25.0, 24.0, 22.0, 12.0, 6.0, 9.0, 4.0, 6.0, 4.0, 3.0, 5.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.007419586181640625, -0.007188856601715088, -0.006958127021789551, -0.006727397441864014, -0.0064966678619384766, -0.0062659382820129395, -0.006035208702087402, -0.005804479122161865, -0.005573749542236328, -0.005343019962310791, -0.005112290382385254, -0.004881560802459717, -0.00465083122253418, -0.004420101642608643, -0.0041893720626831055, -0.003958642482757568, -0.0037279129028320312, -0.003497183322906494, -0.003266453742980957, -0.00303572416305542, -0.002804994583129883, -0.0025742650032043457, -0.0023435354232788086, -0.0021128058433532715, -0.0018820762634277344, -0.0016513466835021973, -0.0014206171035766602, -0.001189887523651123, -0.0009591579437255859, -0.0007284283638000488, -0.0004976987838745117, -0.0002669692039489746, -3.62396240234375e-05, 0.0001944899559020996, 0.0004252195358276367, 0.0006559491157531738, 0.0008866786956787109, 0.001117408275604248, 0.0013481378555297852, 0.0015788674354553223, 0.0018095970153808594, 0.0020403265953063965, 0.0022710561752319336, 0.0025017857551574707, 0.002732515335083008, 0.002963244915008545, 0.003193974494934082, 0.003424704074859619, 0.0036554336547851562, 0.0038861632347106934, 0.0041168928146362305, 0.004347622394561768, 0.004578351974487305, 0.004809081554412842, 0.005039811134338379, 0.005270540714263916, 0.005501270294189453, 0.00573199987411499, 0.005962729454040527, 0.0061934590339660645, 0.0064241886138916016, 0.006654918193817139, 0.006885647773742676, 0.007116377353668213, 0.00734710693359375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 11.0, 80.0, 377.0, 440.0, 82.0, 19.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4104955196380615, -3.3347394466400146, -3.258983612060547, -3.1832275390625, -3.107471466064453, -3.0317153930664062, -2.9559593200683594, -2.8802034854888916, -2.8044474124908447, -2.728691339492798, -2.65293550491333, -2.577179431915283, -2.5014233589172363, -2.4256672859191895, -2.3499112129211426, -2.274155378341675, -2.198399305343628, -2.122643232345581, -2.0468873977661133, -1.9711313247680664, -1.8953752517700195, -1.8196191787719727, -1.7438632249832153, -1.668107271194458, -1.5923511981964111, -1.5165951251983643, -1.440839171409607, -1.3650832176208496, -1.2893271446228027, -1.2135710716247559, -1.1378151178359985, -1.0620591640472412, -0.9863032102584839, -0.9105471968650818, -0.8347911834716797, -0.7590351700782776, -0.6832791566848755, -0.6075231432914734, -0.5317671298980713, -0.4560111165046692, -0.3802551031112671, -0.304499089717865, -0.2287430763244629, -0.1529870629310608, -0.07723104953765869, -0.0014750361442565918, 0.07428097724914551, 0.1500369906425476, 0.2257930040359497, 0.3015490174293518, 0.3773050308227539, 0.453061044216156, 0.5288170576095581, 0.6045730710029602, 0.6803290843963623, 0.7560850977897644, 0.8318411111831665, 0.9075971245765686, 0.9833531379699707, 1.0591092109680176, 1.134865164756775, 1.2106211185455322, 1.286377191543579, 1.362133264541626, 1.4378892183303833]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 6.0, 7.0, 7.0, 18.0, 24.0, 34.0, 55.0, 56.0, 77.0, 98.0, 83.0, 98.0, 77.0, 86.0, 64.0, 65.0, 48.0, 31.0, 29.0, 14.0, 8.0, 5.0, 9.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34692132472991943, -0.33067426085472107, -0.3144271969795227, -0.29818010330200195, -0.2819330394268036, -0.2656859755516052, -0.24943889677524567, -0.2331918179988861, -0.21694475412368774, -0.20069769024848938, -0.18445061147212982, -0.16820353269577026, -0.1519564688205719, -0.13570940494537354, -0.11946232616901398, -0.10321525484323502, -0.08696818351745605, -0.0707211121916771, -0.05447404086589813, -0.03822696954011917, -0.02197989821434021, -0.005732826888561249, 0.010514244437217712, 0.026761315762996674, 0.043008387088775635, 0.059255458414554596, 0.07550252974033356, 0.09174960106611252, 0.10799667239189148, 0.12424374371767044, 0.1404908150434494, 0.15673789381980896, 0.1729850172996521, 0.18923208117485046, 0.20547915995121002, 0.22172623872756958, 0.23797330260276794, 0.2542203664779663, 0.27046746015548706, 0.2867145240306854, 0.3029615879058838, 0.31920865178108215, 0.3354557156562805, 0.35170280933380127, 0.36794987320899963, 0.384196937084198, 0.40044403076171875, 0.4166910946369171, 0.4329381585121155, 0.44918522238731384, 0.4654322862625122, 0.48167937994003296, 0.4979264438152313, 0.5141735076904297, 0.5304206013679504, 0.5466676354408264, 0.5629147291183472, 0.5791618227958679, 0.5954088568687439, 0.6116559505462646, 0.6279029846191406, 0.6441500782966614, 0.6603971719741821, 0.6766442060470581, 0.6928912997245789]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 4.0, 5.0, 4.0, 7.0, 11.0, 22.0, 14.0, 33.0, 48.0, 62.0, 99.0, 178.0, 291.0, 562.0, 1106.0, 2207.0, 5366.0, 15084.0, 48032.0, 325398.0, 553947.0, 64402.0, 19312.0, 6896.0, 2703.0, 1247.0, 661.0, 304.0, 174.0, 132.0, 92.0, 48.0, 39.0, 19.0, 12.0, 9.0, 8.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.362060546875, -0.35003662109375, -0.3380126953125, -0.32598876953125, -0.31396484375, -0.30194091796875, -0.2899169921875, -0.27789306640625, -0.265869140625, -0.25384521484375, -0.2418212890625, -0.22979736328125, -0.2177734375, -0.20574951171875, -0.1937255859375, -0.18170166015625, -0.169677734375, -0.15765380859375, -0.1456298828125, -0.13360595703125, -0.12158203125, -0.10955810546875, -0.0975341796875, -0.08551025390625, -0.073486328125, -0.06146240234375, -0.0494384765625, -0.03741455078125, -0.025390625, -0.01336669921875, -0.0013427734375, 0.01068115234375, 0.022705078125, 0.03472900390625, 0.0467529296875, 0.05877685546875, 0.07080078125, 0.08282470703125, 0.0948486328125, 0.10687255859375, 0.118896484375, 0.13092041015625, 0.1429443359375, 0.15496826171875, 0.1669921875, 0.17901611328125, 0.1910400390625, 0.20306396484375, 0.215087890625, 0.22711181640625, 0.2391357421875, 0.25115966796875, 0.26318359375, 0.27520751953125, 0.2872314453125, 0.29925537109375, 0.311279296875, 0.32330322265625, 0.3353271484375, 0.34735107421875, 0.359375, 0.37139892578125, 0.3834228515625, 0.39544677734375, 0.407470703125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 8.0, 8.0, 10.0, 21.0, 36.0, 32.0, 56.0, 63.0, 74.0, 90.0, 94.0, 81.0, 76.0, 72.0, 67.0, 54.0, 43.0, 31.0, 38.0, 14.0, 11.0, 4.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7587890625, -0.7298431396484375, -0.700897216796875, -0.6719512939453125, -0.64300537109375, -0.6140594482421875, -0.585113525390625, -0.5561676025390625, -0.5272216796875, -0.4982757568359375, -0.469329833984375, -0.4403839111328125, -0.41143798828125, -0.3824920654296875, -0.353546142578125, -0.3246002197265625, -0.295654296875, -0.2667083740234375, -0.237762451171875, -0.2088165283203125, -0.17987060546875, -0.1509246826171875, -0.121978759765625, -0.0930328369140625, -0.0640869140625, -0.0351409912109375, -0.006195068359375, 0.0227508544921875, 0.05169677734375, 0.0806427001953125, 0.109588623046875, 0.1385345458984375, 0.16748046875, 0.1964263916015625, 0.225372314453125, 0.2543182373046875, 0.28326416015625, 0.3122100830078125, 0.341156005859375, 0.3701019287109375, 0.3990478515625, 0.4279937744140625, 0.456939697265625, 0.4858856201171875, 0.51483154296875, 0.5437774658203125, 0.572723388671875, 0.6016693115234375, 0.630615234375, 0.6595611572265625, 0.688507080078125, 0.7174530029296875, 0.74639892578125, 0.7753448486328125, 0.804290771484375, 0.8332366943359375, 0.8621826171875, 0.8911285400390625, 0.920074462890625, 0.9490203857421875, 0.97796630859375, 1.0069122314453125, 1.035858154296875, 1.0648040771484375, 1.09375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 6.0, 10.0, 12.0, 16.0, 8.0, 24.0, 25.0, 33.0, 39.0, 49.0, 76.0, 86.0, 93.0, 144.0, 190.0, 264.0, 401.0, 831.0, 2680.0, 18356.0, 399937.0, 597362.0, 22287.0, 3113.0, 880.0, 447.0, 300.0, 193.0, 151.0, 112.0, 95.0, 68.0, 53.0, 42.0, 34.0, 37.0, 18.0, 8.0, 14.0, 18.0, 7.0, 7.0, 6.0, 6.0, 3.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6474609375, -0.6251678466796875, -0.602874755859375, -0.5805816650390625, -0.55828857421875, -0.5359954833984375, -0.513702392578125, -0.4914093017578125, -0.4691162109375, -0.4468231201171875, -0.424530029296875, -0.4022369384765625, -0.37994384765625, -0.3576507568359375, -0.335357666015625, -0.3130645751953125, -0.290771484375, -0.2684783935546875, -0.246185302734375, -0.2238922119140625, -0.20159912109375, -0.1793060302734375, -0.157012939453125, -0.1347198486328125, -0.1124267578125, -0.0901336669921875, -0.067840576171875, -0.0455474853515625, -0.02325439453125, -0.0009613037109375, 0.021331787109375, 0.0436248779296875, 0.06591796875, 0.0882110595703125, 0.110504150390625, 0.1327972412109375, 0.15509033203125, 0.1773834228515625, 0.199676513671875, 0.2219696044921875, 0.2442626953125, 0.2665557861328125, 0.288848876953125, 0.3111419677734375, 0.33343505859375, 0.3557281494140625, 0.378021240234375, 0.4003143310546875, 0.422607421875, 0.4449005126953125, 0.467193603515625, 0.4894866943359375, 0.51177978515625, 0.5340728759765625, 0.556365966796875, 0.5786590576171875, 0.6009521484375, 0.6232452392578125, 0.645538330078125, 0.6678314208984375, 0.69012451171875, 0.7124176025390625, 0.734710693359375, 0.7570037841796875, 0.779296875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 9.0, 5.0, 5.0, 10.0, 7.0, 17.0, 15.0, 14.0, 27.0, 22.0, 34.0, 49.0, 48.0, 47.0, 58.0, 63.0, 62.0, 55.0, 61.0, 64.0, 35.0, 34.0, 52.0, 25.0, 27.0, 27.0, 20.0, 15.0, 20.0, 13.0, 6.0, 11.0, 13.0, 8.0, 10.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.79833984375, -0.7741470336914062, -0.7499542236328125, -0.7257614135742188, -0.701568603515625, -0.6773757934570312, -0.6531829833984375, -0.6289901733398438, -0.60479736328125, -0.5806045532226562, -0.5564117431640625, -0.5322189331054688, -0.508026123046875, -0.48383331298828125, -0.4596405029296875, -0.43544769287109375, -0.4112548828125, -0.38706207275390625, -0.3628692626953125, -0.33867645263671875, -0.314483642578125, -0.29029083251953125, -0.2660980224609375, -0.24190521240234375, -0.21771240234375, -0.19351959228515625, -0.1693267822265625, -0.14513397216796875, -0.120941162109375, -0.09674835205078125, -0.0725555419921875, -0.04836273193359375, -0.024169921875, 2.288818359375e-05, 0.0242156982421875, 0.04840850830078125, 0.072601318359375, 0.09679412841796875, 0.1209869384765625, 0.14517974853515625, 0.16937255859375, 0.19356536865234375, 0.2177581787109375, 0.24195098876953125, 0.266143798828125, 0.29033660888671875, 0.3145294189453125, 0.33872222900390625, 0.3629150390625, 0.38710784912109375, 0.4113006591796875, 0.43549346923828125, 0.459686279296875, 0.48387908935546875, 0.5080718994140625, 0.5322647094726562, 0.55645751953125, 0.5806503295898438, 0.6048431396484375, 0.6290359497070312, 0.653228759765625, 0.6774215698242188, 0.7016143798828125, 0.7258071899414062, 0.75]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 11.0, 10.0, 27.0, 24.0, 52.0, 82.0, 112.0, 169.0, 294.0, 490.0, 1359.0, 7062.0, 808364.0, 223268.0, 4811.0, 1141.0, 492.0, 286.0, 146.0, 122.0, 76.0, 45.0, 44.0, 17.0, 19.0, 4.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.5712890625, -0.5576591491699219, -0.5440292358398438, -0.5303993225097656, -0.5167694091796875, -0.5031394958496094, -0.48950958251953125, -0.4758796691894531, -0.462249755859375, -0.4486198425292969, -0.43498992919921875, -0.4213600158691406, -0.4077301025390625, -0.3941001892089844, -0.38047027587890625, -0.3668403625488281, -0.35321044921875, -0.3395805358886719, -0.32595062255859375, -0.3123207092285156, -0.2986907958984375, -0.2850608825683594, -0.27143096923828125, -0.2578010559082031, -0.244171142578125, -0.23054122924804688, -0.21691131591796875, -0.20328140258789062, -0.1896514892578125, -0.17602157592773438, -0.16239166259765625, -0.14876174926757812, -0.1351318359375, -0.12150192260742188, -0.10787200927734375, -0.09424209594726562, -0.0806121826171875, -0.06698226928710938, -0.05335235595703125, -0.039722442626953125, -0.026092529296875, -0.012462615966796875, 0.00116729736328125, 0.014797210693359375, 0.0284271240234375, 0.042057037353515625, 0.05568695068359375, 0.06931686401367188, 0.08294677734375, 0.09657669067382812, 0.11020660400390625, 0.12383651733398438, 0.1374664306640625, 0.15109634399414062, 0.16472625732421875, 0.17835617065429688, 0.191986083984375, 0.20561599731445312, 0.21924591064453125, 0.23287582397460938, 0.2465057373046875, 0.2601356506347656, 0.27376556396484375, 0.2873954772949219, 0.301025390625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 18.0, 50.0, 153.0, 559.0, 129.0, 46.0, 17.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6193599700927734e-05, -4.337821155786514e-05, -4.056282341480255e-05, -3.774743527173996e-05, -3.493204712867737e-05, -3.2116658985614777e-05, -2.9301270842552185e-05, -2.6485882699489594e-05, -2.3670494556427002e-05, -2.085510641336441e-05, -1.803971827030182e-05, -1.5224330127239227e-05, -1.2408941984176636e-05, -9.593553841114044e-06, -6.778165698051453e-06, -3.962777554988861e-06, -1.1473894119262695e-06, 1.667998731136322e-06, 4.4833868741989136e-06, 7.298775017261505e-06, 1.0114163160324097e-05, 1.2929551303386688e-05, 1.574493944644928e-05, 1.856032758951187e-05, 2.1375715732574463e-05, 2.4191103875637054e-05, 2.7006492018699646e-05, 2.9821880161762238e-05, 3.263726830482483e-05, 3.545265644788742e-05, 3.826804459095001e-05, 4.1083432734012604e-05, 4.3898820877075195e-05, 4.671420902013779e-05, 4.952959716320038e-05, 5.234498530626297e-05, 5.516037344932556e-05, 5.797576159238815e-05, 6.0791149735450745e-05, 6.360653787851334e-05, 6.642192602157593e-05, 6.923731416463852e-05, 7.205270230770111e-05, 7.48680904507637e-05, 7.76834785938263e-05, 8.049886673688889e-05, 8.331425487995148e-05, 8.612964302301407e-05, 8.894503116607666e-05, 9.176041930913925e-05, 9.457580745220184e-05, 9.739119559526443e-05, 0.00010020658373832703, 0.00010302197188138962, 0.00010583736002445221, 0.0001086527481675148, 0.00011146813631057739, 0.00011428352445363998, 0.00011709891259670258, 0.00011991430073976517, 0.00012272968888282776, 0.00012554507702589035, 0.00012836046516895294, 0.00013117585331201553, 0.00013399124145507812]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 3.0, 9.0, 5.0, 8.0, 21.0, 20.0, 29.0, 43.0, 48.0, 69.0, 106.0, 189.0, 231.0, 391.0, 745.0, 2246.0, 20026.0, 951936.0, 66099.0, 3951.0, 986.0, 497.0, 276.0, 216.0, 124.0, 83.0, 53.0, 41.0, 21.0, 21.0, 14.0, 14.0, 10.0, 5.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3447265625, -0.33074951171875, -0.3167724609375, -0.30279541015625, -0.288818359375, -0.27484130859375, -0.2608642578125, -0.24688720703125, -0.23291015625, -0.21893310546875, -0.2049560546875, -0.19097900390625, -0.177001953125, -0.16302490234375, -0.1490478515625, -0.13507080078125, -0.12109375, -0.10711669921875, -0.0931396484375, -0.07916259765625, -0.065185546875, -0.05120849609375, -0.0372314453125, -0.02325439453125, -0.00927734375, 0.00469970703125, 0.0186767578125, 0.03265380859375, 0.046630859375, 0.06060791015625, 0.0745849609375, 0.08856201171875, 0.1025390625, 0.11651611328125, 0.1304931640625, 0.14447021484375, 0.158447265625, 0.17242431640625, 0.1864013671875, 0.20037841796875, 0.21435546875, 0.22833251953125, 0.2423095703125, 0.25628662109375, 0.270263671875, 0.28424072265625, 0.2982177734375, 0.31219482421875, 0.326171875, 0.34014892578125, 0.3541259765625, 0.36810302734375, 0.382080078125, 0.39605712890625, 0.4100341796875, 0.42401123046875, 0.43798828125, 0.45196533203125, 0.4659423828125, 0.47991943359375, 0.493896484375, 0.50787353515625, 0.5218505859375, 0.53582763671875, 0.5498046875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 9.0, 10.0, 10.0, 15.0, 40.0, 44.0, 89.0, 194.0, 282.0, 137.0, 58.0, 41.0, 29.0, 14.0, 7.0, 10.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11181640625, -0.10825538635253906, -0.10469436645507812, -0.10113334655761719, -0.09757232666015625, -0.09401130676269531, -0.09045028686523438, -0.08688926696777344, -0.0833282470703125, -0.07976722717285156, -0.07620620727539062, -0.07264518737792969, -0.06908416748046875, -0.06552314758300781, -0.061962127685546875, -0.05840110778808594, -0.054840087890625, -0.05127906799316406, -0.047718048095703125, -0.04415702819824219, -0.04059600830078125, -0.03703498840332031, -0.033473968505859375, -0.029912948608398438, -0.0263519287109375, -0.022790908813476562, -0.019229888916015625, -0.015668869018554688, -0.01210784912109375, -0.008546829223632812, -0.004985809326171875, -0.0014247894287109375, 0.00213623046875, 0.0056972503662109375, 0.009258270263671875, 0.012819290161132812, 0.01638031005859375, 0.019941329956054688, 0.023502349853515625, 0.027063369750976562, 0.0306243896484375, 0.03418540954589844, 0.037746429443359375, 0.04130744934082031, 0.04486846923828125, 0.04842948913574219, 0.051990509033203125, 0.05555152893066406, 0.059112548828125, 0.06267356872558594, 0.06623458862304688, 0.06979560852050781, 0.07335662841796875, 0.07691764831542969, 0.08047866821289062, 0.08403968811035156, 0.0876007080078125, 0.09116172790527344, 0.09472274780273438, 0.09828376770019531, 0.10184478759765625, 0.10540580749511719, 0.10896682739257812, 0.11252784729003906, 0.1160888671875]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 23.0, 46.0, 114.0, 200.0, 239.0, 197.0, 99.0, 43.0, 24.0, 9.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.612043857574463, -2.543992519378662, -2.4759409427642822, -2.4078896045684814, -2.3398382663726807, -2.271786689758301, -2.2037353515625, -2.135684013366699, -2.0676324367523193, -1.999580979347229, -1.9315296411514282, -1.863478183746338, -1.7954267263412476, -1.7273752689361572, -1.6593239307403564, -1.5912724733352661, -1.5232211351394653, -1.455169677734375, -1.3871183395385742, -1.3190668821334839, -1.2510154247283936, -1.1829640865325928, -1.1149126291275024, -1.046861171722412, -0.9788097739219666, -0.910758376121521, -0.8427069187164307, -0.7746555209159851, -0.7066041231155396, -0.6385526657104492, -0.5705012679100037, -0.5024498701095581, -0.4343982934951782, -0.3663468658924103, -0.29829543828964233, -0.23024404048919678, -0.16219261288642883, -0.09414118528366089, -0.026089787483215332, 0.04196164011955261, 0.11001306772232056, 0.1780644953250885, 0.24611590802669525, 0.314167320728302, 0.38221874833106995, 0.4502701759338379, 0.5183215737342834, 0.586372971534729, 0.6544244289398193, 0.7224758267402649, 0.7905272841453552, 0.8585786819458008, 0.9266301393508911, 0.9946815371513367, 1.0627329349517822, 1.1307843923568726, 1.198835849761963, 1.2668873071670532, 1.334938645362854, 1.4029901027679443, 1.4710415601730347, 1.539093017578125, 1.6071443557739258, 1.6751958131790161, 1.743247151374817]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 1.0, 2.0, 4.0, 9.0, 6.0, 5.0, 7.0, 7.0, 9.0, 10.0, 18.0, 26.0, 28.0, 23.0, 25.0, 37.0, 26.0, 45.0, 34.0, 41.0, 47.0, 37.0, 47.0, 42.0, 34.0, 44.0, 48.0, 41.0, 39.0, 46.0, 30.0, 27.0, 28.0, 23.0, 15.0, 22.0, 15.0, 13.0, 5.0, 12.0, 7.0, 6.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.0844839811325073, -1.0528457164764404, -1.0212074518203735, -0.9895691275596619, -0.9579308032989502, -0.9262925386428833, -0.8946542739868164, -0.8630160093307495, -0.8313776850700378, -0.799739420413971, -0.7681010961532593, -0.7364628314971924, -0.7048245668411255, -0.6731862425804138, -0.6415479779243469, -0.6099096536636353, -0.5782713890075684, -0.5466331243515015, -0.5149948000907898, -0.4833565354347229, -0.4517182409763336, -0.42007994651794434, -0.38844168186187744, -0.35680338740348816, -0.3251650929450989, -0.2935267984867096, -0.2618885040283203, -0.23025023937225342, -0.19861194491386414, -0.16697365045547485, -0.13533537089824677, -0.10369709134101868, -0.0720587968826294, -0.04042050987482071, -0.008782222867012024, 0.02285606414079666, 0.05449435114860535, 0.08613264560699463, 0.11777092516422272, 0.1494092047214508, 0.1810474991798401, 0.21268579363822937, 0.24432407319545746, 0.27596235275268555, 0.30760064721107483, 0.3392389416694641, 0.370877206325531, 0.4025155007839203, 0.43415379524230957, 0.46579208970069885, 0.49743038415908813, 0.529068648815155, 0.5607069730758667, 0.5923452377319336, 0.6239835023880005, 0.6556217670440674, 0.687260091304779, 0.718898355960846, 0.7505366802215576, 0.7821749448776245, 0.8138132095336914, 0.8454515337944031, 0.87708979845047, 0.9087281227111816, 0.9403663873672485]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 5.0, 9.0, 4.0, 5.0, 10.0, 15.0, 7.0, 10.0, 8.0, 20.0, 22.0, 25.0, 28.0, 39.0, 47.0, 59.0, 105.0, 199.0, 606.0, 2646.0, 63580.0, 4069588.0, 53486.0, 2598.0, 559.0, 191.0, 86.0, 61.0, 46.0, 32.0, 24.0, 23.0, 19.0, 12.0, 24.0, 18.0, 11.0, 12.0, 6.0, 10.0, 10.0, 5.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.84375, -1.785186767578125, -1.72662353515625, -1.668060302734375, -1.6094970703125, -1.550933837890625, -1.49237060546875, -1.433807373046875, -1.375244140625, -1.316680908203125, -1.25811767578125, -1.199554443359375, -1.1409912109375, -1.082427978515625, -1.02386474609375, -0.965301513671875, -0.90673828125, -0.848175048828125, -0.78961181640625, -0.731048583984375, -0.6724853515625, -0.613922119140625, -0.55535888671875, -0.496795654296875, -0.438232421875, -0.379669189453125, -0.32110595703125, -0.262542724609375, -0.2039794921875, -0.145416259765625, -0.08685302734375, -0.028289794921875, 0.0302734375, 0.088836669921875, 0.14739990234375, 0.205963134765625, 0.2645263671875, 0.323089599609375, 0.38165283203125, 0.440216064453125, 0.498779296875, 0.557342529296875, 0.61590576171875, 0.674468994140625, 0.7330322265625, 0.791595458984375, 0.85015869140625, 0.908721923828125, 0.96728515625, 1.025848388671875, 1.08441162109375, 1.142974853515625, 1.2015380859375, 1.260101318359375, 1.31866455078125, 1.377227783203125, 1.435791015625, 1.494354248046875, 1.55291748046875, 1.611480712890625, 1.6700439453125, 1.728607177734375, 1.78717041015625, 1.845733642578125, 1.904296875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 3.0, 0.0, 1.0, 4.0, 8.0, 7.0, 12.0, 16.0, 15.0, 21.0, 27.0, 34.0, 32.0, 44.0, 54.0, 67.0, 56.0, 64.0, 59.0, 63.0, 70.0, 51.0, 59.0, 46.0, 26.0, 38.0, 27.0, 21.0, 16.0, 11.0, 16.0, 9.0, 8.0, 9.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.429931640625, -0.4167518615722656, -0.40357208251953125, -0.3903923034667969, -0.3772125244140625, -0.3640327453613281, -0.35085296630859375, -0.3376731872558594, -0.324493408203125, -0.3113136291503906, -0.29813385009765625, -0.2849540710449219, -0.2717742919921875, -0.2585945129394531, -0.24541473388671875, -0.23223495483398438, -0.21905517578125, -0.20587539672851562, -0.19269561767578125, -0.17951583862304688, -0.1663360595703125, -0.15315628051757812, -0.13997650146484375, -0.12679672241210938, -0.113616943359375, -0.10043716430664062, -0.08725738525390625, -0.07407760620117188, -0.0608978271484375, -0.047718048095703125, -0.03453826904296875, -0.021358489990234375, -0.0081787109375, 0.005001068115234375, 0.01818084716796875, 0.031360626220703125, 0.0445404052734375, 0.057720184326171875, 0.07089996337890625, 0.08407974243164062, 0.097259521484375, 0.11043930053710938, 0.12361907958984375, 0.13679885864257812, 0.1499786376953125, 0.16315841674804688, 0.17633819580078125, 0.18951797485351562, 0.20269775390625, 0.21587753295898438, 0.22905731201171875, 0.24223709106445312, 0.2554168701171875, 0.2685966491699219, 0.28177642822265625, 0.2949562072753906, 0.308135986328125, 0.3213157653808594, 0.33449554443359375, 0.3476753234863281, 0.3608551025390625, 0.3740348815917969, 0.38721466064453125, 0.4003944396972656, 0.41357421875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 13.0, 10.0, 24.0, 70.0, 131.0, 410.0, 2034.0, 50873.0, 4095458.0, 42518.0, 2070.0, 394.0, 141.0, 64.0, 30.0, 19.0, 12.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1416015625, -1.0858612060546875, -1.030120849609375, -0.9743804931640625, -0.91864013671875, -0.8628997802734375, -0.807159423828125, -0.7514190673828125, -0.6956787109375, -0.6399383544921875, -0.584197998046875, -0.5284576416015625, -0.47271728515625, -0.4169769287109375, -0.361236572265625, -0.3054962158203125, -0.249755859375, -0.1940155029296875, -0.138275146484375, -0.0825347900390625, -0.02679443359375, 0.0289459228515625, 0.084686279296875, 0.1404266357421875, 0.1961669921875, 0.2519073486328125, 0.307647705078125, 0.3633880615234375, 0.41912841796875, 0.4748687744140625, 0.530609130859375, 0.5863494873046875, 0.64208984375, 0.6978302001953125, 0.753570556640625, 0.8093109130859375, 0.86505126953125, 0.9207916259765625, 0.976531982421875, 1.0322723388671875, 1.0880126953125, 1.1437530517578125, 1.199493408203125, 1.2552337646484375, 1.31097412109375, 1.3667144775390625, 1.422454833984375, 1.4781951904296875, 1.533935546875, 1.5896759033203125, 1.645416259765625, 1.7011566162109375, 1.75689697265625, 1.8126373291015625, 1.868377685546875, 1.9241180419921875, 1.9798583984375, 2.0355987548828125, 2.091339111328125, 2.1470794677734375, 2.20281982421875, 2.2585601806640625, 2.314300537109375, 2.3700408935546875, 2.42578125]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 8.0, 9.0, 8.0, 20.0, 29.0, 66.0, 154.0, 287.0, 630.0, 1154.0, 896.0, 439.0, 186.0, 102.0, 46.0, 19.0, 13.0, 10.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.48681640625, -0.47702980041503906, -0.4672431945800781, -0.4574565887451172, -0.44766998291015625, -0.4378833770751953, -0.4280967712402344, -0.41831016540527344, -0.4085235595703125, -0.39873695373535156, -0.3889503479003906, -0.3791637420654297, -0.36937713623046875, -0.3595905303955078, -0.3498039245605469, -0.34001731872558594, -0.330230712890625, -0.32044410705566406, -0.3106575012207031, -0.3008708953857422, -0.29108428955078125, -0.2812976837158203, -0.2715110778808594, -0.26172447204589844, -0.2519378662109375, -0.24215126037597656, -0.23236465454101562, -0.2225780487060547, -0.21279144287109375, -0.2030048370361328, -0.19321823120117188, -0.18343162536621094, -0.17364501953125, -0.16385841369628906, -0.15407180786132812, -0.1442852020263672, -0.13449859619140625, -0.12471199035644531, -0.11492538452148438, -0.10513877868652344, -0.0953521728515625, -0.08556556701660156, -0.07577896118164062, -0.06599235534667969, -0.05620574951171875, -0.04641914367675781, -0.036632537841796875, -0.026845932006835938, -0.017059326171875, -0.0072727203369140625, 0.002513885498046875, 0.012300491333007812, 0.02208709716796875, 0.03187370300292969, 0.041660308837890625, 0.05144691467285156, 0.0612335205078125, 0.07102012634277344, 0.08080673217773438, 0.09059333801269531, 0.10037994384765625, 0.11016654968261719, 0.11995315551757812, 0.12973976135253906, 0.1395263671875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 6.0, 12.0, 27.0, 47.0, 68.0, 84.0, 127.0, 147.0, 161.0, 102.0, 96.0, 51.0, 29.0, 19.0, 12.0, 1.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.293984293937683, -1.2637734413146973, -1.2335625886917114, -1.2033517360687256, -1.1731407642364502, -1.1429299116134644, -1.1127190589904785, -1.0825082063674927, -1.0522973537445068, -1.022086501121521, -0.9918756484985352, -0.9616647362709045, -0.9314538836479187, -0.9012430310249329, -0.8710321187973022, -0.8408212661743164, -0.8106104135513306, -0.7803995609283447, -0.7501887083053589, -0.7199777960777283, -0.6897669434547424, -0.6595560908317566, -0.629345178604126, -0.5991343259811401, -0.5689234733581543, -0.5387126207351685, -0.5085017681121826, -0.478290855884552, -0.44808000326156616, -0.4178691506385803, -0.3876582682132721, -0.35744738578796387, -0.32723647356033325, -0.2970256209373474, -0.2668147385120392, -0.23660387098789215, -0.20639300346374512, -0.17618213593959808, -0.14597126841545105, -0.11576040089130402, -0.08554953336715698, -0.05533866584300995, -0.025127798318862915, 0.005083069205284119, 0.03529393672943115, 0.06550480425357819, 0.09571567177772522, 0.12592653930187225, 0.1561374068260193, 0.18634827435016632, 0.21655914187431335, 0.2467700093984604, 0.2769808769226074, 0.30719172954559326, 0.3374026119709015, 0.3676134943962097, 0.39782434701919556, 0.4280351996421814, 0.4582460820674896, 0.48845696449279785, 0.5186678171157837, 0.5488786697387695, 0.5790895223617554, 0.609300434589386, 0.6395112872123718]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 6.0, 8.0, 4.0, 14.0, 12.0, 18.0, 22.0, 28.0, 33.0, 29.0, 32.0, 32.0, 40.0, 42.0, 54.0, 66.0, 46.0, 52.0, 56.0, 43.0, 46.0, 53.0, 36.0, 36.0, 42.0, 26.0, 19.0, 24.0, 16.0, 17.0, 13.0, 5.0, 6.0, 8.0, 8.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38227951526641846, -0.368903249502182, -0.35552698373794556, -0.3421507179737091, -0.32877445220947266, -0.3153982162475586, -0.30202195048332214, -0.2886456847190857, -0.27526941895484924, -0.2618931531906128, -0.24851688742637634, -0.2351406365633011, -0.22176437079906464, -0.20838810503482819, -0.19501185417175293, -0.18163558840751648, -0.16825932264328003, -0.15488305687904358, -0.14150679111480713, -0.12813054025173187, -0.11475427448749542, -0.10137800872325897, -0.08800175040960312, -0.07462549209594727, -0.061249226331710815, -0.047872964292764664, -0.03449670225381851, -0.02112044021487236, -0.0077441781759262085, 0.005632087588310242, 0.019008345901966095, 0.03238460421562195, 0.045760899782180786, 0.05913716182112694, 0.07251342386007309, 0.08588968217372894, 0.0992659479379654, 0.11264221370220184, 0.1260184645652771, 0.13939473032951355, 0.15277099609375, 0.16614726185798645, 0.1795235276222229, 0.19289977848529816, 0.2062760442495346, 0.21965231001377106, 0.2330285608768463, 0.24640482664108276, 0.2597810924053192, 0.27315735816955566, 0.2865336239337921, 0.29990988969802856, 0.3132861256599426, 0.32666242122650146, 0.3400386571884155, 0.353414922952652, 0.3667911887168884, 0.3801674544811249, 0.39354372024536133, 0.4069199860095978, 0.42029625177383423, 0.4336724877357483, 0.44704875349998474, 0.4604250192642212, 0.47380128502845764]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 0.0, 5.0, 4.0, 6.0, 7.0, 11.0, 26.0, 54.0, 125.0, 416.0, 2088.0, 11373.0, 162061.0, 835448.0, 30825.0, 4753.0, 948.0, 223.0, 68.0, 41.0, 15.0, 13.0, 8.0, 3.0, 0.0, 5.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.5966796875, -0.5806617736816406, -0.5646438598632812, -0.5486259460449219, -0.5326080322265625, -0.5165901184082031, -0.5005722045898438, -0.4845542907714844, -0.468536376953125, -0.4525184631347656, -0.43650054931640625, -0.4204826354980469, -0.4044647216796875, -0.3884468078613281, -0.37242889404296875, -0.3564109802246094, -0.34039306640625, -0.3243751525878906, -0.30835723876953125, -0.2923393249511719, -0.2763214111328125, -0.2603034973144531, -0.24428558349609375, -0.22826766967773438, -0.212249755859375, -0.19623184204101562, -0.18021392822265625, -0.16419601440429688, -0.1481781005859375, -0.13216018676757812, -0.11614227294921875, -0.10012435913085938, -0.0841064453125, -0.06808853149414062, -0.05207061767578125, -0.036052703857421875, -0.0200347900390625, -0.004016876220703125, 0.01200103759765625, 0.028018951416015625, 0.044036865234375, 0.060054779052734375, 0.07607269287109375, 0.09209060668945312, 0.1081085205078125, 0.12412643432617188, 0.14014434814453125, 0.15616226196289062, 0.17218017578125, 0.18819808959960938, 0.20421600341796875, 0.22023391723632812, 0.2362518310546875, 0.2522697448730469, 0.26828765869140625, 0.2843055725097656, 0.300323486328125, 0.3163414001464844, 0.33235931396484375, 0.3483772277832031, 0.3643951416015625, 0.3804130554199219, 0.39643096923828125, 0.4124488830566406, 0.428466796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 6.0, 10.0, 7.0, 21.0, 18.0, 18.0, 24.0, 24.0, 30.0, 31.0, 38.0, 37.0, 28.0, 47.0, 48.0, 61.0, 36.0, 56.0, 57.0, 53.0, 42.0, 45.0, 37.0, 37.0, 34.0, 17.0, 27.0, 22.0, 20.0, 16.0, 13.0, 6.0, 3.0, 6.0, 9.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.265380859375, -0.25646209716796875, -0.2475433349609375, -0.23862457275390625, -0.229705810546875, -0.22078704833984375, -0.2118682861328125, -0.20294952392578125, -0.19403076171875, -0.18511199951171875, -0.1761932373046875, -0.16727447509765625, -0.158355712890625, -0.14943695068359375, -0.1405181884765625, -0.13159942626953125, -0.1226806640625, -0.11376190185546875, -0.1048431396484375, -0.09592437744140625, -0.087005615234375, -0.07808685302734375, -0.0691680908203125, -0.06024932861328125, -0.05133056640625, -0.04241180419921875, -0.0334930419921875, -0.02457427978515625, -0.015655517578125, -0.00673675537109375, 0.0021820068359375, 0.01110076904296875, 0.02001953125, 0.02893829345703125, 0.0378570556640625, 0.04677581787109375, 0.055694580078125, 0.06461334228515625, 0.0735321044921875, 0.08245086669921875, 0.09136962890625, 0.10028839111328125, 0.1092071533203125, 0.11812591552734375, 0.127044677734375, 0.13596343994140625, 0.1448822021484375, 0.15380096435546875, 0.1627197265625, 0.17163848876953125, 0.1805572509765625, 0.18947601318359375, 0.198394775390625, 0.20731353759765625, 0.2162322998046875, 0.22515106201171875, 0.23406982421875, 0.24298858642578125, 0.2519073486328125, 0.26082611083984375, 0.269744873046875, 0.27866363525390625, 0.2875823974609375, 0.29650115966796875, 0.305419921875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 3.0, 6.0, 10.0, 9.0, 16.0, 7.0, 24.0, 29.0, 56.0, 77.0, 102.0, 157.0, 257.0, 363.0, 566.0, 994.0, 1598.0, 2863.0, 5377.0, 11250.0, 26975.0, 80310.0, 253380.0, 394274.0, 176427.0, 54745.0, 19895.0, 8494.0, 4363.0, 2291.0, 1336.0, 791.0, 507.0, 321.0, 219.0, 128.0, 103.0, 65.0, 45.0, 38.0, 24.0, 17.0, 11.0, 11.0, 3.0, 3.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.11004638671875, -0.1068410873413086, -0.10363578796386719, -0.10043048858642578, -0.09722518920898438, -0.09401988983154297, -0.09081459045410156, -0.08760929107666016, -0.08440399169921875, -0.08119869232177734, -0.07799339294433594, -0.07478809356689453, -0.07158279418945312, -0.06837749481201172, -0.06517219543457031, -0.061966896057128906, -0.0587615966796875, -0.055556297302246094, -0.05235099792480469, -0.04914569854736328, -0.045940399169921875, -0.04273509979248047, -0.03952980041503906, -0.036324501037597656, -0.03311920166015625, -0.029913902282714844, -0.026708602905273438, -0.02350330352783203, -0.020298004150390625, -0.01709270477294922, -0.013887405395507812, -0.010682106018066406, -0.007476806640625, -0.004271507263183594, -0.0010662078857421875, 0.0021390914916992188, 0.005344390869140625, 0.008549690246582031, 0.011754989624023438, 0.014960289001464844, 0.01816558837890625, 0.021370887756347656, 0.024576187133789062, 0.02778148651123047, 0.030986785888671875, 0.03419208526611328, 0.03739738464355469, 0.040602684020996094, 0.0438079833984375, 0.047013282775878906, 0.05021858215332031, 0.05342388153076172, 0.056629180908203125, 0.05983448028564453, 0.06303977966308594, 0.06624507904052734, 0.06945037841796875, 0.07265567779541016, 0.07586097717285156, 0.07906627655029297, 0.08227157592773438, 0.08547687530517578, 0.08868217468261719, 0.0918874740600586, 0.0950927734375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 15.0, 7.0, 9.0, 13.0, 20.0, 18.0, 24.0, 22.0, 22.0, 17.0, 22.0, 40.0, 30.0, 36.0, 42.0, 40.0, 36.0, 50.0, 41.0, 50.0, 52.0, 54.0, 34.0, 36.0, 35.0, 34.0, 29.0, 22.0, 23.0, 27.0, 15.0, 17.0, 11.0, 9.0, 11.0, 14.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.5498046875, -0.532958984375, -0.51611328125, -0.499267578125, -0.482421875, -0.465576171875, -0.44873046875, -0.431884765625, -0.4150390625, -0.398193359375, -0.38134765625, -0.364501953125, -0.34765625, -0.330810546875, -0.31396484375, -0.297119140625, -0.2802734375, -0.263427734375, -0.24658203125, -0.229736328125, -0.212890625, -0.196044921875, -0.17919921875, -0.162353515625, -0.1455078125, -0.128662109375, -0.11181640625, -0.094970703125, -0.078125, -0.061279296875, -0.04443359375, -0.027587890625, -0.0107421875, 0.006103515625, 0.02294921875, 0.039794921875, 0.056640625, 0.073486328125, 0.09033203125, 0.107177734375, 0.1240234375, 0.140869140625, 0.15771484375, 0.174560546875, 0.19140625, 0.208251953125, 0.22509765625, 0.241943359375, 0.2587890625, 0.275634765625, 0.29248046875, 0.309326171875, 0.326171875, 0.343017578125, 0.35986328125, 0.376708984375, 0.3935546875, 0.410400390625, 0.42724609375, 0.444091796875, 0.4609375, 0.477783203125, 0.49462890625, 0.511474609375, 0.5283203125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 10.0, 17.0, 23.0, 21.0, 27.0, 50.0, 83.0, 126.0, 180.0, 273.0, 444.0, 796.0, 1364.0, 2761.0, 5833.0, 14721.0, 45572.0, 152918.0, 365298.0, 302149.0, 104139.0, 31286.0, 10771.0, 4553.0, 2175.0, 1151.0, 652.0, 387.0, 251.0, 180.0, 114.0, 64.0, 49.0, 28.0, 27.0, 10.0, 14.0, 13.0, 5.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.0316162109375, -0.030708789825439453, -0.029801368713378906, -0.02889394760131836, -0.027986526489257812, -0.027079105377197266, -0.02617168426513672, -0.025264263153076172, -0.024356842041015625, -0.023449420928955078, -0.02254199981689453, -0.021634578704833984, -0.020727157592773438, -0.01981973648071289, -0.018912315368652344, -0.018004894256591797, -0.01709747314453125, -0.016190052032470703, -0.015282630920410156, -0.01437520980834961, -0.013467788696289062, -0.012560367584228516, -0.011652946472167969, -0.010745525360107422, -0.009838104248046875, -0.008930683135986328, -0.008023262023925781, -0.007115840911865234, -0.0062084197998046875, -0.005300998687744141, -0.004393577575683594, -0.003486156463623047, -0.0025787353515625, -0.0016713142395019531, -0.0007638931274414062, 0.00014352798461914062, 0.0010509490966796875, 0.0019583702087402344, 0.0028657913208007812, 0.003773212432861328, 0.004680633544921875, 0.005588054656982422, 0.006495475769042969, 0.007402896881103516, 0.008310317993164062, 0.00921773910522461, 0.010125160217285156, 0.011032581329345703, 0.01194000244140625, 0.012847423553466797, 0.013754844665527344, 0.01466226577758789, 0.015569686889648438, 0.016477108001708984, 0.01738452911376953, 0.018291950225830078, 0.019199371337890625, 0.020106792449951172, 0.02101421356201172, 0.021921634674072266, 0.022829055786132812, 0.02373647689819336, 0.024643898010253906, 0.025551319122314453, 0.026458740234375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 14.0, 12.0, 34.0, 28.0, 34.0, 42.0, 61.0, 89.0, 95.0, 80.0, 95.0, 80.0, 92.0, 54.0, 46.0, 39.0, 31.0, 18.0, 18.0, 12.0, 2.0, 6.0, 3.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5616416931152344e-05, -1.5077181160449982e-05, -1.453794538974762e-05, -1.3998709619045258e-05, -1.3459473848342896e-05, -1.2920238077640533e-05, -1.2381002306938171e-05, -1.184176653623581e-05, -1.1302530765533447e-05, -1.0763294994831085e-05, -1.0224059224128723e-05, -9.684823453426361e-06, -9.145587682723999e-06, -8.606351912021637e-06, -8.067116141319275e-06, -7.527880370616913e-06, -6.988644599914551e-06, -6.449408829212189e-06, -5.910173058509827e-06, -5.370937287807465e-06, -4.8317015171051025e-06, -4.2924657464027405e-06, -3.7532299757003784e-06, -3.2139942049980164e-06, -2.6747584342956543e-06, -2.1355226635932922e-06, -1.5962868928909302e-06, -1.0570511221885681e-06, -5.178153514862061e-07, 2.1420419216156006e-08, 5.606561899185181e-07, 1.0998919606208801e-06, 1.6391277313232422e-06, 2.1783635020256042e-06, 2.7175992727279663e-06, 3.2568350434303284e-06, 3.7960708141326904e-06, 4.3353065848350525e-06, 4.8745423555374146e-06, 5.413778126239777e-06, 5.953013896942139e-06, 6.492249667644501e-06, 7.031485438346863e-06, 7.570721209049225e-06, 8.109956979751587e-06, 8.649192750453949e-06, 9.188428521156311e-06, 9.727664291858673e-06, 1.0266900062561035e-05, 1.0806135833263397e-05, 1.134537160396576e-05, 1.1884607374668121e-05, 1.2423843145370483e-05, 1.2963078916072845e-05, 1.3502314686775208e-05, 1.404155045747757e-05, 1.4580786228179932e-05, 1.5120021998882294e-05, 1.5659257769584656e-05, 1.6198493540287018e-05, 1.673772931098938e-05, 1.7276965081691742e-05, 1.7816200852394104e-05, 1.8355436623096466e-05, 1.8894672393798828e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 9.0, 19.0, 21.0, 27.0, 40.0, 86.0, 128.0, 209.0, 388.0, 919.0, 2420.0, 8791.0, 37122.0, 172863.0, 468487.0, 274720.0, 62444.0, 13849.0, 3670.0, 1191.0, 495.0, 235.0, 132.0, 98.0, 65.0, 38.0, 21.0, 27.0, 10.0, 12.0, 5.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.042266845703125, -0.04093217849731445, -0.039597511291503906, -0.03826284408569336, -0.03692817687988281, -0.035593509674072266, -0.03425884246826172, -0.03292417526245117, -0.031589508056640625, -0.030254840850830078, -0.02892017364501953, -0.027585506439208984, -0.026250839233398438, -0.02491617202758789, -0.023581504821777344, -0.022246837615966797, -0.02091217041015625, -0.019577503204345703, -0.018242835998535156, -0.01690816879272461, -0.015573501586914062, -0.014238834381103516, -0.012904167175292969, -0.011569499969482422, -0.010234832763671875, -0.008900165557861328, -0.007565498352050781, -0.006230831146240234, -0.0048961639404296875, -0.0035614967346191406, -0.0022268295288085938, -0.0008921623229980469, 0.0004425048828125, 0.0017771720886230469, 0.0031118392944335938, 0.004446506500244141, 0.0057811737060546875, 0.007115840911865234, 0.008450508117675781, 0.009785175323486328, 0.011119842529296875, 0.012454509735107422, 0.013789176940917969, 0.015123844146728516, 0.016458511352539062, 0.01779317855834961, 0.019127845764160156, 0.020462512969970703, 0.02179718017578125, 0.023131847381591797, 0.024466514587402344, 0.02580118179321289, 0.027135848999023438, 0.028470516204833984, 0.02980518341064453, 0.031139850616455078, 0.032474517822265625, 0.03380918502807617, 0.03514385223388672, 0.036478519439697266, 0.03781318664550781, 0.03914785385131836, 0.040482521057128906, 0.04181718826293945, 0.04315185546875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 7.0, 7.0, 11.0, 6.0, 14.0, 12.0, 19.0, 22.0, 41.0, 46.0, 43.0, 59.0, 76.0, 84.0, 73.0, 78.0, 77.0, 64.0, 56.0, 41.0, 27.0, 39.0, 40.0, 17.0, 13.0, 10.0, 8.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.016693115234375, -0.01629197597503662, -0.015890836715698242, -0.015489697456359863, -0.015088558197021484, -0.014687418937683105, -0.014286279678344727, -0.013885140419006348, -0.013484001159667969, -0.01308286190032959, -0.012681722640991211, -0.012280583381652832, -0.011879444122314453, -0.011478304862976074, -0.011077165603637695, -0.010676026344299316, -0.010274887084960938, -0.009873747825622559, -0.00947260856628418, -0.0090714693069458, -0.008670330047607422, -0.008269190788269043, -0.007868051528930664, -0.007466912269592285, -0.007065773010253906, -0.006664633750915527, -0.0062634944915771484, -0.0058623552322387695, -0.005461215972900391, -0.005060076713562012, -0.004658937454223633, -0.004257798194885254, -0.003856658935546875, -0.003455519676208496, -0.003054380416870117, -0.0026532411575317383, -0.0022521018981933594, -0.0018509626388549805, -0.0014498233795166016, -0.0010486841201782227, -0.0006475448608398438, -0.00024640560150146484, 0.00015473365783691406, 0.000555872917175293, 0.0009570121765136719, 0.0013581514358520508, 0.0017592906951904297, 0.0021604299545288086, 0.0025615692138671875, 0.0029627084732055664, 0.0033638477325439453, 0.0037649869918823242, 0.004166126251220703, 0.004567265510559082, 0.004968404769897461, 0.00536954402923584, 0.005770683288574219, 0.006171822547912598, 0.0065729618072509766, 0.0069741010665893555, 0.007375240325927734, 0.007776379585266113, 0.008177518844604492, 0.008578658103942871, 0.00897979736328125]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 7.0, 23.0, 69.0, 167.0, 245.0, 260.0, 150.0, 64.0, 13.0, 6.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9459316730499268, -1.9085006713867188, -1.8710697889328003, -1.8336387872695923, -1.7962079048156738, -1.7587769031524658, -1.7213460206985474, -1.6839150190353394, -1.646484136581421, -1.609053134918213, -1.5716222524642944, -1.5341912508010864, -1.496760368347168, -1.45932936668396, -1.4218984842300415, -1.3844674825668335, -1.347036600112915, -1.309605598449707, -1.2721747159957886, -1.2347437143325806, -1.197312831878662, -1.159881830215454, -1.1224509477615356, -1.0850199460983276, -1.0475889444351196, -1.0101579427719116, -0.9727270603179932, -0.9352961182594299, -0.8978651762008667, -0.8604342341423035, -0.8230032920837402, -0.7855722904205322, -0.7481414079666138, -0.7107104659080505, -0.6732795238494873, -0.6358485817909241, -0.5984176397323608, -0.5609866976737976, -0.5235557556152344, -0.48612478375434875, -0.4486938714981079, -0.4112629294395447, -0.37383198738098145, -0.3364010453224182, -0.298970103263855, -0.26153916120529175, -0.22410818934440613, -0.1866772472858429, -0.14924630522727966, -0.11181536316871643, -0.0743844136595726, -0.03695346415042877, 0.00047747790813446045, 0.03790841996669769, 0.07533937692642212, 0.11277031898498535, 0.15020126104354858, 0.18763220310211182, 0.22506314516067505, 0.2624940872192383, 0.2999250292778015, 0.33735597133636475, 0.37478694319725037, 0.4122178852558136, 0.44964882731437683]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 5.0, 10.0, 16.0, 18.0, 19.0, 20.0, 25.0, 37.0, 33.0, 41.0, 39.0, 49.0, 63.0, 62.0, 58.0, 63.0, 47.0, 61.0, 53.0, 45.0, 47.0, 38.0, 30.0, 21.0, 22.0, 21.0, 10.0, 8.0, 9.0, 9.0, 9.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2811904847621918, -0.27113327383995056, -0.26107603311538696, -0.25101882219314575, -0.24096161127090454, -0.23090438544750214, -0.22084715962409973, -0.21078994870185852, -0.20073272287845612, -0.1906754970550537, -0.1806182861328125, -0.1705610603094101, -0.1605038344860077, -0.15044662356376648, -0.14038939774036407, -0.13033217191696167, -0.12027496099472046, -0.11021774262189865, -0.10016052424907684, -0.09010329842567444, -0.08004608005285263, -0.06998886168003082, -0.059931639581918716, -0.04987441748380661, -0.0398171991109848, -0.029759978875517845, -0.019702758640050888, -0.009645538404583931, 0.0004116818308830261, 0.010468900203704834, 0.02052612230181694, 0.030583344399929047, 0.04064059257507324, 0.05069781094789505, 0.060755033046007156, 0.07081225514411926, 0.08086947351694107, 0.09092669188976288, 0.10098391771316528, 0.11104113608598709, 0.1210983544588089, 0.1311555802822113, 0.14121279120445251, 0.15127001702785492, 0.16132724285125732, 0.17138445377349854, 0.18144167959690094, 0.19149890542030334, 0.20155611634254456, 0.21161334216594696, 0.22167055308818817, 0.23172777891159058, 0.2417849898338318, 0.251842200756073, 0.2618994414806366, 0.2719566524028778, 0.2820138931274414, 0.2920711040496826, 0.3021283447742462, 0.3121855556964874, 0.32224276661872864, 0.33230000734329224, 0.34235721826553345, 0.35241442918777466, 0.36247164011001587]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 17.0, 15.0, 23.0, 21.0, 59.0, 95.0, 189.0, 415.0, 895.0, 2384.0, 8274.0, 35391.0, 235661.0, 658402.0, 83655.0, 16326.0, 4209.0, 1398.0, 543.0, 237.0, 128.0, 64.0, 43.0, 29.0, 21.0, 16.0, 10.0, 4.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.458984375, -0.442138671875, -0.42529296875, -0.408447265625, -0.3916015625, -0.374755859375, -0.35791015625, -0.341064453125, -0.32421875, -0.307373046875, -0.29052734375, -0.273681640625, -0.2568359375, -0.239990234375, -0.22314453125, -0.206298828125, -0.189453125, -0.172607421875, -0.15576171875, -0.138916015625, -0.1220703125, -0.105224609375, -0.08837890625, -0.071533203125, -0.0546875, -0.037841796875, -0.02099609375, -0.004150390625, 0.0126953125, 0.029541015625, 0.04638671875, 0.063232421875, 0.080078125, 0.096923828125, 0.11376953125, 0.130615234375, 0.1474609375, 0.164306640625, 0.18115234375, 0.197998046875, 0.21484375, 0.231689453125, 0.24853515625, 0.265380859375, 0.2822265625, 0.299072265625, 0.31591796875, 0.332763671875, 0.349609375, 0.366455078125, 0.38330078125, 0.400146484375, 0.4169921875, 0.433837890625, 0.45068359375, 0.467529296875, 0.484375, 0.501220703125, 0.51806640625, 0.534912109375, 0.5517578125, 0.568603515625, 0.58544921875, 0.602294921875, 0.619140625]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 6.0, 12.0, 12.0, 15.0, 21.0, 42.0, 40.0, 53.0, 70.0, 63.0, 90.0, 78.0, 100.0, 79.0, 79.0, 66.0, 55.0, 41.0, 30.0, 17.0, 16.0, 10.0, 6.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.497314453125, -0.4694633483886719, -0.44161224365234375, -0.4137611389160156, -0.3859100341796875, -0.3580589294433594, -0.33020782470703125, -0.3023567199707031, -0.274505615234375, -0.24665451049804688, -0.21880340576171875, -0.19095230102539062, -0.1631011962890625, -0.13525009155273438, -0.10739898681640625, -0.07954788208007812, -0.05169677734375, -0.023845672607421875, 0.00400543212890625, 0.031856536865234375, 0.0597076416015625, 0.08755874633789062, 0.11540985107421875, 0.14326095581054688, 0.171112060546875, 0.19896316528320312, 0.22681427001953125, 0.2546653747558594, 0.2825164794921875, 0.3103675842285156, 0.33821868896484375, 0.3660697937011719, 0.3939208984375, 0.4217720031738281, 0.44962310791015625, 0.4774742126464844, 0.5053253173828125, 0.5331764221191406, 0.5610275268554688, 0.5888786315917969, 0.616729736328125, 0.6445808410644531, 0.6724319458007812, 0.7002830505371094, 0.7281341552734375, 0.7559852600097656, 0.7838363647460938, 0.8116874694824219, 0.83953857421875, 0.8673896789550781, 0.8952407836914062, 0.9230918884277344, 0.9509429931640625, 0.9787940979003906, 1.0066452026367188, 1.0344963073730469, 1.062347412109375, 1.0901985168457031, 1.1180496215820312, 1.1459007263183594, 1.1737518310546875, 1.2016029357910156, 1.2294540405273438, 1.2573051452636719, 1.28515625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 6.0, 2.0, 5.0, 6.0, 8.0, 10.0, 10.0, 7.0, 16.0, 12.0, 24.0, 29.0, 32.0, 54.0, 79.0, 105.0, 159.0, 290.0, 749.0, 4131.0, 75865.0, 914204.0, 48111.0, 3132.0, 707.0, 289.0, 128.0, 78.0, 69.0, 59.0, 33.0, 29.0, 32.0, 23.0, 15.0, 13.0, 12.0, 5.0, 7.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95458984375, -0.9232254028320312, -0.8918609619140625, -0.8604965209960938, -0.829132080078125, -0.7977676391601562, -0.7664031982421875, -0.7350387573242188, -0.70367431640625, -0.6723098754882812, -0.6409454345703125, -0.6095809936523438, -0.578216552734375, -0.5468521118164062, -0.5154876708984375, -0.48412322998046875, -0.4527587890625, -0.42139434814453125, -0.3900299072265625, -0.35866546630859375, -0.327301025390625, -0.29593658447265625, -0.2645721435546875, -0.23320770263671875, -0.20184326171875, -0.17047882080078125, -0.1391143798828125, -0.10774993896484375, -0.076385498046875, -0.04502105712890625, -0.0136566162109375, 0.01770782470703125, 0.049072265625, 0.08043670654296875, 0.1118011474609375, 0.14316558837890625, 0.174530029296875, 0.20589447021484375, 0.2372589111328125, 0.26862335205078125, 0.29998779296875, 0.33135223388671875, 0.3627166748046875, 0.39408111572265625, 0.425445556640625, 0.45680999755859375, 0.4881744384765625, 0.5195388793945312, 0.5509033203125, 0.5822677612304688, 0.6136322021484375, 0.6449966430664062, 0.676361083984375, 0.7077255249023438, 0.7390899658203125, 0.7704544067382812, 0.80181884765625, 0.8331832885742188, 0.8645477294921875, 0.8959121704101562, 0.927276611328125, 0.9586410522460938, 0.9900054931640625, 1.0213699340820312, 1.052734375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 1.0, 5.0, 8.0, 9.0, 3.0, 3.0, 12.0, 12.0, 14.0, 17.0, 19.0, 24.0, 19.0, 27.0, 27.0, 30.0, 36.0, 47.0, 43.0, 48.0, 36.0, 46.0, 40.0, 39.0, 43.0, 47.0, 34.0, 38.0, 41.0, 37.0, 26.0, 18.0, 23.0, 25.0, 20.0, 11.0, 10.0, 10.0, 10.0, 11.0, 5.0, 5.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5166015625, -0.49932098388671875, -0.4820404052734375, -0.46475982666015625, -0.447479248046875, -0.43019866943359375, -0.4129180908203125, -0.39563751220703125, -0.37835693359375, -0.36107635498046875, -0.3437957763671875, -0.32651519775390625, -0.309234619140625, -0.29195404052734375, -0.2746734619140625, -0.25739288330078125, -0.2401123046875, -0.22283172607421875, -0.2055511474609375, -0.18827056884765625, -0.170989990234375, -0.15370941162109375, -0.1364288330078125, -0.11914825439453125, -0.10186767578125, -0.08458709716796875, -0.0673065185546875, -0.05002593994140625, -0.032745361328125, -0.01546478271484375, 0.0018157958984375, 0.01909637451171875, 0.036376953125, 0.05365753173828125, 0.0709381103515625, 0.08821868896484375, 0.105499267578125, 0.12277984619140625, 0.1400604248046875, 0.15734100341796875, 0.17462158203125, 0.19190216064453125, 0.2091827392578125, 0.22646331787109375, 0.243743896484375, 0.26102447509765625, 0.2783050537109375, 0.29558563232421875, 0.3128662109375, 0.33014678955078125, 0.3474273681640625, 0.36470794677734375, 0.381988525390625, 0.39926910400390625, 0.4165496826171875, 0.43383026123046875, 0.45111083984375, 0.46839141845703125, 0.4856719970703125, 0.5029525756835938, 0.520233154296875, 0.5375137329101562, 0.5547943115234375, 0.5720748901367188, 0.58935546875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 10.0, 9.0, 13.0, 25.0, 28.0, 42.0, 60.0, 104.0, 136.0, 271.0, 625.0, 1924.0, 9704.0, 246145.0, 762704.0, 22083.0, 3021.0, 857.0, 306.0, 159.0, 84.0, 67.0, 50.0, 38.0, 24.0, 17.0, 10.0, 9.0, 9.0, 8.0, 4.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3076171875, -0.298614501953125, -0.28961181640625, -0.280609130859375, -0.2716064453125, -0.262603759765625, -0.25360107421875, -0.244598388671875, -0.235595703125, -0.226593017578125, -0.21759033203125, -0.208587646484375, -0.1995849609375, -0.190582275390625, -0.18157958984375, -0.172576904296875, -0.16357421875, -0.154571533203125, -0.14556884765625, -0.136566162109375, -0.1275634765625, -0.118560791015625, -0.10955810546875, -0.100555419921875, -0.091552734375, -0.082550048828125, -0.07354736328125, -0.064544677734375, -0.0555419921875, -0.046539306640625, -0.03753662109375, -0.028533935546875, -0.01953125, -0.010528564453125, -0.00152587890625, 0.007476806640625, 0.0164794921875, 0.025482177734375, 0.03448486328125, 0.043487548828125, 0.052490234375, 0.061492919921875, 0.07049560546875, 0.079498291015625, 0.0885009765625, 0.097503662109375, 0.10650634765625, 0.115509033203125, 0.12451171875, 0.133514404296875, 0.14251708984375, 0.151519775390625, 0.1605224609375, 0.169525146484375, 0.17852783203125, 0.187530517578125, 0.196533203125, 0.205535888671875, 0.21453857421875, 0.223541259765625, 0.2325439453125, 0.241546630859375, 0.25054931640625, 0.259552001953125, 0.2685546875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 12.0, 5.0, 12.0, 8.0, 21.0, 20.0, 20.0, 47.0, 76.0, 118.0, 127.0, 162.0, 117.0, 76.0, 59.0, 47.0, 20.0, 16.0, 9.0, 8.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.236532211303711e-05, -3.14200296998024e-05, -3.0474737286567688e-05, -2.9529444873332977e-05, -2.8584152460098267e-05, -2.7638860046863556e-05, -2.6693567633628845e-05, -2.5748275220394135e-05, -2.4802982807159424e-05, -2.3857690393924713e-05, -2.2912397980690002e-05, -2.1967105567455292e-05, -2.102181315422058e-05, -2.007652074098587e-05, -1.913122832775116e-05, -1.818593591451645e-05, -1.7240643501281738e-05, -1.6295351088047028e-05, -1.5350058674812317e-05, -1.4404766261577606e-05, -1.3459473848342896e-05, -1.2514181435108185e-05, -1.1568889021873474e-05, -1.0623596608638763e-05, -9.678304195404053e-06, -8.733011782169342e-06, -7.787719368934631e-06, -6.842426955699921e-06, -5.89713454246521e-06, -4.951842129230499e-06, -4.0065497159957886e-06, -3.061257302761078e-06, -2.115964889526367e-06, -1.1706724762916565e-06, -2.253800630569458e-07, 7.199123501777649e-07, 1.6652047634124756e-06, 2.6104971766471863e-06, 3.555789589881897e-06, 4.501082003116608e-06, 5.446374416351318e-06, 6.391666829586029e-06, 7.33695924282074e-06, 8.28225165605545e-06, 9.227544069290161e-06, 1.0172836482524872e-05, 1.1118128895759583e-05, 1.2063421308994293e-05, 1.3008713722229004e-05, 1.3954006135463715e-05, 1.4899298548698425e-05, 1.5844590961933136e-05, 1.6789883375167847e-05, 1.7735175788402557e-05, 1.8680468201637268e-05, 1.962576061487198e-05, 2.057105302810669e-05, 2.15163454413414e-05, 2.246163785457611e-05, 2.340693026781082e-05, 2.4352222681045532e-05, 2.5297515094280243e-05, 2.6242807507514954e-05, 2.7188099920749664e-05, 2.8133392333984375e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 2.0, 5.0, 8.0, 11.0, 10.0, 10.0, 25.0, 21.0, 20.0, 38.0, 60.0, 73.0, 108.0, 142.0, 285.0, 490.0, 931.0, 1762.0, 4075.0, 12458.0, 84273.0, 729050.0, 184527.0, 19702.0, 5495.0, 2241.0, 1154.0, 553.0, 339.0, 206.0, 131.0, 84.0, 61.0, 53.0, 35.0, 30.0, 22.0, 15.0, 11.0, 5.0, 6.0, 7.0, 2.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2076416015625, -0.20147132873535156, -0.19530105590820312, -0.1891307830810547, -0.18296051025390625, -0.1767902374267578, -0.17061996459960938, -0.16444969177246094, -0.1582794189453125, -0.15210914611816406, -0.14593887329101562, -0.1397686004638672, -0.13359832763671875, -0.1274280548095703, -0.12125778198242188, -0.11508750915527344, -0.108917236328125, -0.10274696350097656, -0.09657669067382812, -0.09040641784667969, -0.08423614501953125, -0.07806587219238281, -0.07189559936523438, -0.06572532653808594, -0.0595550537109375, -0.05338478088378906, -0.047214508056640625, -0.04104423522949219, -0.03487396240234375, -0.028703689575195312, -0.022533416748046875, -0.016363143920898438, -0.01019287109375, -0.0040225982666015625, 0.002147674560546875, 0.008317947387695312, 0.01448822021484375, 0.020658493041992188, 0.026828765869140625, 0.03299903869628906, 0.0391693115234375, 0.04533958435058594, 0.051509857177734375, 0.05768013000488281, 0.06385040283203125, 0.07002067565917969, 0.07619094848632812, 0.08236122131347656, 0.088531494140625, 0.09470176696777344, 0.10087203979492188, 0.10704231262207031, 0.11321258544921875, 0.11938285827636719, 0.12555313110351562, 0.13172340393066406, 0.1378936767578125, 0.14406394958496094, 0.15023422241210938, 0.1564044952392578, 0.16257476806640625, 0.1687450408935547, 0.17491531372070312, 0.18108558654785156, 0.187255859375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 8.0, 4.0, 10.0, 9.0, 10.0, 18.0, 15.0, 18.0, 42.0, 53.0, 62.0, 73.0, 103.0, 114.0, 120.0, 84.0, 76.0, 39.0, 37.0, 30.0, 25.0, 8.0, 10.0, 6.0, 9.0, 4.0, 4.0, 1.0, 0.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07684326171875, -0.07448101043701172, -0.07211875915527344, -0.06975650787353516, -0.06739425659179688, -0.0650320053100586, -0.06266975402832031, -0.06030750274658203, -0.05794525146484375, -0.05558300018310547, -0.05322074890136719, -0.050858497619628906, -0.048496246337890625, -0.046133995056152344, -0.04377174377441406, -0.04140949249267578, -0.0390472412109375, -0.03668498992919922, -0.03432273864746094, -0.031960487365722656, -0.029598236083984375, -0.027235984802246094, -0.024873733520507812, -0.02251148223876953, -0.02014923095703125, -0.01778697967529297, -0.015424728393554688, -0.013062477111816406, -0.010700225830078125, -0.008337974548339844, -0.0059757232666015625, -0.0036134719848632812, -0.001251220703125, 0.0011110305786132812, 0.0034732818603515625, 0.005835533142089844, 0.008197784423828125, 0.010560035705566406, 0.012922286987304688, 0.015284538269042969, 0.01764678955078125, 0.02000904083251953, 0.022371292114257812, 0.024733543395996094, 0.027095794677734375, 0.029458045959472656, 0.03182029724121094, 0.03418254852294922, 0.0365447998046875, 0.03890705108642578, 0.04126930236816406, 0.043631553649902344, 0.045993804931640625, 0.048356056213378906, 0.05071830749511719, 0.05308055877685547, 0.05544281005859375, 0.05780506134033203, 0.06016731262207031, 0.0625295639038086, 0.06489181518554688, 0.06725406646728516, 0.06961631774902344, 0.07197856903076172, 0.0743408203125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 7.0, 199.0, 682.0, 112.0, 12.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.27834701538086, -12.064332008361816, -11.850317001342773, -11.63630199432373, -11.422286987304688, -11.208271980285645, -10.994256973266602, -10.780241012573242, -10.5662260055542, -10.352210998535156, -10.138195991516113, -9.92418098449707, -9.710165977478027, -9.496150970458984, -9.282135009765625, -9.068120956420898, -8.854105949401855, -8.640090942382812, -8.42607593536377, -8.212060928344727, -7.998045444488525, -7.784030437469482, -7.5700154304504395, -7.3560004234313965, -7.141984939575195, -6.927969932556152, -6.713954925537109, -6.499939918518066, -6.285924434661865, -6.071909427642822, -5.857894420623779, -5.643879413604736, -5.429863929748535, -5.215848922729492, -5.001833915710449, -4.787818908691406, -4.573803424835205, -4.359788417816162, -4.145773410797119, -3.931758403778076, -3.717743396759033, -3.5037283897399902, -3.289713144302368, -3.075698137283325, -2.8616831302642822, -2.64766788482666, -2.433652877807617, -2.219637870788574, -2.0056228637695312, -1.7916077375411987, -1.5775927305221558, -1.3635776042938232, -1.1495625972747803, -0.9355474710464478, -0.7215323448181152, -0.5075173377990723, -0.2935020923614502, -0.07948701083660126, 0.13452807068824768, 0.3485431671142578, 0.5625582337379456, 0.7765733003616333, 0.9905884265899658, 1.2046034336090088, 1.4186185598373413]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 7.0, 2.0, 8.0, 7.0, 7.0, 14.0, 16.0, 15.0, 16.0, 20.0, 23.0, 30.0, 34.0, 22.0, 46.0, 45.0, 61.0, 52.0, 61.0, 41.0, 63.0, 60.0, 42.0, 35.0, 31.0, 45.0, 36.0, 21.0, 31.0, 17.0, 24.0, 13.0, 19.0, 5.0, 6.0, 7.0, 11.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9674336314201355, -0.9344180822372437, -0.901402473449707, -0.8683869242668152, -0.8353713154792786, -0.8023557662963867, -0.7693401575088501, -0.7363246083259583, -0.7033090591430664, -0.6702935099601746, -0.6372779011726379, -0.6042623519897461, -0.5712467432022095, -0.5382311940193176, -0.5052156448364258, -0.47220003604888916, -0.43918442726135254, -0.4061688482761383, -0.3731532692909241, -0.3401377201080322, -0.3071221113204956, -0.27410656213760376, -0.24109098315238953, -0.2080754041671753, -0.17505982518196106, -0.14204424619674683, -0.10902867466211319, -0.07601310312747955, -0.04299752414226532, -0.009981945157051086, 0.023033618927001953, 0.056049197912216187, 0.0890648365020752, 0.12208041548728943, 0.15509599447250366, 0.1881115585565567, 0.22112713754177094, 0.254142701625824, 0.2871582806110382, 0.32017385959625244, 0.3531894385814667, 0.3862050175666809, 0.41922059655189514, 0.4522361755371094, 0.4852517247200012, 0.5182673335075378, 0.5512828826904297, 0.5842984914779663, 0.6173140406608582, 0.65032958984375, 0.6833451986312866, 0.7163607478141785, 0.7493763566017151, 0.7823919057846069, 0.8154075145721436, 0.8484230637550354, 0.8814386129379272, 0.9144541621208191, 0.9474697709083557, 0.9804853200912476, 1.0135009288787842, 1.0465165376663208, 1.0795320272445679, 1.1125476360321045, 1.1455632448196411]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 7.0, 10.0, 27.0, 19.0, 50.0, 83.0, 147.0, 242.0, 447.0, 973.0, 2685.0, 10268.0, 71929.0, 1357954.0, 2572247.0, 153931.0, 16645.0, 3892.0, 1373.0, 630.0, 281.0, 177.0, 93.0, 66.0, 33.0, 26.0, 14.0, 13.0, 9.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.88037109375, -0.8599662780761719, -0.8395614624023438, -0.8191566467285156, -0.7987518310546875, -0.7783470153808594, -0.7579421997070312, -0.7375373840332031, -0.717132568359375, -0.6967277526855469, -0.6763229370117188, -0.6559181213378906, -0.6355133056640625, -0.6151084899902344, -0.5947036743164062, -0.5742988586425781, -0.55389404296875, -0.5334892272949219, -0.5130844116210938, -0.4926795959472656, -0.4722747802734375, -0.4518699645996094, -0.43146514892578125, -0.4110603332519531, -0.390655517578125, -0.3702507019042969, -0.34984588623046875, -0.3294410705566406, -0.3090362548828125, -0.2886314392089844, -0.26822662353515625, -0.24782180786132812, -0.2274169921875, -0.20701217651367188, -0.18660736083984375, -0.16620254516601562, -0.1457977294921875, -0.12539291381835938, -0.10498809814453125, -0.08458328247070312, -0.064178466796875, -0.043773651123046875, -0.02336883544921875, -0.002964019775390625, 0.0174407958984375, 0.037845611572265625, 0.05825042724609375, 0.07865524291992188, 0.09906005859375, 0.11946487426757812, 0.13986968994140625, 0.16027450561523438, 0.1806793212890625, 0.20108413696289062, 0.22148895263671875, 0.24189376831054688, 0.262298583984375, 0.2827033996582031, 0.30310821533203125, 0.3235130310058594, 0.3439178466796875, 0.3643226623535156, 0.38472747802734375, 0.4051322937011719, 0.425537109375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 10.0, 9.0, 15.0, 19.0, 20.0, 22.0, 20.0, 30.0, 25.0, 46.0, 37.0, 55.0, 76.0, 68.0, 55.0, 55.0, 50.0, 58.0, 42.0, 52.0, 36.0, 47.0, 25.0, 30.0, 23.0, 19.0, 8.0, 11.0, 8.0, 9.0, 8.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.303466796875, -0.2922096252441406, -0.28095245361328125, -0.2696952819824219, -0.2584381103515625, -0.24718093872070312, -0.23592376708984375, -0.22466659545898438, -0.213409423828125, -0.20215225219726562, -0.19089508056640625, -0.17963790893554688, -0.1683807373046875, -0.15712356567382812, -0.14586639404296875, -0.13460922241210938, -0.12335205078125, -0.11209487915039062, -0.10083770751953125, -0.08958053588867188, -0.0783233642578125, -0.06706619262695312, -0.05580902099609375, -0.044551849365234375, -0.033294677734375, -0.022037506103515625, -0.01078033447265625, 0.000476837158203125, 0.0117340087890625, 0.022991180419921875, 0.03424835205078125, 0.045505523681640625, 0.0567626953125, 0.06801986694335938, 0.07927703857421875, 0.09053421020507812, 0.1017913818359375, 0.11304855346679688, 0.12430572509765625, 0.13556289672851562, 0.146820068359375, 0.15807723999023438, 0.16933441162109375, 0.18059158325195312, 0.1918487548828125, 0.20310592651367188, 0.21436309814453125, 0.22562026977539062, 0.23687744140625, 0.24813461303710938, 0.25939178466796875, 0.2706489562988281, 0.2819061279296875, 0.2931632995605469, 0.30442047119140625, 0.3156776428222656, 0.326934814453125, 0.3381919860839844, 0.34944915771484375, 0.3607063293457031, 0.3719635009765625, 0.3832206726074219, 0.39447784423828125, 0.4057350158691406, 0.4169921875]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 7.0, 6.0, 14.0, 14.0, 37.0, 50.0, 105.0, 269.0, 852.0, 4925.0, 146571.0, 3995825.0, 41634.0, 2864.0, 659.0, 207.0, 97.0, 54.0, 25.0, 26.0, 9.0, 8.0, 8.0, 4.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7158203125, -1.6710968017578125, -1.626373291015625, -1.5816497802734375, -1.53692626953125, -1.4922027587890625, -1.447479248046875, -1.4027557373046875, -1.3580322265625, -1.3133087158203125, -1.268585205078125, -1.2238616943359375, -1.17913818359375, -1.1344146728515625, -1.089691162109375, -1.0449676513671875, -1.000244140625, -0.9555206298828125, -0.910797119140625, -0.8660736083984375, -0.82135009765625, -0.7766265869140625, -0.731903076171875, -0.6871795654296875, -0.6424560546875, -0.5977325439453125, -0.553009033203125, -0.5082855224609375, -0.46356201171875, -0.4188385009765625, -0.374114990234375, -0.3293914794921875, -0.28466796875, -0.2399444580078125, -0.195220947265625, -0.1504974365234375, -0.10577392578125, -0.0610504150390625, -0.016326904296875, 0.0283966064453125, 0.0731201171875, 0.1178436279296875, 0.162567138671875, 0.2072906494140625, 0.25201416015625, 0.2967376708984375, 0.341461181640625, 0.3861846923828125, 0.430908203125, 0.4756317138671875, 0.520355224609375, 0.5650787353515625, 0.60980224609375, 0.6545257568359375, 0.699249267578125, 0.7439727783203125, 0.7886962890625, 0.8334197998046875, 0.878143310546875, 0.9228668212890625, 0.96759033203125, 1.0123138427734375, 1.057037353515625, 1.1017608642578125, 1.146484375]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 5.0, 7.0, 8.0, 13.0, 13.0, 21.0, 37.0, 66.0, 73.0, 127.0, 216.0, 396.0, 605.0, 752.0, 636.0, 488.0, 245.0, 125.0, 100.0, 47.0, 27.0, 16.0, 6.0, 13.0, 3.0, 8.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17041015625, -0.1642284393310547, -0.15804672241210938, -0.15186500549316406, -0.14568328857421875, -0.13950157165527344, -0.13331985473632812, -0.1271381378173828, -0.1209564208984375, -0.11477470397949219, -0.10859298706054688, -0.10241127014160156, -0.09622955322265625, -0.09004783630371094, -0.08386611938476562, -0.07768440246582031, -0.071502685546875, -0.06532096862792969, -0.059139251708984375, -0.05295753479003906, -0.04677581787109375, -0.04059410095214844, -0.034412384033203125, -0.028230667114257812, -0.0220489501953125, -0.015867233276367188, -0.009685516357421875, -0.0035037994384765625, 0.00267791748046875, 0.008859634399414062, 0.015041351318359375, 0.021223068237304688, 0.02740478515625, 0.03358650207519531, 0.039768218994140625, 0.04594993591308594, 0.05213165283203125, 0.05831336975097656, 0.06449508666992188, 0.07067680358886719, 0.0768585205078125, 0.08304023742675781, 0.08922195434570312, 0.09540367126464844, 0.10158538818359375, 0.10776710510253906, 0.11394882202148438, 0.12013053894042969, 0.126312255859375, 0.1324939727783203, 0.13867568969726562, 0.14485740661621094, 0.15103912353515625, 0.15722084045410156, 0.16340255737304688, 0.1695842742919922, 0.1757659912109375, 0.1819477081298828, 0.18812942504882812, 0.19431114196777344, 0.20049285888671875, 0.20667457580566406, 0.21285629272460938, 0.2190380096435547, 0.2252197265625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 11.0, 13.0, 22.0, 24.0, 38.0, 52.0, 72.0, 78.0, 87.0, 97.0, 103.0, 89.0, 85.0, 65.0, 45.0, 36.0, 34.0, 22.0, 11.0, 7.0, 8.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7341853380203247, -0.7143028974533081, -0.6944205164909363, -0.6745380759239197, -0.6546556949615479, -0.6347732543945312, -0.6148908138275146, -0.595008373260498, -0.5751259922981262, -0.5552435517311096, -0.5353611707687378, -0.5154787302017212, -0.495596319437027, -0.47571390867233276, -0.45583146810531616, -0.43594905734062195, -0.41606664657592773, -0.3961842358112335, -0.3763018250465393, -0.3564193844795227, -0.3365369737148285, -0.3166545629501343, -0.2967721223831177, -0.27688971161842346, -0.25700730085372925, -0.23712489008903503, -0.21724246442317963, -0.19736003875732422, -0.17747762799263, -0.1575952172279358, -0.13771279156208038, -0.11783036589622498, -0.09794789552688599, -0.07806547731161118, -0.058183059096336365, -0.038300640881061554, -0.018418222665786743, 0.0014641955494880676, 0.02134661376476288, 0.041229039430618286, 0.0611114501953125, 0.08099386841058731, 0.10087628662586212, 0.12075870484113693, 0.14064112305641174, 0.16052353382110596, 0.18040595948696136, 0.20028838515281677, 0.220170795917511, 0.2400532066822052, 0.2599356174468994, 0.279818058013916, 0.29970046877861023, 0.31958287954330444, 0.33946532011032104, 0.35934773087501526, 0.3792301416397095, 0.3991125524044037, 0.4189949631690979, 0.4388774037361145, 0.4587598145008087, 0.47864222526550293, 0.49852466583251953, 0.5184071063995361, 0.538289487361908]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 10.0, 6.0, 13.0, 17.0, 23.0, 17.0, 23.0, 16.0, 30.0, 26.0, 34.0, 52.0, 33.0, 29.0, 37.0, 32.0, 61.0, 32.0, 38.0, 54.0, 46.0, 37.0, 36.0, 31.0, 34.0, 41.0, 36.0, 21.0, 24.0, 20.0, 22.0, 13.0, 14.0, 9.0, 11.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3390185832977295, -0.32841241359710693, -0.317806214094162, -0.30720004439353943, -0.29659387469291687, -0.2859877049922943, -0.27538150548934937, -0.2647753357887268, -0.25416916608810425, -0.2435629814863205, -0.23295681178569794, -0.22235062718391418, -0.21174445748329163, -0.20113827288150787, -0.19053208827972412, -0.17992591857910156, -0.1693197339773178, -0.15871354937553406, -0.1481073796749115, -0.13750119507312775, -0.1268950253725052, -0.11628884077072144, -0.10568266361951828, -0.09507648646831512, -0.08447030931711197, -0.07386413216590881, -0.06325795501470566, -0.052651774138212204, -0.04204559698700905, -0.03143941983580589, -0.02083323895931244, -0.010227061808109283, 0.00037911534309387207, 0.010985293425619602, 0.021591471508145332, 0.03219765052199364, 0.04280382767319679, 0.05341000482439995, 0.0640161857008934, 0.07462236285209656, 0.08522854000329971, 0.09583471715450287, 0.10644089430570602, 0.11704707145690918, 0.12765325605869293, 0.1382594257593155, 0.14886561036109924, 0.1594717800617218, 0.17007796466350555, 0.1806841492652893, 0.19129031896591187, 0.20189650356769562, 0.21250267326831818, 0.22310885787010193, 0.2337150275707245, 0.24432121217250824, 0.254927396774292, 0.26553356647491455, 0.2761397659778595, 0.28674593567848206, 0.2973521053791046, 0.3079582750797272, 0.3185644745826721, 0.3291706442832947, 0.33977681398391724]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 8.0, 23.0, 55.0, 128.0, 347.0, 1009.0, 2957.0, 9645.0, 47167.0, 676926.0, 277919.0, 23222.0, 6088.0, 1929.0, 690.0, 252.0, 97.0, 39.0, 17.0, 8.0, 3.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.275146484375, -0.26488494873046875, -0.2546234130859375, -0.24436187744140625, -0.234100341796875, -0.22383880615234375, -0.2135772705078125, -0.20331573486328125, -0.19305419921875, -0.18279266357421875, -0.1725311279296875, -0.16226959228515625, -0.152008056640625, -0.14174652099609375, -0.1314849853515625, -0.12122344970703125, -0.1109619140625, -0.10070037841796875, -0.0904388427734375, -0.08017730712890625, -0.069915771484375, -0.05965423583984375, -0.0493927001953125, -0.03913116455078125, -0.02886962890625, -0.01860809326171875, -0.0083465576171875, 0.00191497802734375, 0.012176513671875, 0.02243804931640625, 0.0326995849609375, 0.04296112060546875, 0.05322265625, 0.06348419189453125, 0.0737457275390625, 0.08400726318359375, 0.094268798828125, 0.10453033447265625, 0.1147918701171875, 0.12505340576171875, 0.13531494140625, 0.14557647705078125, 0.1558380126953125, 0.16609954833984375, 0.176361083984375, 0.18662261962890625, 0.1968841552734375, 0.20714569091796875, 0.2174072265625, 0.22766876220703125, 0.2379302978515625, 0.24819183349609375, 0.258453369140625, 0.26871490478515625, 0.2789764404296875, 0.28923797607421875, 0.29949951171875, 0.30976104736328125, 0.3200225830078125, 0.33028411865234375, 0.340545654296875, 0.35080718994140625, 0.3610687255859375, 0.37133026123046875, 0.381591796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 4.0, 12.0, 11.0, 16.0, 17.0, 23.0, 38.0, 29.0, 36.0, 48.0, 48.0, 56.0, 63.0, 68.0, 52.0, 54.0, 64.0, 53.0, 60.0, 42.0, 35.0, 43.0, 32.0, 26.0, 24.0, 13.0, 8.0, 7.0, 7.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2235107421875, -0.2151012420654297, -0.20669174194335938, -0.19828224182128906, -0.18987274169921875, -0.18146324157714844, -0.17305374145507812, -0.1646442413330078, -0.1562347412109375, -0.1478252410888672, -0.13941574096679688, -0.13100624084472656, -0.12259674072265625, -0.11418724060058594, -0.10577774047851562, -0.09736824035644531, -0.088958740234375, -0.08054924011230469, -0.07213973999023438, -0.06373023986816406, -0.05532073974609375, -0.04691123962402344, -0.038501739501953125, -0.030092239379882812, -0.0216827392578125, -0.013273239135742188, -0.004863739013671875, 0.0035457611083984375, 0.01195526123046875, 0.020364761352539062, 0.028774261474609375, 0.03718376159667969, 0.04559326171875, 0.05400276184082031, 0.062412261962890625, 0.07082176208496094, 0.07923126220703125, 0.08764076232910156, 0.09605026245117188, 0.10445976257324219, 0.1128692626953125, 0.12127876281738281, 0.12968826293945312, 0.13809776306152344, 0.14650726318359375, 0.15491676330566406, 0.16332626342773438, 0.1717357635498047, 0.180145263671875, 0.1885547637939453, 0.19696426391601562, 0.20537376403808594, 0.21378326416015625, 0.22219276428222656, 0.23060226440429688, 0.2390117645263672, 0.2474212646484375, 0.2558307647705078, 0.2642402648925781, 0.27264976501464844, 0.28105926513671875, 0.28946876525878906, 0.2978782653808594, 0.3062877655029297, 0.314697265625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 11.0, 11.0, 19.0, 21.0, 38.0, 64.0, 98.0, 118.0, 200.0, 287.0, 457.0, 810.0, 1454.0, 2751.0, 5380.0, 11867.0, 29624.0, 88168.0, 262994.0, 377993.0, 173585.0, 55176.0, 19994.0, 8305.0, 4020.0, 2110.0, 1195.0, 689.0, 399.0, 247.0, 162.0, 93.0, 76.0, 43.0, 36.0, 15.0, 20.0, 7.0, 3.0, 8.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0823974609375, -0.07967758178710938, -0.07695770263671875, -0.07423782348632812, -0.0715179443359375, -0.06879806518554688, -0.06607818603515625, -0.06335830688476562, -0.060638427734375, -0.057918548583984375, -0.05519866943359375, -0.052478790283203125, -0.0497589111328125, -0.047039031982421875, -0.04431915283203125, -0.041599273681640625, -0.03887939453125, -0.036159515380859375, -0.03343963623046875, -0.030719757080078125, -0.0279998779296875, -0.025279998779296875, -0.02256011962890625, -0.019840240478515625, -0.017120361328125, -0.014400482177734375, -0.01168060302734375, -0.008960723876953125, -0.0062408447265625, -0.003520965576171875, -0.00080108642578125, 0.001918792724609375, 0.004638671875, 0.007358551025390625, 0.01007843017578125, 0.012798309326171875, 0.0155181884765625, 0.018238067626953125, 0.02095794677734375, 0.023677825927734375, 0.026397705078125, 0.029117584228515625, 0.03183746337890625, 0.034557342529296875, 0.0372772216796875, 0.039997100830078125, 0.04271697998046875, 0.045436859130859375, 0.04815673828125, 0.050876617431640625, 0.05359649658203125, 0.056316375732421875, 0.0590362548828125, 0.061756134033203125, 0.06447601318359375, 0.06719589233398438, 0.069915771484375, 0.07263565063476562, 0.07535552978515625, 0.07807540893554688, 0.0807952880859375, 0.08351516723632812, 0.08623504638671875, 0.08895492553710938, 0.0916748046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 8.0, 3.0, 3.0, 4.0, 7.0, 8.0, 6.0, 7.0, 11.0, 14.0, 13.0, 24.0, 19.0, 25.0, 31.0, 31.0, 29.0, 25.0, 31.0, 26.0, 39.0, 44.0, 43.0, 45.0, 44.0, 38.0, 29.0, 33.0, 36.0, 30.0, 36.0, 31.0, 26.0, 32.0, 12.0, 23.0, 20.0, 29.0, 18.0, 11.0, 13.0, 5.0, 4.0, 10.0, 5.0, 6.0, 3.0, 2.0, 1.0, 5.0, 5.0, 4.0, 2.0, 3.0], "bins": [-0.3837890625, -0.3726043701171875, -0.361419677734375, -0.3502349853515625, -0.33905029296875, -0.3278656005859375, -0.316680908203125, -0.3054962158203125, -0.2943115234375, -0.2831268310546875, -0.271942138671875, -0.2607574462890625, -0.24957275390625, -0.2383880615234375, -0.227203369140625, -0.2160186767578125, -0.204833984375, -0.1936492919921875, -0.182464599609375, -0.1712799072265625, -0.16009521484375, -0.1489105224609375, -0.137725830078125, -0.1265411376953125, -0.1153564453125, -0.1041717529296875, -0.092987060546875, -0.0818023681640625, -0.07061767578125, -0.0594329833984375, -0.048248291015625, -0.0370635986328125, -0.02587890625, -0.0146942138671875, -0.003509521484375, 0.0076751708984375, 0.01885986328125, 0.0300445556640625, 0.041229248046875, 0.0524139404296875, 0.0635986328125, 0.0747833251953125, 0.085968017578125, 0.0971527099609375, 0.10833740234375, 0.1195220947265625, 0.130706787109375, 0.1418914794921875, 0.153076171875, 0.1642608642578125, 0.175445556640625, 0.1866302490234375, 0.19781494140625, 0.2089996337890625, 0.220184326171875, 0.2313690185546875, 0.2425537109375, 0.2537384033203125, 0.264923095703125, 0.2761077880859375, 0.28729248046875, 0.2984771728515625, 0.309661865234375, 0.3208465576171875, 0.33203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 8.0, 5.0, 8.0, 10.0, 15.0, 21.0, 44.0, 55.0, 82.0, 122.0, 190.0, 299.0, 549.0, 999.0, 2309.0, 5566.0, 17916.0, 78059.0, 369690.0, 436534.0, 102203.0, 22008.0, 6732.0, 2527.0, 1104.0, 638.0, 328.0, 171.0, 111.0, 77.0, 55.0, 36.0, 17.0, 11.0, 11.0, 8.0, 7.0, 3.0, 3.0, 2.0, 10.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.044830322265625, -0.04347515106201172, -0.04211997985839844, -0.040764808654785156, -0.039409637451171875, -0.038054466247558594, -0.03669929504394531, -0.03534412384033203, -0.03398895263671875, -0.03263378143310547, -0.03127861022949219, -0.029923439025878906, -0.028568267822265625, -0.027213096618652344, -0.025857925415039062, -0.02450275421142578, -0.0231475830078125, -0.02179241180419922, -0.020437240600585938, -0.019082069396972656, -0.017726898193359375, -0.016371726989746094, -0.015016555786132812, -0.013661384582519531, -0.01230621337890625, -0.010951042175292969, -0.009595870971679688, -0.008240699768066406, -0.006885528564453125, -0.005530357360839844, -0.0041751861572265625, -0.0028200149536132812, -0.00146484375, -0.00010967254638671875, 0.0012454986572265625, 0.0026006698608398438, 0.003955841064453125, 0.005311012268066406, 0.0066661834716796875, 0.008021354675292969, 0.00937652587890625, 0.010731697082519531, 0.012086868286132812, 0.013442039489746094, 0.014797210693359375, 0.016152381896972656, 0.017507553100585938, 0.01886272430419922, 0.0202178955078125, 0.02157306671142578, 0.022928237915039062, 0.024283409118652344, 0.025638580322265625, 0.026993751525878906, 0.028348922729492188, 0.02970409393310547, 0.03105926513671875, 0.03241443634033203, 0.03376960754394531, 0.035124778747558594, 0.036479949951171875, 0.037835121154785156, 0.03919029235839844, 0.04054546356201172, 0.041900634765625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 2.0, 2.0, 7.0, 7.0, 4.0, 8.0, 22.0, 29.0, 39.0, 35.0, 48.0, 49.0, 76.0, 83.0, 101.0, 69.0, 88.0, 62.0, 64.0, 58.0, 35.0, 21.0, 25.0, 14.0, 9.0, 14.0, 6.0, 4.0, 4.0, 8.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.704692840576172e-05, -1.6460195183753967e-05, -1.5873461961746216e-05, -1.5286728739738464e-05, -1.4699995517730713e-05, -1.4113262295722961e-05, -1.352652907371521e-05, -1.2939795851707458e-05, -1.2353062629699707e-05, -1.1766329407691956e-05, -1.1179596185684204e-05, -1.0592862963676453e-05, -1.0006129741668701e-05, -9.41939651966095e-06, -8.832663297653198e-06, -8.245930075645447e-06, -7.659196853637695e-06, -7.072463631629944e-06, -6.485730409622192e-06, -5.898997187614441e-06, -5.3122639656066895e-06, -4.725530743598938e-06, -4.1387975215911865e-06, -3.552064299583435e-06, -2.9653310775756836e-06, -2.378597855567932e-06, -1.7918646335601807e-06, -1.2051314115524292e-06, -6.183981895446777e-07, -3.166496753692627e-08, 5.550682544708252e-07, 1.1418014764785767e-06, 1.7285346984863281e-06, 2.3152679204940796e-06, 2.902001142501831e-06, 3.4887343645095825e-06, 4.075467586517334e-06, 4.6622008085250854e-06, 5.248934030532837e-06, 5.835667252540588e-06, 6.42240047454834e-06, 7.009133696556091e-06, 7.595866918563843e-06, 8.182600140571594e-06, 8.769333362579346e-06, 9.356066584587097e-06, 9.942799806594849e-06, 1.05295330286026e-05, 1.1116266250610352e-05, 1.1702999472618103e-05, 1.2289732694625854e-05, 1.2876465916633606e-05, 1.3463199138641357e-05, 1.4049932360649109e-05, 1.463666558265686e-05, 1.5223398804664612e-05, 1.5810132026672363e-05, 1.6396865248680115e-05, 1.6983598470687866e-05, 1.7570331692695618e-05, 1.815706491470337e-05, 1.874379813671112e-05, 1.9330531358718872e-05, 1.9917264580726624e-05, 2.0503997802734375e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 11.0, 2.0, 13.0, 8.0, 25.0, 25.0, 50.0, 96.0, 173.0, 337.0, 866.0, 2598.0, 9546.0, 46565.0, 263821.0, 542250.0, 146783.0, 26511.0, 5916.0, 1659.0, 664.0, 282.0, 126.0, 75.0, 42.0, 47.0, 14.0, 14.0, 10.0, 4.0, 2.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054779052734375, -0.05291128158569336, -0.05104351043701172, -0.04917573928833008, -0.04730796813964844, -0.0454401969909668, -0.043572425842285156, -0.041704654693603516, -0.039836883544921875, -0.037969112396240234, -0.036101341247558594, -0.03423357009887695, -0.03236579895019531, -0.030498027801513672, -0.02863025665283203, -0.02676248550415039, -0.02489471435546875, -0.02302694320678711, -0.02115917205810547, -0.019291400909423828, -0.017423629760742188, -0.015555858612060547, -0.013688087463378906, -0.011820316314697266, -0.009952545166015625, -0.008084774017333984, -0.006217002868652344, -0.004349231719970703, -0.0024814605712890625, -0.0006136894226074219, 0.0012540817260742188, 0.0031218528747558594, 0.0049896240234375, 0.006857395172119141, 0.008725166320800781, 0.010592937469482422, 0.012460708618164062, 0.014328479766845703, 0.016196250915527344, 0.018064022064208984, 0.019931793212890625, 0.021799564361572266, 0.023667335510253906, 0.025535106658935547, 0.027402877807617188, 0.029270648956298828, 0.03113842010498047, 0.03300619125366211, 0.03487396240234375, 0.03674173355102539, 0.03860950469970703, 0.04047727584838867, 0.04234504699707031, 0.04421281814575195, 0.046080589294433594, 0.047948360443115234, 0.049816131591796875, 0.051683902740478516, 0.053551673889160156, 0.0554194450378418, 0.05728721618652344, 0.05915498733520508, 0.06102275848388672, 0.06289052963256836, 0.06475830078125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 4.0, 14.0, 12.0, 19.0, 34.0, 37.0, 54.0, 78.0, 96.0, 112.0, 120.0, 120.0, 79.0, 67.0, 52.0, 34.0, 18.0, 18.0, 11.0, 9.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.018646240234375, -0.018119215965270996, -0.017592191696166992, -0.01706516742706299, -0.016538143157958984, -0.01601111888885498, -0.015484094619750977, -0.014957070350646973, -0.014430046081542969, -0.013903021812438965, -0.013375997543334961, -0.012848973274230957, -0.012321949005126953, -0.01179492473602295, -0.011267900466918945, -0.010740876197814941, -0.010213851928710938, -0.009686827659606934, -0.00915980339050293, -0.008632779121398926, -0.008105754852294922, -0.007578730583190918, -0.007051706314086914, -0.00652468204498291, -0.005997657775878906, -0.005470633506774902, -0.0049436092376708984, -0.0044165849685668945, -0.0038895606994628906, -0.0033625364303588867, -0.002835512161254883, -0.002308487892150879, -0.001781463623046875, -0.001254439353942871, -0.0007274150848388672, -0.00020039081573486328, 0.0003266334533691406, 0.0008536577224731445, 0.0013806819915771484, 0.0019077062606811523, 0.0024347305297851562, 0.00296175479888916, 0.003488779067993164, 0.004015803337097168, 0.004542827606201172, 0.005069851875305176, 0.00559687614440918, 0.006123900413513184, 0.0066509246826171875, 0.007177948951721191, 0.007704973220825195, 0.0082319974899292, 0.008759021759033203, 0.009286046028137207, 0.009813070297241211, 0.010340094566345215, 0.010867118835449219, 0.011394143104553223, 0.011921167373657227, 0.01244819164276123, 0.012975215911865234, 0.013502240180969238, 0.014029264450073242, 0.014556288719177246, 0.01508331298828125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 12.0, 17.0, 23.0, 28.0, 46.0, 78.0, 114.0, 122.0, 114.0, 121.0, 95.0, 80.0, 53.0, 47.0, 18.0, 16.0, 8.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4926278293132782, -0.4795452356338501, -0.4664626121520996, -0.4533800184726715, -0.4402974247932434, -0.4272148013114929, -0.4141322076320648, -0.4010496139526367, -0.3879670202732086, -0.3748844265937805, -0.36180180311203003, -0.34871920943260193, -0.33563661575317383, -0.32255399227142334, -0.30947139859199524, -0.29638880491256714, -0.28330618143081665, -0.27022358775138855, -0.25714096426963806, -0.24405837059020996, -0.23097577691078186, -0.21789316833019257, -0.20481055974960327, -0.19172796607017517, -0.17864537239074707, -0.16556276381015778, -0.15248017013072968, -0.13939756155014038, -0.12631496787071228, -0.11323235929012299, -0.10014975816011429, -0.08706715703010559, -0.07398456335067749, -0.06090196222066879, -0.047819361090660095, -0.0347367562353611, -0.0216541551053524, -0.008571550250053406, 0.004511050879955292, 0.01759365200996399, 0.030676253139972687, 0.043758854269981384, 0.05684145539999008, 0.06992405652999878, 0.08300666511058807, 0.09608926624059677, 0.10917186737060547, 0.12225446850061417, 0.13533706963062286, 0.14841967821121216, 0.16150227189064026, 0.17458488047122955, 0.18766747415065765, 0.20075008273124695, 0.21383267641067505, 0.22691528499126434, 0.23999789357185364, 0.25308048725128174, 0.2661631107330322, 0.2792457044124603, 0.2923282980918884, 0.3054109215736389, 0.318493515253067, 0.3315761089324951, 0.3446587026119232]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 0.0, 7.0, 6.0, 9.0, 12.0, 16.0, 16.0, 28.0, 30.0, 33.0, 28.0, 41.0, 48.0, 49.0, 38.0, 51.0, 51.0, 48.0, 51.0, 51.0, 46.0, 48.0, 39.0, 46.0, 35.0, 37.0, 33.0, 20.0, 22.0, 18.0, 10.0, 6.0, 15.0, 3.0, 6.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1983073204755783, -0.19137267768383026, -0.18443803489208221, -0.17750339210033417, -0.17056876420974731, -0.16363412141799927, -0.15669947862625122, -0.14976483583450317, -0.14283019304275513, -0.13589555025100708, -0.12896090745925903, -0.12202627211809158, -0.11509162932634354, -0.10815698653459549, -0.10122235119342804, -0.09428770840167999, -0.08735306560993195, -0.0804184228181839, -0.07348378002643585, -0.0665491446852684, -0.059614501893520355, -0.05267985910177231, -0.04574522003531456, -0.03881058096885681, -0.031875938177108765, -0.024941297248005867, -0.01800665631890297, -0.011072015389800072, -0.004137374460697174, 0.002797268331050873, 0.009731907397508621, 0.01666654646396637, 0.023601189255714417, 0.030535830184817314, 0.03747047111392021, 0.04440511018037796, 0.05133975297212601, 0.058274395763874054, 0.0652090311050415, 0.07214367389678955, 0.0790783166885376, 0.08601295948028564, 0.09294760227203369, 0.09988223761320114, 0.10681688040494919, 0.11375152319669724, 0.12068615853786469, 0.12762080132961273, 0.13455544412136078, 0.14149008691310883, 0.14842472970485687, 0.15535937249660492, 0.16229400038719177, 0.16922864317893982, 0.17616328597068787, 0.1830979287624359, 0.19003257155418396, 0.196967214345932, 0.20390185713768005, 0.2108364999294281, 0.21777114272117615, 0.2247057855129242, 0.23164041340351105, 0.2385750561952591, 0.24550969898700714]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 8.0, 15.0, 20.0, 45.0, 76.0, 141.0, 302.0, 610.0, 1434.0, 3645.0, 10822.0, 35801.0, 152449.0, 578759.0, 200497.0, 43706.0, 13002.0, 4270.0, 1563.0, 680.0, 321.0, 154.0, 83.0, 64.0, 32.0, 14.0, 14.0, 8.0, 8.0, 4.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33349609375, -0.32045745849609375, -0.3074188232421875, -0.29438018798828125, -0.281341552734375, -0.26830291748046875, -0.2552642822265625, -0.24222564697265625, -0.22918701171875, -0.21614837646484375, -0.2031097412109375, -0.19007110595703125, -0.177032470703125, -0.16399383544921875, -0.1509552001953125, -0.13791656494140625, -0.1248779296875, -0.11183929443359375, -0.0988006591796875, -0.08576202392578125, -0.072723388671875, -0.05968475341796875, -0.0466461181640625, -0.03360748291015625, -0.02056884765625, -0.00753021240234375, 0.0055084228515625, 0.01854705810546875, 0.031585693359375, 0.04462432861328125, 0.0576629638671875, 0.07070159912109375, 0.083740234375, 0.09677886962890625, 0.1098175048828125, 0.12285614013671875, 0.135894775390625, 0.14893341064453125, 0.1619720458984375, 0.17501068115234375, 0.18804931640625, 0.20108795166015625, 0.2141265869140625, 0.22716522216796875, 0.240203857421875, 0.25324249267578125, 0.2662811279296875, 0.27931976318359375, 0.2923583984375, 0.30539703369140625, 0.3184356689453125, 0.33147430419921875, 0.344512939453125, 0.35755157470703125, 0.3705902099609375, 0.38362884521484375, 0.39666748046875, 0.40970611572265625, 0.4227447509765625, 0.43578338623046875, 0.448822021484375, 0.46186065673828125, 0.4748992919921875, 0.48793792724609375, 0.5009765625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 3.0, 5.0, 9.0, 12.0, 12.0, 8.0, 17.0, 20.0, 22.0, 26.0, 42.0, 33.0, 37.0, 39.0, 43.0, 44.0, 42.0, 50.0, 50.0, 36.0, 44.0, 42.0, 41.0, 42.0, 47.0, 42.0, 22.0, 29.0, 30.0, 20.0, 19.0, 16.0, 17.0, 8.0, 7.0, 8.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.382568359375, -0.37010955810546875, -0.3576507568359375, -0.34519195556640625, -0.332733154296875, -0.32027435302734375, -0.3078155517578125, -0.29535675048828125, -0.28289794921875, -0.27043914794921875, -0.2579803466796875, -0.24552154541015625, -0.233062744140625, -0.22060394287109375, -0.2081451416015625, -0.19568634033203125, -0.1832275390625, -0.17076873779296875, -0.1583099365234375, -0.14585113525390625, -0.133392333984375, -0.12093353271484375, -0.1084747314453125, -0.09601593017578125, -0.08355712890625, -0.07109832763671875, -0.0586395263671875, -0.04618072509765625, -0.033721923828125, -0.02126312255859375, -0.0088043212890625, 0.00365447998046875, 0.01611328125, 0.02857208251953125, 0.0410308837890625, 0.05348968505859375, 0.065948486328125, 0.07840728759765625, 0.0908660888671875, 0.10332489013671875, 0.11578369140625, 0.12824249267578125, 0.1407012939453125, 0.15316009521484375, 0.165618896484375, 0.17807769775390625, 0.1905364990234375, 0.20299530029296875, 0.2154541015625, 0.22791290283203125, 0.2403717041015625, 0.25283050537109375, 0.265289306640625, 0.27774810791015625, 0.2902069091796875, 0.30266571044921875, 0.31512451171875, 0.32758331298828125, 0.3400421142578125, 0.35250091552734375, 0.364959716796875, 0.37741851806640625, 0.3898773193359375, 0.40233612060546875, 0.414794921875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 3.0, 2.0, 7.0, 10.0, 14.0, 11.0, 22.0, 34.0, 33.0, 54.0, 94.0, 124.0, 244.0, 613.0, 1549.0, 5899.0, 27802.0, 199342.0, 686716.0, 102964.0, 16937.0, 3856.0, 1154.0, 448.0, 217.0, 122.0, 102.0, 61.0, 22.0, 27.0, 27.0, 16.0, 7.0, 5.0, 2.0, 5.0, 1.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.59033203125, -0.5740928649902344, -0.5578536987304688, -0.5416145324707031, -0.5253753662109375, -0.5091361999511719, -0.49289703369140625, -0.4766578674316406, -0.460418701171875, -0.4441795349121094, -0.42794036865234375, -0.4117012023925781, -0.3954620361328125, -0.3792228698730469, -0.36298370361328125, -0.3467445373535156, -0.33050537109375, -0.3142662048339844, -0.29802703857421875, -0.2817878723144531, -0.2655487060546875, -0.24930953979492188, -0.23307037353515625, -0.21683120727539062, -0.200592041015625, -0.18435287475585938, -0.16811370849609375, -0.15187454223632812, -0.1356353759765625, -0.11939620971679688, -0.10315704345703125, -0.08691787719726562, -0.0706787109375, -0.054439544677734375, -0.03820037841796875, -0.021961212158203125, -0.0057220458984375, 0.010517120361328125, 0.02675628662109375, 0.042995452880859375, 0.059234619140625, 0.07547378540039062, 0.09171295166015625, 0.10795211791992188, 0.1241912841796875, 0.14043045043945312, 0.15666961669921875, 0.17290878295898438, 0.18914794921875, 0.20538711547851562, 0.22162628173828125, 0.23786544799804688, 0.2541046142578125, 0.2703437805175781, 0.28658294677734375, 0.3028221130371094, 0.319061279296875, 0.3353004455566406, 0.35153961181640625, 0.3677787780761719, 0.3840179443359375, 0.4002571105957031, 0.41649627685546875, 0.4327354431152344, 0.448974609375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 3.0, 3.0, 4.0, 7.0, 4.0, 8.0, 7.0, 4.0, 11.0, 16.0, 13.0, 19.0, 14.0, 29.0, 23.0, 32.0, 26.0, 41.0, 47.0, 60.0, 37.0, 51.0, 50.0, 60.0, 50.0, 52.0, 53.0, 45.0, 36.0, 34.0, 27.0, 25.0, 17.0, 15.0, 17.0, 11.0, 6.0, 8.0, 10.0, 9.0, 6.0, 3.0, 6.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.379150390625, -0.3644981384277344, -0.34984588623046875, -0.3351936340332031, -0.3205413818359375, -0.3058891296386719, -0.29123687744140625, -0.2765846252441406, -0.261932373046875, -0.24728012084960938, -0.23262786865234375, -0.21797561645507812, -0.2033233642578125, -0.18867111206054688, -0.17401885986328125, -0.15936660766601562, -0.14471435546875, -0.13006210327148438, -0.11540985107421875, -0.10075759887695312, -0.0861053466796875, -0.07145309448242188, -0.05680084228515625, -0.042148590087890625, -0.027496337890625, -0.012844085693359375, 0.00180816650390625, 0.016460418701171875, 0.0311126708984375, 0.045764923095703125, 0.06041717529296875, 0.07506942749023438, 0.0897216796875, 0.10437393188476562, 0.11902618408203125, 0.13367843627929688, 0.1483306884765625, 0.16298294067382812, 0.17763519287109375, 0.19228744506835938, 0.206939697265625, 0.22159194946289062, 0.23624420166015625, 0.2508964538574219, 0.2655487060546875, 0.2802009582519531, 0.29485321044921875, 0.3095054626464844, 0.32415771484375, 0.3388099670410156, 0.35346221923828125, 0.3681144714355469, 0.3827667236328125, 0.3974189758300781, 0.41207122802734375, 0.4267234802246094, 0.441375732421875, 0.4560279846191406, 0.47068023681640625, 0.4853324890136719, 0.4999847412109375, 0.5146369934082031, 0.5292892456054688, 0.5439414978027344, 0.55859375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 6.0, 17.0, 12.0, 25.0, 53.0, 58.0, 133.0, 241.0, 524.0, 964.0, 2354.0, 6284.0, 21392.0, 113168.0, 608244.0, 240634.0, 38467.0, 9925.0, 3301.0, 1393.0, 619.0, 333.0, 155.0, 78.0, 49.0, 32.0, 19.0, 13.0, 15.0, 11.0, 6.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.128662109375, -0.12484359741210938, -0.12102508544921875, -0.11720657348632812, -0.1133880615234375, -0.10956954956054688, -0.10575103759765625, -0.10193252563476562, -0.098114013671875, -0.09429550170898438, -0.09047698974609375, -0.08665847778320312, -0.0828399658203125, -0.07902145385742188, -0.07520294189453125, -0.07138442993164062, -0.06756591796875, -0.06374740600585938, -0.05992889404296875, -0.056110382080078125, -0.0522918701171875, -0.048473358154296875, -0.04465484619140625, -0.040836334228515625, -0.037017822265625, -0.033199310302734375, -0.02938079833984375, -0.025562286376953125, -0.0217437744140625, -0.017925262451171875, -0.01410675048828125, -0.010288238525390625, -0.0064697265625, -0.002651214599609375, 0.00116729736328125, 0.004985809326171875, 0.0088043212890625, 0.012622833251953125, 0.01644134521484375, 0.020259857177734375, 0.024078369140625, 0.027896881103515625, 0.03171539306640625, 0.035533905029296875, 0.0393524169921875, 0.043170928955078125, 0.04698944091796875, 0.050807952880859375, 0.05462646484375, 0.058444976806640625, 0.06226348876953125, 0.06608200073242188, 0.0699005126953125, 0.07371902465820312, 0.07753753662109375, 0.08135604858398438, 0.085174560546875, 0.08899307250976562, 0.09281158447265625, 0.09663009643554688, 0.1004486083984375, 0.10426712036132812, 0.10808563232421875, 0.11190414428710938, 0.11572265625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 9.0, 12.0, 8.0, 15.0, 25.0, 21.0, 42.0, 47.0, 81.0, 92.0, 149.0, 134.0, 106.0, 85.0, 49.0, 43.0, 30.0, 24.0, 11.0, 7.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.676248550415039e-05, -2.5925226509571075e-05, -2.508796751499176e-05, -2.4250708520412445e-05, -2.341344952583313e-05, -2.2576190531253815e-05, -2.17389315366745e-05, -2.0901672542095184e-05, -2.006441354751587e-05, -1.9227154552936554e-05, -1.838989555835724e-05, -1.7552636563777924e-05, -1.671537756919861e-05, -1.5878118574619293e-05, -1.5040859580039978e-05, -1.4203600585460663e-05, -1.3366341590881348e-05, -1.2529082596302032e-05, -1.1691823601722717e-05, -1.0854564607143402e-05, -1.0017305612564087e-05, -9.180046617984772e-06, -8.342787623405457e-06, -7.505528628826141e-06, -6.668269634246826e-06, -5.831010639667511e-06, -4.993751645088196e-06, -4.156492650508881e-06, -3.3192336559295654e-06, -2.4819746613502502e-06, -1.644715666770935e-06, -8.074566721916199e-07, 2.9802322387695312e-08, 8.670613169670105e-07, 1.7043203115463257e-06, 2.541579306125641e-06, 3.378838300704956e-06, 4.216097295284271e-06, 5.0533562898635864e-06, 5.890615284442902e-06, 6.727874279022217e-06, 7.565133273601532e-06, 8.402392268180847e-06, 9.239651262760162e-06, 1.0076910257339478e-05, 1.0914169251918793e-05, 1.1751428246498108e-05, 1.2588687241077423e-05, 1.3425946235656738e-05, 1.4263205230236053e-05, 1.5100464224815369e-05, 1.5937723219394684e-05, 1.6774982213974e-05, 1.7612241208553314e-05, 1.844950020313263e-05, 1.9286759197711945e-05, 2.012401819229126e-05, 2.0961277186870575e-05, 2.179853618144989e-05, 2.2635795176029205e-05, 2.347305417060852e-05, 2.4310313165187836e-05, 2.514757215976715e-05, 2.5984831154346466e-05, 2.682209014892578e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 11.0, 15.0, 16.0, 33.0, 44.0, 101.0, 145.0, 305.0, 639.0, 1399.0, 3277.0, 9970.0, 43700.0, 353148.0, 544833.0, 69956.0, 13450.0, 4237.0, 1661.0, 756.0, 371.0, 205.0, 96.0, 66.0, 37.0, 20.0, 12.0, 9.0, 8.0, 8.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.181884765625, -0.176849365234375, -0.17181396484375, -0.166778564453125, -0.1617431640625, -0.156707763671875, -0.15167236328125, -0.146636962890625, -0.1416015625, -0.136566162109375, -0.13153076171875, -0.126495361328125, -0.1214599609375, -0.116424560546875, -0.11138916015625, -0.106353759765625, -0.101318359375, -0.096282958984375, -0.09124755859375, -0.086212158203125, -0.0811767578125, -0.076141357421875, -0.07110595703125, -0.066070556640625, -0.06103515625, -0.055999755859375, -0.05096435546875, -0.045928955078125, -0.0408935546875, -0.035858154296875, -0.03082275390625, -0.025787353515625, -0.020751953125, -0.015716552734375, -0.01068115234375, -0.005645751953125, -0.0006103515625, 0.004425048828125, 0.00946044921875, 0.014495849609375, 0.01953125, 0.024566650390625, 0.02960205078125, 0.034637451171875, 0.0396728515625, 0.044708251953125, 0.04974365234375, 0.054779052734375, 0.059814453125, 0.064849853515625, 0.06988525390625, 0.074920654296875, 0.0799560546875, 0.084991455078125, 0.09002685546875, 0.095062255859375, 0.10009765625, 0.105133056640625, 0.11016845703125, 0.115203857421875, 0.1202392578125, 0.125274658203125, 0.13031005859375, 0.135345458984375, 0.140380859375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 1.0, 2.0, 3.0, 3.0, 7.0, 7.0, 5.0, 9.0, 8.0, 10.0, 15.0, 14.0, 24.0, 43.0, 46.0, 54.0, 56.0, 67.0, 93.0, 129.0, 83.0, 72.0, 53.0, 32.0, 36.0, 22.0, 15.0, 19.0, 15.0, 12.0, 14.0, 6.0, 6.0, 10.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037689208984375, -0.035985469818115234, -0.03428173065185547, -0.0325779914855957, -0.030874252319335938, -0.029170513153076172, -0.027466773986816406, -0.02576303482055664, -0.024059295654296875, -0.02235555648803711, -0.020651817321777344, -0.018948078155517578, -0.017244338989257812, -0.015540599822998047, -0.013836860656738281, -0.012133121490478516, -0.01042938232421875, -0.008725643157958984, -0.007021903991699219, -0.005318164825439453, -0.0036144256591796875, -0.0019106864929199219, -0.00020694732666015625, 0.0014967918395996094, 0.003200531005859375, 0.004904270172119141, 0.006608009338378906, 0.008311748504638672, 0.010015487670898438, 0.011719226837158203, 0.013422966003417969, 0.015126705169677734, 0.0168304443359375, 0.018534183502197266, 0.02023792266845703, 0.021941661834716797, 0.023645401000976562, 0.025349140167236328, 0.027052879333496094, 0.02875661849975586, 0.030460357666015625, 0.03216409683227539, 0.033867835998535156, 0.03557157516479492, 0.03727531433105469, 0.03897905349731445, 0.04068279266357422, 0.042386531829833984, 0.04409027099609375, 0.045794010162353516, 0.04749774932861328, 0.04920148849487305, 0.05090522766113281, 0.05260896682739258, 0.054312705993652344, 0.05601644515991211, 0.057720184326171875, 0.05942392349243164, 0.061127662658691406, 0.06283140182495117, 0.06453514099121094, 0.0662388801574707, 0.06794261932373047, 0.06964635848999023, 0.07135009765625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 12.0, 31.0, 94.0, 153.0, 255.0, 230.0, 138.0, 64.0, 22.0, 11.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5363852977752686, -0.4763522744178772, -0.41631922125816345, -0.3562861979007721, -0.29625314474105835, -0.236220121383667, -0.17618709802627563, -0.11615404486656189, -0.05612102150917053, 0.003912013024091721, 0.06394504755735397, 0.12397807836532593, 0.18401111662387848, 0.24404415488243103, 0.3040771782398224, 0.36411023139953613, 0.4241432547569275, 0.48417627811431885, 0.5442093014717102, 0.6042423248291016, 0.6642754077911377, 0.724308431148529, 0.7843414545059204, 0.8443745374679565, 0.9044075012207031, 0.9644405245780945, 1.0244735479354858, 1.084506630897522, 1.1445395946502686, 1.2045726776123047, 1.2646057605743408, 1.3246387243270874, 1.3846718072891235, 1.4447048902511597, 1.5047378540039062, 1.5647709369659424, 1.624803900718689, 1.684836983680725, 1.7448699474334717, 1.8049030303955078, 1.864936113357544, 1.92496919631958, 1.9850021600723267, 2.0450351238250732, 2.1050682067871094, 2.1651012897491455, 2.2251343727111816, 2.2851674556732178, 2.345200300216675, 2.405233383178711, 2.465266466140747, 2.525299310684204, 2.5853323936462402, 2.6453654766082764, 2.7053985595703125, 2.7654316425323486, 2.8254647254943848, 2.885497808456421, 2.945530891418457, 3.005563735961914, 3.06559681892395, 3.1256299018859863, 3.1856629848480225, 3.2456960678100586, 3.3057289123535156]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 1.0, 0.0, 3.0, 6.0, 6.0, 8.0, 5.0, 6.0, 5.0, 7.0, 10.0, 15.0, 16.0, 23.0, 21.0, 37.0, 41.0, 37.0, 28.0, 40.0, 31.0, 37.0, 47.0, 42.0, 38.0, 36.0, 31.0, 39.0, 40.0, 33.0, 33.0, 35.0, 33.0, 33.0, 31.0, 17.0, 21.0, 17.0, 18.0, 18.0, 11.0, 19.0, 6.0, 12.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.7475723028182983, -0.7260862588882446, -0.7046001553535461, -0.6831140518188477, -0.661628007888794, -0.6401419639587402, -0.6186558604240417, -0.5971697568893433, -0.5756837129592896, -0.5541976690292358, -0.5327115654945374, -0.5112254619598389, -0.48973941802978516, -0.46825334429740906, -0.44676727056503296, -0.42528119683265686, -0.40379512310028076, -0.38230904936790466, -0.36082297563552856, -0.33933690190315247, -0.31785082817077637, -0.29636475443840027, -0.27487868070602417, -0.25339260697364807, -0.23190653324127197, -0.21042045950889587, -0.18893438577651978, -0.16744831204414368, -0.14596223831176758, -0.12447616457939148, -0.10299009084701538, -0.08150401711463928, -0.06001788377761841, -0.03853181004524231, -0.01704573631286621, 0.004440337419509888, 0.025926411151885986, 0.047412484884262085, 0.06889855861663818, 0.09038463234901428, 0.11187070608139038, 0.13335677981376648, 0.15484285354614258, 0.17632892727851868, 0.19781500101089478, 0.21930107474327087, 0.24078714847564697, 0.26227322220802307, 0.28375929594039917, 0.30524536967277527, 0.32673144340515137, 0.34821751713752747, 0.36970359086990356, 0.39118966460227966, 0.41267573833465576, 0.43416181206703186, 0.45564788579940796, 0.47713395953178406, 0.49862003326416016, 0.5201060771942139, 0.5415921807289124, 0.5630782842636108, 0.5845643281936646, 0.6060503721237183, 0.6275364756584167]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 5.0, 6.0, 7.0, 12.0, 13.0, 11.0, 18.0, 28.0, 29.0, 42.0, 70.0, 107.0, 185.0, 428.0, 1104.0, 3181.0, 12363.0, 79582.0, 1215886.0, 2620087.0, 227272.0, 25352.0, 5595.0, 1673.0, 595.0, 245.0, 134.0, 66.0, 42.0, 33.0, 29.0, 13.0, 23.0, 18.0, 9.0, 8.0, 5.0, 7.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.65673828125, -0.6399879455566406, -0.6232376098632812, -0.6064872741699219, -0.5897369384765625, -0.5729866027832031, -0.5562362670898438, -0.5394859313964844, -0.522735595703125, -0.5059852600097656, -0.48923492431640625, -0.4724845886230469, -0.4557342529296875, -0.4389839172363281, -0.42223358154296875, -0.4054832458496094, -0.38873291015625, -0.3719825744628906, -0.35523223876953125, -0.3384819030761719, -0.3217315673828125, -0.3049812316894531, -0.28823089599609375, -0.2714805603027344, -0.254730224609375, -0.23797988891601562, -0.22122955322265625, -0.20447921752929688, -0.1877288818359375, -0.17097854614257812, -0.15422821044921875, -0.13747787475585938, -0.1207275390625, -0.10397720336914062, -0.08722686767578125, -0.07047653198242188, -0.0537261962890625, -0.036975860595703125, -0.02022552490234375, -0.003475189208984375, 0.013275146484375, 0.030025482177734375, 0.04677581787109375, 0.06352615356445312, 0.0802764892578125, 0.09702682495117188, 0.11377716064453125, 0.13052749633789062, 0.14727783203125, 0.16402816772460938, 0.18077850341796875, 0.19752883911132812, 0.2142791748046875, 0.23102951049804688, 0.24777984619140625, 0.2645301818847656, 0.281280517578125, 0.2980308532714844, 0.31478118896484375, 0.3315315246582031, 0.3482818603515625, 0.3650321960449219, 0.38178253173828125, 0.3985328674316406, 0.415283203125]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 4.0, 7.0, 10.0, 11.0, 10.0, 17.0, 19.0, 9.0, 28.0, 21.0, 23.0, 28.0, 46.0, 34.0, 36.0, 41.0, 31.0, 54.0, 40.0, 45.0, 43.0, 33.0, 42.0, 28.0, 46.0, 27.0, 39.0, 34.0, 30.0, 35.0, 16.0, 16.0, 14.0, 16.0, 14.0, 10.0, 10.0, 13.0, 7.0, 6.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.22265625, -0.21603775024414062, -0.20941925048828125, -0.20280075073242188, -0.1961822509765625, -0.18956375122070312, -0.18294525146484375, -0.17632675170898438, -0.169708251953125, -0.16308975219726562, -0.15647125244140625, -0.14985275268554688, -0.1432342529296875, -0.13661575317382812, -0.12999725341796875, -0.12337875366210938, -0.11676025390625, -0.11014175415039062, -0.10352325439453125, -0.09690475463867188, -0.0902862548828125, -0.08366775512695312, -0.07704925537109375, -0.07043075561523438, -0.063812255859375, -0.057193756103515625, -0.05057525634765625, -0.043956756591796875, -0.0373382568359375, -0.030719757080078125, -0.02410125732421875, -0.017482757568359375, -0.0108642578125, -0.004245758056640625, 0.00237274169921875, 0.008991241455078125, 0.0156097412109375, 0.022228240966796875, 0.02884674072265625, 0.035465240478515625, 0.042083740234375, 0.048702239990234375, 0.05532073974609375, 0.061939239501953125, 0.0685577392578125, 0.07517623901367188, 0.08179473876953125, 0.08841323852539062, 0.09503173828125, 0.10165023803710938, 0.10826873779296875, 0.11488723754882812, 0.1215057373046875, 0.12812423706054688, 0.13474273681640625, 0.14136123657226562, 0.147979736328125, 0.15459823608398438, 0.16121673583984375, 0.16783523559570312, 0.1744537353515625, 0.18107223510742188, 0.18769073486328125, 0.19430923461914062, 0.200927734375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 18.0, 24.0, 36.0, 96.0, 246.0, 560.0, 1908.0, 11557.0, 690046.0, 3452386.0, 32813.0, 3128.0, 855.0, 315.0, 145.0, 52.0, 26.0, 26.0, 13.0, 9.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.056640625, -1.0227508544921875, -0.988861083984375, -0.9549713134765625, -0.92108154296875, -0.8871917724609375, -0.853302001953125, -0.8194122314453125, -0.7855224609375, -0.7516326904296875, -0.717742919921875, -0.6838531494140625, -0.64996337890625, -0.6160736083984375, -0.582183837890625, -0.5482940673828125, -0.514404296875, -0.4805145263671875, -0.446624755859375, -0.4127349853515625, -0.37884521484375, -0.3449554443359375, -0.311065673828125, -0.2771759033203125, -0.2432861328125, -0.2093963623046875, -0.175506591796875, -0.1416168212890625, -0.10772705078125, -0.0738372802734375, -0.039947509765625, -0.0060577392578125, 0.02783203125, 0.0617218017578125, 0.095611572265625, 0.1295013427734375, 0.16339111328125, 0.1972808837890625, 0.231170654296875, 0.2650604248046875, 0.2989501953125, 0.3328399658203125, 0.366729736328125, 0.4006195068359375, 0.43450927734375, 0.4683990478515625, 0.502288818359375, 0.5361785888671875, 0.570068359375, 0.6039581298828125, 0.637847900390625, 0.6717376708984375, 0.70562744140625, 0.7395172119140625, 0.773406982421875, 0.8072967529296875, 0.8411865234375, 0.8750762939453125, 0.908966064453125, 0.9428558349609375, 0.97674560546875, 1.0106353759765625, 1.044525146484375, 1.0784149169921875, 1.1123046875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 12.0, 3.0, 11.0, 18.0, 17.0, 50.0, 54.0, 69.0, 121.0, 207.0, 261.0, 368.0, 487.0, 559.0, 519.0, 411.0, 278.0, 227.0, 138.0, 87.0, 44.0, 45.0, 27.0, 20.0, 10.0, 8.0, 12.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1324462890625, -0.12764739990234375, -0.1228485107421875, -0.11804962158203125, -0.113250732421875, -0.10845184326171875, -0.1036529541015625, -0.09885406494140625, -0.09405517578125, -0.08925628662109375, -0.0844573974609375, -0.07965850830078125, -0.074859619140625, -0.07006072998046875, -0.0652618408203125, -0.06046295166015625, -0.0556640625, -0.05086517333984375, -0.0460662841796875, -0.04126739501953125, -0.036468505859375, -0.03166961669921875, -0.0268707275390625, -0.02207183837890625, -0.01727294921875, -0.01247406005859375, -0.0076751708984375, -0.00287628173828125, 0.001922607421875, 0.00672149658203125, 0.0115203857421875, 0.01631927490234375, 0.0211181640625, 0.02591705322265625, 0.0307159423828125, 0.03551483154296875, 0.040313720703125, 0.04511260986328125, 0.0499114990234375, 0.05471038818359375, 0.05950927734375, 0.06430816650390625, 0.0691070556640625, 0.07390594482421875, 0.078704833984375, 0.08350372314453125, 0.0883026123046875, 0.09310150146484375, 0.097900390625, 0.10269927978515625, 0.1074981689453125, 0.11229705810546875, 0.117095947265625, 0.12189483642578125, 0.1266937255859375, 0.13149261474609375, 0.13629150390625, 0.14109039306640625, 0.1458892822265625, 0.15068817138671875, 0.155487060546875, 0.16028594970703125, 0.1650848388671875, 0.16988372802734375, 0.1746826171875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 6.0, 8.0, 11.0, 7.0, 10.0, 13.0, 15.0, 22.0, 28.0, 35.0, 31.0, 38.0, 47.0, 37.0, 35.0, 70.0, 50.0, 60.0, 48.0, 53.0, 45.0, 59.0, 51.0, 37.0, 26.0, 30.0, 19.0, 21.0, 18.0, 15.0, 16.0, 13.0, 7.0, 6.0, 5.0, 1.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.3278948962688446, -0.3179178535938263, -0.3079407811164856, -0.2979637384414673, -0.287986695766449, -0.2780096232891083, -0.26803258061408997, -0.25805550813674927, -0.24807846546173096, -0.23810140788555145, -0.22812435030937195, -0.21814730763435364, -0.20817025005817413, -0.19819319248199463, -0.18821614980697632, -0.17823909223079681, -0.1682620346546173, -0.1582849770784378, -0.1483079195022583, -0.13833087682724, -0.12835381925106049, -0.11837676167488098, -0.10839971154928207, -0.09842266142368317, -0.08844560384750366, -0.07846854627132416, -0.06849149614572525, -0.058514442294836044, -0.04853738844394684, -0.03856033459305763, -0.028583280742168427, -0.01860623061656952, -0.008629143238067627, 0.001347910612821579, 0.011324964463710785, 0.02130201831459999, 0.0312790721654892, 0.0412561260163784, 0.05123317986726761, 0.061210229992866516, 0.07118728756904602, 0.08116434514522552, 0.09114139527082443, 0.10111844539642334, 0.11109550297260284, 0.12107256054878235, 0.13104960322380066, 0.14102666079998016, 0.15100371837615967, 0.16098077595233917, 0.17095783352851868, 0.180934876203537, 0.1909119337797165, 0.200888991355896, 0.2108660340309143, 0.2208430916070938, 0.23082014918327332, 0.24079720675945282, 0.2507742643356323, 0.26075130701065063, 0.27072834968566895, 0.28070542216300964, 0.29068246483802795, 0.30065953731536865, 0.31063657999038696]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 5.0, 3.0, 5.0, 6.0, 5.0, 17.0, 9.0, 6.0, 8.0, 12.0, 17.0, 17.0, 17.0, 25.0, 24.0, 27.0, 32.0, 39.0, 32.0, 39.0, 37.0, 29.0, 42.0, 33.0, 37.0, 44.0, 30.0, 40.0, 33.0, 35.0, 24.0, 24.0, 22.0, 26.0, 32.0, 31.0, 24.0, 17.0, 21.0, 17.0, 11.0, 15.0, 5.0, 4.0, 4.0, 7.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.26479968428611755, -0.25700971484184265, -0.24921973049640656, -0.24142974615097046, -0.23363977670669556, -0.22584979236125946, -0.21805980801582336, -0.21026983857154846, -0.20247985422611237, -0.19468986988067627, -0.18689990043640137, -0.17910991609096527, -0.17131993174552917, -0.16352996230125427, -0.15573997795581818, -0.14794999361038208, -0.14016002416610718, -0.13237003982067108, -0.12458007037639618, -0.11679008603096008, -0.10900010913610458, -0.10121013224124908, -0.09342014789581299, -0.08563017100095749, -0.07784019410610199, -0.07005021721124649, -0.06226023659110069, -0.054470255970954895, -0.046680279076099396, -0.038890302181243896, -0.0311003215610981, -0.0233103409409523, -0.015520364046096802, -0.007730385288596153, 5.959346890449524e-05, 0.007849572226405144, 0.015639550983905792, 0.02342952787876129, 0.03121950849890709, 0.03900948911905289, 0.046799466013908386, 0.054589442908763885, 0.06237942352890968, 0.07016940414905548, 0.07795938104391098, 0.08574935793876648, 0.09353934228420258, 0.10132931917905807, 0.10911929607391357, 0.11690927296876907, 0.12469924986362457, 0.13248923420906067, 0.14027920365333557, 0.14806918799877167, 0.15585917234420776, 0.16364914178848267, 0.17143912613391876, 0.17922911047935486, 0.18701907992362976, 0.19480906426906586, 0.20259904861450195, 0.21038901805877686, 0.21817900240421295, 0.22596898674964905, 0.23375895619392395]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 4.0, 6.0, 5.0, 5.0, 16.0, 30.0, 31.0, 37.0, 48.0, 97.0, 127.0, 173.0, 297.0, 430.0, 623.0, 931.0, 1433.0, 2208.0, 3395.0, 5096.0, 7739.0, 11739.0, 21646.0, 59683.0, 207997.0, 394308.0, 212392.0, 61132.0, 21872.0, 11971.0, 7784.0, 5264.0, 3459.0, 2224.0, 1515.0, 958.0, 652.0, 388.0, 282.0, 173.0, 107.0, 82.0, 65.0, 35.0, 29.0, 25.0, 13.0, 16.0, 7.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.07598876953125, -0.07341384887695312, -0.07083892822265625, -0.06826400756835938, -0.0656890869140625, -0.06311416625976562, -0.06053924560546875, -0.057964324951171875, -0.055389404296875, -0.052814483642578125, -0.05023956298828125, -0.047664642333984375, -0.0450897216796875, -0.042514801025390625, -0.03993988037109375, -0.037364959716796875, -0.0347900390625, -0.032215118408203125, -0.02964019775390625, -0.027065277099609375, -0.0244903564453125, -0.021915435791015625, -0.01934051513671875, -0.016765594482421875, -0.014190673828125, -0.011615753173828125, -0.00904083251953125, -0.006465911865234375, -0.0038909912109375, -0.001316070556640625, 0.00125885009765625, 0.003833770751953125, 0.00640869140625, 0.008983612060546875, 0.01155853271484375, 0.014133453369140625, 0.0167083740234375, 0.019283294677734375, 0.02185821533203125, 0.024433135986328125, 0.027008056640625, 0.029582977294921875, 0.03215789794921875, 0.034732818603515625, 0.0373077392578125, 0.039882659912109375, 0.04245758056640625, 0.045032501220703125, 0.047607421875, 0.050182342529296875, 0.05275726318359375, 0.055332183837890625, 0.0579071044921875, 0.060482025146484375, 0.06305694580078125, 0.06563186645507812, 0.068206787109375, 0.07078170776367188, 0.07335662841796875, 0.07593154907226562, 0.0785064697265625, 0.08108139038085938, 0.08365631103515625, 0.08623123168945312, 0.08880615234375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 5.0, 4.0, 3.0, 5.0, 8.0, 11.0, 12.0, 8.0, 14.0, 12.0, 16.0, 12.0, 22.0, 24.0, 20.0, 33.0, 35.0, 33.0, 40.0, 32.0, 35.0, 36.0, 44.0, 34.0, 37.0, 47.0, 38.0, 36.0, 26.0, 39.0, 17.0, 30.0, 37.0, 16.0, 28.0, 19.0, 26.0, 14.0, 21.0, 18.0, 11.0, 10.0, 16.0, 5.0, 8.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.1614990234375, -0.15656661987304688, -0.15163421630859375, -0.14670181274414062, -0.1417694091796875, -0.13683700561523438, -0.13190460205078125, -0.12697219848632812, -0.122039794921875, -0.11710739135742188, -0.11217498779296875, -0.10724258422851562, -0.1023101806640625, -0.09737777709960938, -0.09244537353515625, -0.08751296997070312, -0.08258056640625, -0.07764816284179688, -0.07271575927734375, -0.06778335571289062, -0.0628509521484375, -0.057918548583984375, -0.05298614501953125, -0.048053741455078125, -0.043121337890625, -0.038188934326171875, -0.03325653076171875, -0.028324127197265625, -0.0233917236328125, -0.018459320068359375, -0.01352691650390625, -0.008594512939453125, -0.003662109375, 0.001270294189453125, 0.00620269775390625, 0.011135101318359375, 0.0160675048828125, 0.020999908447265625, 0.02593231201171875, 0.030864715576171875, 0.035797119140625, 0.040729522705078125, 0.04566192626953125, 0.050594329833984375, 0.0555267333984375, 0.060459136962890625, 0.06539154052734375, 0.07032394409179688, 0.07525634765625, 0.08018875122070312, 0.08512115478515625, 0.09005355834960938, 0.0949859619140625, 0.09991836547851562, 0.10485076904296875, 0.10978317260742188, 0.114715576171875, 0.11964797973632812, 0.12458038330078125, 0.12951278686523438, 0.1344451904296875, 0.13937759399414062, 0.14430999755859375, 0.14924240112304688, 0.1541748046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 5.0, 4.0, 9.0, 13.0, 16.0, 22.0, 39.0, 42.0, 73.0, 99.0, 159.0, 241.0, 386.0, 633.0, 1140.0, 1982.0, 3690.0, 7371.0, 16338.0, 42353.0, 147229.0, 404680.0, 288805.0, 82929.0, 26900.0, 11408.0, 5374.0, 2841.0, 1505.0, 875.0, 482.0, 303.0, 204.0, 115.0, 94.0, 54.0, 39.0, 29.0, 19.0, 18.0, 6.0, 7.0, 5.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07366943359375, -0.07119560241699219, -0.06872177124023438, -0.06624794006347656, -0.06377410888671875, -0.06130027770996094, -0.058826446533203125, -0.05635261535644531, -0.0538787841796875, -0.05140495300292969, -0.048931121826171875, -0.04645729064941406, -0.04398345947265625, -0.04150962829589844, -0.039035797119140625, -0.03656196594238281, -0.034088134765625, -0.03161430358886719, -0.029140472412109375, -0.026666641235351562, -0.02419281005859375, -0.021718978881835938, -0.019245147705078125, -0.016771316528320312, -0.0142974853515625, -0.011823654174804688, -0.009349822998046875, -0.0068759918212890625, -0.00440216064453125, -0.0019283294677734375, 0.000545501708984375, 0.0030193328857421875, 0.0054931640625, 0.007966995239257812, 0.010440826416015625, 0.012914657592773438, 0.01538848876953125, 0.017862319946289062, 0.020336151123046875, 0.022809982299804688, 0.0252838134765625, 0.027757644653320312, 0.030231475830078125, 0.03270530700683594, 0.03517913818359375, 0.03765296936035156, 0.040126800537109375, 0.04260063171386719, 0.045074462890625, 0.04754829406738281, 0.050022125244140625, 0.05249595642089844, 0.05496978759765625, 0.05744361877441406, 0.059917449951171875, 0.06239128112792969, 0.0648651123046875, 0.06733894348144531, 0.06981277465820312, 0.07228660583496094, 0.07476043701171875, 0.07723426818847656, 0.07970809936523438, 0.08218193054199219, 0.08465576171875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 7.0, 7.0, 5.0, 6.0, 9.0, 8.0, 11.0, 17.0, 12.0, 7.0, 23.0, 28.0, 26.0, 26.0, 28.0, 44.0, 54.0, 31.0, 32.0, 47.0, 56.0, 35.0, 50.0, 52.0, 39.0, 47.0, 33.0, 43.0, 25.0, 36.0, 27.0, 26.0, 20.0, 19.0, 7.0, 12.0, 12.0, 6.0, 11.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.441650390625, -0.4284095764160156, -0.41516876220703125, -0.4019279479980469, -0.3886871337890625, -0.3754463195800781, -0.36220550537109375, -0.3489646911621094, -0.335723876953125, -0.3224830627441406, -0.30924224853515625, -0.2960014343261719, -0.2827606201171875, -0.2695198059082031, -0.25627899169921875, -0.24303817749023438, -0.22979736328125, -0.21655654907226562, -0.20331573486328125, -0.19007492065429688, -0.1768341064453125, -0.16359329223632812, -0.15035247802734375, -0.13711166381835938, -0.123870849609375, -0.11063003540039062, -0.09738922119140625, -0.08414840698242188, -0.0709075927734375, -0.057666778564453125, -0.04442596435546875, -0.031185150146484375, -0.0179443359375, -0.004703521728515625, 0.00853729248046875, 0.021778106689453125, 0.0350189208984375, 0.048259735107421875, 0.06150054931640625, 0.07474136352539062, 0.087982177734375, 0.10122299194335938, 0.11446380615234375, 0.12770462036132812, 0.1409454345703125, 0.15418624877929688, 0.16742706298828125, 0.18066787719726562, 0.19390869140625, 0.20714950561523438, 0.22039031982421875, 0.23363113403320312, 0.2468719482421875, 0.2601127624511719, 0.27335357666015625, 0.2865943908691406, 0.299835205078125, 0.3130760192871094, 0.32631683349609375, 0.3395576477050781, 0.3527984619140625, 0.3660392761230469, 0.37928009033203125, 0.3925209045410156, 0.40576171875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 8.0, 7.0, 11.0, 7.0, 15.0, 25.0, 52.0, 61.0, 104.0, 171.0, 380.0, 621.0, 1297.0, 2608.0, 5886.0, 16039.0, 65488.0, 446853.0, 422027.0, 60863.0, 15243.0, 5822.0, 2385.0, 1221.0, 543.0, 330.0, 182.0, 111.0, 73.0, 42.0, 28.0, 20.0, 14.0, 9.0, 3.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.05694580078125, -0.05531787872314453, -0.05368995666503906, -0.052062034606933594, -0.050434112548828125, -0.048806190490722656, -0.04717826843261719, -0.04555034637451172, -0.04392242431640625, -0.04229450225830078, -0.04066658020019531, -0.039038658142089844, -0.037410736083984375, -0.035782814025878906, -0.03415489196777344, -0.03252696990966797, -0.0308990478515625, -0.02927112579345703, -0.027643203735351562, -0.026015281677246094, -0.024387359619140625, -0.022759437561035156, -0.021131515502929688, -0.01950359344482422, -0.01787567138671875, -0.01624774932861328, -0.014619827270507812, -0.012991905212402344, -0.011363983154296875, -0.009736061096191406, -0.008108139038085938, -0.006480216979980469, -0.004852294921875, -0.0032243728637695312, -0.0015964508056640625, 3.147125244140625e-05, 0.001659393310546875, 0.0032873153686523438, 0.0049152374267578125, 0.006543159484863281, 0.00817108154296875, 0.009799003601074219, 0.011426925659179688, 0.013054847717285156, 0.014682769775390625, 0.016310691833496094, 0.017938613891601562, 0.01956653594970703, 0.0211944580078125, 0.02282238006591797, 0.024450302124023438, 0.026078224182128906, 0.027706146240234375, 0.029334068298339844, 0.030961990356445312, 0.03258991241455078, 0.03421783447265625, 0.03584575653076172, 0.03747367858886719, 0.039101600646972656, 0.040729522705078125, 0.042357444763183594, 0.04398536682128906, 0.04561328887939453, 0.0472412109375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 7.0, 7.0, 10.0, 13.0, 8.0, 37.0, 54.0, 89.0, 92.0, 131.0, 143.0, 139.0, 92.0, 51.0, 33.0, 26.0, 14.0, 9.0, 4.0, 7.0, 3.0, 6.0, 9.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.063678741455078e-05, -2.978648990392685e-05, -2.8936192393302917e-05, -2.8085894882678986e-05, -2.7235597372055054e-05, -2.6385299861431122e-05, -2.553500235080719e-05, -2.4684704840183258e-05, -2.3834407329559326e-05, -2.2984109818935394e-05, -2.2133812308311462e-05, -2.128351479768753e-05, -2.04332172870636e-05, -1.9582919776439667e-05, -1.8732622265815735e-05, -1.7882324755191803e-05, -1.703202724456787e-05, -1.618172973394394e-05, -1.5331432223320007e-05, -1.4481134712696075e-05, -1.3630837202072144e-05, -1.2780539691448212e-05, -1.193024218082428e-05, -1.1079944670200348e-05, -1.0229647159576416e-05, -9.379349648952484e-06, -8.529052138328552e-06, -7.67875462770462e-06, -6.8284571170806885e-06, -5.978159606456757e-06, -5.127862095832825e-06, -4.277564585208893e-06, -3.427267074584961e-06, -2.576969563961029e-06, -1.7266720533370972e-06, -8.763745427131653e-07, -2.60770320892334e-08, 8.242204785346985e-07, 1.6745179891586304e-06, 2.5248154997825623e-06, 3.375113010406494e-06, 4.225410521030426e-06, 5.075708031654358e-06, 5.92600554227829e-06, 6.776303052902222e-06, 7.6266005635261536e-06, 8.476898074150085e-06, 9.327195584774017e-06, 1.017749309539795e-05, 1.1027790606021881e-05, 1.1878088116645813e-05, 1.2728385627269745e-05, 1.3578683137893677e-05, 1.4428980648517609e-05, 1.527927815914154e-05, 1.6129575669765472e-05, 1.6979873180389404e-05, 1.7830170691013336e-05, 1.8680468201637268e-05, 1.95307657122612e-05, 2.0381063222885132e-05, 2.1231360733509064e-05, 2.2081658244132996e-05, 2.2931955754756927e-05, 2.378225326538086e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 9.0, 17.0, 18.0, 28.0, 35.0, 65.0, 112.0, 157.0, 292.0, 540.0, 883.0, 1534.0, 2859.0, 5364.0, 11616.0, 26500.0, 73937.0, 221073.0, 374496.0, 210661.0, 70244.0, 25643.0, 10862.0, 5357.0, 2662.0, 1516.0, 835.0, 459.0, 284.0, 184.0, 108.0, 68.0, 56.0, 41.0, 11.0, 8.0, 5.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.036468505859375, -0.03537893295288086, -0.03428936004638672, -0.03319978713989258, -0.03211021423339844, -0.031020641326904297, -0.029931068420410156, -0.028841495513916016, -0.027751922607421875, -0.026662349700927734, -0.025572776794433594, -0.024483203887939453, -0.023393630981445312, -0.022304058074951172, -0.02121448516845703, -0.02012491226196289, -0.01903533935546875, -0.01794576644897461, -0.01685619354248047, -0.015766620635986328, -0.014677047729492188, -0.013587474822998047, -0.012497901916503906, -0.011408329010009766, -0.010318756103515625, -0.009229183197021484, -0.008139610290527344, -0.007050037384033203, -0.0059604644775390625, -0.004870891571044922, -0.0037813186645507812, -0.0026917457580566406, -0.0016021728515625, -0.0005125999450683594, 0.0005769729614257812, 0.0016665458679199219, 0.0027561187744140625, 0.003845691680908203, 0.004935264587402344, 0.006024837493896484, 0.007114410400390625, 0.008203983306884766, 0.009293556213378906, 0.010383129119873047, 0.011472702026367188, 0.012562274932861328, 0.013651847839355469, 0.01474142074584961, 0.01583099365234375, 0.01692056655883789, 0.01801013946533203, 0.019099712371826172, 0.020189285278320312, 0.021278858184814453, 0.022368431091308594, 0.023458003997802734, 0.024547576904296875, 0.025637149810791016, 0.026726722717285156, 0.027816295623779297, 0.028905868530273438, 0.029995441436767578, 0.03108501434326172, 0.03217458724975586, 0.03326416015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 9.0, 8.0, 6.0, 18.0, 14.0, 33.0, 54.0, 69.0, 95.0, 93.0, 138.0, 111.0, 99.0, 71.0, 58.0, 36.0, 26.0, 13.0, 13.0, 12.0, 12.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01428985595703125, -0.01380765438079834, -0.01332545280456543, -0.01284325122833252, -0.01236104965209961, -0.0118788480758667, -0.011396646499633789, -0.010914444923400879, -0.010432243347167969, -0.009950041770935059, -0.009467840194702148, -0.008985638618469238, -0.008503437042236328, -0.008021235466003418, -0.007539033889770508, -0.007056832313537598, -0.0065746307373046875, -0.006092429161071777, -0.005610227584838867, -0.005128026008605957, -0.004645824432373047, -0.004163622856140137, -0.0036814212799072266, -0.0031992197036743164, -0.0027170181274414062, -0.002234816551208496, -0.001752614974975586, -0.0012704133987426758, -0.0007882118225097656, -0.00030601024627685547, 0.0001761913299560547, 0.0006583929061889648, 0.001140594482421875, 0.0016227960586547852, 0.0021049976348876953, 0.0025871992111206055, 0.0030694007873535156, 0.0035516023635864258, 0.004033803939819336, 0.004516005516052246, 0.004998207092285156, 0.005480408668518066, 0.0059626102447509766, 0.006444811820983887, 0.006927013397216797, 0.007409214973449707, 0.007891416549682617, 0.008373618125915527, 0.008855819702148438, 0.009338021278381348, 0.009820222854614258, 0.010302424430847168, 0.010784626007080078, 0.011266827583312988, 0.011749029159545898, 0.012231230735778809, 0.012713432312011719, 0.013195633888244629, 0.013677835464477539, 0.01416003704071045, 0.01464223861694336, 0.01512444019317627, 0.01560664176940918, 0.01608884334564209, 0.016571044921875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 8.0, 17.0, 18.0, 23.0, 18.0, 23.0, 36.0, 43.0, 44.0, 61.0, 70.0, 67.0, 49.0, 61.0, 62.0, 58.0, 70.0, 43.0, 45.0, 26.0, 28.0, 20.0, 16.0, 19.0, 21.0, 13.0, 8.0, 11.0, 8.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23547668755054474, -0.22861741483211517, -0.2217581421136856, -0.21489888429641724, -0.20803961157798767, -0.2011803388595581, -0.19432106614112854, -0.18746179342269897, -0.1806025207042694, -0.17374324798583984, -0.16688397526741028, -0.1600247025489807, -0.15316544473171234, -0.14630617201328278, -0.1394468992948532, -0.13258762657642365, -0.12572836875915527, -0.11886909604072571, -0.11200983077287674, -0.10515055805444717, -0.0982912927865982, -0.09143202006816864, -0.08457274734973907, -0.07771347463130951, -0.07085420936346054, -0.06399493664503098, -0.05713567137718201, -0.05027639865875244, -0.043417129665613174, -0.03655786067247391, -0.029698587954044342, -0.022839318960905075, -0.015980035066604614, -0.009120765142142773, -0.002261495217680931, 0.004597775638103485, 0.011457044631242752, 0.01831631362438202, 0.025175586342811584, 0.03203485533595085, 0.03889412432909012, 0.045753393322229385, 0.05261266231536865, 0.05947193503379822, 0.06633120775222778, 0.07319047302007675, 0.08004974573850632, 0.08690901100635529, 0.09376828372478485, 0.10062755644321442, 0.10748682171106339, 0.11434609442949295, 0.12120535969734192, 0.12806463241577148, 0.13492390513420105, 0.14178317785263062, 0.14864245057106018, 0.15550172328948975, 0.1623609960079193, 0.16922026872634888, 0.17607952654361725, 0.18293879926204681, 0.18979807198047638, 0.19665734469890594, 0.20351660251617432]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 5.0, 0.0, 2.0, 8.0, 2.0, 9.0, 9.0, 9.0, 10.0, 7.0, 7.0, 10.0, 10.0, 20.0, 19.0, 17.0, 22.0, 31.0, 27.0, 30.0, 33.0, 29.0, 35.0, 36.0, 40.0, 43.0, 35.0, 38.0, 33.0, 30.0, 26.0, 37.0, 30.0, 42.0, 30.0, 18.0, 23.0, 33.0, 16.0, 29.0, 24.0, 21.0, 12.0, 15.0, 8.0, 8.0, 8.0, 2.0, 2.0, 2.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0], "bins": [-0.15810687839984894, -0.15346482396125793, -0.14882275462150574, -0.14418070018291473, -0.13953863084316254, -0.13489657640457153, -0.13025450706481934, -0.12561245262622833, -0.12097039818763733, -0.11632833629846573, -0.11168627440929413, -0.10704421997070312, -0.10240215808153152, -0.09776009619235992, -0.09311803430318832, -0.08847597241401672, -0.08383391052484512, -0.07919184863567352, -0.07454978674650192, -0.06990772485733032, -0.06526567041873932, -0.06062360852956772, -0.05598154664039612, -0.051339488476514816, -0.046697426587343216, -0.042055364698171616, -0.037413306534290314, -0.03277124464511871, -0.028129184618592262, -0.02348712459206581, -0.01884506270289421, -0.014203004539012909, -0.009560942649841309, -0.00491888215765357, -0.00027682166546583176, 0.004365239292383194, 0.009007299318909645, 0.013649359345436096, 0.018291421234607697, 0.022933479398489, 0.0275755412876606, 0.0322176031768322, 0.0368596613407135, 0.0415017232298851, 0.0461437851190567, 0.050785843282938004, 0.055427905172109604, 0.060069963335990906, 0.0647120252251625, 0.0693540871143341, 0.0739961490035057, 0.07863821089267731, 0.08328026533126831, 0.08792232722043991, 0.09256438910961151, 0.09720644354820251, 0.10184851288795471, 0.10649057477712631, 0.11113263666629791, 0.11577469110488892, 0.12041675299406052, 0.12505881488323212, 0.12970086932182312, 0.13434293866157532, 0.13898499310016632]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 11.0, 6.0, 8.0, 15.0, 24.0, 45.0, 39.0, 44.0, 87.0, 157.0, 244.0, 416.0, 764.0, 1369.0, 2934.0, 6321.0, 14511.0, 34374.0, 82336.0, 186127.0, 300789.0, 229708.0, 107689.0, 45503.0, 19071.0, 8335.0, 3694.0, 1700.0, 933.0, 485.0, 282.0, 180.0, 107.0, 88.0, 53.0, 31.0, 20.0, 15.0, 12.0, 13.0, 1.0, 4.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2607421875, -0.2516441345214844, -0.24254608154296875, -0.23344802856445312, -0.2243499755859375, -0.21525192260742188, -0.20615386962890625, -0.19705581665039062, -0.187957763671875, -0.17885971069335938, -0.16976165771484375, -0.16066360473632812, -0.1515655517578125, -0.14246749877929688, -0.13336944580078125, -0.12427139282226562, -0.11517333984375, -0.10607528686523438, -0.09697723388671875, -0.08787918090820312, -0.0787811279296875, -0.06968307495117188, -0.06058502197265625, -0.051486968994140625, -0.042388916015625, -0.033290863037109375, -0.02419281005859375, -0.015094757080078125, -0.0059967041015625, 0.003101348876953125, 0.01219940185546875, 0.021297454833984375, 0.0303955078125, 0.039493560791015625, 0.04859161376953125, 0.057689666748046875, 0.0667877197265625, 0.07588577270507812, 0.08498382568359375, 0.09408187866210938, 0.103179931640625, 0.11227798461914062, 0.12137603759765625, 0.13047409057617188, 0.1395721435546875, 0.14867019653320312, 0.15776824951171875, 0.16686630249023438, 0.17596435546875, 0.18506240844726562, 0.19416046142578125, 0.20325851440429688, 0.2123565673828125, 0.22145462036132812, 0.23055267333984375, 0.23965072631835938, 0.248748779296875, 0.2578468322753906, 0.26694488525390625, 0.2760429382324219, 0.2851409912109375, 0.2942390441894531, 0.30333709716796875, 0.3124351501464844, 0.321533203125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 3.0, 11.0, 8.0, 10.0, 8.0, 4.0, 14.0, 16.0, 18.0, 27.0, 22.0, 24.0, 38.0, 44.0, 51.0, 35.0, 43.0, 47.0, 44.0, 52.0, 40.0, 58.0, 49.0, 46.0, 32.0, 27.0, 35.0, 37.0, 36.0, 25.0, 23.0, 17.0, 14.0, 13.0, 7.0, 4.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28662109375, -0.27622222900390625, -0.2658233642578125, -0.25542449951171875, -0.245025634765625, -0.23462677001953125, -0.2242279052734375, -0.21382904052734375, -0.20343017578125, -0.19303131103515625, -0.1826324462890625, -0.17223358154296875, -0.161834716796875, -0.15143585205078125, -0.1410369873046875, -0.13063812255859375, -0.1202392578125, -0.10984039306640625, -0.0994415283203125, -0.08904266357421875, -0.078643798828125, -0.06824493408203125, -0.0578460693359375, -0.04744720458984375, -0.03704833984375, -0.02664947509765625, -0.0162506103515625, -0.00585174560546875, 0.004547119140625, 0.01494598388671875, 0.0253448486328125, 0.03574371337890625, 0.046142578125, 0.05654144287109375, 0.0669403076171875, 0.07733917236328125, 0.087738037109375, 0.09813690185546875, 0.1085357666015625, 0.11893463134765625, 0.12933349609375, 0.13973236083984375, 0.1501312255859375, 0.16053009033203125, 0.170928955078125, 0.18132781982421875, 0.1917266845703125, 0.20212554931640625, 0.2125244140625, 0.22292327880859375, 0.2333221435546875, 0.24372100830078125, 0.254119873046875, 0.26451873779296875, 0.2749176025390625, 0.28531646728515625, 0.29571533203125, 0.30611419677734375, 0.3165130615234375, 0.32691192626953125, 0.337310791015625, 0.34770965576171875, 0.3581085205078125, 0.36850738525390625, 0.37890625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 15.0, 20.0, 16.0, 18.0, 26.0, 40.0, 50.0, 65.0, 90.0, 141.0, 163.0, 309.0, 451.0, 846.0, 1739.0, 4143.0, 10876.0, 30521.0, 88275.0, 238448.0, 366400.0, 195321.0, 70351.0, 24455.0, 8915.0, 3411.0, 1425.0, 758.0, 420.0, 250.0, 143.0, 111.0, 90.0, 67.0, 45.0, 34.0, 24.0, 23.0, 19.0, 13.0, 7.0, 7.0, 2.0, 5.0, 1.0, 0.0, 3.0, 3.0], "bins": [-0.429931640625, -0.4181175231933594, -0.40630340576171875, -0.3944892883300781, -0.3826751708984375, -0.3708610534667969, -0.35904693603515625, -0.3472328186035156, -0.335418701171875, -0.3236045837402344, -0.31179046630859375, -0.2999763488769531, -0.2881622314453125, -0.2763481140136719, -0.26453399658203125, -0.2527198791503906, -0.24090576171875, -0.22909164428710938, -0.21727752685546875, -0.20546340942382812, -0.1936492919921875, -0.18183517456054688, -0.17002105712890625, -0.15820693969726562, -0.146392822265625, -0.13457870483398438, -0.12276458740234375, -0.11095046997070312, -0.0991363525390625, -0.08732223510742188, -0.07550811767578125, -0.06369400024414062, -0.0518798828125, -0.040065765380859375, -0.02825164794921875, -0.016437530517578125, -0.0046234130859375, 0.007190704345703125, 0.01900482177734375, 0.030818939208984375, 0.042633056640625, 0.054447174072265625, 0.06626129150390625, 0.07807540893554688, 0.0898895263671875, 0.10170364379882812, 0.11351776123046875, 0.12533187866210938, 0.13714599609375, 0.14896011352539062, 0.16077423095703125, 0.17258834838867188, 0.1844024658203125, 0.19621658325195312, 0.20803070068359375, 0.21984481811523438, 0.231658935546875, 0.24347305297851562, 0.25528717041015625, 0.2671012878417969, 0.2789154052734375, 0.2907295227050781, 0.30254364013671875, 0.3143577575683594, 0.326171875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 9.0, 5.0, 6.0, 8.0, 16.0, 14.0, 15.0, 19.0, 20.0, 31.0, 24.0, 37.0, 39.0, 36.0, 40.0, 45.0, 63.0, 63.0, 47.0, 64.0, 42.0, 52.0, 44.0, 25.0, 35.0, 32.0, 29.0, 28.0, 20.0, 19.0, 14.0, 4.0, 11.0, 6.0, 11.0, 6.0, 3.0, 4.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.40625, -0.3944587707519531, -0.38266754150390625, -0.3708763122558594, -0.3590850830078125, -0.3472938537597656, -0.33550262451171875, -0.3237113952636719, -0.311920166015625, -0.3001289367675781, -0.28833770751953125, -0.2765464782714844, -0.2647552490234375, -0.2529640197753906, -0.24117279052734375, -0.22938156127929688, -0.21759033203125, -0.20579910278320312, -0.19400787353515625, -0.18221664428710938, -0.1704254150390625, -0.15863418579101562, -0.14684295654296875, -0.13505172729492188, -0.123260498046875, -0.11146926879882812, -0.09967803955078125, -0.08788681030273438, -0.0760955810546875, -0.06430435180664062, -0.05251312255859375, -0.040721893310546875, -0.0289306640625, -0.017139434814453125, -0.00534820556640625, 0.006443023681640625, 0.0182342529296875, 0.030025482177734375, 0.04181671142578125, 0.053607940673828125, 0.065399169921875, 0.07719039916992188, 0.08898162841796875, 0.10077285766601562, 0.1125640869140625, 0.12435531616210938, 0.13614654541015625, 0.14793777465820312, 0.15972900390625, 0.17152023315429688, 0.18331146240234375, 0.19510269165039062, 0.2068939208984375, 0.21868515014648438, 0.23047637939453125, 0.24226760864257812, 0.254058837890625, 0.2658500671386719, 0.27764129638671875, 0.2894325256347656, 0.3012237548828125, 0.3130149841308594, 0.32480621337890625, 0.3365974426269531, 0.348388671875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 12.0, 8.0, 17.0, 22.0, 40.0, 51.0, 93.0, 141.0, 255.0, 507.0, 975.0, 1999.0, 4392.0, 10123.0, 24216.0, 59692.0, 144641.0, 348966.0, 254012.0, 116330.0, 47639.0, 19250.0, 8111.0, 3571.0, 1680.0, 822.0, 430.0, 231.0, 135.0, 78.0, 42.0, 20.0, 16.0, 14.0, 7.0, 10.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06207275390625, -0.06012535095214844, -0.058177947998046875, -0.05623054504394531, -0.05428314208984375, -0.05233573913574219, -0.050388336181640625, -0.04844093322753906, -0.0464935302734375, -0.04454612731933594, -0.042598724365234375, -0.04065132141113281, -0.03870391845703125, -0.03675651550292969, -0.034809112548828125, -0.03286170959472656, -0.030914306640625, -0.028966903686523438, -0.027019500732421875, -0.025072097778320312, -0.02312469482421875, -0.021177291870117188, -0.019229888916015625, -0.017282485961914062, -0.0153350830078125, -0.013387680053710938, -0.011440277099609375, -0.009492874145507812, -0.00754547119140625, -0.0055980682373046875, -0.003650665283203125, -0.0017032623291015625, 0.000244140625, 0.0021915435791015625, 0.004138946533203125, 0.0060863494873046875, 0.00803375244140625, 0.009981155395507812, 0.011928558349609375, 0.013875961303710938, 0.0158233642578125, 0.017770767211914062, 0.019718170166015625, 0.021665573120117188, 0.02361297607421875, 0.025560379028320312, 0.027507781982421875, 0.029455184936523438, 0.031402587890625, 0.03334999084472656, 0.035297393798828125, 0.03724479675292969, 0.03919219970703125, 0.04113960266113281, 0.043087005615234375, 0.04503440856933594, 0.0469818115234375, 0.04892921447753906, 0.050876617431640625, 0.05282402038574219, 0.05477142333984375, 0.05671882629394531, 0.058666229248046875, 0.06061363220214844, 0.06256103515625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 2.0, 3.0, 11.0, 14.0, 13.0, 15.0, 18.0, 24.0, 18.0, 25.0, 24.0, 40.0, 43.0, 45.0, 51.0, 51.0, 83.0, 84.0, 62.0, 52.0, 64.0, 30.0, 34.0, 28.0, 22.0, 28.0, 19.0, 16.0, 15.0, 17.0, 4.0, 10.0, 2.0, 7.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.808208465576172e-06, -7.482245564460754e-06, -7.156282663345337e-06, -6.8303197622299194e-06, -6.504356861114502e-06, -6.1783939599990845e-06, -5.852431058883667e-06, -5.5264681577682495e-06, -5.200505256652832e-06, -4.8745423555374146e-06, -4.548579454421997e-06, -4.22261655330658e-06, -3.896653652191162e-06, -3.5706907510757446e-06, -3.244727849960327e-06, -2.9187649488449097e-06, -2.592802047729492e-06, -2.2668391466140747e-06, -1.9408762454986572e-06, -1.6149133443832397e-06, -1.2889504432678223e-06, -9.629875421524048e-07, -6.370246410369873e-07, -3.110617399215698e-07, 1.4901161193847656e-08, 3.4086406230926514e-07, 6.668269634246826e-07, 9.927898645401e-07, 1.3187527656555176e-06, 1.644715666770935e-06, 1.9706785678863525e-06, 2.29664146900177e-06, 2.6226043701171875e-06, 2.948567271232605e-06, 3.2745301723480225e-06, 3.60049307346344e-06, 3.926455974578857e-06, 4.252418875694275e-06, 4.578381776809692e-06, 4.90434467792511e-06, 5.230307579040527e-06, 5.556270480155945e-06, 5.882233381271362e-06, 6.20819628238678e-06, 6.534159183502197e-06, 6.860122084617615e-06, 7.186084985733032e-06, 7.51204788684845e-06, 7.838010787963867e-06, 8.163973689079285e-06, 8.489936590194702e-06, 8.81589949131012e-06, 9.141862392425537e-06, 9.467825293540955e-06, 9.793788194656372e-06, 1.011975109577179e-05, 1.0445713996887207e-05, 1.0771676898002625e-05, 1.1097639799118042e-05, 1.142360270023346e-05, 1.1749565601348877e-05, 1.2075528502464294e-05, 1.2401491403579712e-05, 1.272745430469513e-05, 1.3053417205810547e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 9.0, 13.0, 19.0, 30.0, 36.0, 61.0, 92.0, 149.0, 209.0, 329.0, 501.0, 788.0, 1370.0, 2575.0, 5066.0, 11787.0, 33178.0, 101673.0, 277720.0, 398611.0, 139584.0, 45362.0, 15815.0, 6401.0, 3037.0, 1579.0, 965.0, 538.0, 367.0, 243.0, 154.0, 104.0, 71.0, 44.0, 27.0, 15.0, 16.0, 7.0, 6.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08099365234375, -0.07839298248291016, -0.07579231262207031, -0.07319164276123047, -0.07059097290039062, -0.06799030303955078, -0.06538963317871094, -0.0627889633178711, -0.06018829345703125, -0.057587623596191406, -0.05498695373535156, -0.05238628387451172, -0.049785614013671875, -0.04718494415283203, -0.04458427429199219, -0.041983604431152344, -0.0393829345703125, -0.036782264709472656, -0.03418159484863281, -0.03158092498779297, -0.028980255126953125, -0.02637958526611328, -0.023778915405273438, -0.021178245544433594, -0.01857757568359375, -0.015976905822753906, -0.013376235961914062, -0.010775566101074219, -0.008174896240234375, -0.005574226379394531, -0.0029735565185546875, -0.00037288665771484375, 0.002227783203125, 0.004828453063964844, 0.0074291229248046875, 0.010029792785644531, 0.012630462646484375, 0.015231132507324219, 0.017831802368164062, 0.020432472229003906, 0.02303314208984375, 0.025633811950683594, 0.028234481811523438, 0.03083515167236328, 0.033435821533203125, 0.03603649139404297, 0.03863716125488281, 0.041237831115722656, 0.0438385009765625, 0.046439170837402344, 0.04903984069824219, 0.05164051055908203, 0.054241180419921875, 0.05684185028076172, 0.05944252014160156, 0.062043190002441406, 0.06464385986328125, 0.0672445297241211, 0.06984519958496094, 0.07244586944580078, 0.07504653930664062, 0.07764720916748047, 0.08024787902832031, 0.08284854888916016, 0.08544921875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 6.0, 4.0, 8.0, 7.0, 17.0, 22.0, 50.0, 64.0, 120.0, 136.0, 234.0, 102.0, 78.0, 49.0, 34.0, 19.0, 12.0, 14.0, 4.0, 5.0, 2.0, 1.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10595703125, -0.10302448272705078, -0.10009193420410156, -0.09715938568115234, -0.09422683715820312, -0.0912942886352539, -0.08836174011230469, -0.08542919158935547, -0.08249664306640625, -0.07956409454345703, -0.07663154602050781, -0.0736989974975586, -0.07076644897460938, -0.06783390045166016, -0.06490135192871094, -0.06196880340576172, -0.0590362548828125, -0.05610370635986328, -0.05317115783691406, -0.050238609313964844, -0.047306060791015625, -0.044373512268066406, -0.04144096374511719, -0.03850841522216797, -0.03557586669921875, -0.03264331817626953, -0.029710769653320312, -0.026778221130371094, -0.023845672607421875, -0.020913124084472656, -0.017980575561523438, -0.015048027038574219, -0.012115478515625, -0.009182929992675781, -0.0062503814697265625, -0.0033178329467773438, -0.000385284423828125, 0.0025472640991210938, 0.0054798126220703125, 0.008412361145019531, 0.01134490966796875, 0.014277458190917969, 0.017210006713867188, 0.020142555236816406, 0.023075103759765625, 0.026007652282714844, 0.028940200805664062, 0.03187274932861328, 0.0348052978515625, 0.03773784637451172, 0.04067039489746094, 0.043602943420410156, 0.046535491943359375, 0.049468040466308594, 0.05240058898925781, 0.05533313751220703, 0.05826568603515625, 0.06119823455810547, 0.06413078308105469, 0.0670633316040039, 0.06999588012695312, 0.07292842864990234, 0.07586097717285156, 0.07879352569580078, 0.08172607421875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 5.0, 10.0, 12.0, 21.0, 29.0, 42.0, 46.0, 64.0, 75.0, 85.0, 107.0, 115.0, 83.0, 66.0, 64.0, 45.0, 41.0, 31.0, 26.0, 9.0, 9.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8088246583938599, -0.7880679368972778, -0.7673112154006958, -0.7465544939041138, -0.7257977724075317, -0.7050409913063049, -0.6842842698097229, -0.6635275483131409, -0.6427708268165588, -0.6220141053199768, -0.6012573838233948, -0.5805006623268127, -0.5597438812255859, -0.5389871597290039, -0.5182304382324219, -0.49747371673583984, -0.4767169952392578, -0.4559602737426758, -0.43520355224609375, -0.41444680094718933, -0.3936900794506073, -0.37293335795402527, -0.35217660665512085, -0.3314198851585388, -0.3106631636619568, -0.28990644216537476, -0.2691497206687927, -0.2483929693698883, -0.22763624787330627, -0.20687952637672424, -0.18612278997898102, -0.1653660535812378, -0.14460933208465576, -0.12385260313749313, -0.1030958741903305, -0.08233914524316788, -0.06158241629600525, -0.04082568734884262, -0.020068958401679993, 0.0006877779960632324, 0.021444499492645264, 0.04220122843980789, 0.06295795738697052, 0.08371468633413315, 0.10447141528129578, 0.1252281367778778, 0.14598487317562103, 0.16674160957336426, 0.1874983310699463, 0.20825505256652832, 0.22901178896427155, 0.24976852536201477, 0.2705252468585968, 0.29128196835517883, 0.31203871965408325, 0.3327954411506653, 0.3535521626472473, 0.37430888414382935, 0.3950656056404114, 0.4158223569393158, 0.4365790784358978, 0.45733579993247986, 0.4780925512313843, 0.4988492727279663, 0.5196059942245483]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 0.0, 6.0, 5.0, 7.0, 11.0, 12.0, 8.0, 10.0, 10.0, 10.0, 21.0, 17.0, 22.0, 25.0, 30.0, 25.0, 24.0, 33.0, 32.0, 36.0, 46.0, 47.0, 36.0, 33.0, 40.0, 36.0, 40.0, 36.0, 44.0, 41.0, 26.0, 28.0, 31.0, 24.0, 15.0, 17.0, 20.0, 20.0, 15.0, 9.0, 13.0, 9.0, 5.0, 7.0, 6.0, 2.0, 1.0, 6.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.5575844049453735, -0.5409726500511169, -0.5243608951568604, -0.5077491402626038, -0.49113738536834717, -0.4745256304740906, -0.45791390538215637, -0.4413021504878998, -0.4246903955936432, -0.4080786406993866, -0.39146688580513, -0.3748551309108734, -0.3582434058189392, -0.3416316509246826, -0.325019896030426, -0.30840814113616943, -0.29179638624191284, -0.27518463134765625, -0.25857287645339966, -0.24196113646030426, -0.22534938156604767, -0.20873762667179108, -0.19212588667869568, -0.1755141317844391, -0.1589023768901825, -0.1422906219959259, -0.1256788671016693, -0.10906712710857391, -0.09245537221431732, -0.07584361732006073, -0.059231869876384735, -0.04262012243270874, -0.02600836753845215, -0.009396616369485855, 0.007215134799480438, 0.02382688596844673, 0.040438637137413025, 0.05705039203166962, 0.07366213947534561, 0.0902738869190216, 0.1068856418132782, 0.12349739670753479, 0.14010915160179138, 0.15672089159488678, 0.17333264648914337, 0.18994440138339996, 0.20655614137649536, 0.22316789627075195, 0.23977965116500854, 0.25639140605926514, 0.27300316095352173, 0.2896149158477783, 0.3062266707420349, 0.3228384256362915, 0.3394501507282257, 0.3560619056224823, 0.3726736605167389, 0.3892854154109955, 0.4058971703052521, 0.42250892519950867, 0.43912065029144287, 0.45573240518569946, 0.47234416007995605, 0.48895591497421265, 0.5055676698684692]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 10.0, 14.0, 15.0, 18.0, 31.0, 43.0, 44.0, 64.0, 122.0, 154.0, 225.0, 372.0, 496.0, 684.0, 1004.0, 1492.0, 2347.0, 3762.0, 6234.0, 1009596.0, 8782.0, 5288.0, 3295.0, 2125.0, 1369.0, 980.0, 635.0, 418.0, 294.0, 218.0, 153.0, 93.0, 76.0, 48.0, 28.0, 20.0, 14.0, 9.0, 12.0, 6.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5183072090148926, -0.5015133023262024, -0.4847193956375122, -0.467925488948822, -0.45113155245780945, -0.43433764576911926, -0.4175437390804291, -0.4007498323917389, -0.3839558959007263, -0.36716198921203613, -0.35036808252334595, -0.33357417583465576, -0.3167802393436432, -0.299986332654953, -0.2831924259662628, -0.26639851927757263, -0.24960461258888245, -0.23281070590019226, -0.21601678431034088, -0.1992228776216507, -0.18242895603179932, -0.16563504934310913, -0.14884114265441895, -0.13204723596572876, -0.11525331437587738, -0.0984594002366066, -0.08166548609733582, -0.06487157940864563, -0.04807766526937485, -0.031283751130104065, -0.01448984444141388, 0.002304069697856903, 0.019097983837127686, 0.03589189797639847, 0.05268580839037895, 0.06947971880435944, 0.08627363294363022, 0.103067547082901, 0.11986145377159119, 0.13665536046028137, 0.15344928205013275, 0.17024318873882294, 0.18703711032867432, 0.2038310170173645, 0.2206249237060547, 0.23741884529590607, 0.25421273708343506, 0.27100667357444763, 0.2878005802631378, 0.304594486951828, 0.3213883936405182, 0.33818233013153076, 0.35497623682022095, 0.37177014350891113, 0.3885640501976013, 0.4053579568862915, 0.4221518635749817, 0.4389457702636719, 0.45573967695236206, 0.47253358364105225, 0.4893275201320648, 0.5061213970184326, 0.5229153633117676, 0.5397092700004578, 0.556503176689148]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 8.0, 6.0, 10.0, 21.0, 39.0, 54.0, 81.0, 202.0, 346.0, 632.0, 1153.0, 2073.0, 4051.0, 10658.0, 51404888.0, 33277.0, 6109.0, 3075.0, 1605.0, 892.0, 490.0, 281.0, 167.0, 86.0, 44.0, 31.0, 18.0, 14.0, 9.0, 5.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.65234375, -5.455806255340576, -5.259268760681152, -5.06273078918457, -4.8661932945251465, -4.669655799865723, -4.473118305206299, -4.276580810546875, -4.080043315887451, -3.8835058212280273, -3.6869680881500244, -3.4904305934906006, -3.2938930988311768, -3.097355365753174, -2.90081787109375, -2.704280376434326, -2.5077426433563232, -2.3112051486968994, -2.1146674156188965, -1.9181299209594727, -1.7215924263000488, -1.5250548124313354, -1.328517198562622, -1.1319797039031982, -0.9354420900344849, -0.7389045357704163, -0.5423669815063477, -0.3458293676376343, -0.14929181337356567, 0.04724574089050293, 0.2437833547592163, 0.44032084941864014, 0.6368584632873535, 0.8333960175514221, 1.0299335718154907, 1.226471185684204, 1.423008680343628, 1.6195462942123413, 1.8160839080810547, 2.0126214027404785, 2.2091588973999023, 2.405696392059326, 2.602234125137329, 2.798771619796753, 2.9953091144561768, 3.1918468475341797, 3.3883843421936035, 3.5849218368530273, 3.7814595699310303, 3.977997064590454, 4.174534797668457, 4.371072292327881, 4.567609786987305, 4.7641472816467285, 4.960684776306152, 5.157222747802734, 5.353760242462158, 5.550297737121582, 5.746835231781006, 5.94337272644043, 6.139910697937012, 6.3364481925964355, 6.532985687255859, 6.729523181915283, 6.926060676574707]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 6.0, 11.0, 12.0, 16.0, 34.0, 60.0, 88.0, 157.0, 257.0, 360.0, 673.0, 994.0, 1613.0, 2744.0, 4405.0, 7380.0, 12715.0, 21183.0, 36544.0, 61043.0, 101888.0, 160428.0, 236500.0, 324469.0, 531979.0, 3229397.0, 565899.0, 329037.0, 240176.0, 163671.0, 103322.0, 63526.0, 37204.0, 21588.0, 13079.0, 7506.0, 4574.0, 2702.0, 1595.0, 1049.0, 617.0, 379.0, 207.0, 126.0, 89.0, 52.0, 39.0, 17.0, 15.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.54833984375, -0.53094482421875, -0.5135498046875, -0.49615478515625, -0.478759765625, -0.46136474609375, -0.4439697265625, -0.42657470703125, -0.4091796875, -0.39178466796875, -0.3743896484375, -0.35699462890625, -0.339599609375, -0.32220458984375, -0.3048095703125, -0.28741455078125, -0.27001953125, -0.25262451171875, -0.2352294921875, -0.21783447265625, -0.200439453125, -0.18304443359375, -0.1656494140625, -0.14825439453125, -0.130859375, -0.11346435546875, -0.0960693359375, -0.07867431640625, -0.061279296875, -0.04388427734375, -0.0264892578125, -0.00909423828125, 0.00830078125, 0.02569580078125, 0.0430908203125, 0.06048583984375, 0.077880859375, 0.09527587890625, 0.1126708984375, 0.13006591796875, 0.1474609375, 0.16485595703125, 0.1822509765625, 0.19964599609375, 0.217041015625, 0.23443603515625, 0.2518310546875, 0.26922607421875, 0.28662109375, 0.30401611328125, 0.3214111328125, 0.33880615234375, 0.356201171875, 0.37359619140625, 0.3909912109375, 0.40838623046875, 0.42578125, 0.44317626953125, 0.4605712890625, 0.47796630859375, 0.495361328125, 0.51275634765625, 0.5301513671875, 0.54754638671875, 0.56494140625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 4.0, 6.0, 1.0, 8.0, 7.0, 12.0, 12.0, 16.0, 16.0, 17.0, 33.0, 27.0, 33.0, 39.0, 59.0, 44.0, 50.0, 45.0, 117.0, 798.0, 253.0, 63.0, 51.0, 54.0, 45.0, 29.0, 40.0, 23.0, 22.0, 23.0, 19.0, 25.0, 6.0, 7.0, 7.0, 8.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44140625, -4.28680419921875, -4.1322021484375, -3.97760009765625, -3.822998046875, -3.66839599609375, -3.5137939453125, -3.35919189453125, -3.20458984375, -3.04998779296875, -2.8953857421875, -2.74078369140625, -2.586181640625, -2.43157958984375, -2.2769775390625, -2.12237548828125, -1.9677734375, -1.81317138671875, -1.6585693359375, -1.50396728515625, -1.349365234375, -1.19476318359375, -1.0401611328125, -0.88555908203125, -0.73095703125, -0.57635498046875, -0.4217529296875, -0.26715087890625, -0.112548828125, 0.04205322265625, 0.1966552734375, 0.35125732421875, 0.505859375, 0.66046142578125, 0.8150634765625, 0.96966552734375, 1.124267578125, 1.27886962890625, 1.4334716796875, 1.58807373046875, 1.74267578125, 1.89727783203125, 2.0518798828125, 2.20648193359375, 2.361083984375, 2.51568603515625, 2.6702880859375, 2.82489013671875, 2.9794921875, 3.13409423828125, 3.2886962890625, 3.44329833984375, 3.597900390625, 3.75250244140625, 3.9071044921875, 4.06170654296875, 4.21630859375, 4.37091064453125, 4.5255126953125, 4.68011474609375, 4.834716796875, 4.98931884765625, 5.1439208984375, 5.29852294921875, 5.453125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 5.0, 7.0, 18.0, 26.0, 31.0, 78.0, 143.0, 283.0, 481.0, 857.0, 1616.0, 2745.0, 4801.0, 8220.0, 13815.0, 22881.0, 36162.0, 55233.0, 83053.0, 118733.0, 161470.0, 210079.0, 256878.0, 306615.0, 2030191.0, 1724125.0, 299246.0, 251881.0, 205778.0, 158386.0, 115020.0, 80411.0, 53732.0, 34704.0, 21659.0, 13314.0, 7965.0, 4743.0, 2716.0, 1426.0, 842.0, 436.0, 272.0, 168.0, 99.0, 46.0, 27.0, 18.0, 8.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.302001953125, -0.2912025451660156, -0.28040313720703125, -0.2696037292480469, -0.2588043212890625, -0.24800491333007812, -0.23720550537109375, -0.22640609741210938, -0.215606689453125, -0.20480728149414062, -0.19400787353515625, -0.18320846557617188, -0.1724090576171875, -0.16160964965820312, -0.15081024169921875, -0.14001083374023438, -0.12921142578125, -0.11841201782226562, -0.10761260986328125, -0.09681320190429688, -0.0860137939453125, -0.07521438598632812, -0.06441497802734375, -0.053615570068359375, -0.042816162109375, -0.032016754150390625, -0.02121734619140625, -0.010417938232421875, 0.0003814697265625, 0.011180877685546875, 0.02198028564453125, 0.032779693603515625, 0.0435791015625, 0.054378509521484375, 0.06517791748046875, 0.07597732543945312, 0.0867767333984375, 0.09757614135742188, 0.10837554931640625, 0.11917495727539062, 0.129974365234375, 0.14077377319335938, 0.15157318115234375, 0.16237258911132812, 0.1731719970703125, 0.18397140502929688, 0.19477081298828125, 0.20557022094726562, 0.21636962890625, 0.22716903686523438, 0.23796844482421875, 0.24876785278320312, 0.2595672607421875, 0.2703666687011719, 0.28116607666015625, 0.2919654846191406, 0.302764892578125, 0.3135643005371094, 0.32436370849609375, 0.3351631164550781, 0.3459625244140625, 0.3567619323730469, 0.36756134033203125, 0.3783607482910156, 0.38916015625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 3.0, 8.0, 1.0, 7.0, 10.0, 10.0, 8.0, 11.0, 14.0, 23.0, 15.0, 25.0, 23.0, 26.0, 33.0, 43.0, 36.0, 31.0, 42.0, 31.0, 39.0, 65.0, 499.0, 537.0, 54.0, 31.0, 33.0, 36.0, 29.0, 23.0, 27.0, 30.0, 26.0, 18.0, 25.0, 24.0, 19.0, 13.0, 19.0, 13.0, 16.0, 7.0, 8.0, 9.0, 7.0, 6.0, 2.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.140625, -3.042633056640625, -2.94464111328125, -2.846649169921875, -2.7486572265625, -2.650665283203125, -2.55267333984375, -2.454681396484375, -2.356689453125, -2.258697509765625, -2.16070556640625, -2.062713623046875, -1.9647216796875, -1.866729736328125, -1.76873779296875, -1.670745849609375, -1.57275390625, -1.474761962890625, -1.37677001953125, -1.278778076171875, -1.1807861328125, -1.082794189453125, -0.98480224609375, -0.886810302734375, -0.788818359375, -0.690826416015625, -0.59283447265625, -0.494842529296875, -0.3968505859375, -0.298858642578125, -0.20086669921875, -0.102874755859375, -0.0048828125, 0.093109130859375, 0.19110107421875, 0.289093017578125, 0.3870849609375, 0.485076904296875, 0.58306884765625, 0.681060791015625, 0.779052734375, 0.877044677734375, 0.97503662109375, 1.073028564453125, 1.1710205078125, 1.269012451171875, 1.36700439453125, 1.464996337890625, 1.56298828125, 1.660980224609375, 1.75897216796875, 1.856964111328125, 1.9549560546875, 2.052947998046875, 2.15093994140625, 2.248931884765625, 2.346923828125, 2.444915771484375, 2.54290771484375, 2.640899658203125, 2.7388916015625, 2.836883544921875, 2.93487548828125, 3.032867431640625, 3.130859375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 1.0, 3.0, 5.0, 12.0, 17.0, 19.0, 29.0, 36.0, 61.0, 66.0, 99.0, 135.0, 211.0, 264.0, 363.0, 573.0, 798.0, 1238.0, 2014.0, 3645.0, 7434.0, 17970.0, 46947.0, 112513.0, 4123134.0, 1780856.0, 112205.0, 46100.0, 17823.0, 7366.0, 3538.0, 1976.0, 1278.0, 779.0, 542.0, 362.0, 271.0, 220.0, 159.0, 101.0, 80.0, 58.0, 37.0, 35.0, 18.0, 12.0, 14.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.5537109375, -1.5001220703125, -1.446533203125, -1.3929443359375, -1.33935546875, -1.2857666015625, -1.232177734375, -1.1785888671875, -1.125, -1.0714111328125, -1.017822265625, -0.9642333984375, -0.91064453125, -0.8570556640625, -0.803466796875, -0.7498779296875, -0.6962890625, -0.6427001953125, -0.589111328125, -0.5355224609375, -0.48193359375, -0.4283447265625, -0.374755859375, -0.3211669921875, -0.267578125, -0.2139892578125, -0.160400390625, -0.1068115234375, -0.05322265625, 0.0003662109375, 0.053955078125, 0.1075439453125, 0.1611328125, 0.2147216796875, 0.268310546875, 0.3218994140625, 0.37548828125, 0.4290771484375, 0.482666015625, 0.5362548828125, 0.58984375, 0.6434326171875, 0.697021484375, 0.7506103515625, 0.80419921875, 0.8577880859375, 0.911376953125, 0.9649658203125, 1.0185546875, 1.0721435546875, 1.125732421875, 1.1793212890625, 1.23291015625, 1.2864990234375, 1.340087890625, 1.3936767578125, 1.447265625, 1.5008544921875, 1.554443359375, 1.6080322265625, 1.66162109375, 1.7152099609375, 1.768798828125, 1.8223876953125, 1.8759765625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 6.0, 0.0, 2.0, 5.0, 7.0, 5.0, 10.0, 8.0, 6.0, 20.0, 20.0, 22.0, 24.0, 18.0, 31.0, 29.0, 32.0, 45.0, 45.0, 34.0, 49.0, 102.0, 841.0, 206.0, 54.0, 46.0, 28.0, 40.0, 42.0, 38.0, 22.0, 35.0, 23.0, 19.0, 25.0, 14.0, 10.0, 10.0, 16.0, 7.0, 8.0, 12.0, 5.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.53125, -3.41607666015625, -3.3009033203125, -3.18572998046875, -3.070556640625, -2.95538330078125, -2.8402099609375, -2.72503662109375, -2.60986328125, -2.49468994140625, -2.3795166015625, -2.26434326171875, -2.149169921875, -2.03399658203125, -1.9188232421875, -1.80364990234375, -1.6884765625, -1.57330322265625, -1.4581298828125, -1.34295654296875, -1.227783203125, -1.11260986328125, -0.9974365234375, -0.88226318359375, -0.76708984375, -0.65191650390625, -0.5367431640625, -0.42156982421875, -0.306396484375, -0.19122314453125, -0.0760498046875, 0.03912353515625, 0.154296875, 0.26947021484375, 0.3846435546875, 0.49981689453125, 0.614990234375, 0.73016357421875, 0.8453369140625, 0.96051025390625, 1.07568359375, 1.19085693359375, 1.3060302734375, 1.42120361328125, 1.536376953125, 1.65155029296875, 1.7667236328125, 1.88189697265625, 1.9970703125, 2.11224365234375, 2.2274169921875, 2.34259033203125, 2.457763671875, 2.57293701171875, 2.6881103515625, 2.80328369140625, 2.91845703125, 3.03363037109375, 3.1488037109375, 3.26397705078125, 3.379150390625, 3.49432373046875, 3.6094970703125, 3.72467041015625, 3.83984375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 7.0, 8.0, 9.0, 24.0, 36.0, 59.0, 96.0, 140.0, 203.0, 152.0, 80.0, 70.0, 42.0, 25.0, 19.0, 9.0, 2.0, 6.0, 2.0, 3.0, 1.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.538033485412598, -11.14929485321045, -10.760555267333984, -10.371816635131836, -9.983078002929688, -9.594338417053223, -9.205599784851074, -8.81686019897461, -8.428121566772461, -8.039382934570312, -7.650643348693848, -7.261904716491699, -6.873165607452393, -6.484426498413086, -6.0956878662109375, -5.706948757171631, -5.318209648132324, -4.929470539093018, -4.540731430053711, -4.1519927978515625, -3.763253688812256, -3.374514579772949, -2.9857757091522217, -2.597036838531494, -2.2082977294921875, -1.8195587396621704, -1.4308197498321533, -1.0420807600021362, -0.6533417701721191, -0.26460278034210205, 0.12413620948791504, 0.5128750801086426, 0.9016132354736328, 1.29035222530365, 1.679091215133667, 2.0678300857543945, 2.456569194793701, 2.845308303833008, 3.2340471744537354, 3.622786045074463, 4.0115251541137695, 4.400264263153076, 4.789003372192383, 5.177742004394531, 5.566481113433838, 5.9552202224731445, 6.343958854675293, 6.7326979637146, 7.121437072753906, 7.510176181793213, 7.8989152908325195, 8.287653923034668, 8.676393508911133, 9.065132141113281, 9.45387077331543, 9.842609405517578, 10.231348991394043, 10.620087623596191, 11.008827209472656, 11.397565841674805, 11.786304473876953, 12.175044059753418, 12.563782691955566, 12.952522277832031, 13.34126091003418]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 7.0, 5.0, 7.0, 9.0, 7.0, 17.0, 9.0, 15.0, 24.0, 31.0, 23.0, 47.0, 53.0, 67.0, 53.0, 92.0, 94.0, 75.0, 69.0, 60.0, 47.0, 34.0, 35.0, 26.0, 28.0, 15.0, 19.0, 10.0, 4.0, 7.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.305809020996094, -15.819100379943848, -15.332390785217285, -14.845682144165039, -14.358972549438477, -13.87226390838623, -13.385554313659668, -12.898845672607422, -12.41213607788086, -11.925427436828613, -11.43871784210205, -10.952009201049805, -10.465299606323242, -9.978590965270996, -9.491881370544434, -9.005172729492188, -8.518463134765625, -8.031754493713379, -7.545044898986816, -7.058335781097412, -6.571626663208008, -6.084918022155762, -5.598208427429199, -5.111499786376953, -4.624791145324707, -4.138082027435303, -3.6513729095458984, -3.164663791656494, -2.67795467376709, -2.1912457942962646, -1.7045366764068604, -1.217827558517456, -0.7311182022094727, -0.24440911412239075, 0.24229997396469116, 0.7290090322494507, 1.215718150138855, 1.7024271488189697, 2.189136266708374, 2.6758453845977783, 3.1625545024871826, 3.649263620376587, 4.135972499847412, 4.622681617736816, 5.109390735626221, 5.596099853515625, 6.082808971405029, 6.569518089294434, 7.056227207183838, 7.542936325073242, 8.029644966125488, 8.51635456085205, 9.003063201904297, 9.48977279663086, 9.976481437683105, 10.463191032409668, 10.949899673461914, 11.43660831451416, 11.923317909240723, 12.410026550292969, 12.896736145019531, 13.383444786071777, 13.87015438079834, 14.356863021850586, 14.843572616577148]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 10.0, 9.0, 17.0, 27.0, 41.0, 66.0, 93.0, 137.0, 250.0, 440.0, 716.0, 1421.0, 2811.0, 6276.0, 16505.0, 58716.0, 3716206.0, 322403.0, 41411.0, 14089.0, 6034.0, 2864.0, 1519.0, 855.0, 500.0, 295.0, 193.0, 131.0, 73.0, 46.0, 44.0, 20.0, 19.0, 13.0, 9.0, 4.0, 6.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1336669921875, -0.1294708251953125, -0.125274658203125, -0.1210784912109375, -0.11688232421875, -0.1126861572265625, -0.108489990234375, -0.1042938232421875, -0.10009765625, -0.0959014892578125, -0.091705322265625, -0.0875091552734375, -0.08331298828125, -0.0791168212890625, -0.074920654296875, -0.0707244873046875, -0.0665283203125, -0.0623321533203125, -0.058135986328125, -0.0539398193359375, -0.04974365234375, -0.0455474853515625, -0.041351318359375, -0.0371551513671875, -0.032958984375, -0.0287628173828125, -0.024566650390625, -0.0203704833984375, -0.01617431640625, -0.0119781494140625, -0.007781982421875, -0.0035858154296875, 0.0006103515625, 0.0048065185546875, 0.009002685546875, 0.0131988525390625, 0.01739501953125, 0.0215911865234375, 0.025787353515625, 0.0299835205078125, 0.0341796875, 0.0383758544921875, 0.042572021484375, 0.0467681884765625, 0.05096435546875, 0.0551605224609375, 0.059356689453125, 0.0635528564453125, 0.0677490234375, 0.0719451904296875, 0.076141357421875, 0.0803375244140625, 0.08453369140625, 0.0887298583984375, 0.092926025390625, 0.0971221923828125, 0.101318359375, 0.1055145263671875, 0.109710693359375, 0.1139068603515625, 0.11810302734375, 0.1222991943359375, 0.126495361328125, 0.1306915283203125, 0.1348876953125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 9.0, 4.0, 2.0, 9.0, 4.0, 6.0, 8.0, 14.0, 11.0, 11.0, 24.0, 49.0, 259.0, 395.0, 55.0, 21.0, 15.0, 21.0, 9.0, 8.0, 10.0, 6.0, 7.0, 4.0, 4.0, 5.0, 5.0, 1.0, 6.0, 3.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033050537109375, -0.03179597854614258, -0.030541419982910156, -0.029286861419677734, -0.028032302856445312, -0.02677774429321289, -0.02552318572998047, -0.024268627166748047, -0.023014068603515625, -0.021759510040283203, -0.02050495147705078, -0.01925039291381836, -0.017995834350585938, -0.016741275787353516, -0.015486717224121094, -0.014232158660888672, -0.01297760009765625, -0.011723041534423828, -0.010468482971191406, -0.009213924407958984, -0.007959365844726562, -0.006704807281494141, -0.005450248718261719, -0.004195690155029297, -0.002941131591796875, -0.0016865730285644531, -0.00043201446533203125, 0.0008225440979003906, 0.0020771026611328125, 0.0033316612243652344, 0.004586219787597656, 0.005840778350830078, 0.0070953369140625, 0.008349895477294922, 0.009604454040527344, 0.010859012603759766, 0.012113571166992188, 0.01336812973022461, 0.014622688293457031, 0.015877246856689453, 0.017131805419921875, 0.018386363983154297, 0.01964092254638672, 0.02089548110961914, 0.022150039672851562, 0.023404598236083984, 0.024659156799316406, 0.025913715362548828, 0.02716827392578125, 0.028422832489013672, 0.029677391052246094, 0.030931949615478516, 0.03218650817871094, 0.03344106674194336, 0.03469562530517578, 0.0359501838684082, 0.037204742431640625, 0.03845930099487305, 0.03971385955810547, 0.04096841812133789, 0.04222297668457031, 0.043477535247802734, 0.044732093811035156, 0.04598665237426758, 0.0472412109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 6.0, 6.0, 6.0, 11.0, 16.0, 16.0, 16.0, 24.0, 35.0, 46.0, 67.0, 104.0, 159.0, 234.0, 385.0, 743.0, 1473.0, 3436.0, 8370.0, 22526.0, 67283.0, 247533.0, 1545534.0, 1902663.0, 279091.0, 73924.0, 24199.0, 8961.0, 3777.0, 1650.0, 792.0, 424.0, 212.0, 170.0, 93.0, 64.0, 48.0, 48.0, 32.0, 22.0, 16.0, 16.0, 13.0, 10.0, 9.0, 4.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.08154296875, -0.07907485961914062, -0.07660675048828125, -0.07413864135742188, -0.0716705322265625, -0.06920242309570312, -0.06673431396484375, -0.06426620483398438, -0.061798095703125, -0.059329986572265625, -0.05686187744140625, -0.054393768310546875, -0.0519256591796875, -0.049457550048828125, -0.04698944091796875, -0.044521331787109375, -0.04205322265625, -0.039585113525390625, -0.03711700439453125, -0.034648895263671875, -0.0321807861328125, -0.029712677001953125, -0.02724456787109375, -0.024776458740234375, -0.022308349609375, -0.019840240478515625, -0.01737213134765625, -0.014904022216796875, -0.0124359130859375, -0.009967803955078125, -0.00749969482421875, -0.005031585693359375, -0.0025634765625, -9.5367431640625e-05, 0.00237274169921875, 0.004840850830078125, 0.0073089599609375, 0.009777069091796875, 0.01224517822265625, 0.014713287353515625, 0.017181396484375, 0.019649505615234375, 0.02211761474609375, 0.024585723876953125, 0.0270538330078125, 0.029521942138671875, 0.03199005126953125, 0.034458160400390625, 0.03692626953125, 0.039394378662109375, 0.04186248779296875, 0.044330596923828125, 0.0467987060546875, 0.049266815185546875, 0.05173492431640625, 0.054203033447265625, 0.056671142578125, 0.059139251708984375, 0.06160736083984375, 0.06407546997070312, 0.0665435791015625, 0.06901168823242188, 0.07147979736328125, 0.07394790649414062, 0.076416015625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 12.0, 5.0, 8.0, 21.0, 16.0, 22.0, 27.0, 33.0, 39.0, 61.0, 79.0, 93.0, 136.0, 187.0, 275.0, 463.0, 824.0, 562.0, 357.0, 214.0, 159.0, 116.0, 78.0, 58.0, 33.0, 34.0, 35.0, 19.0, 21.0, 17.0, 13.0, 6.0, 9.0, 7.0, 7.0, 9.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029388427734375, -0.028324604034423828, -0.027260780334472656, -0.026196956634521484, -0.025133132934570312, -0.02406930923461914, -0.02300548553466797, -0.021941661834716797, -0.020877838134765625, -0.019814014434814453, -0.01875019073486328, -0.01768636703491211, -0.016622543334960938, -0.015558719635009766, -0.014494895935058594, -0.013431072235107422, -0.01236724853515625, -0.011303424835205078, -0.010239601135253906, -0.009175777435302734, -0.008111953735351562, -0.007048130035400391, -0.005984306335449219, -0.004920482635498047, -0.003856658935546875, -0.002792835235595703, -0.0017290115356445312, -0.0006651878356933594, 0.0003986358642578125, 0.0014624595642089844, 0.0025262832641601562, 0.003590106964111328, 0.0046539306640625, 0.005717754364013672, 0.006781578063964844, 0.007845401763916016, 0.008909225463867188, 0.00997304916381836, 0.011036872863769531, 0.012100696563720703, 0.013164520263671875, 0.014228343963623047, 0.015292167663574219, 0.01635599136352539, 0.017419815063476562, 0.018483638763427734, 0.019547462463378906, 0.020611286163330078, 0.02167510986328125, 0.022738933563232422, 0.023802757263183594, 0.024866580963134766, 0.025930404663085938, 0.02699422836303711, 0.02805805206298828, 0.029121875762939453, 0.030185699462890625, 0.031249523162841797, 0.03231334686279297, 0.03337717056274414, 0.03444099426269531, 0.035504817962646484, 0.036568641662597656, 0.03763246536254883, 0.0386962890625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 7.0, 11.0, 46.0, 108.0, 195.0, 225.0, 197.0, 111.0, 66.0, 26.0, 6.0, 1.0, 1.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.389734148979187, -0.3784733712673187, -0.36721259355545044, -0.35595181584358215, -0.34469103813171387, -0.3334302604198456, -0.3221694827079773, -0.3109087347984314, -0.2996479272842407, -0.28838714957237244, -0.27712637186050415, -0.26586559414863586, -0.2546048164367676, -0.2433440387248993, -0.2320832759141922, -0.2208224982023239, -0.20956173539161682, -0.19830095767974854, -0.18704017996788025, -0.17577940225601196, -0.16451862454414368, -0.1532578468322754, -0.1419970840215683, -0.1307363063097, -0.11947552859783173, -0.10821475088596344, -0.09695397317409515, -0.08569320291280746, -0.07443242520093918, -0.06317164748907089, -0.0519108772277832, -0.04065009951591492, -0.02938932180404663, -0.018128545954823494, -0.006867770105600357, 0.004393003880977631, 0.015653781592845917, 0.026914559304714203, 0.03817532956600189, 0.04943610727787018, 0.060696884989738464, 0.07195766270160675, 0.08321844041347504, 0.09447921067476273, 0.10573998838663101, 0.1170007660984993, 0.128261536359787, 0.13952231407165527, 0.15078309178352356, 0.16204386949539185, 0.17330464720726013, 0.18456542491912842, 0.1958262026309967, 0.207086980342865, 0.21834774315357208, 0.22960852086544037, 0.24086929857730865, 0.25213006138801575, 0.26339083909988403, 0.2746516168117523, 0.2859123945236206, 0.2971731722354889, 0.3084339499473572, 0.31969472765922546, 0.33095550537109375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 14.0, 15.0, 33.0, 28.0, 34.0, 48.0, 59.0, 63.0, 72.0, 62.0, 74.0, 72.0, 64.0, 65.0, 53.0, 63.0, 45.0, 32.0, 24.0, 20.0, 16.0, 11.0, 5.0, 2.0, 6.0, 4.0, 8.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.3145880699157715, -0.30716803669929504, -0.2997480034828186, -0.29232797026634216, -0.2849079370498657, -0.27748793363571167, -0.27006787061691284, -0.2626478672027588, -0.25522783398628235, -0.2478078007698059, -0.24038776755332947, -0.23296773433685303, -0.22554771602153778, -0.21812768280506134, -0.2107076495885849, -0.20328761637210846, -0.19586758315563202, -0.18844754993915558, -0.18102751672267914, -0.1736074984073639, -0.16618746519088745, -0.158767431974411, -0.15134739875793457, -0.14392736554145813, -0.1365073323249817, -0.12908729910850525, -0.1216672733426094, -0.11424724012613297, -0.10682721436023712, -0.09940718114376068, -0.09198714792728424, -0.0845671147108078, -0.07714709639549255, -0.06972706317901611, -0.06230703741312027, -0.05488700419664383, -0.04746697470545769, -0.040046945214271545, -0.032626911997795105, -0.025206882506608963, -0.01778685301542282, -0.010366822592914104, -0.002946792170405388, 0.004473239183425903, 0.011893268674612045, 0.019313298165798187, 0.026733331382274628, 0.03415336087346077, 0.04157339036464691, 0.048993419855833054, 0.056413449347019196, 0.06383348256349564, 0.07125350832939148, 0.07867354154586792, 0.08609357476234436, 0.0935136079788208, 0.10093363374471664, 0.10835366696119308, 0.11577369272708893, 0.12319372594356537, 0.1306137591600418, 0.13803377747535706, 0.1454538106918335, 0.15287384390830994, 0.16029387712478638]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 9.0, 9.0, 7.0, 12.0, 17.0, 37.0, 46.0, 79.0, 110.0, 149.0, 248.0, 383.0, 552.0, 896.0, 1377.0, 2228.0, 3383.0, 5525.0, 9189.0, 16837.0, 32272.0, 117419.0, 741384.0, 57861.0, 24729.0, 13490.0, 7766.0, 4559.0, 2776.0, 1800.0, 1183.0, 770.0, 465.0, 358.0, 226.0, 145.0, 87.0, 59.0, 34.0, 21.0, 21.0, 16.0, 6.0, 8.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1070556640625, -0.1036367416381836, -0.10021781921386719, -0.09679889678955078, -0.09337997436523438, -0.08996105194091797, -0.08654212951660156, -0.08312320709228516, -0.07970428466796875, -0.07628536224365234, -0.07286643981933594, -0.06944751739501953, -0.06602859497070312, -0.06260967254638672, -0.05919075012207031, -0.055771827697753906, -0.0523529052734375, -0.048933982849121094, -0.04551506042480469, -0.04209613800048828, -0.038677215576171875, -0.03525829315185547, -0.03183937072753906, -0.028420448303222656, -0.02500152587890625, -0.021582603454589844, -0.018163681030273438, -0.014744758605957031, -0.011325836181640625, -0.007906913757324219, -0.0044879913330078125, -0.0010690689086914062, 0.002349853515625, 0.005768775939941406, 0.009187698364257812, 0.012606620788574219, 0.016025543212890625, 0.01944446563720703, 0.022863388061523438, 0.026282310485839844, 0.02970123291015625, 0.033120155334472656, 0.03653907775878906, 0.03995800018310547, 0.043376922607421875, 0.04679584503173828, 0.05021476745605469, 0.053633689880371094, 0.0570526123046875, 0.060471534729003906, 0.06389045715332031, 0.06730937957763672, 0.07072830200195312, 0.07414722442626953, 0.07756614685058594, 0.08098506927490234, 0.08440399169921875, 0.08782291412353516, 0.09124183654785156, 0.09466075897216797, 0.09807968139648438, 0.10149860382080078, 0.10491752624511719, 0.1083364486694336, 0.11175537109375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 10.0, 3.0, 10.0, 7.0, 10.0, 13.0, 10.0, 10.0, 35.0, 115.0, 426.0, 174.0, 43.0, 23.0, 15.0, 17.0, 12.0, 9.0, 5.0, 5.0, 6.0, 6.0, 2.0, 6.0, 5.0, 1.0, 3.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035400390625, -0.03408527374267578, -0.03277015686035156, -0.031455039978027344, -0.030139923095703125, -0.028824806213378906, -0.027509689331054688, -0.02619457244873047, -0.02487945556640625, -0.02356433868408203, -0.022249221801757812, -0.020934104919433594, -0.019618988037109375, -0.018303871154785156, -0.016988754272460938, -0.01567363739013672, -0.0143585205078125, -0.013043403625488281, -0.011728286743164062, -0.010413169860839844, -0.009098052978515625, -0.007782936096191406, -0.0064678192138671875, -0.005152702331542969, -0.00383758544921875, -0.0025224685668945312, -0.0012073516845703125, 0.00010776519775390625, 0.001422882080078125, 0.0027379989624023438, 0.0040531158447265625, 0.005368232727050781, 0.006683349609375, 0.007998466491699219, 0.009313583374023438, 0.010628700256347656, 0.011943817138671875, 0.013258934020996094, 0.014574050903320312, 0.01588916778564453, 0.01720428466796875, 0.01851940155029297, 0.019834518432617188, 0.021149635314941406, 0.022464752197265625, 0.023779869079589844, 0.025094985961914062, 0.02641010284423828, 0.0277252197265625, 0.02904033660888672, 0.030355453491210938, 0.031670570373535156, 0.032985687255859375, 0.034300804138183594, 0.03561592102050781, 0.03693103790283203, 0.03824615478515625, 0.03956127166748047, 0.04087638854980469, 0.042191505432128906, 0.043506622314453125, 0.044821739196777344, 0.04613685607910156, 0.04745197296142578, 0.04876708984375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 10.0, 5.0, 12.0, 17.0, 16.0, 28.0, 27.0, 38.0, 58.0, 73.0, 124.0, 202.0, 360.0, 633.0, 1452.0, 3814.0, 12583.0, 51948.0, 282682.0, 537612.0, 120622.0, 25175.0, 6756.0, 2179.0, 889.0, 431.0, 295.0, 163.0, 96.0, 75.0, 59.0, 36.0, 21.0, 18.0, 20.0, 8.0, 8.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12451171875, -0.12076759338378906, -0.11702346801757812, -0.11327934265136719, -0.10953521728515625, -0.10579109191894531, -0.10204696655273438, -0.09830284118652344, -0.0945587158203125, -0.09081459045410156, -0.08707046508789062, -0.08332633972167969, -0.07958221435546875, -0.07583808898925781, -0.07209396362304688, -0.06834983825683594, -0.064605712890625, -0.06086158752441406, -0.057117462158203125, -0.05337333679199219, -0.04962921142578125, -0.04588508605957031, -0.042140960693359375, -0.03839683532714844, -0.0346527099609375, -0.030908584594726562, -0.027164459228515625, -0.023420333862304688, -0.01967620849609375, -0.015932083129882812, -0.012187957763671875, -0.008443832397460938, -0.00469970703125, -0.0009555816650390625, 0.002788543701171875, 0.0065326690673828125, 0.01027679443359375, 0.014020919799804688, 0.017765045166015625, 0.021509170532226562, 0.0252532958984375, 0.028997421264648438, 0.032741546630859375, 0.03648567199707031, 0.04022979736328125, 0.04397392272949219, 0.047718048095703125, 0.05146217346191406, 0.055206298828125, 0.05895042419433594, 0.06269454956054688, 0.06643867492675781, 0.07018280029296875, 0.07392692565917969, 0.07767105102539062, 0.08141517639160156, 0.0851593017578125, 0.08890342712402344, 0.09264755249023438, 0.09639167785644531, 0.10013580322265625, 0.10387992858886719, 0.10762405395507812, 0.11136817932128906, 0.1151123046875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 2.0, 7.0, 6.0, 16.0, 11.0, 14.0, 5.0, 21.0, 16.0, 26.0, 26.0, 42.0, 45.0, 42.0, 40.0, 38.0, 41.0, 56.0, 42.0, 50.0, 42.0, 49.0, 55.0, 34.0, 43.0, 36.0, 46.0, 30.0, 24.0, 27.0, 17.0, 11.0, 8.0, 12.0, 8.0, 3.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1649169921875, -0.1600475311279297, -0.15517807006835938, -0.15030860900878906, -0.14543914794921875, -0.14056968688964844, -0.13570022583007812, -0.1308307647705078, -0.1259613037109375, -0.12109184265136719, -0.11622238159179688, -0.11135292053222656, -0.10648345947265625, -0.10161399841308594, -0.09674453735351562, -0.09187507629394531, -0.087005615234375, -0.08213615417480469, -0.07726669311523438, -0.07239723205566406, -0.06752777099609375, -0.06265830993652344, -0.057788848876953125, -0.05291938781738281, -0.0480499267578125, -0.04318046569824219, -0.038311004638671875, -0.03344154357910156, -0.02857208251953125, -0.023702621459960938, -0.018833160400390625, -0.013963699340820312, -0.00909423828125, -0.0042247772216796875, 0.000644683837890625, 0.0055141448974609375, 0.01038360595703125, 0.015253067016601562, 0.020122528076171875, 0.024991989135742188, 0.0298614501953125, 0.03473091125488281, 0.039600372314453125, 0.04446983337402344, 0.04933929443359375, 0.05420875549316406, 0.059078216552734375, 0.06394767761230469, 0.068817138671875, 0.07368659973144531, 0.07855606079101562, 0.08342552185058594, 0.08829498291015625, 0.09316444396972656, 0.09803390502929688, 0.10290336608886719, 0.1077728271484375, 0.11264228820800781, 0.11751174926757812, 0.12238121032714844, 0.12725067138671875, 0.13212013244628906, 0.13698959350585938, 0.1418590545654297, 0.146728515625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 4.0, 10.0, 15.0, 18.0, 19.0, 29.0, 37.0, 70.0, 100.0, 190.0, 310.0, 569.0, 1081.0, 2306.0, 6047.0, 20664.0, 132259.0, 711004.0, 141330.0, 21619.0, 6087.0, 2320.0, 1069.0, 553.0, 295.0, 196.0, 115.0, 65.0, 55.0, 37.0, 19.0, 13.0, 12.0, 10.0, 12.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10064697265625, -0.09745311737060547, -0.09425926208496094, -0.0910654067993164, -0.08787155151367188, -0.08467769622802734, -0.08148384094238281, -0.07828998565673828, -0.07509613037109375, -0.07190227508544922, -0.06870841979980469, -0.06551456451416016, -0.062320709228515625, -0.059126853942871094, -0.05593299865722656, -0.05273914337158203, -0.0495452880859375, -0.04635143280029297, -0.04315757751464844, -0.039963722229003906, -0.036769866943359375, -0.033576011657714844, -0.030382156372070312, -0.02718830108642578, -0.02399444580078125, -0.02080059051513672, -0.017606735229492188, -0.014412879943847656, -0.011219024658203125, -0.008025169372558594, -0.0048313140869140625, -0.0016374588012695312, 0.001556396484375, 0.004750251770019531, 0.007944107055664062, 0.011137962341308594, 0.014331817626953125, 0.017525672912597656, 0.020719528198242188, 0.02391338348388672, 0.02710723876953125, 0.03030109405517578, 0.03349494934082031, 0.036688804626464844, 0.039882659912109375, 0.043076515197753906, 0.04627037048339844, 0.04946422576904297, 0.0526580810546875, 0.05585193634033203, 0.05904579162597656, 0.062239646911621094, 0.06543350219726562, 0.06862735748291016, 0.07182121276855469, 0.07501506805419922, 0.07820892333984375, 0.08140277862548828, 0.08459663391113281, 0.08779048919677734, 0.09098434448242188, 0.0941781997680664, 0.09737205505371094, 0.10056591033935547, 0.103759765625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 8.0, 14.0, 14.0, 19.0, 30.0, 25.0, 42.0, 49.0, 61.0, 85.0, 76.0, 113.0, 88.0, 73.0, 60.0, 50.0, 38.0, 40.0, 27.0, 24.0, 17.0, 6.0, 14.0, 7.0, 6.0, 3.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.937980651855469e-05, -6.725545972585678e-05, -6.513111293315887e-05, -6.300676614046097e-05, -6.088241934776306e-05, -5.8758072555065155e-05, -5.663372576236725e-05, -5.450937896966934e-05, -5.2385032176971436e-05, -5.026068538427353e-05, -4.813633859157562e-05, -4.6011991798877716e-05, -4.388764500617981e-05, -4.17632982134819e-05, -3.9638951420783997e-05, -3.751460462808609e-05, -3.5390257835388184e-05, -3.326591104269028e-05, -3.114156424999237e-05, -2.9017217457294464e-05, -2.6892870664596558e-05, -2.476852387189865e-05, -2.2644177079200745e-05, -2.0519830286502838e-05, -1.839548349380493e-05, -1.6271136701107025e-05, -1.4146789908409119e-05, -1.2022443115711212e-05, -9.898096323013306e-06, -7.7737495303154e-06, -5.649402737617493e-06, -3.525055944919586e-06, -1.4007091522216797e-06, 7.236376404762268e-07, 2.8479844331741333e-06, 4.97233122587204e-06, 7.096678018569946e-06, 9.221024811267853e-06, 1.134537160396576e-05, 1.3469718396663666e-05, 1.5594065189361572e-05, 1.771841198205948e-05, 1.9842758774757385e-05, 2.1967105567455292e-05, 2.4091452360153198e-05, 2.6215799152851105e-05, 2.834014594554901e-05, 3.0464492738246918e-05, 3.2588839530944824e-05, 3.471318632364273e-05, 3.683753311634064e-05, 3.8961879909038544e-05, 4.108622670173645e-05, 4.321057349443436e-05, 4.533492028713226e-05, 4.745926707983017e-05, 4.9583613872528076e-05, 5.170796066522598e-05, 5.383230745792389e-05, 5.5956654250621796e-05, 5.80810010433197e-05, 6.020534783601761e-05, 6.232969462871552e-05, 6.445404142141342e-05, 6.657838821411133e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 6.0, 9.0, 10.0, 17.0, 28.0, 42.0, 46.0, 70.0, 127.0, 227.0, 369.0, 666.0, 1467.0, 3345.0, 9386.0, 34111.0, 201537.0, 608187.0, 147780.0, 27437.0, 8088.0, 2860.0, 1235.0, 667.0, 341.0, 189.0, 106.0, 66.0, 39.0, 32.0, 17.0, 11.0, 7.0, 10.0, 7.0, 5.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09368896484375, -0.09096717834472656, -0.08824539184570312, -0.08552360534667969, -0.08280181884765625, -0.08008003234863281, -0.07735824584960938, -0.07463645935058594, -0.0719146728515625, -0.06919288635253906, -0.06647109985351562, -0.06374931335449219, -0.06102752685546875, -0.05830574035644531, -0.055583953857421875, -0.05286216735839844, -0.050140380859375, -0.04741859436035156, -0.044696807861328125, -0.04197502136230469, -0.03925323486328125, -0.03653144836425781, -0.033809661865234375, -0.031087875366210938, -0.0283660888671875, -0.025644302368164062, -0.022922515869140625, -0.020200729370117188, -0.01747894287109375, -0.014757156372070312, -0.012035369873046875, -0.009313583374023438, -0.006591796875, -0.0038700103759765625, -0.001148223876953125, 0.0015735626220703125, 0.00429534912109375, 0.0070171356201171875, 0.009738922119140625, 0.012460708618164062, 0.0151824951171875, 0.017904281616210938, 0.020626068115234375, 0.023347854614257812, 0.02606964111328125, 0.028791427612304688, 0.031513214111328125, 0.03423500061035156, 0.036956787109375, 0.03967857360839844, 0.042400360107421875, 0.04512214660644531, 0.04784393310546875, 0.05056571960449219, 0.053287506103515625, 0.05600929260253906, 0.0587310791015625, 0.06145286560058594, 0.06417465209960938, 0.06689643859863281, 0.06961822509765625, 0.07234001159667969, 0.07506179809570312, 0.07778358459472656, 0.08050537109375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 3.0, 9.0, 12.0, 13.0, 32.0, 34.0, 46.0, 60.0, 88.0, 103.0, 108.0, 99.0, 96.0, 71.0, 59.0, 51.0, 20.0, 17.0, 21.0, 17.0, 8.0, 6.0, 7.0, 3.0, 4.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09527587890625, -0.0922842025756836, -0.08929252624511719, -0.08630084991455078, -0.08330917358398438, -0.08031749725341797, -0.07732582092285156, -0.07433414459228516, -0.07134246826171875, -0.06835079193115234, -0.06535911560058594, -0.06236743927001953, -0.059375762939453125, -0.05638408660888672, -0.05339241027832031, -0.050400733947753906, -0.0474090576171875, -0.044417381286621094, -0.04142570495605469, -0.03843402862548828, -0.035442352294921875, -0.03245067596435547, -0.029458999633789062, -0.026467323303222656, -0.02347564697265625, -0.020483970642089844, -0.017492294311523438, -0.014500617980957031, -0.011508941650390625, -0.008517265319824219, -0.0055255889892578125, -0.0025339126586914062, 0.000457763671875, 0.0034494400024414062, 0.0064411163330078125, 0.009432792663574219, 0.012424468994140625, 0.015416145324707031, 0.018407821655273438, 0.021399497985839844, 0.02439117431640625, 0.027382850646972656, 0.030374526977539062, 0.03336620330810547, 0.036357879638671875, 0.03934955596923828, 0.04234123229980469, 0.045332908630371094, 0.0483245849609375, 0.051316261291503906, 0.05430793762207031, 0.05729961395263672, 0.060291290283203125, 0.06328296661376953, 0.06627464294433594, 0.06926631927490234, 0.07225799560546875, 0.07524967193603516, 0.07824134826660156, 0.08123302459716797, 0.08422470092773438, 0.08721637725830078, 0.09020805358886719, 0.0931997299194336, 0.09619140625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 7.0, 18.0, 39.0, 155.0, 423.0, 247.0, 74.0, 27.0, 9.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6697742938995361, -1.6020219326019287, -1.5342695713043213, -1.4665172100067139, -1.3987648487091064, -1.331012487411499, -1.2632602453231812, -1.1955078840255737, -1.1277555227279663, -1.0600031614303589, -0.9922508001327515, -0.9244984984397888, -0.8567461371421814, -0.788993775844574, -0.7212414741516113, -0.6534891128540039, -0.5857367515563965, -0.5179843902587891, -0.45023205876350403, -0.382479727268219, -0.3147273659706116, -0.24697500467300415, -0.17922267317771912, -0.11147034168243408, -0.04371798038482666, 0.024034366011619568, 0.0917867124080658, 0.15953905880451202, 0.22729140520095825, 0.2950437664985657, 0.3627960979938507, 0.43054842948913574, 0.49830102920532227, 0.5660533905029297, 0.6338057518005371, 0.7015580534934998, 0.7693104147911072, 0.8370627760887146, 0.9048150777816772, 0.9725674390792847, 1.040319800376892, 1.1080721616744995, 1.175824522972107, 1.2435768842697144, 1.3113291263580322, 1.3790814876556396, 1.446833848953247, 1.5145862102508545, 1.582338571548462, 1.6500909328460693, 1.7178432941436768, 1.7855956554412842, 1.8533480167388916, 1.921100378036499, 1.988852620124817, 2.0566048622131348, 2.124357223510742, 2.1921095848083496, 2.259861946105957, 2.3276143074035645, 2.395366668701172, 2.4631190299987793, 2.5308713912963867, 2.598623752593994, 2.6663761138916016]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 0.0, 3.0, 5.0, 2.0, 1.0, 4.0, 2.0, 5.0, 3.0, 6.0, 5.0, 9.0, 20.0, 17.0, 36.0, 77.0, 102.0, 149.0, 172.0, 124.0, 95.0, 48.0, 32.0, 18.0, 11.0, 8.0, 5.0, 2.0, 8.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.358370304107666, -2.277796745300293, -2.197222948074341, -2.1166493892669678, -2.0360758304595947, -1.9555021524429321, -1.8749284744262695, -1.7943549156188965, -1.7137812376022339, -1.6332075595855713, -1.5526340007781982, -1.4720603227615356, -1.391486644744873, -1.3109130859375, -1.2303394079208374, -1.1497657299041748, -1.0691921710968018, -0.9886185526847839, -0.9080449342727661, -0.8274712562561035, -0.7468976378440857, -0.6663240194320679, -0.5857503414154053, -0.5051767230033875, -0.42460310459136963, -0.3440294861793518, -0.2634558379650116, -0.18288220465183258, -0.10230857133865356, -0.021734952926635742, 0.05883869528770447, 0.13941234350204468, 0.2199862003326416, 0.3005598187446594, 0.38113346695899963, 0.46170711517333984, 0.5422807335853577, 0.6228543519973755, 0.7034280300140381, 0.7840016484260559, 0.8645752668380737, 0.9451488852500916, 1.0257225036621094, 1.106296181678772, 1.1868698596954346, 1.2674434185028076, 1.3480170965194702, 1.4285907745361328, 1.5091643333435059, 1.5897380113601685, 1.6703115701675415, 1.750885248184204, 1.8314588069915771, 1.9120324850082397, 1.9926061630249023, 2.0731797218322754, 2.1537532806396484, 2.2343268394470215, 2.3149006366729736, 2.3954741954803467, 2.4760477542877197, 2.556621551513672, 2.637195110321045, 2.717768669128418, 2.79834246635437]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 9.0, 15.0, 23.0, 40.0, 59.0, 108.0, 175.0, 274.0, 552.0, 1007.0, 1830.0, 3658.0, 8121.0, 22266.0, 103346.0, 3837715.0, 162614.0, 30421.0, 10963.0, 4888.0, 2523.0, 1414.0, 793.0, 485.0, 303.0, 215.0, 150.0, 96.0, 71.0, 40.0, 34.0, 20.0, 15.0, 15.0, 9.0, 8.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2498779296875, -0.23972129821777344, -0.22956466674804688, -0.2194080352783203, -0.20925140380859375, -0.1990947723388672, -0.18893814086914062, -0.17878150939941406, -0.1686248779296875, -0.15846824645996094, -0.14831161499023438, -0.1381549835205078, -0.12799835205078125, -0.11784172058105469, -0.10768508911132812, -0.09752845764160156, -0.087371826171875, -0.07721519470214844, -0.06705856323242188, -0.05690193176269531, -0.04674530029296875, -0.03658866882324219, -0.026432037353515625, -0.016275405883789062, -0.0061187744140625, 0.0040378570556640625, 0.014194488525390625, 0.024351119995117188, 0.03450775146484375, 0.04466438293457031, 0.054821014404296875, 0.06497764587402344, 0.07513427734375, 0.08529090881347656, 0.09544754028320312, 0.10560417175292969, 0.11576080322265625, 0.1259174346923828, 0.13607406616210938, 0.14623069763183594, 0.1563873291015625, 0.16654396057128906, 0.17670059204101562, 0.1868572235107422, 0.19701385498046875, 0.2071704864501953, 0.21732711791992188, 0.22748374938964844, 0.237640380859375, 0.24779701232910156, 0.2579536437988281, 0.2681102752685547, 0.27826690673828125, 0.2884235382080078, 0.2985801696777344, 0.30873680114746094, 0.3188934326171875, 0.32905006408691406, 0.3392066955566406, 0.3493633270263672, 0.35951995849609375, 0.3696765899658203, 0.3798332214355469, 0.38998985290527344, 0.400146484375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 4.0, 7.0, 12.0, 11.0, 3.0, 7.0, 5.0, 11.0, 15.0, 23.0, 43.0, 106.0, 249.0, 243.0, 86.0, 50.0, 28.0, 13.0, 16.0, 8.0, 12.0, 4.0, 5.0, 9.0, 8.0, 2.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0264129638671875, -0.02527642250061035, -0.024139881134033203, -0.023003339767456055, -0.021866798400878906, -0.020730257034301758, -0.01959371566772461, -0.01845717430114746, -0.017320632934570312, -0.016184091567993164, -0.015047550201416016, -0.013911008834838867, -0.012774467468261719, -0.01163792610168457, -0.010501384735107422, -0.009364843368530273, -0.008228302001953125, -0.0070917606353759766, -0.005955219268798828, -0.00481867790222168, -0.0036821365356445312, -0.002545595169067383, -0.0014090538024902344, -0.00027251243591308594, 0.0008640289306640625, 0.002000570297241211, 0.0031371116638183594, 0.004273653030395508, 0.005410194396972656, 0.006546735763549805, 0.007683277130126953, 0.008819818496704102, 0.00995635986328125, 0.011092901229858398, 0.012229442596435547, 0.013365983963012695, 0.014502525329589844, 0.015639066696166992, 0.01677560806274414, 0.01791214942932129, 0.019048690795898438, 0.020185232162475586, 0.021321773529052734, 0.022458314895629883, 0.02359485626220703, 0.02473139762878418, 0.025867938995361328, 0.027004480361938477, 0.028141021728515625, 0.029277563095092773, 0.030414104461669922, 0.03155064582824707, 0.03268718719482422, 0.03382372856140137, 0.034960269927978516, 0.036096811294555664, 0.03723335266113281, 0.03836989402770996, 0.03950643539428711, 0.04064297676086426, 0.041779518127441406, 0.042916059494018555, 0.0440526008605957, 0.04518914222717285, 0.04632568359375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 5.0, 8.0, 7.0, 10.0, 18.0, 18.0, 20.0, 32.0, 74.0, 117.0, 229.0, 495.0, 988.0, 2463.0, 6997.0, 26518.0, 146049.0, 2768118.0, 1119661.0, 94178.0, 19174.0, 5437.0, 1876.0, 876.0, 354.0, 238.0, 118.0, 64.0, 56.0, 25.0, 19.0, 11.0, 5.0, 8.0, 7.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.2646484375, -0.2570629119873047, -0.24947738647460938, -0.24189186096191406, -0.23430633544921875, -0.22672080993652344, -0.21913528442382812, -0.2115497589111328, -0.2039642333984375, -0.1963787078857422, -0.18879318237304688, -0.18120765686035156, -0.17362213134765625, -0.16603660583496094, -0.15845108032226562, -0.1508655548095703, -0.143280029296875, -0.1356945037841797, -0.12810897827148438, -0.12052345275878906, -0.11293792724609375, -0.10535240173339844, -0.09776687622070312, -0.09018135070800781, -0.0825958251953125, -0.07501029968261719, -0.06742477416992188, -0.05983924865722656, -0.05225372314453125, -0.04466819763183594, -0.037082672119140625, -0.029497146606445312, -0.02191162109375, -0.014326095581054688, -0.006740570068359375, 0.0008449554443359375, 0.00843048095703125, 0.016016006469726562, 0.023601531982421875, 0.031187057495117188, 0.0387725830078125, 0.04635810852050781, 0.053943634033203125, 0.06152915954589844, 0.06911468505859375, 0.07670021057128906, 0.08428573608398438, 0.09187126159667969, 0.099456787109375, 0.10704231262207031, 0.11462783813476562, 0.12221336364746094, 0.12979888916015625, 0.13738441467285156, 0.14496994018554688, 0.1525554656982422, 0.1601409912109375, 0.1677265167236328, 0.17531204223632812, 0.18289756774902344, 0.19048309326171875, 0.19806861877441406, 0.20565414428710938, 0.2132396697998047, 0.2208251953125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 6.0, 7.0, 11.0, 10.0, 17.0, 27.0, 35.0, 43.0, 56.0, 111.0, 180.0, 294.0, 620.0, 1366.0, 541.0, 271.0, 153.0, 103.0, 63.0, 42.0, 34.0, 17.0, 12.0, 17.0, 8.0, 7.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037353515625, -0.036038875579833984, -0.03472423553466797, -0.03340959548950195, -0.03209495544433594, -0.030780315399169922, -0.029465675354003906, -0.02815103530883789, -0.026836395263671875, -0.02552175521850586, -0.024207115173339844, -0.022892475128173828, -0.021577835083007812, -0.020263195037841797, -0.01894855499267578, -0.017633914947509766, -0.01631927490234375, -0.015004634857177734, -0.013689994812011719, -0.012375354766845703, -0.011060714721679688, -0.009746074676513672, -0.008431434631347656, -0.007116794586181641, -0.005802154541015625, -0.004487514495849609, -0.0031728744506835938, -0.0018582344055175781, -0.0005435943603515625, 0.0007710456848144531, 0.0020856857299804688, 0.0034003257751464844, 0.0047149658203125, 0.006029605865478516, 0.007344245910644531, 0.008658885955810547, 0.009973526000976562, 0.011288166046142578, 0.012602806091308594, 0.01391744613647461, 0.015232086181640625, 0.01654672622680664, 0.017861366271972656, 0.019176006317138672, 0.020490646362304688, 0.021805286407470703, 0.02311992645263672, 0.024434566497802734, 0.02574920654296875, 0.027063846588134766, 0.02837848663330078, 0.029693126678466797, 0.031007766723632812, 0.03232240676879883, 0.033637046813964844, 0.03495168685913086, 0.036266326904296875, 0.03758096694946289, 0.038895606994628906, 0.04021024703979492, 0.04152488708496094, 0.04283952713012695, 0.04415416717529297, 0.045468807220458984, 0.046783447265625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 9.0, 28.0, 99.0, 261.0, 338.0, 181.0, 59.0, 14.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20842024683952332, -0.19268736243247986, -0.1769544780254364, -0.16122160851955414, -0.14548872411251068, -0.12975583970546722, -0.11402296274900436, -0.0982900857925415, -0.08255720138549805, -0.06682431697845459, -0.05109144002199173, -0.03535855934023857, -0.019625678658485413, -0.0038927942514419556, 0.011840082705020905, 0.027572959661483765, 0.04330584406852722, 0.05903872475028038, 0.07477160543203354, 0.0905044823884964, 0.10623736679553986, 0.12197025120258331, 0.13770312070846558, 0.15343600511550903, 0.1691688895225525, 0.18490177392959595, 0.2006346583366394, 0.21636752784252167, 0.23210041224956512, 0.24783329665660858, 0.26356616616249084, 0.2792990505695343, 0.29503196477890015, 0.3107648491859436, 0.32649773359298706, 0.3422306180000305, 0.357963502407074, 0.37369638681411743, 0.3894292414188385, 0.40516212582588196, 0.4208950102329254, 0.43662789463996887, 0.45236077904701233, 0.4680936634540558, 0.48382651805877686, 0.4995594024658203, 0.5152922868728638, 0.5310251712799072, 0.5467580556869507, 0.5624909400939941, 0.5782238245010376, 0.593956708908081, 0.6096895933151245, 0.625422477722168, 0.6411553621292114, 0.6568882465362549, 0.6726211309432983, 0.6883540153503418, 0.7040868997573853, 0.7198197841644287, 0.7355526685714722, 0.7512855529785156, 0.7670184373855591, 0.7827513217926025, 0.7984841465950012]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 12.0, 8.0, 5.0, 8.0, 13.0, 13.0, 19.0, 28.0, 27.0, 34.0, 37.0, 59.0, 79.0, 59.0, 67.0, 68.0, 51.0, 62.0, 58.0, 49.0, 50.0, 41.0, 25.0, 22.0, 17.0, 17.0, 16.0, 12.0, 5.0, 2.0, 8.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1761237382888794, -0.17084665596485138, -0.16556957364082336, -0.16029249131679535, -0.15501540899276733, -0.1497383415699005, -0.1444612592458725, -0.13918417692184448, -0.13390709459781647, -0.12863001227378845, -0.12335292994976044, -0.11807585507631302, -0.112798772752285, -0.10752169042825699, -0.10224461555480957, -0.09696753323078156, -0.09169045090675354, -0.08641336858272552, -0.08113628625869751, -0.07585921138525009, -0.07058212906122208, -0.06530504673719406, -0.060027968138456345, -0.05475088953971863, -0.04947380721569061, -0.0441967248916626, -0.03891964629292488, -0.033642567694187164, -0.02836548537015915, -0.023088404908776283, -0.017811324447393417, -0.0125342458486557, -0.0072571635246276855, -0.0019800830632448196, 0.0032969973981380463, 0.008574077859520912, 0.013851158320903778, 0.019128238782286644, 0.02440531924366951, 0.029682397842407227, 0.03495948016643524, 0.04023656249046326, 0.045513641089200974, 0.05079071968793869, 0.056067802011966705, 0.06134488433599472, 0.06662195920944214, 0.07189904153347015, 0.07717612385749817, 0.08245320618152618, 0.0877302885055542, 0.09300736337900162, 0.09828444570302963, 0.10356152802705765, 0.10883860290050507, 0.11411568522453308, 0.1193927675485611, 0.12466984987258911, 0.12994693219661713, 0.13522401452064514, 0.14050108194351196, 0.14577816426753998, 0.151055246591568, 0.156332328915596, 0.16160941123962402]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 8.0, 14.0, 16.0, 8.0, 31.0, 41.0, 55.0, 73.0, 147.0, 199.0, 315.0, 463.0, 843.0, 1517.0, 2878.0, 5723.0, 12987.0, 33880.0, 184311.0, 691728.0, 72686.0, 22046.0, 9374.0, 4240.0, 2189.0, 1098.0, 659.0, 379.0, 214.0, 150.0, 78.0, 79.0, 39.0, 30.0, 16.0, 17.0, 10.0, 11.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.209228515625, -0.2031269073486328, -0.19702529907226562, -0.19092369079589844, -0.18482208251953125, -0.17872047424316406, -0.17261886596679688, -0.1665172576904297, -0.1604156494140625, -0.1543140411376953, -0.14821243286132812, -0.14211082458496094, -0.13600921630859375, -0.12990760803222656, -0.12380599975585938, -0.11770439147949219, -0.111602783203125, -0.10550117492675781, -0.09939956665039062, -0.09329795837402344, -0.08719635009765625, -0.08109474182128906, -0.07499313354492188, -0.06889152526855469, -0.0627899169921875, -0.05668830871582031, -0.050586700439453125, -0.04448509216308594, -0.03838348388671875, -0.03228187561035156, -0.026180267333984375, -0.020078659057617188, -0.01397705078125, -0.007875442504882812, -0.001773834228515625, 0.0043277740478515625, 0.01042938232421875, 0.016530990600585938, 0.022632598876953125, 0.028734207153320312, 0.0348358154296875, 0.04093742370605469, 0.047039031982421875, 0.05314064025878906, 0.05924224853515625, 0.06534385681152344, 0.07144546508789062, 0.07754707336425781, 0.083648681640625, 0.08975028991699219, 0.09585189819335938, 0.10195350646972656, 0.10805511474609375, 0.11415672302246094, 0.12025833129882812, 0.1263599395751953, 0.1324615478515625, 0.1385631561279297, 0.14466476440429688, 0.15076637268066406, 0.15686798095703125, 0.16296958923339844, 0.16907119750976562, 0.1751728057861328, 0.1812744140625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 1.0, 11.0, 3.0, 6.0, 6.0, 11.0, 15.0, 14.0, 27.0, 41.0, 76.0, 171.0, 213.0, 164.0, 80.0, 43.0, 28.0, 13.0, 11.0, 12.0, 10.0, 5.0, 6.0, 1.0, 10.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0226287841796875, -0.021587610244750977, -0.020546436309814453, -0.01950526237487793, -0.018464088439941406, -0.017422914505004883, -0.01638174057006836, -0.015340566635131836, -0.014299392700195312, -0.013258218765258789, -0.012217044830322266, -0.011175870895385742, -0.010134696960449219, -0.009093523025512695, -0.008052349090576172, -0.0070111751556396484, -0.005970001220703125, -0.0049288272857666016, -0.003887653350830078, -0.0028464794158935547, -0.0018053054809570312, -0.0007641315460205078, 0.0002770423889160156, 0.001318216323852539, 0.0023593902587890625, 0.003400564193725586, 0.004441738128662109, 0.005482912063598633, 0.006524085998535156, 0.00756525993347168, 0.008606433868408203, 0.009647607803344727, 0.01068878173828125, 0.011729955673217773, 0.012771129608154297, 0.01381230354309082, 0.014853477478027344, 0.015894651412963867, 0.01693582534790039, 0.017976999282836914, 0.019018173217773438, 0.02005934715270996, 0.021100521087646484, 0.022141695022583008, 0.02318286895751953, 0.024224042892456055, 0.025265216827392578, 0.0263063907623291, 0.027347564697265625, 0.02838873863220215, 0.029429912567138672, 0.030471086502075195, 0.03151226043701172, 0.03255343437194824, 0.033594608306884766, 0.03463578224182129, 0.03567695617675781, 0.036718130111694336, 0.03775930404663086, 0.03880047798156738, 0.039841651916503906, 0.04088282585144043, 0.04192399978637695, 0.04296517372131348, 0.04400634765625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 8.0, 7.0, 9.0, 27.0, 29.0, 46.0, 73.0, 118.0, 277.0, 476.0, 1112.0, 3023.0, 10420.0, 57537.0, 477385.0, 430440.0, 52129.0, 10093.0, 3055.0, 1184.0, 526.0, 224.0, 162.0, 77.0, 42.0, 29.0, 19.0, 13.0, 4.0, 7.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1614990234375, -0.15628433227539062, -0.15106964111328125, -0.14585494995117188, -0.1406402587890625, -0.13542556762695312, -0.13021087646484375, -0.12499618530273438, -0.119781494140625, -0.11456680297851562, -0.10935211181640625, -0.10413742065429688, -0.0989227294921875, -0.09370803833007812, -0.08849334716796875, -0.08327865600585938, -0.07806396484375, -0.07284927368164062, -0.06763458251953125, -0.062419891357421875, -0.0572052001953125, -0.051990509033203125, -0.04677581787109375, -0.041561126708984375, -0.036346435546875, -0.031131744384765625, -0.02591705322265625, -0.020702362060546875, -0.0154876708984375, -0.010272979736328125, -0.00505828857421875, 0.000156402587890625, 0.00537109375, 0.010585784912109375, 0.01580047607421875, 0.021015167236328125, 0.0262298583984375, 0.031444549560546875, 0.03665924072265625, 0.041873931884765625, 0.047088623046875, 0.052303314208984375, 0.05751800537109375, 0.06273269653320312, 0.0679473876953125, 0.07316207885742188, 0.07837677001953125, 0.08359146118164062, 0.08880615234375, 0.09402084350585938, 0.09923553466796875, 0.10445022583007812, 0.1096649169921875, 0.11487960815429688, 0.12009429931640625, 0.12530899047851562, 0.130523681640625, 0.13573837280273438, 0.14095306396484375, 0.14616775512695312, 0.1513824462890625, 0.15659713745117188, 0.16181182861328125, 0.16702651977539062, 0.1722412109375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 6.0, 8.0, 16.0, 7.0, 19.0, 16.0, 23.0, 29.0, 26.0, 32.0, 37.0, 43.0, 31.0, 46.0, 39.0, 49.0, 47.0, 55.0, 44.0, 43.0, 38.0, 41.0, 36.0, 34.0, 38.0, 36.0, 16.0, 26.0, 19.0, 20.0, 15.0, 16.0, 9.0, 9.0, 5.0, 2.0, 6.0, 5.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.09246826171875, -0.08959674835205078, -0.08672523498535156, -0.08385372161865234, -0.08098220825195312, -0.0781106948852539, -0.07523918151855469, -0.07236766815185547, -0.06949615478515625, -0.06662464141845703, -0.06375312805175781, -0.060881614685058594, -0.058010101318359375, -0.055138587951660156, -0.05226707458496094, -0.04939556121826172, -0.0465240478515625, -0.04365253448486328, -0.04078102111816406, -0.037909507751464844, -0.035037994384765625, -0.032166481018066406, -0.029294967651367188, -0.02642345428466797, -0.02355194091796875, -0.02068042755126953, -0.017808914184570312, -0.014937400817871094, -0.012065887451171875, -0.009194374084472656, -0.0063228607177734375, -0.0034513473510742188, -0.000579833984375, 0.0022916793823242188, 0.0051631927490234375, 0.008034706115722656, 0.010906219482421875, 0.013777732849121094, 0.016649246215820312, 0.01952075958251953, 0.02239227294921875, 0.02526378631591797, 0.028135299682617188, 0.031006813049316406, 0.033878326416015625, 0.036749839782714844, 0.03962135314941406, 0.04249286651611328, 0.0453643798828125, 0.04823589324951172, 0.05110740661621094, 0.053978919982910156, 0.056850433349609375, 0.059721946716308594, 0.06259346008300781, 0.06546497344970703, 0.06833648681640625, 0.07120800018310547, 0.07407951354980469, 0.0769510269165039, 0.07982254028320312, 0.08269405364990234, 0.08556556701660156, 0.08843708038330078, 0.09130859375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 5.0, 5.0, 7.0, 8.0, 22.0, 21.0, 51.0, 92.0, 173.0, 349.0, 775.0, 1945.0, 6418.0, 31088.0, 296824.0, 622466.0, 71496.0, 11666.0, 3044.0, 1146.0, 451.0, 219.0, 110.0, 67.0, 40.0, 23.0, 12.0, 11.0, 9.0, 1.0, 6.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.204345703125, -0.19854164123535156, -0.19273757934570312, -0.1869335174560547, -0.18112945556640625, -0.1753253936767578, -0.16952133178710938, -0.16371726989746094, -0.1579132080078125, -0.15210914611816406, -0.14630508422851562, -0.1405010223388672, -0.13469696044921875, -0.1288928985595703, -0.12308883666992188, -0.11728477478027344, -0.111480712890625, -0.10567665100097656, -0.09987258911132812, -0.09406852722167969, -0.08826446533203125, -0.08246040344238281, -0.07665634155273438, -0.07085227966308594, -0.0650482177734375, -0.05924415588378906, -0.053440093994140625, -0.04763603210449219, -0.04183197021484375, -0.03602790832519531, -0.030223846435546875, -0.024419784545898438, -0.01861572265625, -0.012811660766601562, -0.007007598876953125, -0.0012035369873046875, 0.00460052490234375, 0.010404586791992188, 0.016208648681640625, 0.022012710571289062, 0.0278167724609375, 0.03362083435058594, 0.039424896240234375, 0.04522895812988281, 0.05103302001953125, 0.05683708190917969, 0.06264114379882812, 0.06844520568847656, 0.074249267578125, 0.08005332946777344, 0.08585739135742188, 0.09166145324707031, 0.09746551513671875, 0.10326957702636719, 0.10907363891601562, 0.11487770080566406, 0.1206817626953125, 0.12648582458496094, 0.13228988647460938, 0.1380939483642578, 0.14389801025390625, 0.1497020721435547, 0.15550613403320312, 0.16131019592285156, 0.1671142578125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 6.0, 7.0, 17.0, 10.0, 11.0, 26.0, 39.0, 51.0, 61.0, 91.0, 106.0, 113.0, 110.0, 91.0, 70.0, 49.0, 36.0, 31.0, 21.0, 26.0, 6.0, 3.0, 8.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.196996688842773e-05, -8.819904178380966e-05, -8.442811667919159e-05, -8.065719157457352e-05, -7.688626646995544e-05, -7.311534136533737e-05, -6.93444162607193e-05, -6.557349115610123e-05, -6.180256605148315e-05, -5.803164094686508e-05, -5.426071584224701e-05, -5.048979073762894e-05, -4.6718865633010864e-05, -4.294794052839279e-05, -3.917701542377472e-05, -3.540609031915665e-05, -3.1635165214538574e-05, -2.7864240109920502e-05, -2.409331500530243e-05, -2.0322389900684357e-05, -1.6551464796066284e-05, -1.2780539691448212e-05, -9.00961458683014e-06, -5.238689482212067e-06, -1.4677643775939941e-06, 2.3031607270240784e-06, 6.074085831642151e-06, 9.845010936260223e-06, 1.3615936040878296e-05, 1.738686114549637e-05, 2.115778625011444e-05, 2.4928711354732513e-05, 2.8699636459350586e-05, 3.247056156396866e-05, 3.624148666858673e-05, 4.0012411773204803e-05, 4.3783336877822876e-05, 4.755426198244095e-05, 5.132518708705902e-05, 5.5096112191677094e-05, 5.8867037296295166e-05, 6.263796240091324e-05, 6.640888750553131e-05, 7.017981261014938e-05, 7.395073771476746e-05, 7.772166281938553e-05, 8.14925879240036e-05, 8.526351302862167e-05, 8.903443813323975e-05, 9.280536323785782e-05, 9.657628834247589e-05, 0.00010034721344709396, 0.00010411813855171204, 0.00010788906365633011, 0.00011165998876094818, 0.00011543091386556625, 0.00011920183897018433, 0.0001229727640748024, 0.00012674368917942047, 0.00013051461428403854, 0.00013428553938865662, 0.0001380564644932747, 0.00014182738959789276, 0.00014559831470251083, 0.0001493692398071289]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 17.0, 12.0, 18.0, 30.0, 45.0, 65.0, 108.0, 169.0, 301.0, 561.0, 1001.0, 2202.0, 5517.0, 16139.0, 61198.0, 268637.0, 475423.0, 160209.0, 37659.0, 11178.0, 4094.0, 1802.0, 960.0, 470.0, 274.0, 169.0, 89.0, 72.0, 39.0, 32.0, 23.0, 15.0, 5.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10064697265625, -0.0972137451171875, -0.093780517578125, -0.0903472900390625, -0.0869140625, -0.0834808349609375, -0.080047607421875, -0.0766143798828125, -0.07318115234375, -0.0697479248046875, -0.066314697265625, -0.0628814697265625, -0.0594482421875, -0.0560150146484375, -0.052581787109375, -0.0491485595703125, -0.04571533203125, -0.0422821044921875, -0.038848876953125, -0.0354156494140625, -0.031982421875, -0.0285491943359375, -0.025115966796875, -0.0216827392578125, -0.01824951171875, -0.0148162841796875, -0.011383056640625, -0.0079498291015625, -0.0045166015625, -0.0010833740234375, 0.002349853515625, 0.0057830810546875, 0.00921630859375, 0.0126495361328125, 0.016082763671875, 0.0195159912109375, 0.02294921875, 0.0263824462890625, 0.029815673828125, 0.0332489013671875, 0.03668212890625, 0.0401153564453125, 0.043548583984375, 0.0469818115234375, 0.0504150390625, 0.0538482666015625, 0.057281494140625, 0.0607147216796875, 0.06414794921875, 0.0675811767578125, 0.071014404296875, 0.0744476318359375, 0.077880859375, 0.0813140869140625, 0.084747314453125, 0.0881805419921875, 0.09161376953125, 0.0950469970703125, 0.098480224609375, 0.1019134521484375, 0.1053466796875, 0.1087799072265625, 0.112213134765625, 0.1156463623046875, 0.11907958984375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 5.0, 8.0, 10.0, 6.0, 11.0, 18.0, 21.0, 36.0, 36.0, 38.0, 61.0, 69.0, 85.0, 106.0, 86.0, 67.0, 63.0, 59.0, 47.0, 45.0, 27.0, 25.0, 23.0, 11.0, 9.0, 8.0, 10.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0635986328125, -0.06102466583251953, -0.05845069885253906, -0.055876731872558594, -0.053302764892578125, -0.050728797912597656, -0.04815483093261719, -0.04558086395263672, -0.04300689697265625, -0.04043292999267578, -0.03785896301269531, -0.035284996032714844, -0.032711029052734375, -0.030137062072753906, -0.027563095092773438, -0.02498912811279297, -0.0224151611328125, -0.01984119415283203, -0.017267227172851562, -0.014693260192871094, -0.012119293212890625, -0.009545326232910156, -0.0069713592529296875, -0.004397392272949219, -0.00182342529296875, 0.0007505416870117188, 0.0033245086669921875, 0.005898475646972656, 0.008472442626953125, 0.011046409606933594, 0.013620376586914062, 0.01619434356689453, 0.018768310546875, 0.02134227752685547, 0.023916244506835938, 0.026490211486816406, 0.029064178466796875, 0.031638145446777344, 0.03421211242675781, 0.03678607940673828, 0.03936004638671875, 0.04193401336669922, 0.04450798034667969, 0.047081947326660156, 0.049655914306640625, 0.052229881286621094, 0.05480384826660156, 0.05737781524658203, 0.0599517822265625, 0.06252574920654297, 0.06509971618652344, 0.0676736831665039, 0.07024765014648438, 0.07282161712646484, 0.07539558410644531, 0.07796955108642578, 0.08054351806640625, 0.08311748504638672, 0.08569145202636719, 0.08826541900634766, 0.09083938598632812, 0.0934133529663086, 0.09598731994628906, 0.09856128692626953, 0.10113525390625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 21.0, 121.0, 438.0, 353.0, 48.0, 14.0, 5.0, 3.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1782442331314087, -1.1036667823791504, -1.029089331626892, -0.9545119404792786, -0.8799344897270203, -0.805357038974762, -0.7307796478271484, -0.6562021970748901, -0.5816247463226318, -0.5070472955703735, -0.4324698746204376, -0.3578924536705017, -0.2833150029182434, -0.2087375521659851, -0.1341601312160492, -0.05958271026611328, 0.01499474048614502, 0.08957217633724213, 0.16414961218833923, 0.23872704803943634, 0.31330448389053345, 0.38788193464279175, 0.46245935559272766, 0.5370367765426636, 0.6116142272949219, 0.6861916780471802, 0.7607691287994385, 0.835346519947052, 0.9099239706993103, 0.9845014214515686, 1.0590788125991821, 1.1336562633514404, 1.2082338333129883, 1.2828112840652466, 1.3573887348175049, 1.4319661855697632, 1.5065436363220215, 1.5811209678649902, 1.6556984186172485, 1.7302758693695068, 1.8048533201217651, 1.8794307708740234, 1.9540082216262817, 2.02858567237854, 2.103163003921509, 2.1777405738830566, 2.2523179054260254, 2.326895236968994, 2.401472806930542, 2.4760501384735107, 2.5506277084350586, 2.6252050399780273, 2.699782609939575, 2.774359941482544, 2.848937511444092, 2.9235148429870605, 2.9980921745300293, 3.072669506072998, 3.147247076034546, 3.2218244075775146, 3.2964019775390625, 3.3709793090820312, 3.445556879043579, 3.520134210586548, 3.5947117805480957]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 6.0, 8.0, 2.0, 10.0, 10.0, 31.0, 23.0, 36.0, 57.0, 73.0, 87.0, 103.0, 88.0, 94.0, 85.0, 57.0, 56.0, 47.0, 40.0, 25.0, 19.0, 9.0, 14.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0531800985336304, -1.0190048217773438, -0.9848296642303467, -0.9506543874740601, -0.9164791703224182, -0.8823039531707764, -0.8481286764144897, -0.8139534592628479, -0.779778242111206, -0.7456030249595642, -0.7114278078079224, -0.6772525310516357, -0.6430773138999939, -0.608902096748352, -0.5747268199920654, -0.5405516028404236, -0.5063763856887817, -0.4722011685371399, -0.43802592158317566, -0.4038506746292114, -0.3696754574775696, -0.33550024032592773, -0.3013249933719635, -0.26714974641799927, -0.23297452926635742, -0.19879929721355438, -0.16462406516075134, -0.1304488331079483, -0.09627360105514526, -0.062098369002342224, -0.027923136949539185, 0.006252095103263855, 0.040427446365356445, 0.07460267841815948, 0.10877791047096252, 0.14295314252376556, 0.1771283745765686, 0.21130360662937164, 0.24547883868217468, 0.2796540856361389, 0.31382930278778076, 0.3480045199394226, 0.38217976689338684, 0.4163550138473511, 0.4505302309989929, 0.48470544815063477, 0.5188807249069214, 0.5530559420585632, 0.5872311592102051, 0.6214063763618469, 0.6555815935134888, 0.6897568702697754, 0.7239320874214172, 0.7581073045730591, 0.7922825813293457, 0.8264577984809875, 0.8606330156326294, 0.8948082327842712, 0.9289834499359131, 0.9631587266921997, 0.9973339438438416, 1.0315091609954834, 1.06568443775177, 1.099859595298767, 1.1340348720550537]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 15.0, 22.0, 41.0, 52.0, 73.0, 124.0, 136.0, 233.0, 359.0, 625.0, 1073.0, 1709.0, 3017.0, 6392.0, 18105.0, 80523.0, 3631899.0, 386089.0, 38859.0, 12218.0, 5221.0, 2633.0, 1518.0, 998.0, 664.0, 487.0, 299.0, 245.0, 165.0, 118.0, 101.0, 62.0, 38.0, 30.0, 24.0, 20.0, 17.0, 11.0, 9.0, 13.0, 6.0, 8.0, 7.0, 7.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.276123046875, -0.26451873779296875, -0.2529144287109375, -0.24131011962890625, -0.229705810546875, -0.21810150146484375, -0.2064971923828125, -0.19489288330078125, -0.18328857421875, -0.17168426513671875, -0.1600799560546875, -0.14847564697265625, -0.136871337890625, -0.12526702880859375, -0.1136627197265625, -0.10205841064453125, -0.0904541015625, -0.07884979248046875, -0.0672454833984375, -0.05564117431640625, -0.044036865234375, -0.03243255615234375, -0.0208282470703125, -0.00922393798828125, 0.00238037109375, 0.01398468017578125, 0.0255889892578125, 0.03719329833984375, 0.048797607421875, 0.06040191650390625, 0.0720062255859375, 0.08361053466796875, 0.09521484375, 0.10681915283203125, 0.1184234619140625, 0.13002777099609375, 0.141632080078125, 0.15323638916015625, 0.1648406982421875, 0.17644500732421875, 0.18804931640625, 0.19965362548828125, 0.2112579345703125, 0.22286224365234375, 0.234466552734375, 0.24607086181640625, 0.2576751708984375, 0.26927947998046875, 0.2808837890625, 0.29248809814453125, 0.3040924072265625, 0.31569671630859375, 0.327301025390625, 0.33890533447265625, 0.3505096435546875, 0.36211395263671875, 0.37371826171875, 0.38532257080078125, 0.3969268798828125, 0.40853118896484375, 0.420135498046875, 0.43173980712890625, 0.4433441162109375, 0.45494842529296875, 0.466552734375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 7.0, 1.0, 2.0, 4.0, 4.0, 10.0, 10.0, 14.0, 15.0, 19.0, 34.0, 70.0, 117.0, 192.0, 191.0, 128.0, 57.0, 34.0, 22.0, 17.0, 11.0, 10.0, 7.0, 10.0, 5.0, 2.0, 6.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027313232421875, -0.026135921478271484, -0.02495861053466797, -0.023781299591064453, -0.022603988647460938, -0.021426677703857422, -0.020249366760253906, -0.01907205581665039, -0.017894744873046875, -0.01671743392944336, -0.015540122985839844, -0.014362812042236328, -0.013185501098632812, -0.012008190155029297, -0.010830879211425781, -0.009653568267822266, -0.00847625732421875, -0.007298946380615234, -0.006121635437011719, -0.004944324493408203, -0.0037670135498046875, -0.002589702606201172, -0.0014123916625976562, -0.00023508071899414062, 0.000942230224609375, 0.0021195411682128906, 0.0032968521118164062, 0.004474163055419922, 0.0056514739990234375, 0.006828784942626953, 0.008006095886230469, 0.009183406829833984, 0.0103607177734375, 0.011538028717041016, 0.012715339660644531, 0.013892650604248047, 0.015069961547851562, 0.016247272491455078, 0.017424583435058594, 0.01860189437866211, 0.019779205322265625, 0.02095651626586914, 0.022133827209472656, 0.023311138153076172, 0.024488449096679688, 0.025665760040283203, 0.02684307098388672, 0.028020381927490234, 0.02919769287109375, 0.030375003814697266, 0.03155231475830078, 0.0327296257019043, 0.03390693664550781, 0.03508424758911133, 0.036261558532714844, 0.03743886947631836, 0.038616180419921875, 0.03979349136352539, 0.040970802307128906, 0.04214811325073242, 0.04332542419433594, 0.04450273513793945, 0.04568004608154297, 0.046857357025146484, 0.04803466796875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 5.0, 12.0, 10.0, 12.0, 16.0, 26.0, 44.0, 84.0, 132.0, 361.0, 1006.0, 4182.0, 28231.0, 987988.0, 3119339.0, 44944.0, 5734.0, 1332.0, 400.0, 171.0, 91.0, 45.0, 37.0, 24.0, 12.0, 8.0, 7.0, 6.0, 5.0, 4.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4853515625, -0.4697418212890625, -0.454132080078125, -0.4385223388671875, -0.42291259765625, -0.4073028564453125, -0.391693115234375, -0.3760833740234375, -0.3604736328125, -0.3448638916015625, -0.329254150390625, -0.3136444091796875, -0.29803466796875, -0.2824249267578125, -0.266815185546875, -0.2512054443359375, -0.235595703125, -0.2199859619140625, -0.204376220703125, -0.1887664794921875, -0.17315673828125, -0.1575469970703125, -0.141937255859375, -0.1263275146484375, -0.1107177734375, -0.0951080322265625, -0.079498291015625, -0.0638885498046875, -0.04827880859375, -0.0326690673828125, -0.017059326171875, -0.0014495849609375, 0.01416015625, 0.0297698974609375, 0.045379638671875, 0.0609893798828125, 0.07659912109375, 0.0922088623046875, 0.107818603515625, 0.1234283447265625, 0.1390380859375, 0.1546478271484375, 0.170257568359375, 0.1858673095703125, 0.20147705078125, 0.2170867919921875, 0.232696533203125, 0.2483062744140625, 0.263916015625, 0.2795257568359375, 0.295135498046875, 0.3107452392578125, 0.32635498046875, 0.3419647216796875, 0.357574462890625, 0.3731842041015625, 0.3887939453125, 0.4044036865234375, 0.420013427734375, 0.4356231689453125, 0.45123291015625, 0.4668426513671875, 0.482452392578125, 0.4980621337890625, 0.513671875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 6.0, 5.0, 3.0, 9.0, 11.0, 25.0, 48.0, 43.0, 74.0, 126.0, 227.0, 399.0, 1180.0, 999.0, 374.0, 201.0, 126.0, 65.0, 38.0, 29.0, 25.0, 15.0, 10.0, 9.0, 8.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.05126953125, -0.04966545104980469, -0.048061370849609375, -0.04645729064941406, -0.04485321044921875, -0.04324913024902344, -0.041645050048828125, -0.04004096984863281, -0.0384368896484375, -0.03683280944824219, -0.035228729248046875, -0.03362464904785156, -0.03202056884765625, -0.030416488647460938, -0.028812408447265625, -0.027208328247070312, -0.025604248046875, -0.024000167846679688, -0.022396087646484375, -0.020792007446289062, -0.01918792724609375, -0.017583847045898438, -0.015979766845703125, -0.014375686645507812, -0.0127716064453125, -0.011167526245117188, -0.009563446044921875, -0.007959365844726562, -0.00635528564453125, -0.0047512054443359375, -0.003147125244140625, -0.0015430450439453125, 6.103515625e-05, 0.0016651153564453125, 0.003269195556640625, 0.0048732757568359375, 0.00647735595703125, 0.008081436157226562, 0.009685516357421875, 0.011289596557617188, 0.0128936767578125, 0.014497756958007812, 0.016101837158203125, 0.017705917358398438, 0.01930999755859375, 0.020914077758789062, 0.022518157958984375, 0.024122238159179688, 0.025726318359375, 0.027330398559570312, 0.028934478759765625, 0.030538558959960938, 0.03214263916015625, 0.03374671936035156, 0.035350799560546875, 0.03695487976074219, 0.0385589599609375, 0.04016304016113281, 0.041767120361328125, 0.04337120056152344, 0.04497528076171875, 0.04657936096191406, 0.048183441162109375, 0.04978752136230469, 0.0513916015625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 9.0, 10.0, 21.0, 36.0, 49.0, 122.0, 194.0, 197.0, 162.0, 103.0, 52.0, 27.0, 7.0, 7.0, 3.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23055657744407654, -0.2192464917898178, -0.20793640613555908, -0.19662630558013916, -0.18531623482704163, -0.1740061342716217, -0.16269604861736298, -0.15138596296310425, -0.14007587730884552, -0.1287657916545868, -0.11745570600032806, -0.10614561289548874, -0.09483552724123001, -0.08352544158697128, -0.07221534848213196, -0.06090526282787323, -0.0495951771736145, -0.038285091519355774, -0.026975002139806747, -0.01566491276025772, -0.004354827105998993, 0.006955258548259735, 0.01826535165309906, 0.029575437307357788, 0.040885522961616516, 0.052195608615875244, 0.06350569427013397, 0.0748157873749733, 0.08612587302923203, 0.09743595868349075, 0.10874605178833008, 0.1200561374425888, 0.13136622309684753, 0.14267630875110626, 0.153986394405365, 0.1652964949607849, 0.17660656571388245, 0.18791666626930237, 0.1992267519235611, 0.21053683757781982, 0.22184692323207855, 0.23315700888633728, 0.244467094540596, 0.25577718019485474, 0.26708728075027466, 0.2783973515033722, 0.2897074520587921, 0.30101752281188965, 0.31232762336730957, 0.3236377239227295, 0.334947794675827, 0.34625789523124695, 0.3575679659843445, 0.3688780665397644, 0.3801881670951843, 0.39149823784828186, 0.4028083086013794, 0.4141184091567993, 0.42542847990989685, 0.4367385804653168, 0.4480486512184143, 0.45935875177383423, 0.47066885232925415, 0.4819789230823517, 0.4932890236377716]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 5.0, 13.0, 8.0, 17.0, 16.0, 29.0, 33.0, 40.0, 42.0, 69.0, 69.0, 75.0, 44.0, 57.0, 92.0, 61.0, 60.0, 52.0, 47.0, 30.0, 40.0, 33.0, 15.0, 9.0, 16.0, 8.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.190393328666687, -0.18349000811576843, -0.17658667266368866, -0.16968335211277008, -0.1627800166606903, -0.15587669610977173, -0.14897337555885315, -0.14207004010677338, -0.1351667046546936, -0.12826338410377502, -0.12136004865169525, -0.11445672810077667, -0.1075533926486969, -0.10065007209777832, -0.09374674409627914, -0.08684341609477997, -0.07994009554386139, -0.07303676754236221, -0.06613343954086304, -0.05923011526465416, -0.052326787263154984, -0.04542345926165581, -0.03852013498544693, -0.031616806983947754, -0.024713478982448578, -0.017810150980949402, -0.010906824842095375, -0.004003498703241348, 0.0028998292982578278, 0.009803157299757004, 0.01670648157596588, 0.023609809577465057, 0.030513137578964233, 0.03741646558046341, 0.044319793581962585, 0.05122311785817146, 0.05812644585967064, 0.06502977013587952, 0.07193309813737869, 0.07883642613887787, 0.08573975414037704, 0.09264308214187622, 0.0995464101433754, 0.10644973814487457, 0.11335305869579315, 0.12025639414787292, 0.1271597146987915, 0.13406303524971008, 0.14096637070178986, 0.14786969125270844, 0.1547730267047882, 0.1616763472557068, 0.16857968270778656, 0.17548300325870514, 0.1823863387107849, 0.1892896592617035, 0.19619297981262207, 0.20309630036354065, 0.20999963581562042, 0.216902956366539, 0.22380629181861877, 0.23070961236953735, 0.23761293292045593, 0.2445162683725357, 0.2514196038246155]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 10.0, 4.0, 11.0, 14.0, 32.0, 48.0, 56.0, 98.0, 150.0, 253.0, 402.0, 644.0, 1341.0, 2765.0, 6072.0, 17860.0, 80985.0, 634008.0, 250102.0, 34985.0, 10445.0, 4107.0, 1921.0, 935.0, 514.0, 302.0, 182.0, 112.0, 69.0, 55.0, 27.0, 11.0, 14.0, 11.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3095703125, -0.3006629943847656, -0.29175567626953125, -0.2828483581542969, -0.2739410400390625, -0.2650337219238281, -0.25612640380859375, -0.24721908569335938, -0.238311767578125, -0.22940444946289062, -0.22049713134765625, -0.21158981323242188, -0.2026824951171875, -0.19377517700195312, -0.18486785888671875, -0.17596054077148438, -0.16705322265625, -0.15814590454101562, -0.14923858642578125, -0.14033126831054688, -0.1314239501953125, -0.12251663208007812, -0.11360931396484375, -0.10470199584960938, -0.095794677734375, -0.08688735961914062, -0.07798004150390625, -0.06907272338867188, -0.0601654052734375, -0.051258087158203125, -0.04235076904296875, -0.033443450927734375, -0.0245361328125, -0.015628814697265625, -0.00672149658203125, 0.002185821533203125, 0.0110931396484375, 0.020000457763671875, 0.02890777587890625, 0.037815093994140625, 0.046722412109375, 0.055629730224609375, 0.06453704833984375, 0.07344436645507812, 0.0823516845703125, 0.09125900268554688, 0.10016632080078125, 0.10907363891601562, 0.11798095703125, 0.12688827514648438, 0.13579559326171875, 0.14470291137695312, 0.1536102294921875, 0.16251754760742188, 0.17142486572265625, 0.18033218383789062, 0.189239501953125, 0.19814682006835938, 0.20705413818359375, 0.21596145629882812, 0.2248687744140625, 0.23377609252929688, 0.24268341064453125, 0.2515907287597656, 0.260498046875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 9.0, 5.0, 2.0, 10.0, 7.0, 13.0, 25.0, 35.0, 67.0, 122.0, 139.0, 187.0, 136.0, 89.0, 54.0, 36.0, 15.0, 16.0, 9.0, 5.0, 8.0, 3.0, 2.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026641845703125, -0.025508880615234375, -0.02437591552734375, -0.023242950439453125, -0.0221099853515625, -0.020977020263671875, -0.01984405517578125, -0.018711090087890625, -0.017578125, -0.016445159912109375, -0.01531219482421875, -0.014179229736328125, -0.0130462646484375, -0.011913299560546875, -0.01078033447265625, -0.009647369384765625, -0.008514404296875, -0.007381439208984375, -0.00624847412109375, -0.005115509033203125, -0.0039825439453125, -0.002849578857421875, -0.00171661376953125, -0.000583648681640625, 0.00054931640625, 0.001682281494140625, 0.00281524658203125, 0.003948211669921875, 0.0050811767578125, 0.006214141845703125, 0.00734710693359375, 0.008480072021484375, 0.009613037109375, 0.010746002197265625, 0.01187896728515625, 0.013011932373046875, 0.0141448974609375, 0.015277862548828125, 0.01641082763671875, 0.017543792724609375, 0.0186767578125, 0.019809722900390625, 0.02094268798828125, 0.022075653076171875, 0.0232086181640625, 0.024341583251953125, 0.02547454833984375, 0.026607513427734375, 0.027740478515625, 0.028873443603515625, 0.03000640869140625, 0.031139373779296875, 0.0322723388671875, 0.033405303955078125, 0.03453826904296875, 0.035671234130859375, 0.03680419921875, 0.037937164306640625, 0.03907012939453125, 0.040203094482421875, 0.0413360595703125, 0.042469024658203125, 0.04360198974609375, 0.044734954833984375, 0.045867919921875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 8.0, 9.0, 8.0, 12.0, 16.0, 22.0, 23.0, 45.0, 56.0, 91.0, 110.0, 136.0, 235.0, 351.0, 608.0, 946.0, 2047.0, 5641.0, 20901.0, 99329.0, 428665.0, 379223.0, 82662.0, 17996.0, 5079.0, 1775.0, 920.0, 533.0, 331.0, 220.0, 149.0, 106.0, 66.0, 56.0, 38.0, 27.0, 34.0, 8.0, 20.0, 11.0, 8.0, 7.0, 4.0, 6.0, 1.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.2344970703125, -0.22758865356445312, -0.22068023681640625, -0.21377182006835938, -0.2068634033203125, -0.19995498657226562, -0.19304656982421875, -0.18613815307617188, -0.179229736328125, -0.17232131958007812, -0.16541290283203125, -0.15850448608398438, -0.1515960693359375, -0.14468765258789062, -0.13777923583984375, -0.13087081909179688, -0.12396240234375, -0.11705398559570312, -0.11014556884765625, -0.10323715209960938, -0.0963287353515625, -0.08942031860351562, -0.08251190185546875, -0.07560348510742188, -0.068695068359375, -0.061786651611328125, -0.05487823486328125, -0.047969818115234375, -0.0410614013671875, -0.034152984619140625, -0.02724456787109375, -0.020336151123046875, -0.013427734375, -0.006519317626953125, 0.00038909912109375, 0.007297515869140625, 0.0142059326171875, 0.021114349365234375, 0.02802276611328125, 0.034931182861328125, 0.041839599609375, 0.048748016357421875, 0.05565643310546875, 0.06256484985351562, 0.0694732666015625, 0.07638168334960938, 0.08329010009765625, 0.09019851684570312, 0.09710693359375, 0.10401535034179688, 0.11092376708984375, 0.11783218383789062, 0.1247406005859375, 0.13164901733398438, 0.13855743408203125, 0.14546585083007812, 0.152374267578125, 0.15928268432617188, 0.16619110107421875, 0.17309951782226562, 0.1800079345703125, 0.18691635131835938, 0.19382476806640625, 0.20073318481445312, 0.2076416015625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 3.0, 4.0, 8.0, 8.0, 14.0, 20.0, 12.0, 22.0, 33.0, 26.0, 31.0, 32.0, 44.0, 38.0, 32.0, 48.0, 42.0, 50.0, 53.0, 36.0, 37.0, 45.0, 41.0, 43.0, 39.0, 29.0, 24.0, 28.0, 22.0, 21.0, 18.0, 18.0, 14.0, 15.0, 6.0, 9.0, 6.0, 6.0, 0.0, 4.0, 7.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.104736328125, -0.1015481948852539, -0.09836006164550781, -0.09517192840576172, -0.09198379516601562, -0.08879566192626953, -0.08560752868652344, -0.08241939544677734, -0.07923126220703125, -0.07604312896728516, -0.07285499572753906, -0.06966686248779297, -0.06647872924804688, -0.06329059600830078, -0.06010246276855469, -0.056914329528808594, -0.0537261962890625, -0.050538063049316406, -0.04734992980957031, -0.04416179656982422, -0.040973663330078125, -0.03778553009033203, -0.03459739685058594, -0.031409263610839844, -0.02822113037109375, -0.025032997131347656, -0.021844863891601562, -0.01865673065185547, -0.015468597412109375, -0.012280464172363281, -0.009092330932617188, -0.005904197692871094, -0.002716064453125, 0.00047206878662109375, 0.0036602020263671875, 0.006848335266113281, 0.010036468505859375, 0.013224601745605469, 0.016412734985351562, 0.019600868225097656, 0.02278900146484375, 0.025977134704589844, 0.029165267944335938, 0.03235340118408203, 0.035541534423828125, 0.03872966766357422, 0.04191780090332031, 0.045105934143066406, 0.0482940673828125, 0.051482200622558594, 0.05467033386230469, 0.05785846710205078, 0.061046600341796875, 0.06423473358154297, 0.06742286682128906, 0.07061100006103516, 0.07379913330078125, 0.07698726654052734, 0.08017539978027344, 0.08336353302001953, 0.08655166625976562, 0.08973979949951172, 0.09292793273925781, 0.0961160659790039, 0.09930419921875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 11.0, 14.0, 19.0, 39.0, 49.0, 98.0, 147.0, 283.0, 577.0, 1304.0, 3469.0, 10326.0, 35400.0, 138259.0, 448897.0, 302546.0, 76231.0, 20347.0, 6317.0, 2298.0, 936.0, 411.0, 244.0, 128.0, 77.0, 29.0, 27.0, 17.0, 13.0, 11.0, 9.0, 9.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.133056640625, -0.12873458862304688, -0.12441253662109375, -0.12009048461914062, -0.1157684326171875, -0.11144638061523438, -0.10712432861328125, -0.10280227661132812, -0.098480224609375, -0.09415817260742188, -0.08983612060546875, -0.08551406860351562, -0.0811920166015625, -0.07686996459960938, -0.07254791259765625, -0.06822586059570312, -0.06390380859375, -0.059581756591796875, -0.05525970458984375, -0.050937652587890625, -0.0466156005859375, -0.042293548583984375, -0.03797149658203125, -0.033649444580078125, -0.029327392578125, -0.025005340576171875, -0.02068328857421875, -0.016361236572265625, -0.0120391845703125, -0.007717132568359375, -0.00339508056640625, 0.000926971435546875, 0.0052490234375, 0.009571075439453125, 0.01389312744140625, 0.018215179443359375, 0.0225372314453125, 0.026859283447265625, 0.03118133544921875, 0.035503387451171875, 0.039825439453125, 0.044147491455078125, 0.04846954345703125, 0.052791595458984375, 0.0571136474609375, 0.061435699462890625, 0.06575775146484375, 0.07007980346679688, 0.07440185546875, 0.07872390747070312, 0.08304595947265625, 0.08736801147460938, 0.0916900634765625, 0.09601211547851562, 0.10033416748046875, 0.10465621948242188, 0.108978271484375, 0.11330032348632812, 0.11762237548828125, 0.12194442749023438, 0.1262664794921875, 0.13058853149414062, 0.13491058349609375, 0.13923263549804688, 0.1435546875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 12.0, 4.0, 7.0, 13.0, 12.0, 26.0, 32.0, 53.0, 58.0, 76.0, 97.0, 102.0, 126.0, 101.0, 81.0, 78.0, 40.0, 26.0, 18.0, 16.0, 10.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001957416534423828, -0.0001909509301185608, -0.00018616020679473877, -0.00018136948347091675, -0.00017657876014709473, -0.0001717880368232727, -0.00016699731349945068, -0.00016220659017562866, -0.00015741586685180664, -0.00015262514352798462, -0.0001478344202041626, -0.00014304369688034058, -0.00013825297355651855, -0.00013346225023269653, -0.0001286715269088745, -0.0001238808035850525, -0.00011909008026123047, -0.00011429935693740845, -0.00010950863361358643, -0.0001047179102897644, -9.992718696594238e-05, -9.513646364212036e-05, -9.034574031829834e-05, -8.555501699447632e-05, -8.07642936706543e-05, -7.597357034683228e-05, -7.118284702301025e-05, -6.639212369918823e-05, -6.160140037536621e-05, -5.681067705154419e-05, -5.201995372772217e-05, -4.7229230403900146e-05, -4.2438507080078125e-05, -3.7647783756256104e-05, -3.285706043243408e-05, -2.806633710861206e-05, -2.327561378479004e-05, -1.8484890460968018e-05, -1.3694167137145996e-05, -8.903443813323975e-06, -4.112720489501953e-06, 6.780028343200684e-07, 5.46872615814209e-06, 1.0259449481964111e-05, 1.5050172805786133e-05, 1.9840896129608154e-05, 2.4631619453430176e-05, 2.9422342777252197e-05, 3.421306610107422e-05, 3.900378942489624e-05, 4.379451274871826e-05, 4.858523607254028e-05, 5.3375959396362305e-05, 5.8166682720184326e-05, 6.295740604400635e-05, 6.774812936782837e-05, 7.253885269165039e-05, 7.732957601547241e-05, 8.212029933929443e-05, 8.691102266311646e-05, 9.170174598693848e-05, 9.64924693107605e-05, 0.00010128319263458252, 0.00010607391595840454, 0.00011086463928222656]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 3.0, 12.0, 9.0, 18.0, 38.0, 45.0, 95.0, 176.0, 330.0, 785.0, 1996.0, 8084.0, 64900.0, 684823.0, 259438.0, 21568.0, 3944.0, 1227.0, 512.0, 220.0, 135.0, 79.0, 39.0, 25.0, 15.0, 10.0, 8.0, 3.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2010498046875, -0.1929302215576172, -0.18481063842773438, -0.17669105529785156, -0.16857147216796875, -0.16045188903808594, -0.15233230590820312, -0.1442127227783203, -0.1360931396484375, -0.1279735565185547, -0.11985397338867188, -0.11173439025878906, -0.10361480712890625, -0.09549522399902344, -0.08737564086914062, -0.07925605773925781, -0.071136474609375, -0.06301689147949219, -0.054897308349609375, -0.04677772521972656, -0.03865814208984375, -0.030538558959960938, -0.022418975830078125, -0.014299392700195312, -0.0061798095703125, 0.0019397735595703125, 0.010059356689453125, 0.018178939819335938, 0.02629852294921875, 0.03441810607910156, 0.042537689208984375, 0.05065727233886719, 0.05877685546875, 0.06689643859863281, 0.07501602172851562, 0.08313560485839844, 0.09125518798828125, 0.09937477111816406, 0.10749435424804688, 0.11561393737792969, 0.1237335205078125, 0.1318531036376953, 0.13997268676757812, 0.14809226989746094, 0.15621185302734375, 0.16433143615722656, 0.17245101928710938, 0.1805706024169922, 0.188690185546875, 0.1968097686767578, 0.20492935180664062, 0.21304893493652344, 0.22116851806640625, 0.22928810119628906, 0.23740768432617188, 0.2455272674560547, 0.2536468505859375, 0.2617664337158203, 0.2698860168457031, 0.27800559997558594, 0.28612518310546875, 0.29424476623535156, 0.3023643493652344, 0.3104839324951172, 0.318603515625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 1.0, 5.0, 7.0, 10.0, 25.0, 29.0, 43.0, 40.0, 80.0, 109.0, 119.0, 112.0, 121.0, 86.0, 60.0, 42.0, 29.0, 24.0, 17.0, 8.0, 10.0, 9.0, 4.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09344482421875, -0.0897531509399414, -0.08606147766113281, -0.08236980438232422, -0.07867813110351562, -0.07498645782470703, -0.07129478454589844, -0.06760311126708984, -0.06391143798828125, -0.060219764709472656, -0.05652809143066406, -0.05283641815185547, -0.049144744873046875, -0.04545307159423828, -0.04176139831542969, -0.038069725036621094, -0.0343780517578125, -0.030686378479003906, -0.026994705200195312, -0.02330303192138672, -0.019611358642578125, -0.01591968536376953, -0.012228012084960938, -0.008536338806152344, -0.00484466552734375, -0.0011529922485351562, 0.0025386810302734375, 0.006230354309082031, 0.009922027587890625, 0.013613700866699219, 0.017305374145507812, 0.020997047424316406, 0.024688720703125, 0.028380393981933594, 0.03207206726074219, 0.03576374053955078, 0.039455413818359375, 0.04314708709716797, 0.04683876037597656, 0.050530433654785156, 0.05422210693359375, 0.057913780212402344, 0.06160545349121094, 0.06529712677001953, 0.06898880004882812, 0.07268047332763672, 0.07637214660644531, 0.0800638198852539, 0.0837554931640625, 0.0874471664428711, 0.09113883972167969, 0.09483051300048828, 0.09852218627929688, 0.10221385955810547, 0.10590553283691406, 0.10959720611572266, 0.11328887939453125, 0.11698055267333984, 0.12067222595214844, 0.12436389923095703, 0.12805557250976562, 0.13174724578857422, 0.1354389190673828, 0.1391305923461914, 0.142822265625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 7.0, 20.0, 166.0, 540.0, 237.0, 37.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0903329849243164, -0.9469664096832275, -0.8035998344421387, -0.6602333188056946, -0.5168667435646057, -0.37350016832351685, -0.23013365268707275, -0.08676707744598389, 0.05659949779510498, 0.19996605813503265, 0.3433326184749603, 0.4866991639137268, 0.6300657391548157, 0.7734323143959045, 0.9167988300323486, 1.0601654052734375, 1.2035319805145264, 1.3468985557556152, 1.490265130996704, 1.633631706237793, 1.7769982814788818, 1.9203648567199707, 2.0637311935424805, 2.2070980072021484, 2.350464344024658, 2.493830919265747, 2.637197494506836, 2.780564069747925, 2.9239306449890137, 3.0672972202301025, 3.2106637954711914, 3.354030132293701, 3.497396945953369, 3.640763521194458, 3.784130096435547, 3.9274966716766357, 4.070863246917725, 4.214229583740234, 4.357596397399902, 4.500962734222412, 4.64432954788208, 4.78769588470459, 4.931062698364258, 5.074429035186768, 5.2177958488464355, 5.361162185668945, 5.504528999328613, 5.647895336151123, 5.791261672973633, 5.934628009796143, 6.0779948234558105, 6.22136116027832, 6.364727973937988, 6.508094310760498, 6.651461124420166, 6.794827461242676, 6.938194274902344, 7.0815606117248535, 7.2249274253845215, 7.368293762207031, 7.511660575866699, 7.655026912689209, 7.798393726348877, 7.941760063171387, 8.085126876831055]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 6.0, 6.0, 8.0, 13.0, 16.0, 17.0, 13.0, 23.0, 21.0, 30.0, 31.0, 31.0, 40.0, 49.0, 44.0, 46.0, 46.0, 58.0, 50.0, 53.0, 45.0, 49.0, 33.0, 28.0, 42.0, 29.0, 29.0, 25.0, 24.0, 22.0, 14.0, 19.0, 8.0, 6.0, 11.0, 1.0, 5.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8151053190231323, -0.7894560694694519, -0.7638068199157715, -0.7381575107574463, -0.7125082612037659, -0.6868590116500854, -0.6612097024917603, -0.6355604529380798, -0.6099112033843994, -0.584261953830719, -0.5586127042770386, -0.5329633951187134, -0.507314145565033, -0.48166489601135254, -0.45601561665534973, -0.4303663372993469, -0.4047170877456665, -0.3790678381919861, -0.3534185588359833, -0.32776927947998047, -0.30212002992630005, -0.27647078037261963, -0.2508215010166168, -0.2251722365617752, -0.1995229721069336, -0.17387370765209198, -0.14822444319725037, -0.12257517874240875, -0.09692591428756714, -0.07127664983272552, -0.04562738537788391, -0.019978120923042297, 0.005671143531799316, 0.03132040798664093, 0.056969672441482544, 0.08261893689632416, 0.10826820135116577, 0.13391746580600739, 0.159566730260849, 0.1852159947156906, 0.21086525917053223, 0.23651452362537384, 0.26216378808021545, 0.28781306743621826, 0.3134623169898987, 0.3391115665435791, 0.3647608458995819, 0.3904101252555847, 0.41605937480926514, 0.44170862436294556, 0.46735790371894836, 0.49300718307495117, 0.5186564326286316, 0.544305682182312, 0.5699549913406372, 0.5956042408943176, 0.621253490447998, 0.6469027400016785, 0.6725519895553589, 0.6982012987136841, 0.7238505482673645, 0.7494997978210449, 0.7751491069793701, 0.8007983565330505, 0.826447606086731]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 8.0, 14.0, 14.0, 33.0, 57.0, 113.0, 252.0, 673.0, 1964.0, 9694.0, 146721.0, 3978404.0, 46697.0, 6299.0, 1818.0, 719.0, 331.0, 175.0, 113.0, 58.0, 42.0, 18.0, 13.0, 12.0, 11.0, 9.0, 4.0, 2.0, 5.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53125, -0.5094223022460938, -0.4875946044921875, -0.46576690673828125, -0.443939208984375, -0.42211151123046875, -0.4002838134765625, -0.37845611572265625, -0.35662841796875, -0.33480072021484375, -0.3129730224609375, -0.29114532470703125, -0.269317626953125, -0.24748992919921875, -0.2256622314453125, -0.20383453369140625, -0.1820068359375, -0.16017913818359375, -0.1383514404296875, -0.11652374267578125, -0.094696044921875, -0.07286834716796875, -0.0510406494140625, -0.02921295166015625, -0.00738525390625, 0.01444244384765625, 0.0362701416015625, 0.05809783935546875, 0.079925537109375, 0.10175323486328125, 0.1235809326171875, 0.14540863037109375, 0.167236328125, 0.18906402587890625, 0.2108917236328125, 0.23271942138671875, 0.254547119140625, 0.27637481689453125, 0.2982025146484375, 0.32003021240234375, 0.34185791015625, 0.36368560791015625, 0.3855133056640625, 0.40734100341796875, 0.429168701171875, 0.45099639892578125, 0.4728240966796875, 0.49465179443359375, 0.5164794921875, 0.5383071899414062, 0.5601348876953125, 0.5819625854492188, 0.603790283203125, 0.6256179809570312, 0.6474456787109375, 0.6692733764648438, 0.69110107421875, 0.7129287719726562, 0.7347564697265625, 0.7565841674804688, 0.778411865234375, 0.8002395629882812, 0.8220672607421875, 0.8438949584960938, 0.86572265625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 4.0, 5.0, 10.0, 14.0, 22.0, 32.0, 49.0, 83.0, 100.0, 115.0, 141.0, 127.0, 98.0, 52.0, 45.0, 33.0, 17.0, 15.0, 8.0, 4.0, 2.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03192138671875, -0.03061532974243164, -0.02930927276611328, -0.028003215789794922, -0.026697158813476562, -0.025391101837158203, -0.024085044860839844, -0.022778987884521484, -0.021472930908203125, -0.020166873931884766, -0.018860816955566406, -0.017554759979248047, -0.016248703002929688, -0.014942646026611328, -0.013636589050292969, -0.01233053207397461, -0.01102447509765625, -0.00971841812133789, -0.008412361145019531, -0.007106304168701172, -0.0058002471923828125, -0.004494190216064453, -0.0031881332397460938, -0.0018820762634277344, -0.000576019287109375, 0.0007300376892089844, 0.0020360946655273438, 0.003342151641845703, 0.0046482086181640625, 0.005954265594482422, 0.007260322570800781, 0.00856637954711914, 0.0098724365234375, 0.01117849349975586, 0.012484550476074219, 0.013790607452392578, 0.015096664428710938, 0.016402721405029297, 0.017708778381347656, 0.019014835357666016, 0.020320892333984375, 0.021626949310302734, 0.022933006286621094, 0.024239063262939453, 0.025545120239257812, 0.026851177215576172, 0.02815723419189453, 0.02946329116821289, 0.03076934814453125, 0.03207540512084961, 0.03338146209716797, 0.03468751907348633, 0.03599357604980469, 0.03729963302612305, 0.038605690002441406, 0.039911746978759766, 0.041217803955078125, 0.042523860931396484, 0.043829917907714844, 0.0451359748840332, 0.04644203186035156, 0.04774808883666992, 0.04905414581298828, 0.05036020278930664, 0.051666259765625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 14.0, 20.0, 33.0, 42.0, 78.0, 104.0, 158.0, 284.0, 549.0, 1175.0, 2872.0, 8281.0, 32217.0, 197484.0, 3243902.0, 615722.0, 67908.0, 15114.0, 4719.0, 1777.0, 785.0, 407.0, 246.0, 134.0, 94.0, 44.0, 23.0, 30.0, 18.0, 10.0, 8.0, 4.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28369140625, -0.274749755859375, -0.26580810546875, -0.256866455078125, -0.2479248046875, -0.238983154296875, -0.23004150390625, -0.221099853515625, -0.212158203125, -0.203216552734375, -0.19427490234375, -0.185333251953125, -0.1763916015625, -0.167449951171875, -0.15850830078125, -0.149566650390625, -0.140625, -0.131683349609375, -0.12274169921875, -0.113800048828125, -0.1048583984375, -0.095916748046875, -0.08697509765625, -0.078033447265625, -0.069091796875, -0.060150146484375, -0.05120849609375, -0.042266845703125, -0.0333251953125, -0.024383544921875, -0.01544189453125, -0.006500244140625, 0.00244140625, 0.011383056640625, 0.02032470703125, 0.029266357421875, 0.0382080078125, 0.047149658203125, 0.05609130859375, 0.065032958984375, 0.073974609375, 0.082916259765625, 0.09185791015625, 0.100799560546875, 0.1097412109375, 0.118682861328125, 0.12762451171875, 0.136566162109375, 0.1455078125, 0.154449462890625, 0.16339111328125, 0.172332763671875, 0.1812744140625, 0.190216064453125, 0.19915771484375, 0.208099365234375, 0.217041015625, 0.225982666015625, 0.23492431640625, 0.243865966796875, 0.2528076171875, 0.261749267578125, 0.27069091796875, 0.279632568359375, 0.28857421875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 9.0, 5.0, 4.0, 8.0, 10.0, 9.0, 25.0, 23.0, 30.0, 60.0, 107.0, 119.0, 186.0, 379.0, 1064.0, 1072.0, 367.0, 181.0, 127.0, 87.0, 57.0, 35.0, 27.0, 20.0, 10.0, 13.0, 12.0, 5.0, 2.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.055877685546875, -0.054131507873535156, -0.05238533020019531, -0.05063915252685547, -0.048892974853515625, -0.04714679718017578, -0.04540061950683594, -0.043654441833496094, -0.04190826416015625, -0.040162086486816406, -0.03841590881347656, -0.03666973114013672, -0.034923553466796875, -0.03317737579345703, -0.03143119812011719, -0.029685020446777344, -0.0279388427734375, -0.026192665100097656, -0.024446487426757812, -0.02270030975341797, -0.020954132080078125, -0.01920795440673828, -0.017461776733398438, -0.015715599060058594, -0.01396942138671875, -0.012223243713378906, -0.010477066040039062, -0.008730888366699219, -0.006984710693359375, -0.005238533020019531, -0.0034923553466796875, -0.0017461776733398438, 0.0, 0.0017461776733398438, 0.0034923553466796875, 0.005238533020019531, 0.006984710693359375, 0.008730888366699219, 0.010477066040039062, 0.012223243713378906, 0.01396942138671875, 0.015715599060058594, 0.017461776733398438, 0.01920795440673828, 0.020954132080078125, 0.02270030975341797, 0.024446487426757812, 0.026192665100097656, 0.0279388427734375, 0.029685020446777344, 0.03143119812011719, 0.03317737579345703, 0.034923553466796875, 0.03666973114013672, 0.03841590881347656, 0.040162086486816406, 0.04190826416015625, 0.043654441833496094, 0.04540061950683594, 0.04714679718017578, 0.048892974853515625, 0.05063915252685547, 0.05238533020019531, 0.054131507873535156, 0.055877685546875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 10.0, 27.0, 60.0, 160.0, 278.0, 278.0, 126.0, 45.0, 22.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46466049551963806, -0.4400393068790436, -0.4154181480407715, -0.390796959400177, -0.3661757707595825, -0.3415546119213104, -0.31693342328071594, -0.29231226444244385, -0.26769107580184937, -0.24306990206241608, -0.2184487283229828, -0.1938275396823883, -0.16920636594295502, -0.14458519220352173, -0.11996400356292725, -0.09534282982349396, -0.07072165608406067, -0.04610047861933708, -0.021479301154613495, 0.0031418800354003906, 0.02776305377483368, 0.05238422751426697, 0.07700541615486145, 0.10162658989429474, 0.12624776363372803, 0.15086893737316132, 0.1754901111125946, 0.2001112997531891, 0.22473247349262238, 0.24935364723205566, 0.27397483587265015, 0.29859602451324463, 0.32321715354919434, 0.3478383421897888, 0.3724595010280609, 0.3970806896686554, 0.4217018485069275, 0.446323037147522, 0.47094422578811646, 0.49556541442871094, 0.5201865434646606, 0.5448077321052551, 0.5694289207458496, 0.5940500497817993, 0.6186712384223938, 0.6432924270629883, 0.6679136157035828, 0.6925348043441772, 0.7171559929847717, 0.7417771816253662, 0.7663983702659607, 0.7910195589065552, 0.8156406879425049, 0.8402618765830994, 0.8648830652236938, 0.8895042538642883, 0.9141254425048828, 0.9387466311454773, 0.9633678197860718, 0.9879889488220215, 1.0126101970672607, 1.0372313261032104, 1.0618524551391602, 1.0864737033843994, 1.1110948324203491]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 10.0, 12.0, 10.0, 13.0, 15.0, 30.0, 36.0, 27.0, 37.0, 40.0, 34.0, 59.0, 43.0, 50.0, 47.0, 59.0, 46.0, 47.0, 45.0, 52.0, 54.0, 47.0, 35.0, 26.0, 24.0, 28.0, 22.0, 15.0, 11.0, 9.0, 7.0, 7.0, 5.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21724176406860352, -0.20990778505802155, -0.20257382094860077, -0.1952398419380188, -0.18790587782859802, -0.18057189881801605, -0.17323791980743408, -0.1659039556980133, -0.15856999158859253, -0.15123601257801056, -0.14390204846858978, -0.1365680694580078, -0.12923410534858704, -0.12190012633800507, -0.11456615477800369, -0.10723218321800232, -0.09989820420742035, -0.09256423264741898, -0.0852302610874176, -0.07789628207683563, -0.07056231796741486, -0.06322833895683289, -0.05589436739683151, -0.04856039583683014, -0.041226424276828766, -0.03389245271682739, -0.02655847929418087, -0.019224505871534348, -0.011890534311532974, -0.004556562751531601, 0.002777412533760071, 0.010111384093761444, 0.017445355653762817, 0.02477932721376419, 0.032113298773765564, 0.039447274059057236, 0.04678124561905861, 0.05411521717905998, 0.061449192464351654, 0.06878316402435303, 0.0761171355843544, 0.08345110714435577, 0.09078507870435715, 0.09811905026435852, 0.10545302927494049, 0.11278699338436127, 0.12012097239494324, 0.127454936504364, 0.13478891551494598, 0.14212289452552795, 0.14945685863494873, 0.1567908376455307, 0.16412480175495148, 0.17145878076553345, 0.17879274487495422, 0.1861267238855362, 0.19346070289611816, 0.20079468190670013, 0.2081286460161209, 0.21546262502670288, 0.22279658913612366, 0.23013056814670563, 0.2374645471572876, 0.24479851126670837, 0.25213247537612915]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 5.0, 6.0, 11.0, 21.0, 27.0, 46.0, 72.0, 103.0, 194.0, 328.0, 602.0, 1051.0, 2283.0, 5206.0, 16183.0, 71798.0, 368521.0, 454566.0, 95551.0, 20430.0, 6194.0, 2545.0, 1206.0, 633.0, 393.0, 230.0, 129.0, 78.0, 41.0, 30.0, 19.0, 12.0, 12.0, 5.0, 4.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.246826171875, -0.2391338348388672, -0.23144149780273438, -0.22374916076660156, -0.21605682373046875, -0.20836448669433594, -0.20067214965820312, -0.1929798126220703, -0.1852874755859375, -0.1775951385498047, -0.16990280151367188, -0.16221046447753906, -0.15451812744140625, -0.14682579040527344, -0.13913345336914062, -0.1314411163330078, -0.123748779296875, -0.11605644226074219, -0.10836410522460938, -0.10067176818847656, -0.09297943115234375, -0.08528709411621094, -0.07759475708007812, -0.06990242004394531, -0.0622100830078125, -0.05451774597167969, -0.046825408935546875, -0.03913307189941406, -0.03144073486328125, -0.023748397827148438, -0.016056060791015625, -0.008363723754882812, -0.00067138671875, 0.0070209503173828125, 0.014713287353515625, 0.022405624389648438, 0.03009796142578125, 0.03779029846191406, 0.045482635498046875, 0.05317497253417969, 0.0608673095703125, 0.06855964660644531, 0.07625198364257812, 0.08394432067871094, 0.09163665771484375, 0.09932899475097656, 0.10702133178710938, 0.11471366882324219, 0.122406005859375, 0.1300983428955078, 0.13779067993164062, 0.14548301696777344, 0.15317535400390625, 0.16086769104003906, 0.16856002807617188, 0.1762523651123047, 0.1839447021484375, 0.1916370391845703, 0.19932937622070312, 0.20702171325683594, 0.21471405029296875, 0.22240638732910156, 0.23009872436523438, 0.2377910614013672, 0.2454833984375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 7.0, 7.0, 7.0, 10.0, 28.0, 38.0, 63.0, 82.0, 118.0, 135.0, 130.0, 103.0, 90.0, 74.0, 35.0, 26.0, 15.0, 10.0, 8.0, 3.0, 1.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0362548828125, -0.03481149673461914, -0.03336811065673828, -0.03192472457885742, -0.030481338500976562, -0.029037952423095703, -0.027594566345214844, -0.026151180267333984, -0.024707794189453125, -0.023264408111572266, -0.021821022033691406, -0.020377635955810547, -0.018934249877929688, -0.017490863800048828, -0.01604747772216797, -0.01460409164428711, -0.01316070556640625, -0.01171731948852539, -0.010273933410644531, -0.008830547332763672, -0.0073871612548828125, -0.005943775177001953, -0.004500389099121094, -0.0030570030212402344, -0.001613616943359375, -0.00017023086547851562, 0.0012731552124023438, 0.002716541290283203, 0.0041599273681640625, 0.005603313446044922, 0.007046699523925781, 0.00849008560180664, 0.0099334716796875, 0.01137685775756836, 0.012820243835449219, 0.014263629913330078, 0.015707015991210938, 0.017150402069091797, 0.018593788146972656, 0.020037174224853516, 0.021480560302734375, 0.022923946380615234, 0.024367332458496094, 0.025810718536376953, 0.027254104614257812, 0.028697490692138672, 0.03014087677001953, 0.03158426284790039, 0.03302764892578125, 0.03447103500366211, 0.03591442108154297, 0.03735780715942383, 0.03880119323730469, 0.04024457931518555, 0.041687965393066406, 0.043131351470947266, 0.044574737548828125, 0.046018123626708984, 0.047461509704589844, 0.0489048957824707, 0.05034828186035156, 0.05179166793823242, 0.05323505401611328, 0.05467844009399414, 0.056121826171875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 5.0, 5.0, 10.0, 12.0, 13.0, 16.0, 32.0, 34.0, 53.0, 89.0, 111.0, 142.0, 206.0, 392.0, 528.0, 1079.0, 2285.0, 7582.0, 35144.0, 185977.0, 563383.0, 200692.0, 37642.0, 7719.0, 2502.0, 1094.0, 632.0, 351.0, 256.0, 165.0, 99.0, 92.0, 51.0, 49.0, 31.0, 20.0, 21.0, 13.0, 9.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.277099609375, -0.2688331604003906, -0.26056671142578125, -0.2523002624511719, -0.2440338134765625, -0.23576736450195312, -0.22750091552734375, -0.21923446655273438, -0.210968017578125, -0.20270156860351562, -0.19443511962890625, -0.18616867065429688, -0.1779022216796875, -0.16963577270507812, -0.16136932373046875, -0.15310287475585938, -0.14483642578125, -0.13656997680664062, -0.12830352783203125, -0.12003707885742188, -0.1117706298828125, -0.10350418090820312, -0.09523773193359375, -0.08697128295898438, -0.078704833984375, -0.07043838500976562, -0.06217193603515625, -0.053905487060546875, -0.0456390380859375, -0.037372589111328125, -0.02910614013671875, -0.020839691162109375, -0.0125732421875, -0.004306793212890625, 0.00395965576171875, 0.012226104736328125, 0.0204925537109375, 0.028759002685546875, 0.03702545166015625, 0.045291900634765625, 0.053558349609375, 0.061824798583984375, 0.07009124755859375, 0.07835769653320312, 0.0866241455078125, 0.09489059448242188, 0.10315704345703125, 0.11142349243164062, 0.11968994140625, 0.12795639038085938, 0.13622283935546875, 0.14448928833007812, 0.1527557373046875, 0.16102218627929688, 0.16928863525390625, 0.17755508422851562, 0.185821533203125, 0.19408798217773438, 0.20235443115234375, 0.21062088012695312, 0.2188873291015625, 0.22715377807617188, 0.23542022705078125, 0.24368667602539062, 0.251953125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 6.0, 3.0, 8.0, 6.0, 14.0, 14.0, 14.0, 11.0, 24.0, 28.0, 21.0, 29.0, 37.0, 27.0, 38.0, 41.0, 48.0, 40.0, 42.0, 36.0, 43.0, 43.0, 43.0, 49.0, 45.0, 35.0, 36.0, 29.0, 35.0, 24.0, 25.0, 32.0, 14.0, 16.0, 13.0, 10.0, 1.0, 8.0, 5.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1168212890625, -0.11263275146484375, -0.1084442138671875, -0.10425567626953125, -0.100067138671875, -0.09587860107421875, -0.0916900634765625, -0.08750152587890625, -0.08331298828125, -0.07912445068359375, -0.0749359130859375, -0.07074737548828125, -0.066558837890625, -0.06237030029296875, -0.0581817626953125, -0.05399322509765625, -0.0498046875, -0.04561614990234375, -0.0414276123046875, -0.03723907470703125, -0.033050537109375, -0.02886199951171875, -0.0246734619140625, -0.02048492431640625, -0.01629638671875, -0.01210784912109375, -0.0079193115234375, -0.00373077392578125, 0.000457763671875, 0.00464630126953125, 0.0088348388671875, 0.01302337646484375, 0.0172119140625, 0.02140045166015625, 0.0255889892578125, 0.02977752685546875, 0.033966064453125, 0.03815460205078125, 0.0423431396484375, 0.04653167724609375, 0.05072021484375, 0.05490875244140625, 0.0590972900390625, 0.06328582763671875, 0.067474365234375, 0.07166290283203125, 0.0758514404296875, 0.08003997802734375, 0.084228515625, 0.08841705322265625, 0.0926055908203125, 0.09679412841796875, 0.100982666015625, 0.10517120361328125, 0.1093597412109375, 0.11354827880859375, 0.11773681640625, 0.12192535400390625, 0.1261138916015625, 0.13030242919921875, 0.134490966796875, 0.13867950439453125, 0.1428680419921875, 0.14705657958984375, 0.1512451171875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 4.0, 10.0, 11.0, 16.0, 26.0, 56.0, 83.0, 90.0, 183.0, 253.0, 402.0, 615.0, 1064.0, 1795.0, 3153.0, 5992.0, 12668.0, 33084.0, 108619.0, 439013.0, 316686.0, 77593.0, 25128.0, 10346.0, 4946.0, 2700.0, 1514.0, 950.0, 554.0, 351.0, 257.0, 138.0, 79.0, 58.0, 46.0, 21.0, 17.0, 13.0, 7.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.1522216796875, -0.14820194244384766, -0.1441822052001953, -0.14016246795654297, -0.13614273071289062, -0.13212299346923828, -0.12810325622558594, -0.1240835189819336, -0.12006378173828125, -0.1160440444946289, -0.11202430725097656, -0.10800457000732422, -0.10398483276367188, -0.09996509552001953, -0.09594535827636719, -0.09192562103271484, -0.0879058837890625, -0.08388614654541016, -0.07986640930175781, -0.07584667205810547, -0.07182693481445312, -0.06780719757080078, -0.06378746032714844, -0.059767723083496094, -0.05574798583984375, -0.051728248596191406, -0.04770851135253906, -0.04368877410888672, -0.039669036865234375, -0.03564929962158203, -0.03162956237792969, -0.027609825134277344, -0.023590087890625, -0.019570350646972656, -0.015550613403320312, -0.011530876159667969, -0.007511138916015625, -0.0034914016723632812, 0.0005283355712890625, 0.004548072814941406, 0.00856781005859375, 0.012587547302246094, 0.016607284545898438, 0.02062702178955078, 0.024646759033203125, 0.02866649627685547, 0.03268623352050781, 0.036705970764160156, 0.0407257080078125, 0.044745445251464844, 0.04876518249511719, 0.05278491973876953, 0.056804656982421875, 0.06082439422607422, 0.06484413146972656, 0.0688638687133789, 0.07288360595703125, 0.0769033432006836, 0.08092308044433594, 0.08494281768798828, 0.08896255493164062, 0.09298229217529297, 0.09700202941894531, 0.10102176666259766, 0.10504150390625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 9.0, 4.0, 12.0, 11.0, 15.0, 27.0, 28.0, 42.0, 49.0, 63.0, 79.0, 68.0, 104.0, 83.0, 86.0, 72.0, 61.0, 46.0, 35.0, 31.0, 22.0, 10.0, 9.0, 9.0, 5.0, 4.0, 6.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.939338684082031e-05, -7.642991840839386e-05, -7.346644997596741e-05, -7.050298154354095e-05, -6.75395131111145e-05, -6.457604467868805e-05, -6.16125762462616e-05, -5.8649107813835144e-05, -5.568563938140869e-05, -5.272217094898224e-05, -4.9758702516555786e-05, -4.6795234084129333e-05, -4.383176565170288e-05, -4.086829721927643e-05, -3.7904828786849976e-05, -3.494136035442352e-05, -3.197789192199707e-05, -2.9014423489570618e-05, -2.6050955057144165e-05, -2.3087486624717712e-05, -2.012401819229126e-05, -1.7160549759864807e-05, -1.4197081327438354e-05, -1.1233612895011902e-05, -8.27014446258545e-06, -5.306676030158997e-06, -2.343207597732544e-06, 6.202608346939087e-07, 3.5837292671203613e-06, 6.547197699546814e-06, 9.510666131973267e-06, 1.247413456439972e-05, 1.5437602996826172e-05, 1.8401071429252625e-05, 2.1364539861679077e-05, 2.432800829410553e-05, 2.7291476726531982e-05, 3.0254945158958435e-05, 3.321841359138489e-05, 3.618188202381134e-05, 3.914535045623779e-05, 4.2108818888664246e-05, 4.50722873210907e-05, 4.803575575351715e-05, 5.0999224185943604e-05, 5.3962692618370056e-05, 5.692616105079651e-05, 5.988962948322296e-05, 6.285309791564941e-05, 6.581656634807587e-05, 6.878003478050232e-05, 7.174350321292877e-05, 7.470697164535522e-05, 7.767044007778168e-05, 8.063390851020813e-05, 8.359737694263458e-05, 8.656084537506104e-05, 8.952431380748749e-05, 9.248778223991394e-05, 9.545125067234039e-05, 9.841471910476685e-05, 0.0001013781875371933, 0.00010434165596961975, 0.0001073051244020462, 0.00011026859283447266]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 4.0, 11.0, 5.0, 14.0, 16.0, 17.0, 34.0, 50.0, 93.0, 129.0, 254.0, 518.0, 1198.0, 3362.0, 11996.0, 78885.0, 745973.0, 177455.0, 20409.0, 4977.0, 1671.0, 689.0, 313.0, 147.0, 109.0, 61.0, 47.0, 27.0, 19.0, 19.0, 7.0, 8.0, 2.0, 3.0, 7.0, 4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2371826171875, -0.2294483184814453, -0.22171401977539062, -0.21397972106933594, -0.20624542236328125, -0.19851112365722656, -0.19077682495117188, -0.1830425262451172, -0.1753082275390625, -0.1675739288330078, -0.15983963012695312, -0.15210533142089844, -0.14437103271484375, -0.13663673400878906, -0.12890243530273438, -0.12116813659667969, -0.113433837890625, -0.10569953918457031, -0.09796524047851562, -0.09023094177246094, -0.08249664306640625, -0.07476234436035156, -0.06702804565429688, -0.05929374694824219, -0.0515594482421875, -0.04382514953613281, -0.036090850830078125, -0.028356552124023438, -0.02062225341796875, -0.012887954711914062, -0.005153656005859375, 0.0025806427001953125, 0.01031494140625, 0.018049240112304688, 0.025783538818359375, 0.03351783752441406, 0.04125213623046875, 0.04898643493652344, 0.056720733642578125, 0.06445503234863281, 0.0721893310546875, 0.07992362976074219, 0.08765792846679688, 0.09539222717285156, 0.10312652587890625, 0.11086082458496094, 0.11859512329101562, 0.1263294219970703, 0.134063720703125, 0.1417980194091797, 0.14953231811523438, 0.15726661682128906, 0.16500091552734375, 0.17273521423339844, 0.18046951293945312, 0.1882038116455078, 0.1959381103515625, 0.2036724090576172, 0.21140670776367188, 0.21914100646972656, 0.22687530517578125, 0.23460960388183594, 0.24234390258789062, 0.2500782012939453, 0.2578125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 6.0, 10.0, 11.0, 19.0, 20.0, 22.0, 24.0, 26.0, 31.0, 47.0, 74.0, 118.0, 127.0, 109.0, 81.0, 62.0, 44.0, 43.0, 24.0, 28.0, 9.0, 10.0, 14.0, 13.0, 5.0, 9.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09698486328125, -0.09393882751464844, -0.09089279174804688, -0.08784675598144531, -0.08480072021484375, -0.08175468444824219, -0.07870864868164062, -0.07566261291503906, -0.0726165771484375, -0.06957054138183594, -0.06652450561523438, -0.06347846984863281, -0.06043243408203125, -0.05738639831542969, -0.054340362548828125, -0.05129432678222656, -0.048248291015625, -0.04520225524902344, -0.042156219482421875, -0.03911018371582031, -0.03606414794921875, -0.03301811218261719, -0.029972076416015625, -0.026926040649414062, -0.0238800048828125, -0.020833969116210938, -0.017787933349609375, -0.014741897583007812, -0.01169586181640625, -0.008649826049804688, -0.005603790283203125, -0.0025577545166015625, 0.00048828125, 0.0035343170166015625, 0.006580352783203125, 0.009626388549804688, 0.01267242431640625, 0.015718460083007812, 0.018764495849609375, 0.021810531616210938, 0.0248565673828125, 0.027902603149414062, 0.030948638916015625, 0.03399467468261719, 0.03704071044921875, 0.04008674621582031, 0.043132781982421875, 0.04617881774902344, 0.049224853515625, 0.05227088928222656, 0.055316925048828125, 0.05836296081542969, 0.06140899658203125, 0.06445503234863281, 0.06750106811523438, 0.07054710388183594, 0.0735931396484375, 0.07663917541503906, 0.07968521118164062, 0.08273124694824219, 0.08577728271484375, 0.08882331848144531, 0.09186935424804688, 0.09491539001464844, 0.09796142578125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 13.0, 20.0, 76.0, 204.0, 299.0, 247.0, 97.0, 32.0, 10.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6724709272384644, -1.5774142742156982, -1.4823575019836426, -1.3873008489608765, -1.2922441959381104, -1.1971874237060547, -1.1021307706832886, -1.0070741176605225, -0.9120173454284668, -0.8169606328010559, -0.721903920173645, -0.6268472671508789, -0.531790554523468, -0.43673384189605713, -0.341677188873291, -0.24662047624588013, -0.15156376361846924, -0.05650706589221954, 0.03854963183403015, 0.13360631465911865, 0.22866302728652954, 0.32371973991394043, 0.41877639293670654, 0.5138331055641174, 0.6088898181915283, 0.7039465308189392, 0.7990032434463501, 0.8940598964691162, 0.9891166090965271, 1.084173321723938, 1.179229974746704, 1.2742867469787598, 1.3693432807922363, 1.4643999338150024, 1.559456706047058, 1.6545133590698242, 1.7495701313018799, 1.844626784324646, 1.939683437347412, 2.0347402095794678, 2.1297969818115234, 2.224853754043579, 2.3199102878570557, 2.4149670600891113, 2.510023832321167, 2.6050806045532227, 2.700137138366699, 2.795193910598755, 2.8902504444122314, 2.985307216644287, 3.0803637504577637, 3.1754205226898193, 3.270477294921875, 3.3655338287353516, 3.4605906009674072, 3.555647373199463, 3.6507039070129395, 3.745760679244995, 3.8408172130584717, 3.9358739852905273, 4.030930519104004, 4.125987529754639, 4.221044063568115, 4.316100597381592, 4.411157608032227]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 2.0, 12.0, 5.0, 8.0, 9.0, 10.0, 14.0, 12.0, 17.0, 21.0, 24.0, 26.0, 27.0, 40.0, 47.0, 30.0, 44.0, 36.0, 31.0, 46.0, 37.0, 37.0, 34.0, 36.0, 43.0, 40.0, 40.0, 41.0, 34.0, 41.0, 21.0, 27.0, 20.0, 10.0, 8.0, 10.0, 8.0, 13.0, 7.0, 5.0, 8.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8363328576087952, -0.8103107213973999, -0.7842886447906494, -0.7582665085792542, -0.7322444319725037, -0.7062222957611084, -0.6802002191543579, -0.6541780829429626, -0.6281559467315674, -0.6021338105201721, -0.5761117339134216, -0.5500895977020264, -0.5240675210952759, -0.4980453848838806, -0.47202327847480774, -0.44600117206573486, -0.4199790954589844, -0.3939569890499115, -0.3679348826408386, -0.34191274642944336, -0.31589066982269287, -0.2898685336112976, -0.26384642720222473, -0.23782432079315186, -0.21180221438407898, -0.1857801079750061, -0.15975800156593323, -0.13373588025569916, -0.10771377384662628, -0.0816916674375534, -0.055669546127319336, -0.02964743971824646, -0.0036252737045288086, 0.022396836429834366, 0.04841894656419754, 0.07444106042385101, 0.10046316683292389, 0.12648527324199677, 0.15250739455223083, 0.1785295009613037, 0.2045516073703766, 0.23057371377944946, 0.25659582018852234, 0.2826179265975952, 0.3086400628089905, 0.33466213941574097, 0.36068427562713623, 0.3867063820362091, 0.412728488445282, 0.43875059485435486, 0.46477270126342773, 0.490794837474823, 0.5168169140815735, 0.5428390502929688, 0.5688611268997192, 0.5948832631111145, 0.6209053993225098, 0.646927535533905, 0.6729496121406555, 0.6989717483520508, 0.7249938249588013, 0.7510159611701965, 0.7770380973815918, 0.8030601739883423, 0.8290822505950928]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 9.0, 16.0, 16.0, 51.0, 95.0, 196.0, 427.0, 1072.0, 3697.0, 20430.0, 383433.0, 3720993.0, 53244.0, 7164.0, 1992.0, 725.0, 329.0, 161.0, 89.0, 44.0, 27.0, 27.0, 14.0, 12.0, 4.0, 3.0, 5.0, 0.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.325439453125, -0.3125267028808594, -0.29961395263671875, -0.2867012023925781, -0.2737884521484375, -0.2608757019042969, -0.24796295166015625, -0.23505020141601562, -0.222137451171875, -0.20922470092773438, -0.19631195068359375, -0.18339920043945312, -0.1704864501953125, -0.15757369995117188, -0.14466094970703125, -0.13174819946289062, -0.11883544921875, -0.10592269897460938, -0.09300994873046875, -0.08009719848632812, -0.0671844482421875, -0.054271697998046875, -0.04135894775390625, -0.028446197509765625, -0.015533447265625, -0.002620697021484375, 0.01029205322265625, 0.023204803466796875, 0.0361175537109375, 0.049030303955078125, 0.06194305419921875, 0.07485580444335938, 0.0877685546875, 0.10068130493164062, 0.11359405517578125, 0.12650680541992188, 0.1394195556640625, 0.15233230590820312, 0.16524505615234375, 0.17815780639648438, 0.191070556640625, 0.20398330688476562, 0.21689605712890625, 0.22980880737304688, 0.2427215576171875, 0.2556343078613281, 0.26854705810546875, 0.2814598083496094, 0.29437255859375, 0.3072853088378906, 0.32019805908203125, 0.3331108093261719, 0.3460235595703125, 0.3589363098144531, 0.37184906005859375, 0.3847618103027344, 0.397674560546875, 0.4105873107910156, 0.42350006103515625, 0.4364128112792969, 0.4493255615234375, 0.4622383117675781, 0.47515106201171875, 0.4880638122558594, 0.5009765625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 7.0, 6.0, 8.0, 32.0, 26.0, 37.0, 66.0, 79.0, 104.0, 119.0, 104.0, 104.0, 88.0, 66.0, 46.0, 43.0, 26.0, 12.0, 10.0, 5.0, 5.0, 7.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042327880859375, -0.04071760177612305, -0.039107322692871094, -0.03749704360961914, -0.03588676452636719, -0.034276485443115234, -0.03266620635986328, -0.031055927276611328, -0.029445648193359375, -0.027835369110107422, -0.02622509002685547, -0.024614810943603516, -0.023004531860351562, -0.02139425277709961, -0.019783973693847656, -0.018173694610595703, -0.01656341552734375, -0.014953136444091797, -0.013342857360839844, -0.01173257827758789, -0.010122299194335938, -0.008512020111083984, -0.006901741027832031, -0.005291461944580078, -0.003681182861328125, -0.002070903778076172, -0.00046062469482421875, 0.0011496543884277344, 0.0027599334716796875, 0.004370212554931641, 0.005980491638183594, 0.007590770721435547, 0.0092010498046875, 0.010811328887939453, 0.012421607971191406, 0.01403188705444336, 0.015642166137695312, 0.017252445220947266, 0.01886272430419922, 0.020473003387451172, 0.022083282470703125, 0.023693561553955078, 0.02530384063720703, 0.026914119720458984, 0.028524398803710938, 0.03013467788696289, 0.031744956970214844, 0.0333552360534668, 0.03496551513671875, 0.0365757942199707, 0.038186073303222656, 0.03979635238647461, 0.04140663146972656, 0.043016910552978516, 0.04462718963623047, 0.04623746871948242, 0.047847747802734375, 0.04945802688598633, 0.05106830596923828, 0.052678585052490234, 0.05428886413574219, 0.05589914321899414, 0.057509422302246094, 0.05911970138549805, 0.06072998046875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 4.0, 2.0, 9.0, 15.0, 25.0, 31.0, 47.0, 84.0, 117.0, 176.0, 382.0, 668.0, 1420.0, 3171.0, 7973.0, 23862.0, 96491.0, 664223.0, 3081002.0, 243107.0, 48746.0, 13811.0, 4756.0, 2014.0, 881.0, 511.0, 253.0, 142.0, 102.0, 84.0, 36.0, 27.0, 30.0, 17.0, 16.0, 8.0, 13.0, 4.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.203125, -0.1970195770263672, -0.19091415405273438, -0.18480873107910156, -0.17870330810546875, -0.17259788513183594, -0.16649246215820312, -0.1603870391845703, -0.1542816162109375, -0.1481761932373047, -0.14207077026367188, -0.13596534729003906, -0.12985992431640625, -0.12375450134277344, -0.11764907836914062, -0.11154365539550781, -0.105438232421875, -0.09933280944824219, -0.09322738647460938, -0.08712196350097656, -0.08101654052734375, -0.07491111755371094, -0.06880569458007812, -0.06270027160644531, -0.0565948486328125, -0.05048942565917969, -0.044384002685546875, -0.03827857971191406, -0.03217315673828125, -0.026067733764648438, -0.019962310791015625, -0.013856887817382812, -0.00775146484375, -0.0016460418701171875, 0.004459381103515625, 0.010564804077148438, 0.01667022705078125, 0.022775650024414062, 0.028881072998046875, 0.03498649597167969, 0.0410919189453125, 0.04719734191894531, 0.053302764892578125, 0.05940818786621094, 0.06551361083984375, 0.07161903381347656, 0.07772445678710938, 0.08382987976074219, 0.089935302734375, 0.09604072570800781, 0.10214614868164062, 0.10825157165527344, 0.11435699462890625, 0.12046241760253906, 0.12656784057617188, 0.1326732635498047, 0.1387786865234375, 0.1448841094970703, 0.15098953247070312, 0.15709495544433594, 0.16320037841796875, 0.16930580139160156, 0.17541122436523438, 0.1815166473388672, 0.1876220703125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 8.0, 7.0, 8.0, 18.0, 18.0, 29.0, 38.0, 52.0, 111.0, 188.0, 450.0, 1563.0, 870.0, 331.0, 140.0, 80.0, 65.0, 40.0, 16.0, 16.0, 14.0, 5.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044189453125, -0.04195976257324219, -0.039730072021484375, -0.03750038146972656, -0.03527069091796875, -0.03304100036621094, -0.030811309814453125, -0.028581619262695312, -0.0263519287109375, -0.024122238159179688, -0.021892547607421875, -0.019662857055664062, -0.01743316650390625, -0.015203475952148438, -0.012973785400390625, -0.010744094848632812, -0.008514404296875, -0.0062847137451171875, -0.004055023193359375, -0.0018253326416015625, 0.00040435791015625, 0.0026340484619140625, 0.004863739013671875, 0.0070934295654296875, 0.0093231201171875, 0.011552810668945312, 0.013782501220703125, 0.016012191772460938, 0.01824188232421875, 0.020471572875976562, 0.022701263427734375, 0.024930953979492188, 0.02716064453125, 0.029390335083007812, 0.031620025634765625, 0.03384971618652344, 0.03607940673828125, 0.03830909729003906, 0.040538787841796875, 0.04276847839355469, 0.0449981689453125, 0.04722785949707031, 0.049457550048828125, 0.05168724060058594, 0.05391693115234375, 0.05614662170410156, 0.058376312255859375, 0.06060600280761719, 0.062835693359375, 0.06506538391113281, 0.06729507446289062, 0.06952476501464844, 0.07175445556640625, 0.07398414611816406, 0.07621383666992188, 0.07844352722167969, 0.0806732177734375, 0.08290290832519531, 0.08513259887695312, 0.08736228942871094, 0.08959197998046875, 0.09182167053222656, 0.09405136108398438, 0.09628105163574219, 0.0985107421875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 12.0, 32.0, 67.0, 152.0, 186.0, 271.0, 164.0, 79.0, 33.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-1.0670428276062012, -1.0469731092453003, -1.0269032716751099, -1.006833553314209, -0.9867637157440186, -0.9666939377784729, -0.9466241598129272, -0.9265544414520264, -0.9064846038818359, -0.8864148259162903, -0.8663450479507446, -0.846275269985199, -0.8262054920196533, -0.8061357140541077, -0.786065936088562, -0.7659962177276611, -0.7459264397621155, -0.7258566617965698, -0.7057868838310242, -0.6857171058654785, -0.6656473278999329, -0.6455775499343872, -0.6255077719688416, -0.6054379940032959, -0.585368275642395, -0.5652984976768494, -0.5452287197113037, -0.5251589417457581, -0.5050891637802124, -0.48501938581466675, -0.4649496376514435, -0.4448798596858978, -0.4248100519180298, -0.40474027395248413, -0.3846704959869385, -0.3646007180213928, -0.34453094005584717, -0.3244611620903015, -0.30439141392707825, -0.2843216359615326, -0.2642518877983093, -0.24418210983276367, -0.22411233186721802, -0.20404256880283356, -0.1839727908372879, -0.16390301287174225, -0.1438332498073578, -0.12376347184181213, -0.10369367897510529, -0.08362390100955963, -0.06355413049459457, -0.04348435625433922, -0.023414582014083862, -0.003344804048538208, 0.01672496646642685, 0.03679473698139191, 0.05686451494693756, 0.07693429291248322, 0.09700406342744827, 0.11707383394241333, 0.13714361190795898, 0.15721338987350464, 0.1772831678390503, 0.19735293090343475, 0.2174227088689804]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 7.0, 11.0, 7.0, 11.0, 6.0, 16.0, 15.0, 21.0, 16.0, 16.0, 26.0, 23.0, 22.0, 26.0, 33.0, 42.0, 36.0, 40.0, 28.0, 36.0, 37.0, 42.0, 40.0, 40.0, 30.0, 28.0, 43.0, 31.0, 35.0, 28.0, 40.0, 19.0, 17.0, 18.0, 20.0, 16.0, 9.0, 17.0, 11.0, 7.0, 9.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.14853399991989136, -0.14352990686893463, -0.1385258138179779, -0.13352172076702118, -0.12851762771606445, -0.12351353466510773, -0.118509441614151, -0.11350534856319427, -0.10850125551223755, -0.10349716246128082, -0.0984930694103241, -0.09348897635936737, -0.08848488330841064, -0.08348079025745392, -0.07847669720649719, -0.07347260415554047, -0.06846851110458374, -0.06346441805362701, -0.05846032500267029, -0.05345623195171356, -0.048452138900756836, -0.04344804584980011, -0.038443952798843384, -0.03343985974788666, -0.02843576669692993, -0.023431673645973206, -0.01842758059501648, -0.013423487544059753, -0.008419394493103027, -0.0034153014421463013, 0.0015887916088104248, 0.006592884659767151, 0.011596977710723877, 0.016601070761680603, 0.02160516381263733, 0.026609256863594055, 0.03161334991455078, 0.03661744296550751, 0.04162153601646423, 0.04662562906742096, 0.051629722118377686, 0.05663381516933441, 0.06163790822029114, 0.06664200127124786, 0.07164609432220459, 0.07665018737316132, 0.08165428042411804, 0.08665837347507477, 0.0916624665260315, 0.09666655957698822, 0.10167065262794495, 0.10667474567890167, 0.1116788387298584, 0.11668293178081512, 0.12168702483177185, 0.12669111788272858, 0.1316952109336853, 0.13669930398464203, 0.14170339703559875, 0.14670749008655548, 0.1517115831375122, 0.15671567618846893, 0.16171976923942566, 0.16672386229038239, 0.1717279553413391]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 6.0, 9.0, 10.0, 13.0, 21.0, 27.0, 20.0, 48.0, 78.0, 117.0, 166.0, 256.0, 411.0, 741.0, 1273.0, 2680.0, 5710.0, 13919.0, 36477.0, 100504.0, 264895.0, 358574.0, 164119.0, 59608.0, 22061.0, 8823.0, 3760.0, 1742.0, 991.0, 535.0, 357.0, 210.0, 139.0, 82.0, 52.0, 44.0, 24.0, 17.0, 13.0, 5.0, 5.0, 5.0, 1.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.13818359375, -0.1338977813720703, -0.12961196899414062, -0.12532615661621094, -0.12104034423828125, -0.11675453186035156, -0.11246871948242188, -0.10818290710449219, -0.1038970947265625, -0.09961128234863281, -0.09532546997070312, -0.09103965759277344, -0.08675384521484375, -0.08246803283691406, -0.07818222045898438, -0.07389640808105469, -0.069610595703125, -0.06532478332519531, -0.061038970947265625, -0.05675315856933594, -0.05246734619140625, -0.04818153381347656, -0.043895721435546875, -0.03960990905761719, -0.0353240966796875, -0.031038284301757812, -0.026752471923828125, -0.022466659545898438, -0.01818084716796875, -0.013895034790039062, -0.009609222412109375, -0.0053234100341796875, -0.00103759765625, 0.0032482147216796875, 0.007534027099609375, 0.011819839477539062, 0.01610565185546875, 0.020391464233398438, 0.024677276611328125, 0.028963088989257812, 0.0332489013671875, 0.03753471374511719, 0.041820526123046875, 0.04610633850097656, 0.05039215087890625, 0.05467796325683594, 0.058963775634765625, 0.06324958801269531, 0.067535400390625, 0.07182121276855469, 0.07610702514648438, 0.08039283752441406, 0.08467864990234375, 0.08896446228027344, 0.09325027465820312, 0.09753608703613281, 0.1018218994140625, 0.10610771179199219, 0.11039352416992188, 0.11467933654785156, 0.11896514892578125, 0.12325096130371094, 0.12753677368164062, 0.1318225860595703, 0.1361083984375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 3.0, 10.0, 27.0, 31.0, 36.0, 64.0, 75.0, 87.0, 102.0, 104.0, 91.0, 105.0, 75.0, 62.0, 42.0, 32.0, 14.0, 16.0, 12.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0423583984375, -0.040711402893066406, -0.03906440734863281, -0.03741741180419922, -0.035770416259765625, -0.03412342071533203, -0.03247642517089844, -0.030829429626464844, -0.02918243408203125, -0.027535438537597656, -0.025888442993164062, -0.02424144744873047, -0.022594451904296875, -0.02094745635986328, -0.019300460815429688, -0.017653465270996094, -0.0160064697265625, -0.014359474182128906, -0.012712478637695312, -0.011065483093261719, -0.009418487548828125, -0.007771492004394531, -0.0061244964599609375, -0.004477500915527344, -0.00283050537109375, -0.0011835098266601562, 0.0004634857177734375, 0.0021104812622070312, 0.003757476806640625, 0.005404472351074219, 0.0070514678955078125, 0.008698463439941406, 0.010345458984375, 0.011992454528808594, 0.013639450073242188, 0.015286445617675781, 0.016933441162109375, 0.01858043670654297, 0.020227432250976562, 0.021874427795410156, 0.02352142333984375, 0.025168418884277344, 0.026815414428710938, 0.02846240997314453, 0.030109405517578125, 0.03175640106201172, 0.03340339660644531, 0.035050392150878906, 0.0366973876953125, 0.038344383239746094, 0.03999137878417969, 0.04163837432861328, 0.043285369873046875, 0.04493236541748047, 0.04657936096191406, 0.048226356506347656, 0.04987335205078125, 0.051520347595214844, 0.05316734313964844, 0.05481433868408203, 0.056461334228515625, 0.05810832977294922, 0.05975532531738281, 0.061402320861816406, 0.06304931640625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 8.0, 6.0, 8.0, 11.0, 16.0, 18.0, 28.0, 45.0, 66.0, 88.0, 133.0, 187.0, 289.0, 433.0, 689.0, 1326.0, 2681.0, 7499.0, 29396.0, 126525.0, 417563.0, 338172.0, 90917.0, 21400.0, 5962.0, 2089.0, 1130.0, 621.0, 397.0, 270.0, 180.0, 106.0, 88.0, 55.0, 42.0, 31.0, 20.0, 19.0, 16.0, 6.0, 4.0, 2.0, 4.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1881103515625, -0.1823902130126953, -0.17667007446289062, -0.17094993591308594, -0.16522979736328125, -0.15950965881347656, -0.15378952026367188, -0.1480693817138672, -0.1423492431640625, -0.1366291046142578, -0.13090896606445312, -0.12518882751464844, -0.11946868896484375, -0.11374855041503906, -0.10802841186523438, -0.10230827331542969, -0.096588134765625, -0.09086799621582031, -0.08514785766601562, -0.07942771911621094, -0.07370758056640625, -0.06798744201660156, -0.062267303466796875, -0.05654716491699219, -0.0508270263671875, -0.04510688781738281, -0.039386749267578125, -0.03366661071777344, -0.02794647216796875, -0.022226333618164062, -0.016506195068359375, -0.010786056518554688, -0.00506591796875, 0.0006542205810546875, 0.006374359130859375, 0.012094497680664062, 0.01781463623046875, 0.023534774780273438, 0.029254913330078125, 0.03497505187988281, 0.0406951904296875, 0.04641532897949219, 0.052135467529296875, 0.05785560607910156, 0.06357574462890625, 0.06929588317871094, 0.07501602172851562, 0.08073616027832031, 0.086456298828125, 0.09217643737792969, 0.09789657592773438, 0.10361671447753906, 0.10933685302734375, 0.11505699157714844, 0.12077713012695312, 0.1264972686767578, 0.1322174072265625, 0.1379375457763672, 0.14365768432617188, 0.14937782287597656, 0.15509796142578125, 0.16081809997558594, 0.16653823852539062, 0.1722583770751953, 0.177978515625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 4.0, 9.0, 7.0, 9.0, 11.0, 22.0, 22.0, 23.0, 29.0, 31.0, 35.0, 47.0, 52.0, 47.0, 51.0, 55.0, 68.0, 54.0, 49.0, 48.0, 40.0, 43.0, 49.0, 37.0, 23.0, 25.0, 20.0, 29.0, 18.0, 15.0, 17.0, 8.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20166015625, -0.19617843627929688, -0.19069671630859375, -0.18521499633789062, -0.1797332763671875, -0.17425155639648438, -0.16876983642578125, -0.16328811645507812, -0.157806396484375, -0.15232467651367188, -0.14684295654296875, -0.14136123657226562, -0.1358795166015625, -0.13039779663085938, -0.12491607666015625, -0.11943435668945312, -0.11395263671875, -0.10847091674804688, -0.10298919677734375, -0.09750747680664062, -0.0920257568359375, -0.08654403686523438, -0.08106231689453125, -0.07558059692382812, -0.070098876953125, -0.06461715698242188, -0.05913543701171875, -0.053653717041015625, -0.0481719970703125, -0.042690277099609375, -0.03720855712890625, -0.031726837158203125, -0.0262451171875, -0.020763397216796875, -0.01528167724609375, -0.009799957275390625, -0.0043182373046875, 0.001163482666015625, 0.00664520263671875, 0.012126922607421875, 0.017608642578125, 0.023090362548828125, 0.02857208251953125, 0.034053802490234375, 0.0395355224609375, 0.045017242431640625, 0.05049896240234375, 0.055980682373046875, 0.06146240234375, 0.06694412231445312, 0.07242584228515625, 0.07790756225585938, 0.0833892822265625, 0.08887100219726562, 0.09435272216796875, 0.09983444213867188, 0.105316162109375, 0.11079788208007812, 0.11627960205078125, 0.12176132202148438, 0.1272430419921875, 0.13272476196289062, 0.13820648193359375, 0.14368820190429688, 0.149169921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 4.0, 6.0, 12.0, 13.0, 26.0, 30.0, 34.0, 50.0, 75.0, 112.0, 193.0, 305.0, 556.0, 1117.0, 2218.0, 5114.0, 13822.0, 42803.0, 174779.0, 525355.0, 206670.0, 49318.0, 15289.0, 5687.0, 2306.0, 1109.0, 596.0, 356.0, 197.0, 126.0, 73.0, 55.0, 46.0, 21.0, 24.0, 14.0, 10.0, 7.0, 7.0, 3.0, 3.0, 2.0, 5.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.1038818359375, -0.10103988647460938, -0.09819793701171875, -0.09535598754882812, -0.0925140380859375, -0.08967208862304688, -0.08683013916015625, -0.08398818969726562, -0.081146240234375, -0.07830429077148438, -0.07546234130859375, -0.07262039184570312, -0.0697784423828125, -0.06693649291992188, -0.06409454345703125, -0.061252593994140625, -0.05841064453125, -0.055568695068359375, -0.05272674560546875, -0.049884796142578125, -0.0470428466796875, -0.044200897216796875, -0.04135894775390625, -0.038516998291015625, -0.035675048828125, -0.032833099365234375, -0.02999114990234375, -0.027149200439453125, -0.0243072509765625, -0.021465301513671875, -0.01862335205078125, -0.015781402587890625, -0.012939453125, -0.010097503662109375, -0.00725555419921875, -0.004413604736328125, -0.0015716552734375, 0.001270294189453125, 0.00411224365234375, 0.006954193115234375, 0.009796142578125, 0.012638092041015625, 0.01548004150390625, 0.018321990966796875, 0.0211639404296875, 0.024005889892578125, 0.02684783935546875, 0.029689788818359375, 0.03253173828125, 0.035373687744140625, 0.03821563720703125, 0.041057586669921875, 0.0438995361328125, 0.046741485595703125, 0.04958343505859375, 0.052425384521484375, 0.055267333984375, 0.058109283447265625, 0.06095123291015625, 0.06379318237304688, 0.0666351318359375, 0.06947708129882812, 0.07231903076171875, 0.07516098022460938, 0.0780029296875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 9.0, 7.0, 10.0, 16.0, 16.0, 41.0, 59.0, 69.0, 81.0, 104.0, 106.0, 105.0, 90.0, 82.0, 60.0, 46.0, 26.0, 25.0, 16.0, 17.0, 6.0, 3.0, 3.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.512901306152344e-05, -9.159371256828308e-05, -8.805841207504272e-05, -8.452311158180237e-05, -8.098781108856201e-05, -7.745251059532166e-05, -7.39172101020813e-05, -7.038190960884094e-05, -6.684660911560059e-05, -6.331130862236023e-05, -5.977600812911987e-05, -5.6240707635879517e-05, -5.270540714263916e-05, -4.9170106649398804e-05, -4.563480615615845e-05, -4.209950566291809e-05, -3.8564205169677734e-05, -3.502890467643738e-05, -3.149360418319702e-05, -2.7958303689956665e-05, -2.442300319671631e-05, -2.0887702703475952e-05, -1.7352402210235596e-05, -1.381710171699524e-05, -1.0281801223754883e-05, -6.746500730514526e-06, -3.21120023727417e-06, 3.241002559661865e-07, 3.859400749206543e-06, 7.394701242446899e-06, 1.0930001735687256e-05, 1.4465302228927612e-05, 1.800060272216797e-05, 2.1535903215408325e-05, 2.507120370864868e-05, 2.8606504201889038e-05, 3.2141804695129395e-05, 3.567710518836975e-05, 3.921240568161011e-05, 4.2747706174850464e-05, 4.628300666809082e-05, 4.981830716133118e-05, 5.335360765457153e-05, 5.688890814781189e-05, 6.0424208641052246e-05, 6.39595091342926e-05, 6.749480962753296e-05, 7.103011012077332e-05, 7.456541061401367e-05, 7.810071110725403e-05, 8.163601160049438e-05, 8.517131209373474e-05, 8.87066125869751e-05, 9.224191308021545e-05, 9.577721357345581e-05, 9.931251406669617e-05, 0.00010284781455993652, 0.00010638311505317688, 0.00010991841554641724, 0.00011345371603965759, 0.00011698901653289795, 0.0001205243170261383, 0.00012405961751937866, 0.00012759491801261902, 0.00013113021850585938]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 9.0, 9.0, 13.0, 16.0, 27.0, 46.0, 50.0, 77.0, 96.0, 159.0, 266.0, 556.0, 1032.0, 2601.0, 7397.0, 29020.0, 159586.0, 658606.0, 149375.0, 27313.0, 7423.0, 2547.0, 1069.0, 464.0, 312.0, 165.0, 101.0, 64.0, 39.0, 32.0, 19.0, 21.0, 22.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0966796875, -0.09288597106933594, -0.08909225463867188, -0.08529853820800781, -0.08150482177734375, -0.07771110534667969, -0.07391738891601562, -0.07012367248535156, -0.0663299560546875, -0.06253623962402344, -0.058742523193359375, -0.05494880676269531, -0.05115509033203125, -0.04736137390136719, -0.043567657470703125, -0.03977394104003906, -0.035980224609375, -0.03218650817871094, -0.028392791748046875, -0.024599075317382812, -0.02080535888671875, -0.017011642456054688, -0.013217926025390625, -0.009424209594726562, -0.0056304931640625, -0.0018367767333984375, 0.001956939697265625, 0.0057506561279296875, 0.00954437255859375, 0.013338088989257812, 0.017131805419921875, 0.020925521850585938, 0.02471923828125, 0.028512954711914062, 0.032306671142578125, 0.03610038757324219, 0.03989410400390625, 0.04368782043457031, 0.047481536865234375, 0.05127525329589844, 0.0550689697265625, 0.05886268615722656, 0.06265640258789062, 0.06645011901855469, 0.07024383544921875, 0.07403755187988281, 0.07783126831054688, 0.08162498474121094, 0.085418701171875, 0.08921241760253906, 0.09300613403320312, 0.09679985046386719, 0.10059356689453125, 0.10438728332519531, 0.10818099975585938, 0.11197471618652344, 0.1157684326171875, 0.11956214904785156, 0.12335586547851562, 0.1271495819091797, 0.13094329833984375, 0.1347370147705078, 0.13853073120117188, 0.14232444763183594, 0.1461181640625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 1.0, 4.0, 2.0, 4.0, 3.0, 7.0, 6.0, 5.0, 11.0, 13.0, 15.0, 23.0, 29.0, 49.0, 58.0, 71.0, 87.0, 101.0, 88.0, 86.0, 69.0, 68.0, 58.0, 34.0, 22.0, 19.0, 15.0, 17.0, 7.0, 3.0, 1.0, 9.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07745361328125, -0.07526493072509766, -0.07307624816894531, -0.07088756561279297, -0.06869888305664062, -0.06651020050048828, -0.06432151794433594, -0.062132835388183594, -0.05994415283203125, -0.057755470275878906, -0.05556678771972656, -0.05337810516357422, -0.051189422607421875, -0.04900074005126953, -0.04681205749511719, -0.044623374938964844, -0.0424346923828125, -0.040246009826660156, -0.03805732727050781, -0.03586864471435547, -0.033679962158203125, -0.03149127960205078, -0.029302597045898438, -0.027113914489746094, -0.02492523193359375, -0.022736549377441406, -0.020547866821289062, -0.01835918426513672, -0.016170501708984375, -0.013981819152832031, -0.011793136596679688, -0.009604454040527344, -0.007415771484375, -0.005227088928222656, -0.0030384063720703125, -0.0008497238159179688, 0.001338958740234375, 0.0035276412963867188, 0.0057163238525390625, 0.007905006408691406, 0.01009368896484375, 0.012282371520996094, 0.014471054077148438, 0.01665973663330078, 0.018848419189453125, 0.02103710174560547, 0.023225784301757812, 0.025414466857910156, 0.0276031494140625, 0.029791831970214844, 0.03198051452636719, 0.03416919708251953, 0.036357879638671875, 0.03854656219482422, 0.04073524475097656, 0.042923927307128906, 0.04511260986328125, 0.047301292419433594, 0.04948997497558594, 0.05167865753173828, 0.053867340087890625, 0.05605602264404297, 0.05824470520019531, 0.060433387756347656, 0.0626220703125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 7.0, 15.0, 21.0, 52.0, 110.0, 158.0, 146.0, 140.0, 130.0, 112.0, 44.0, 35.0, 20.0, 9.0, 8.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.777843713760376, -0.7365291118621826, -0.6952145099639893, -0.6538999676704407, -0.6125853657722473, -0.571270763874054, -0.5299562215805054, -0.488641619682312, -0.44732701778411865, -0.4060124158859253, -0.3646978437900543, -0.32338327169418335, -0.28206866979599, -0.24075408279895782, -0.19943949580192566, -0.1581249237060547, -0.11681032180786133, -0.07549573481082916, -0.034181147813797, 0.0071334391832351685, 0.048448026180267334, 0.0897626131772995, 0.13107720017433167, 0.17239177227020264, 0.213706374168396, 0.25502097606658936, 0.2963355481624603, 0.3376501202583313, 0.37896472215652466, 0.420279324054718, 0.461593896150589, 0.50290846824646, 0.5442229509353638, 0.5855375528335571, 0.6268521547317505, 0.6681666970252991, 0.7094812989234924, 0.7507959008216858, 0.7921104431152344, 0.8334250450134277, 0.8747396469116211, 0.9160542488098145, 0.9573688507080078, 0.9986833930015564, 1.0399980545043945, 1.0813125371932983, 1.1226271390914917, 1.163941740989685, 1.2052563428878784, 1.2465709447860718, 1.2878855466842651, 1.3292001485824585, 1.3705146312713623, 1.4118292331695557, 1.453143835067749, 1.4944584369659424, 1.5357730388641357, 1.577087640762329, 1.6184022426605225, 1.6597168445587158, 1.7010314464569092, 1.742345929145813, 1.7836605310440063, 1.8249751329421997, 1.866289734840393]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 3.0, 7.0, 6.0, 6.0, 6.0, 9.0, 11.0, 14.0, 17.0, 14.0, 17.0, 20.0, 27.0, 24.0, 31.0, 25.0, 37.0, 24.0, 32.0, 42.0, 46.0, 38.0, 42.0, 39.0, 37.0, 36.0, 28.0, 38.0, 34.0, 38.0, 30.0, 31.0, 20.0, 31.0, 23.0, 23.0, 19.0, 15.0, 10.0, 7.0, 5.0, 12.0, 4.0, 2.0, 8.0, 1.0, 4.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6271832585334778, -0.6067649126052856, -0.5863465666770935, -0.5659282207489014, -0.545509934425354, -0.5250915884971619, -0.5046732425689697, -0.4842548966407776, -0.46383655071258545, -0.4434182047843933, -0.42299985885620117, -0.4025815427303314, -0.3821631968021393, -0.36174485087394714, -0.3413265347480774, -0.32090818881988525, -0.3004898428916931, -0.280071496963501, -0.25965315103530884, -0.2392348349094391, -0.21881648898124695, -0.1983981430530548, -0.17797981202602386, -0.15756148099899292, -0.13714313507080078, -0.11672479659318924, -0.0963064581155777, -0.07588811963796616, -0.055469781160354614, -0.03505144268274307, -0.01463310420513153, 0.005785226821899414, 0.026203513145446777, 0.04662185162305832, 0.06704019010066986, 0.0874585285782814, 0.10787686705589294, 0.12829521298408508, 0.14871354401111603, 0.16913187503814697, 0.1895502209663391, 0.20996856689453125, 0.2303868979215622, 0.25080522894859314, 0.2712235748767853, 0.2916419208049774, 0.31206023693084717, 0.3324785828590393, 0.35289692878723145, 0.3733152747154236, 0.3937336206436157, 0.4141519367694855, 0.4345702826976776, 0.45498862862586975, 0.4754069447517395, 0.49582529067993164, 0.5162436366081238, 0.5366619825363159, 0.5570803284645081, 0.5774986743927002, 0.5979169607162476, 0.6183353066444397, 0.6387536525726318, 0.659171998500824, 0.6795903444290161]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 5.0, 7.0, 9.0, 19.0, 20.0, 29.0, 41.0, 56.0, 93.0, 139.0, 246.0, 433.0, 785.0, 1491.0, 2827.0, 6349.0, 15883.0, 51751.0, 312419.0, 3559417.0, 181304.0, 37758.0, 12545.0, 5182.0, 2433.0, 1252.0, 693.0, 398.0, 247.0, 143.0, 77.0, 63.0, 44.0, 27.0, 33.0, 15.0, 7.0, 5.0, 7.0, 8.0, 7.0, 3.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-0.1744384765625, -0.1690521240234375, -0.163665771484375, -0.1582794189453125, -0.15289306640625, -0.1475067138671875, -0.142120361328125, -0.1367340087890625, -0.13134765625, -0.1259613037109375, -0.120574951171875, -0.1151885986328125, -0.10980224609375, -0.1044158935546875, -0.099029541015625, -0.0936431884765625, -0.0882568359375, -0.0828704833984375, -0.077484130859375, -0.0720977783203125, -0.06671142578125, -0.0613250732421875, -0.055938720703125, -0.0505523681640625, -0.045166015625, -0.0397796630859375, -0.034393310546875, -0.0290069580078125, -0.02362060546875, -0.0182342529296875, -0.012847900390625, -0.0074615478515625, -0.0020751953125, 0.0033111572265625, 0.008697509765625, 0.0140838623046875, 0.01947021484375, 0.0248565673828125, 0.030242919921875, 0.0356292724609375, 0.041015625, 0.0464019775390625, 0.051788330078125, 0.0571746826171875, 0.06256103515625, 0.0679473876953125, 0.073333740234375, 0.0787200927734375, 0.0841064453125, 0.0894927978515625, 0.094879150390625, 0.1002655029296875, 0.10565185546875, 0.1110382080078125, 0.116424560546875, 0.1218109130859375, 0.127197265625, 0.1325836181640625, 0.137969970703125, 0.1433563232421875, 0.14874267578125, 0.1541290283203125, 0.159515380859375, 0.1649017333984375, 0.1702880859375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 9.0, 8.0, 8.0, 14.0, 23.0, 35.0, 46.0, 52.0, 59.0, 86.0, 89.0, 103.0, 83.0, 79.0, 75.0, 79.0, 41.0, 40.0, 26.0, 17.0, 19.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0416259765625, -0.040076255798339844, -0.03852653503417969, -0.03697681427001953, -0.035427093505859375, -0.03387737274169922, -0.03232765197753906, -0.030777931213378906, -0.02922821044921875, -0.027678489685058594, -0.026128768920898438, -0.02457904815673828, -0.023029327392578125, -0.02147960662841797, -0.019929885864257812, -0.018380165100097656, -0.0168304443359375, -0.015280723571777344, -0.013731002807617188, -0.012181282043457031, -0.010631561279296875, -0.009081840515136719, -0.0075321197509765625, -0.005982398986816406, -0.00443267822265625, -0.0028829574584960938, -0.0013332366943359375, 0.00021648406982421875, 0.001766204833984375, 0.0033159255981445312, 0.0048656463623046875, 0.006415367126464844, 0.007965087890625, 0.009514808654785156, 0.011064529418945312, 0.012614250183105469, 0.014163970947265625, 0.01571369171142578, 0.017263412475585938, 0.018813133239746094, 0.02036285400390625, 0.021912574768066406, 0.023462295532226562, 0.02501201629638672, 0.026561737060546875, 0.02811145782470703, 0.029661178588867188, 0.031210899353027344, 0.0327606201171875, 0.034310340881347656, 0.03586006164550781, 0.03740978240966797, 0.038959503173828125, 0.04050922393798828, 0.04205894470214844, 0.043608665466308594, 0.04515838623046875, 0.046708106994628906, 0.04825782775878906, 0.04980754852294922, 0.051357269287109375, 0.05290699005126953, 0.05445671081542969, 0.056006431579589844, 0.05755615234375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 9.0, 8.0, 22.0, 50.0, 75.0, 124.0, 195.0, 374.0, 726.0, 1705.0, 4503.0, 15803.0, 83074.0, 1302964.0, 2653488.0, 103694.0, 18889.0, 5015.0, 1815.0, 772.0, 401.0, 233.0, 134.0, 64.0, 50.0, 41.0, 20.0, 10.0, 7.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.224609375, -0.217376708984375, -0.21014404296875, -0.202911376953125, -0.1956787109375, -0.188446044921875, -0.18121337890625, -0.173980712890625, -0.166748046875, -0.159515380859375, -0.15228271484375, -0.145050048828125, -0.1378173828125, -0.130584716796875, -0.12335205078125, -0.116119384765625, -0.10888671875, -0.101654052734375, -0.09442138671875, -0.087188720703125, -0.0799560546875, -0.072723388671875, -0.06549072265625, -0.058258056640625, -0.051025390625, -0.043792724609375, -0.03656005859375, -0.029327392578125, -0.0220947265625, -0.014862060546875, -0.00762939453125, -0.000396728515625, 0.0068359375, 0.014068603515625, 0.02130126953125, 0.028533935546875, 0.0357666015625, 0.042999267578125, 0.05023193359375, 0.057464599609375, 0.064697265625, 0.071929931640625, 0.07916259765625, 0.086395263671875, 0.0936279296875, 0.100860595703125, 0.10809326171875, 0.115325927734375, 0.12255859375, 0.129791259765625, 0.13702392578125, 0.144256591796875, 0.1514892578125, 0.158721923828125, 0.16595458984375, 0.173187255859375, 0.180419921875, 0.187652587890625, 0.19488525390625, 0.202117919921875, 0.2093505859375, 0.216583251953125, 0.22381591796875, 0.231048583984375, 0.23828125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 6.0, 1.0, 4.0, 2.0, 7.0, 6.0, 11.0, 24.0, 19.0, 20.0, 23.0, 67.0, 79.0, 146.0, 285.0, 617.0, 1590.0, 515.0, 243.0, 137.0, 75.0, 64.0, 41.0, 30.0, 15.0, 9.0, 13.0, 8.0, 5.0, 11.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.05377197265625, -0.052001953125, -0.05023193359375, -0.0484619140625, -0.04669189453125, -0.044921875, -0.04315185546875, -0.0413818359375, -0.03961181640625, -0.037841796875, -0.03607177734375, -0.0343017578125, -0.03253173828125, -0.03076171875, -0.02899169921875, -0.0272216796875, -0.02545166015625, -0.023681640625, -0.02191162109375, -0.0201416015625, -0.01837158203125, -0.0166015625, -0.01483154296875, -0.0130615234375, -0.01129150390625, -0.009521484375, -0.00775146484375, -0.0059814453125, -0.00421142578125, -0.00244140625, -0.00067138671875, 0.0010986328125, 0.00286865234375, 0.004638671875, 0.00640869140625, 0.0081787109375, 0.00994873046875, 0.01171875, 0.01348876953125, 0.0152587890625, 0.01702880859375, 0.018798828125, 0.02056884765625, 0.0223388671875, 0.02410888671875, 0.02587890625, 0.02764892578125, 0.0294189453125, 0.03118896484375, 0.032958984375, 0.03472900390625, 0.0364990234375, 0.03826904296875, 0.0400390625, 0.04180908203125, 0.0435791015625, 0.04534912109375, 0.047119140625, 0.04888916015625, 0.0506591796875, 0.05242919921875, 0.05419921875, 0.05596923828125, 0.0577392578125, 0.05950927734375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 17.0, 65.0, 145.0, 281.0, 233.0, 153.0, 57.0, 33.0, 12.0, 5.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4061968922615051, -0.38357627391815186, -0.3609556555747986, -0.3383350372314453, -0.31571441888809204, -0.29309380054473877, -0.2704732120037079, -0.24785259366035461, -0.22523197531700134, -0.20261135697364807, -0.1799907386302948, -0.15737013518810272, -0.13474951684474945, -0.11212889850139618, -0.0895082950592041, -0.06688767671585083, -0.04426705837249756, -0.021646443754434586, 0.0009741708636283875, 0.023594781756401062, 0.046215400099754333, 0.0688360184431076, 0.09145662188529968, 0.11407724022865295, 0.13669785857200623, 0.1593184769153595, 0.18193909525871277, 0.20455969870090485, 0.22718031704425812, 0.2498009353876114, 0.27242153882980347, 0.29504215717315674, 0.3176628351211548, 0.34028345346450806, 0.36290407180786133, 0.3855246901512146, 0.40814530849456787, 0.43076592683792114, 0.453386515378952, 0.4760071337223053, 0.49862775206565857, 0.5212483406066895, 0.5438689589500427, 0.566489577293396, 0.5891101956367493, 0.6117308139801025, 0.6343514323234558, 0.6569720506668091, 0.6795926690101624, 0.7022132873535156, 0.7248339056968689, 0.7474545240402222, 0.7700751423835754, 0.7926957607269287, 0.8153163194656372, 0.8379369974136353, 0.8605575561523438, 0.883178174495697, 0.9057987928390503, 0.9284194111824036, 0.9510400295257568, 0.9736606478691101, 0.9962812662124634, 1.0189018249511719, 1.04152250289917]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 8.0, 2.0, 5.0, 9.0, 15.0, 10.0, 9.0, 13.0, 22.0, 20.0, 18.0, 38.0, 23.0, 22.0, 34.0, 28.0, 28.0, 37.0, 29.0, 38.0, 35.0, 34.0, 45.0, 45.0, 45.0, 37.0, 29.0, 35.0, 29.0, 26.0, 32.0, 26.0, 26.0, 23.0, 22.0, 17.0, 16.0, 16.0, 11.0, 8.0, 13.0, 1.0, 8.0, 7.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.16365522146224976, -0.15868541598320007, -0.1537156105041504, -0.14874579012393951, -0.14377598464488983, -0.13880617916584015, -0.13383637368679047, -0.12886656820774078, -0.1238967552781105, -0.11892694979906082, -0.11395713686943054, -0.10898733139038086, -0.10401752591133118, -0.0990477129817009, -0.09407790750265121, -0.08910809457302094, -0.08413828909397125, -0.07916848361492157, -0.07419867068529129, -0.06922886520624161, -0.06425905227661133, -0.059289246797561646, -0.05431944131851196, -0.04934963211417198, -0.044379822909832, -0.03941001370549202, -0.03444020450115204, -0.029470399022102356, -0.024500589817762375, -0.019530780613422394, -0.014560973271727562, -0.00959116593003273, -0.004621356725692749, 0.00034845154732465744, 0.005318259820342064, 0.01028806809335947, 0.015257876366376877, 0.020227685570716858, 0.02519749291241169, 0.03016730025410652, 0.0351371094584465, 0.040106918662786484, 0.045076727867126465, 0.05004653334617615, 0.05501634255051613, 0.05998615175485611, 0.06495595723390579, 0.06992577016353607, 0.07489557564258575, 0.07986538112163544, 0.08483519405126572, 0.0898049995303154, 0.09477481245994568, 0.09974461793899536, 0.10471442341804504, 0.10968422889709473, 0.114654041826725, 0.11962384730577469, 0.12459366023540497, 0.12956346571445465, 0.13453327119350433, 0.1395030915737152, 0.1444728970527649, 0.14944270253181458, 0.15441250801086426]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 2.0, 8.0, 10.0, 13.0, 24.0, 25.0, 54.0, 72.0, 124.0, 215.0, 352.0, 711.0, 1406.0, 2971.0, 6940.0, 18393.0, 55577.0, 176340.0, 412769.0, 249793.0, 79768.0, 26002.0, 9506.0, 3782.0, 1730.0, 854.0, 422.0, 271.0, 153.0, 115.0, 48.0, 45.0, 21.0, 11.0, 11.0, 4.0, 2.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1422119140625, -0.1375732421875, -0.1329345703125, -0.1282958984375, -0.1236572265625, -0.1190185546875, -0.1143798828125, -0.1097412109375, -0.1051025390625, -0.1004638671875, -0.0958251953125, -0.0911865234375, -0.0865478515625, -0.0819091796875, -0.0772705078125, -0.0726318359375, -0.0679931640625, -0.0633544921875, -0.0587158203125, -0.0540771484375, -0.0494384765625, -0.0447998046875, -0.0401611328125, -0.0355224609375, -0.0308837890625, -0.0262451171875, -0.0216064453125, -0.0169677734375, -0.0123291015625, -0.0076904296875, -0.0030517578125, 0.0015869140625, 0.0062255859375, 0.0108642578125, 0.0155029296875, 0.0201416015625, 0.0247802734375, 0.0294189453125, 0.0340576171875, 0.0386962890625, 0.0433349609375, 0.0479736328125, 0.0526123046875, 0.0572509765625, 0.0618896484375, 0.0665283203125, 0.0711669921875, 0.0758056640625, 0.0804443359375, 0.0850830078125, 0.0897216796875, 0.0943603515625, 0.0989990234375, 0.1036376953125, 0.1082763671875, 0.1129150390625, 0.1175537109375, 0.1221923828125, 0.1268310546875, 0.1314697265625, 0.1361083984375, 0.1407470703125, 0.1453857421875, 0.1500244140625, 0.1546630859375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 7.0, 11.0, 15.0, 16.0, 40.0, 37.0, 65.0, 67.0, 76.0, 102.0, 91.0, 91.0, 89.0, 56.0, 59.0, 47.0, 42.0, 32.0, 22.0, 15.0, 7.0, 9.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04156494140625, -0.040015220642089844, -0.03846549987792969, -0.03691577911376953, -0.035366058349609375, -0.03381633758544922, -0.03226661682128906, -0.030716896057128906, -0.02916717529296875, -0.027617454528808594, -0.026067733764648438, -0.02451801300048828, -0.022968292236328125, -0.02141857147216797, -0.019868850708007812, -0.018319129943847656, -0.0167694091796875, -0.015219688415527344, -0.013669967651367188, -0.012120246887207031, -0.010570526123046875, -0.009020805358886719, -0.0074710845947265625, -0.005921363830566406, -0.00437164306640625, -0.0028219223022460938, -0.0012722015380859375, 0.00027751922607421875, 0.001827239990234375, 0.0033769607543945312, 0.0049266815185546875, 0.006476402282714844, 0.008026123046875, 0.009575843811035156, 0.011125564575195312, 0.012675285339355469, 0.014225006103515625, 0.01577472686767578, 0.017324447631835938, 0.018874168395996094, 0.02042388916015625, 0.021973609924316406, 0.023523330688476562, 0.02507305145263672, 0.026622772216796875, 0.02817249298095703, 0.029722213745117188, 0.031271934509277344, 0.0328216552734375, 0.034371376037597656, 0.03592109680175781, 0.03747081756591797, 0.039020538330078125, 0.04057025909423828, 0.04211997985839844, 0.043669700622558594, 0.04521942138671875, 0.046769142150878906, 0.04831886291503906, 0.04986858367919922, 0.051418304443359375, 0.05296802520751953, 0.05451774597167969, 0.056067466735839844, 0.0576171875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 9.0, 24.0, 29.0, 35.0, 48.0, 81.0, 117.0, 180.0, 261.0, 448.0, 698.0, 1331.0, 3320.0, 11368.0, 59290.0, 315145.0, 501621.0, 122916.0, 22055.0, 5270.0, 1920.0, 947.0, 534.0, 309.0, 180.0, 132.0, 88.0, 52.0, 39.0, 29.0, 17.0, 12.0, 13.0, 6.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18115234375, -0.1751556396484375, -0.169158935546875, -0.1631622314453125, -0.15716552734375, -0.1511688232421875, -0.145172119140625, -0.1391754150390625, -0.1331787109375, -0.1271820068359375, -0.121185302734375, -0.1151885986328125, -0.10919189453125, -0.1031951904296875, -0.097198486328125, -0.0912017822265625, -0.085205078125, -0.0792083740234375, -0.073211669921875, -0.0672149658203125, -0.06121826171875, -0.0552215576171875, -0.049224853515625, -0.0432281494140625, -0.0372314453125, -0.0312347412109375, -0.025238037109375, -0.0192413330078125, -0.01324462890625, -0.0072479248046875, -0.001251220703125, 0.0047454833984375, 0.0107421875, 0.0167388916015625, 0.022735595703125, 0.0287322998046875, 0.03472900390625, 0.0407257080078125, 0.046722412109375, 0.0527191162109375, 0.0587158203125, 0.0647125244140625, 0.070709228515625, 0.0767059326171875, 0.08270263671875, 0.0886993408203125, 0.094696044921875, 0.1006927490234375, 0.106689453125, 0.1126861572265625, 0.118682861328125, 0.1246795654296875, 0.13067626953125, 0.1366729736328125, 0.142669677734375, 0.1486663818359375, 0.1546630859375, 0.1606597900390625, 0.166656494140625, 0.1726531982421875, 0.17864990234375, 0.1846466064453125, 0.190643310546875, 0.1966400146484375, 0.20263671875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 4.0, 2.0, 7.0, 6.0, 9.0, 12.0, 16.0, 27.0, 26.0, 22.0, 28.0, 16.0, 23.0, 31.0, 36.0, 47.0, 48.0, 49.0, 49.0, 42.0, 43.0, 46.0, 43.0, 39.0, 46.0, 42.0, 22.0, 29.0, 31.0, 34.0, 24.0, 21.0, 21.0, 11.0, 9.0, 6.0, 8.0, 6.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.135498046875, -0.1314382553100586, -0.1273784637451172, -0.12331867218017578, -0.11925888061523438, -0.11519908905029297, -0.11113929748535156, -0.10707950592041016, -0.10301971435546875, -0.09895992279052734, -0.09490013122558594, -0.09084033966064453, -0.08678054809570312, -0.08272075653076172, -0.07866096496582031, -0.0746011734008789, -0.0705413818359375, -0.0664815902709961, -0.06242179870605469, -0.05836200714111328, -0.054302215576171875, -0.05024242401123047, -0.04618263244628906, -0.042122840881347656, -0.03806304931640625, -0.034003257751464844, -0.029943466186523438, -0.02588367462158203, -0.021823883056640625, -0.01776409149169922, -0.013704299926757812, -0.009644508361816406, -0.005584716796875, -0.0015249252319335938, 0.0025348663330078125, 0.006594657897949219, 0.010654449462890625, 0.014714241027832031, 0.018774032592773438, 0.022833824157714844, 0.02689361572265625, 0.030953407287597656, 0.03501319885253906, 0.03907299041748047, 0.043132781982421875, 0.04719257354736328, 0.05125236511230469, 0.055312156677246094, 0.0593719482421875, 0.0634317398071289, 0.06749153137207031, 0.07155132293701172, 0.07561111450195312, 0.07967090606689453, 0.08373069763183594, 0.08779048919677734, 0.09185028076171875, 0.09591007232666016, 0.09996986389160156, 0.10402965545654297, 0.10808944702148438, 0.11214923858642578, 0.11620903015136719, 0.1202688217163086, 0.12432861328125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 4.0, 4.0, 5.0, 10.0, 16.0, 22.0, 41.0, 103.0, 262.0, 687.0, 2217.0, 8971.0, 48120.0, 452600.0, 472541.0, 50159.0, 9263.0, 2299.0, 759.0, 259.0, 98.0, 56.0, 31.0, 18.0, 8.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.103759765625, -0.09961128234863281, -0.09546279907226562, -0.09131431579589844, -0.08716583251953125, -0.08301734924316406, -0.07886886596679688, -0.07472038269042969, -0.0705718994140625, -0.06642341613769531, -0.062274932861328125, -0.05812644958496094, -0.05397796630859375, -0.04982948303222656, -0.045680999755859375, -0.04153251647949219, -0.037384033203125, -0.03323554992675781, -0.029087066650390625, -0.024938583374023438, -0.02079010009765625, -0.016641616821289062, -0.012493133544921875, -0.008344650268554688, -0.0041961669921875, -4.76837158203125e-05, 0.004100799560546875, 0.008249282836914062, 0.01239776611328125, 0.016546249389648438, 0.020694732666015625, 0.024843215942382812, 0.02899169921875, 0.03314018249511719, 0.037288665771484375, 0.04143714904785156, 0.04558563232421875, 0.04973411560058594, 0.053882598876953125, 0.05803108215332031, 0.0621795654296875, 0.06632804870605469, 0.07047653198242188, 0.07462501525878906, 0.07877349853515625, 0.08292198181152344, 0.08707046508789062, 0.09121894836425781, 0.095367431640625, 0.09951591491699219, 0.10366439819335938, 0.10781288146972656, 0.11196136474609375, 0.11610984802246094, 0.12025833129882812, 0.12440681457519531, 0.1285552978515625, 0.1327037811279297, 0.13685226440429688, 0.14100074768066406, 0.14514923095703125, 0.14929771423339844, 0.15344619750976562, 0.1575946807861328, 0.1617431640625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 2.0, 3.0, 7.0, 3.0, 4.0, 13.0, 7.0, 7.0, 12.0, 17.0, 25.0, 17.0, 25.0, 35.0, 53.0, 63.0, 58.0, 66.0, 77.0, 78.0, 73.0, 57.0, 48.0, 60.0, 38.0, 40.0, 19.0, 23.0, 20.0, 14.0, 6.0, 15.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.529424667358398e-05, -8.270237594842911e-05, -8.011050522327423e-05, -7.751863449811935e-05, -7.492676377296448e-05, -7.23348930478096e-05, -6.974302232265472e-05, -6.715115159749985e-05, -6.455928087234497e-05, -6.19674101471901e-05, -5.937553942203522e-05, -5.678366869688034e-05, -5.4191797971725464e-05, -5.159992724657059e-05, -4.900805652141571e-05, -4.6416185796260834e-05, -4.382431507110596e-05, -4.123244434595108e-05, -3.8640573620796204e-05, -3.604870289564133e-05, -3.345683217048645e-05, -3.0864961445331573e-05, -2.8273090720176697e-05, -2.568121999502182e-05, -2.3089349269866943e-05, -2.0497478544712067e-05, -1.790560781955719e-05, -1.5313737094402313e-05, -1.2721866369247437e-05, -1.012999564409256e-05, -7.538124918937683e-06, -4.946254193782806e-06, -2.3543834686279297e-06, 2.3748725652694702e-07, 2.8293579816818237e-06, 5.4212287068367004e-06, 8.013099431991577e-06, 1.0604970157146454e-05, 1.319684088230133e-05, 1.5788711607456207e-05, 1.8380582332611084e-05, 2.097245305776596e-05, 2.3564323782920837e-05, 2.6156194508075714e-05, 2.874806523323059e-05, 3.133993595838547e-05, 3.3931806683540344e-05, 3.652367740869522e-05, 3.91155481338501e-05, 4.1707418859004974e-05, 4.429928958415985e-05, 4.689116030931473e-05, 4.9483031034469604e-05, 5.207490175962448e-05, 5.466677248477936e-05, 5.7258643209934235e-05, 5.985051393508911e-05, 6.244238466024399e-05, 6.503425538539886e-05, 6.762612611055374e-05, 7.021799683570862e-05, 7.28098675608635e-05, 7.540173828601837e-05, 7.799360901117325e-05, 8.058547973632812e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 7.0, 9.0, 24.0, 33.0, 37.0, 47.0, 93.0, 132.0, 245.0, 461.0, 1056.0, 2847.0, 8872.0, 40139.0, 320006.0, 578183.0, 75284.0, 14221.0, 3979.0, 1498.0, 620.0, 325.0, 167.0, 85.0, 64.0, 44.0, 21.0, 20.0, 12.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10693359375, -0.10326766967773438, -0.09960174560546875, -0.09593582153320312, -0.0922698974609375, -0.08860397338867188, -0.08493804931640625, -0.08127212524414062, -0.077606201171875, -0.07394027709960938, -0.07027435302734375, -0.06660842895507812, -0.0629425048828125, -0.059276580810546875, -0.05561065673828125, -0.051944732666015625, -0.04827880859375, -0.044612884521484375, -0.04094696044921875, -0.037281036376953125, -0.0336151123046875, -0.029949188232421875, -0.02628326416015625, -0.022617340087890625, -0.018951416015625, -0.015285491943359375, -0.01161956787109375, -0.007953643798828125, -0.0042877197265625, -0.000621795654296875, 0.00304412841796875, 0.006710052490234375, 0.0103759765625, 0.014041900634765625, 0.01770782470703125, 0.021373748779296875, 0.0250396728515625, 0.028705596923828125, 0.03237152099609375, 0.036037445068359375, 0.039703369140625, 0.043369293212890625, 0.04703521728515625, 0.050701141357421875, 0.0543670654296875, 0.058032989501953125, 0.06169891357421875, 0.06536483764648438, 0.06903076171875, 0.07269668579101562, 0.07636260986328125, 0.08002853393554688, 0.0836944580078125, 0.08736038208007812, 0.09102630615234375, 0.09469223022460938, 0.098358154296875, 0.10202407836914062, 0.10569000244140625, 0.10935592651367188, 0.1130218505859375, 0.11668777465820312, 0.12035369873046875, 0.12401962280273438, 0.127685546875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 5.0, 6.0, 8.0, 8.0, 12.0, 14.0, 25.0, 37.0, 55.0, 69.0, 84.0, 110.0, 104.0, 124.0, 87.0, 64.0, 64.0, 39.0, 23.0, 11.0, 12.0, 13.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06494140625, -0.062483787536621094, -0.06002616882324219, -0.05756855010986328, -0.055110931396484375, -0.05265331268310547, -0.05019569396972656, -0.047738075256347656, -0.04528045654296875, -0.042822837829589844, -0.04036521911621094, -0.03790760040283203, -0.035449981689453125, -0.03299236297607422, -0.030534744262695312, -0.028077125549316406, -0.0256195068359375, -0.023161888122558594, -0.020704269409179688, -0.01824665069580078, -0.015789031982421875, -0.013331413269042969, -0.010873794555664062, -0.008416175842285156, -0.00595855712890625, -0.0035009384155273438, -0.0010433197021484375, 0.0014142990112304688, 0.003871917724609375, 0.006329536437988281, 0.008787155151367188, 0.011244773864746094, 0.013702392578125, 0.016160011291503906, 0.018617630004882812, 0.02107524871826172, 0.023532867431640625, 0.02599048614501953, 0.028448104858398438, 0.030905723571777344, 0.03336334228515625, 0.035820960998535156, 0.03827857971191406, 0.04073619842529297, 0.043193817138671875, 0.04565143585205078, 0.04810905456542969, 0.050566673278808594, 0.0530242919921875, 0.055481910705566406, 0.05793952941894531, 0.06039714813232422, 0.06285476684570312, 0.06531238555908203, 0.06777000427246094, 0.07022762298583984, 0.07268524169921875, 0.07514286041259766, 0.07760047912597656, 0.08005809783935547, 0.08251571655273438, 0.08497333526611328, 0.08743095397949219, 0.0898885726928711, 0.09234619140625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 11.0, 47.0, 148.0, 230.0, 271.0, 170.0, 85.0, 24.0, 10.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0983920097351074, -1.0309560298919678, -0.9635199308395386, -0.8960839509963989, -0.8286479115486145, -0.7612118721008301, -0.6937758922576904, -0.626339852809906, -0.5589038133621216, -0.49146777391433716, -0.4240317642688751, -0.3565957546234131, -0.28915971517562866, -0.22172367572784424, -0.1542876660823822, -0.08685165643692017, -0.019415616989135742, 0.04802040755748749, 0.11545643210411072, 0.18289245665073395, 0.2503284811973572, 0.3177645206451416, 0.38520053029060364, 0.4526365399360657, 0.5200725793838501, 0.5875086188316345, 0.654944658279419, 0.7223806381225586, 0.789816677570343, 0.8572527170181274, 0.9246886968612671, 0.9921247363090515, 1.059560775756836, 1.1269967555999756, 1.1944328546524048, 1.2618688344955444, 1.3293049335479736, 1.3967409133911133, 1.464176893234253, 1.5316128730773926, 1.5990489721298218, 1.6664849519729614, 1.7339210510253906, 1.8013570308685303, 1.86879301071167, 1.9362291097640991, 2.0036652088165283, 2.071101188659668, 2.1385371685028076, 2.2059731483459473, 2.273409128189087, 2.3408453464508057, 2.4082813262939453, 2.475717306137085, 2.5431532859802246, 2.6105892658233643, 2.678025245666504, 2.7454612255096436, 2.812897205352783, 2.880333423614502, 2.9477694034576416, 3.0152053833007812, 3.082641363143921, 3.1500773429870605, 3.2175135612487793]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 8.0, 4.0, 8.0, 14.0, 13.0, 18.0, 24.0, 30.0, 22.0, 38.0, 39.0, 60.0, 49.0, 52.0, 63.0, 58.0, 59.0, 70.0, 63.0, 50.0, 39.0, 49.0, 34.0, 38.0, 18.0, 21.0, 17.0, 13.0, 12.0, 4.0, 9.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0601372718811035, -1.0322436094284058, -1.004349946975708, -0.9764561653137207, -0.948562502861023, -0.9206688404083252, -0.8927751183509827, -0.8648813962936401, -0.8369877338409424, -0.8090940713882446, -0.7812003493309021, -0.7533066272735596, -0.7254129648208618, -0.6975193023681641, -0.6696255803108215, -0.641731858253479, -0.6138381958007812, -0.5859445333480835, -0.558050811290741, -0.5301570892333984, -0.5022634267807007, -0.47436973452568054, -0.4464760422706604, -0.41858235001564026, -0.3906886577606201, -0.3627949655056, -0.33490127325057983, -0.3070075809955597, -0.27911388874053955, -0.2512201964855194, -0.22332650423049927, -0.19543281197547913, -0.1675390601158142, -0.13964536786079407, -0.11175167560577393, -0.08385798335075378, -0.05596429109573364, -0.0280705988407135, -0.00017690658569335938, 0.027716785669326782, 0.055610477924346924, 0.08350417017936707, 0.11139786243438721, 0.13929155468940735, 0.1671852469444275, 0.19507893919944763, 0.22297263145446777, 0.2508663237094879, 0.27876001596450806, 0.3066537082195282, 0.33454740047454834, 0.3624410927295685, 0.3903347849845886, 0.41822847723960876, 0.4461221694946289, 0.47401586174964905, 0.5019095540046692, 0.5298032760620117, 0.5576969385147095, 0.5855906009674072, 0.6134843230247498, 0.6413780450820923, 0.66927170753479, 0.6971653699874878, 0.7250590920448303]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 8.0, 8.0, 11.0, 18.0, 15.0, 32.0, 67.0, 87.0, 190.0, 292.0, 513.0, 1064.0, 2070.0, 4820.0, 12212.0, 36979.0, 162584.0, 3032135.0, 808167.0, 92017.0, 24793.0, 8718.0, 3775.0, 1637.0, 901.0, 457.0, 255.0, 171.0, 106.0, 67.0, 34.0, 26.0, 22.0, 15.0, 10.0, 8.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.164306640625, -0.15914535522460938, -0.15398406982421875, -0.14882278442382812, -0.1436614990234375, -0.13850021362304688, -0.13333892822265625, -0.12817764282226562, -0.123016357421875, -0.11785507202148438, -0.11269378662109375, -0.10753250122070312, -0.1023712158203125, -0.09720993041992188, -0.09204864501953125, -0.08688735961914062, -0.08172607421875, -0.07656478881835938, -0.07140350341796875, -0.06624221801757812, -0.0610809326171875, -0.055919647216796875, -0.05075836181640625, -0.045597076416015625, -0.040435791015625, -0.035274505615234375, -0.03011322021484375, -0.024951934814453125, -0.0197906494140625, -0.014629364013671875, -0.00946807861328125, -0.004306793212890625, 0.0008544921875, 0.006015777587890625, 0.01117706298828125, 0.016338348388671875, 0.0214996337890625, 0.026660919189453125, 0.03182220458984375, 0.036983489990234375, 0.042144775390625, 0.047306060791015625, 0.05246734619140625, 0.057628631591796875, 0.0627899169921875, 0.06795120239257812, 0.07311248779296875, 0.07827377319335938, 0.08343505859375, 0.08859634399414062, 0.09375762939453125, 0.09891891479492188, 0.1040802001953125, 0.10924148559570312, 0.11440277099609375, 0.11956405639648438, 0.124725341796875, 0.12988662719726562, 0.13504791259765625, 0.14020919799804688, 0.1453704833984375, 0.15053176879882812, 0.15569305419921875, 0.16085433959960938, 0.166015625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 11.0, 9.0, 14.0, 22.0, 28.0, 40.0, 52.0, 73.0, 87.0, 106.0, 85.0, 93.0, 68.0, 77.0, 66.0, 43.0, 33.0, 31.0, 15.0, 20.0, 11.0, 10.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0452880859375, -0.043773651123046875, -0.04225921630859375, -0.040744781494140625, -0.0392303466796875, -0.037715911865234375, -0.03620147705078125, -0.034687042236328125, -0.033172607421875, -0.031658172607421875, -0.03014373779296875, -0.028629302978515625, -0.0271148681640625, -0.025600433349609375, -0.02408599853515625, -0.022571563720703125, -0.02105712890625, -0.019542694091796875, -0.01802825927734375, -0.016513824462890625, -0.0149993896484375, -0.013484954833984375, -0.01197052001953125, -0.010456085205078125, -0.008941650390625, -0.007427215576171875, -0.00591278076171875, -0.004398345947265625, -0.0028839111328125, -0.001369476318359375, 0.00014495849609375, 0.001659393310546875, 0.003173828125, 0.004688262939453125, 0.00620269775390625, 0.007717132568359375, 0.0092315673828125, 0.010746002197265625, 0.01226043701171875, 0.013774871826171875, 0.015289306640625, 0.016803741455078125, 0.01831817626953125, 0.019832611083984375, 0.0213470458984375, 0.022861480712890625, 0.02437591552734375, 0.025890350341796875, 0.02740478515625, 0.028919219970703125, 0.03043365478515625, 0.031948089599609375, 0.0334625244140625, 0.034976959228515625, 0.03649139404296875, 0.038005828857421875, 0.039520263671875, 0.041034698486328125, 0.04254913330078125, 0.044063568115234375, 0.0455780029296875, 0.047092437744140625, 0.04860687255859375, 0.050121307373046875, 0.0516357421875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 6.0, 4.0, 9.0, 5.0, 13.0, 14.0, 9.0, 33.0, 33.0, 59.0, 95.0, 137.0, 241.0, 435.0, 818.0, 1636.0, 3674.0, 8841.0, 24660.0, 79790.0, 355200.0, 2772875.0, 751955.0, 132669.0, 38043.0, 13334.0, 5114.0, 2193.0, 1023.0, 598.0, 261.0, 195.0, 100.0, 67.0, 43.0, 32.0, 17.0, 14.0, 9.0, 7.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.138916015625, -0.13479232788085938, -0.13066864013671875, -0.12654495239257812, -0.1224212646484375, -0.11829757690429688, -0.11417388916015625, -0.11005020141601562, -0.105926513671875, -0.10180282592773438, -0.09767913818359375, -0.09355545043945312, -0.0894317626953125, -0.08530807495117188, -0.08118438720703125, -0.07706069946289062, -0.07293701171875, -0.06881332397460938, -0.06468963623046875, -0.060565948486328125, -0.0564422607421875, -0.052318572998046875, -0.04819488525390625, -0.044071197509765625, -0.039947509765625, -0.035823822021484375, -0.03170013427734375, -0.027576446533203125, -0.0234527587890625, -0.019329071044921875, -0.01520538330078125, -0.011081695556640625, -0.0069580078125, -0.002834320068359375, 0.00128936767578125, 0.005413055419921875, 0.0095367431640625, 0.013660430908203125, 0.01778411865234375, 0.021907806396484375, 0.026031494140625, 0.030155181884765625, 0.03427886962890625, 0.038402557373046875, 0.0425262451171875, 0.046649932861328125, 0.05077362060546875, 0.054897308349609375, 0.05902099609375, 0.06314468383789062, 0.06726837158203125, 0.07139205932617188, 0.0755157470703125, 0.07963943481445312, 0.08376312255859375, 0.08788681030273438, 0.092010498046875, 0.09613418579101562, 0.10025787353515625, 0.10438156127929688, 0.1085052490234375, 0.11262893676757812, 0.11675262451171875, 0.12087631225585938, 0.125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 0.0, 8.0, 8.0, 9.0, 15.0, 19.0, 24.0, 32.0, 37.0, 55.0, 88.0, 117.0, 181.0, 273.0, 515.0, 922.0, 693.0, 346.0, 221.0, 139.0, 79.0, 71.0, 47.0, 37.0, 30.0, 25.0, 16.0, 22.0, 5.0, 6.0, 6.0, 8.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047088623046875, -0.04532766342163086, -0.04356670379638672, -0.04180574417114258, -0.04004478454589844, -0.0382838249206543, -0.036522865295410156, -0.034761905670166016, -0.033000946044921875, -0.031239986419677734, -0.029479026794433594, -0.027718067169189453, -0.025957107543945312, -0.024196147918701172, -0.02243518829345703, -0.02067422866821289, -0.01891326904296875, -0.01715230941772461, -0.015391349792480469, -0.013630390167236328, -0.011869430541992188, -0.010108470916748047, -0.008347511291503906, -0.006586551666259766, -0.004825592041015625, -0.0030646324157714844, -0.0013036727905273438, 0.0004572868347167969, 0.0022182464599609375, 0.003979206085205078, 0.005740165710449219, 0.007501125335693359, 0.0092620849609375, 0.01102304458618164, 0.012784004211425781, 0.014544963836669922, 0.016305923461914062, 0.018066883087158203, 0.019827842712402344, 0.021588802337646484, 0.023349761962890625, 0.025110721588134766, 0.026871681213378906, 0.028632640838623047, 0.030393600463867188, 0.03215456008911133, 0.03391551971435547, 0.03567647933959961, 0.03743743896484375, 0.03919839859008789, 0.04095935821533203, 0.04272031784057617, 0.04448127746582031, 0.04624223709106445, 0.048003196716308594, 0.049764156341552734, 0.051525115966796875, 0.053286075592041016, 0.055047035217285156, 0.0568079948425293, 0.05856895446777344, 0.06032991409301758, 0.06209087371826172, 0.06385183334350586, 0.06561279296875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 9.0, 10.0, 25.0, 32.0, 72.0, 141.0, 190.0, 194.0, 157.0, 94.0, 39.0, 25.0, 8.0, 5.0, 3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5548077821731567, -0.5319732427597046, -0.5091387629508972, -0.48630422353744507, -0.4634696841239929, -0.44063517451286316, -0.4178006649017334, -0.39496612548828125, -0.3721315860748291, -0.34929707646369934, -0.3264625370502472, -0.30362802743911743, -0.2807934880256653, -0.2579589784145355, -0.23512445390224457, -0.2122899293899536, -0.18945541977882385, -0.1666208952665329, -0.14378637075424194, -0.12095185369253159, -0.09811732918024063, -0.07528280466794968, -0.05244828760623932, -0.029613763093948364, -0.00677923858165741, 0.016055284067988396, 0.0388898067176342, 0.06172432750463486, 0.08455885201692581, 0.10739337652921677, 0.13022789359092712, 0.15306241810321808, 0.17589694261550903, 0.1987314671278, 0.22156599164009094, 0.2444005012512207, 0.26723504066467285, 0.2900695502758026, 0.3129040598869324, 0.3357385993003845, 0.35857313871383667, 0.38140764832496643, 0.4042421877384186, 0.42707669734954834, 0.4499112367630005, 0.47274574637413025, 0.49558025598526, 0.5184147953987122, 0.5412492752075195, 0.5640838146209717, 0.586918294429779, 0.6097528338432312, 0.6325873732566833, 0.6554219126701355, 0.6782563924789429, 0.701090931892395, 0.7239254713058472, 0.7467600107192993, 0.7695944905281067, 0.7924290299415588, 0.815263569355011, 0.8380981087684631, 0.8609325885772705, 0.8837671279907227, 0.9066016674041748]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 4.0, 5.0, 9.0, 10.0, 8.0, 11.0, 12.0, 17.0, 16.0, 29.0, 33.0, 19.0, 24.0, 27.0, 28.0, 32.0, 30.0, 41.0, 31.0, 42.0, 39.0, 44.0, 35.0, 36.0, 37.0, 44.0, 45.0, 37.0, 32.0, 34.0, 30.0, 23.0, 21.0, 24.0, 15.0, 13.0, 18.0, 8.0, 9.0, 8.0, 5.0, 6.0, 1.0, 1.0, 5.0, 3.0, 2.0, 0.0, 1.0, 4.0, 1.0], "bins": [-0.23109257221221924, -0.22414252161979675, -0.21719247102737427, -0.21024242043495178, -0.2032923549413681, -0.19634230434894562, -0.18939225375652313, -0.18244220316410065, -0.17549213767051697, -0.16854208707809448, -0.161592036485672, -0.1546419858932495, -0.14769192039966583, -0.14074186980724335, -0.13379181921482086, -0.12684176862239838, -0.11989171802997589, -0.1129416674375534, -0.10599160939455032, -0.09904155880212784, -0.09209150075912476, -0.08514145016670227, -0.07819139957427979, -0.0712413489818573, -0.06429129093885422, -0.057341236621141434, -0.05039118230342865, -0.043441131711006165, -0.03649107739329338, -0.029541023075580597, -0.02259097248315811, -0.015640918165445328, -0.008690863847732544, -0.0017408104613423347, 0.0052092429250478745, 0.012159295380115509, 0.019109349697828293, 0.026059404015541077, 0.03300945460796356, 0.039959508925676346, 0.04690956324338913, 0.05385961756110191, 0.0608096718788147, 0.06775972247123718, 0.07470977306365967, 0.08165983110666275, 0.08860988169908524, 0.09555993974208832, 0.1025099903345108, 0.10946004092693329, 0.11641009896993637, 0.12336014956235886, 0.13031020760536194, 0.13726025819778442, 0.1442103087902069, 0.1511603593826294, 0.15811040997505188, 0.16506046056747437, 0.17201051115989685, 0.17896056175231934, 0.18591062724590302, 0.1928606778383255, 0.19981072843074799, 0.20676077902317047, 0.21371084451675415]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 6.0, 15.0, 14.0, 33.0, 44.0, 74.0, 125.0, 164.0, 369.0, 666.0, 1460.0, 3597.0, 9832.0, 31016.0, 107243.0, 443507.0, 331702.0, 81494.0, 24110.0, 7751.0, 2820.0, 1170.0, 598.0, 279.0, 183.0, 107.0, 68.0, 42.0, 28.0, 14.0, 14.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1884765625, -0.18217086791992188, -0.17586517333984375, -0.16955947875976562, -0.1632537841796875, -0.15694808959960938, -0.15064239501953125, -0.14433670043945312, -0.138031005859375, -0.13172531127929688, -0.12541961669921875, -0.11911392211914062, -0.1128082275390625, -0.10650253295898438, -0.10019683837890625, -0.09389114379882812, -0.08758544921875, -0.08127975463867188, -0.07497406005859375, -0.06866836547851562, -0.0623626708984375, -0.056056976318359375, -0.04975128173828125, -0.043445587158203125, -0.037139892578125, -0.030834197998046875, -0.02452850341796875, -0.018222808837890625, -0.0119171142578125, -0.005611419677734375, 0.00069427490234375, 0.006999969482421875, 0.0133056640625, 0.019611358642578125, 0.02591705322265625, 0.032222747802734375, 0.0385284423828125, 0.044834136962890625, 0.05113983154296875, 0.057445526123046875, 0.063751220703125, 0.07005691528320312, 0.07636260986328125, 0.08266830444335938, 0.0889739990234375, 0.09527969360351562, 0.10158538818359375, 0.10789108276367188, 0.11419677734375, 0.12050247192382812, 0.12680816650390625, 0.13311386108398438, 0.1394195556640625, 0.14572525024414062, 0.15203094482421875, 0.15833663940429688, 0.164642333984375, 0.17094802856445312, 0.17725372314453125, 0.18355941772460938, 0.1898651123046875, 0.19617080688476562, 0.20247650146484375, 0.20878219604492188, 0.215087890625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 10.0, 4.0, 18.0, 17.0, 31.0, 32.0, 49.0, 61.0, 89.0, 109.0, 102.0, 78.0, 87.0, 93.0, 52.0, 51.0, 36.0, 32.0, 17.0, 17.0, 10.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046875, -0.04526042938232422, -0.04364585876464844, -0.042031288146972656, -0.040416717529296875, -0.038802146911621094, -0.03718757629394531, -0.03557300567626953, -0.03395843505859375, -0.03234386444091797, -0.030729293823242188, -0.029114723205566406, -0.027500152587890625, -0.025885581970214844, -0.024271011352539062, -0.02265644073486328, -0.0210418701171875, -0.01942729949951172, -0.017812728881835938, -0.016198158264160156, -0.014583587646484375, -0.012969017028808594, -0.011354446411132812, -0.009739875793457031, -0.00812530517578125, -0.006510734558105469, -0.0048961639404296875, -0.0032815933227539062, -0.001667022705078125, -5.245208740234375e-05, 0.0015621185302734375, 0.0031766891479492188, 0.004791259765625, 0.006405830383300781, 0.008020401000976562, 0.009634971618652344, 0.011249542236328125, 0.012864112854003906, 0.014478683471679688, 0.01609325408935547, 0.01770782470703125, 0.01932239532470703, 0.020936965942382812, 0.022551536560058594, 0.024166107177734375, 0.025780677795410156, 0.027395248413085938, 0.02900981903076172, 0.0306243896484375, 0.03223896026611328, 0.03385353088378906, 0.035468101501464844, 0.037082672119140625, 0.038697242736816406, 0.04031181335449219, 0.04192638397216797, 0.04354095458984375, 0.04515552520751953, 0.04677009582519531, 0.048384666442871094, 0.049999237060546875, 0.051613807678222656, 0.05322837829589844, 0.05484294891357422, 0.05645751953125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 11.0, 9.0, 24.0, 23.0, 38.0, 55.0, 86.0, 125.0, 193.0, 340.0, 638.0, 1272.0, 2972.0, 8603.0, 30731.0, 127662.0, 511101.0, 276997.0, 62555.0, 16154.0, 5006.0, 1892.0, 857.0, 464.0, 300.0, 166.0, 86.0, 76.0, 33.0, 31.0, 20.0, 13.0, 9.0, 10.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1824951171875, -0.1769237518310547, -0.17135238647460938, -0.16578102111816406, -0.16020965576171875, -0.15463829040527344, -0.14906692504882812, -0.1434955596923828, -0.1379241943359375, -0.1323528289794922, -0.12678146362304688, -0.12121009826660156, -0.11563873291015625, -0.11006736755371094, -0.10449600219726562, -0.09892463684082031, -0.093353271484375, -0.08778190612792969, -0.08221054077148438, -0.07663917541503906, -0.07106781005859375, -0.06549644470214844, -0.059925079345703125, -0.05435371398925781, -0.0487823486328125, -0.04321098327636719, -0.037639617919921875, -0.03206825256347656, -0.02649688720703125, -0.020925521850585938, -0.015354156494140625, -0.009782791137695312, -0.00421142578125, 0.0013599395751953125, 0.006931304931640625, 0.012502670288085938, 0.01807403564453125, 0.023645401000976562, 0.029216766357421875, 0.03478813171386719, 0.0403594970703125, 0.04593086242675781, 0.051502227783203125, 0.05707359313964844, 0.06264495849609375, 0.06821632385253906, 0.07378768920898438, 0.07935905456542969, 0.084930419921875, 0.09050178527832031, 0.09607315063476562, 0.10164451599121094, 0.10721588134765625, 0.11278724670410156, 0.11835861206054688, 0.12392997741699219, 0.1295013427734375, 0.1350727081298828, 0.14064407348632812, 0.14621543884277344, 0.15178680419921875, 0.15735816955566406, 0.16292953491210938, 0.1685009002685547, 0.174072265625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 6.0, 7.0, 14.0, 12.0, 16.0, 17.0, 13.0, 24.0, 23.0, 25.0, 32.0, 36.0, 45.0, 42.0, 36.0, 41.0, 35.0, 54.0, 51.0, 51.0, 35.0, 48.0, 52.0, 36.0, 29.0, 30.0, 23.0, 26.0, 23.0, 14.0, 19.0, 13.0, 14.0, 18.0, 9.0, 8.0, 7.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.131103515625, -0.1270771026611328, -0.12305068969726562, -0.11902427673339844, -0.11499786376953125, -0.11097145080566406, -0.10694503784179688, -0.10291862487792969, -0.0988922119140625, -0.09486579895019531, -0.09083938598632812, -0.08681297302246094, -0.08278656005859375, -0.07876014709472656, -0.07473373413085938, -0.07070732116699219, -0.066680908203125, -0.06265449523925781, -0.058628082275390625, -0.05460166931152344, -0.05057525634765625, -0.04654884338378906, -0.042522430419921875, -0.03849601745605469, -0.0344696044921875, -0.030443191528320312, -0.026416778564453125, -0.022390365600585938, -0.01836395263671875, -0.014337539672851562, -0.010311126708984375, -0.0062847137451171875, -0.00225830078125, 0.0017681121826171875, 0.005794525146484375, 0.009820938110351562, 0.01384735107421875, 0.017873764038085938, 0.021900177001953125, 0.025926589965820312, 0.0299530029296875, 0.03397941589355469, 0.038005828857421875, 0.04203224182128906, 0.04605865478515625, 0.05008506774902344, 0.054111480712890625, 0.05813789367675781, 0.062164306640625, 0.06619071960449219, 0.07021713256835938, 0.07424354553222656, 0.07826995849609375, 0.08229637145996094, 0.08632278442382812, 0.09034919738769531, 0.0943756103515625, 0.09840202331542969, 0.10242843627929688, 0.10645484924316406, 0.11048126220703125, 0.11450767517089844, 0.11853408813476562, 0.12256050109863281, 0.1265869140625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 12.0, 2.0, 9.0, 14.0, 22.0, 21.0, 52.0, 79.0, 118.0, 208.0, 359.0, 612.0, 1288.0, 3015.0, 7819.0, 23608.0, 94066.0, 489736.0, 335278.0, 63990.0, 17509.0, 6039.0, 2381.0, 1021.0, 583.0, 298.0, 147.0, 95.0, 61.0, 42.0, 17.0, 17.0, 12.0, 10.0, 6.0, 4.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11175537109375, -0.10835552215576172, -0.10495567321777344, -0.10155582427978516, -0.09815597534179688, -0.0947561264038086, -0.09135627746582031, -0.08795642852783203, -0.08455657958984375, -0.08115673065185547, -0.07775688171386719, -0.0743570327758789, -0.07095718383789062, -0.06755733489990234, -0.06415748596191406, -0.06075763702392578, -0.0573577880859375, -0.05395793914794922, -0.05055809020996094, -0.047158241271972656, -0.043758392333984375, -0.040358543395996094, -0.03695869445800781, -0.03355884552001953, -0.03015899658203125, -0.02675914764404297, -0.023359298706054688, -0.019959449768066406, -0.016559600830078125, -0.013159751892089844, -0.009759902954101562, -0.006360054016113281, -0.002960205078125, 0.00043964385986328125, 0.0038394927978515625, 0.007239341735839844, 0.010639190673828125, 0.014039039611816406, 0.017438888549804688, 0.02083873748779297, 0.02423858642578125, 0.02763843536376953, 0.031038284301757812, 0.034438133239746094, 0.037837982177734375, 0.041237831115722656, 0.04463768005371094, 0.04803752899169922, 0.0514373779296875, 0.05483722686767578, 0.05823707580566406, 0.061636924743652344, 0.06503677368164062, 0.0684366226196289, 0.07183647155761719, 0.07523632049560547, 0.07863616943359375, 0.08203601837158203, 0.08543586730957031, 0.0888357162475586, 0.09223556518554688, 0.09563541412353516, 0.09903526306152344, 0.10243511199951172, 0.1058349609375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 5.0, 7.0, 10.0, 16.0, 22.0, 21.0, 29.0, 35.0, 43.0, 39.0, 57.0, 55.0, 79.0, 96.0, 86.0, 72.0, 59.0, 50.0, 45.0, 30.0, 34.0, 23.0, 16.0, 20.0, 13.0, 6.0, 9.0, 4.0, 3.0, 6.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.189678192138672e-05, -7.906835526227951e-05, -7.62399286031723e-05, -7.34115019440651e-05, -7.058307528495789e-05, -6.775464862585068e-05, -6.492622196674347e-05, -6.209779530763626e-05, -5.926936864852905e-05, -5.6440941989421844e-05, -5.3612515330314636e-05, -5.078408867120743e-05, -4.795566201210022e-05, -4.512723535299301e-05, -4.22988086938858e-05, -3.9470382034778595e-05, -3.664195537567139e-05, -3.381352871656418e-05, -3.098510205745697e-05, -2.8156675398349762e-05, -2.5328248739242554e-05, -2.2499822080135345e-05, -1.9671395421028137e-05, -1.684296876192093e-05, -1.401454210281372e-05, -1.1186115443706512e-05, -8.357688784599304e-06, -5.529262125492096e-06, -2.7008354663848877e-06, 1.2759119272232056e-07, 2.956017851829529e-06, 5.784444510936737e-06, 8.612871170043945e-06, 1.1441297829151154e-05, 1.4269724488258362e-05, 1.709815114736557e-05, 1.992657780647278e-05, 2.2755004465579987e-05, 2.5583431124687195e-05, 2.8411857783794403e-05, 3.124028444290161e-05, 3.406871110200882e-05, 3.689713776111603e-05, 3.9725564420223236e-05, 4.2553991079330444e-05, 4.538241773843765e-05, 4.821084439754486e-05, 5.103927105665207e-05, 5.386769771575928e-05, 5.6696124374866486e-05, 5.9524551033973694e-05, 6.23529776930809e-05, 6.518140435218811e-05, 6.800983101129532e-05, 7.083825767040253e-05, 7.366668432950974e-05, 7.649511098861694e-05, 7.932353764772415e-05, 8.215196430683136e-05, 8.498039096593857e-05, 8.780881762504578e-05, 9.063724428415298e-05, 9.346567094326019e-05, 9.62940976023674e-05, 9.912252426147461e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 7.0, 8.0, 3.0, 14.0, 23.0, 23.0, 32.0, 53.0, 69.0, 121.0, 174.0, 282.0, 492.0, 934.0, 2063.0, 4792.0, 12981.0, 43507.0, 193557.0, 573737.0, 159208.0, 36922.0, 11416.0, 4227.0, 1771.0, 894.0, 476.0, 271.0, 163.0, 109.0, 57.0, 50.0, 34.0, 21.0, 15.0, 12.0, 10.0, 7.0, 7.0, 3.0, 6.0, 4.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08184814453125, -0.07875251770019531, -0.07565689086914062, -0.07256126403808594, -0.06946563720703125, -0.06637001037597656, -0.06327438354492188, -0.06017875671386719, -0.0570831298828125, -0.05398750305175781, -0.050891876220703125, -0.04779624938964844, -0.04470062255859375, -0.04160499572753906, -0.038509368896484375, -0.03541374206542969, -0.032318115234375, -0.029222488403320312, -0.026126861572265625, -0.023031234741210938, -0.01993560791015625, -0.016839981079101562, -0.013744354248046875, -0.010648727416992188, -0.0075531005859375, -0.0044574737548828125, -0.001361846923828125, 0.0017337799072265625, 0.00482940673828125, 0.007925033569335938, 0.011020660400390625, 0.014116287231445312, 0.0172119140625, 0.020307540893554688, 0.023403167724609375, 0.026498794555664062, 0.02959442138671875, 0.03269004821777344, 0.035785675048828125, 0.03888130187988281, 0.0419769287109375, 0.04507255554199219, 0.048168182373046875, 0.05126380920410156, 0.05435943603515625, 0.05745506286621094, 0.060550689697265625, 0.06364631652832031, 0.066741943359375, 0.06983757019042969, 0.07293319702148438, 0.07602882385253906, 0.07912445068359375, 0.08222007751464844, 0.08531570434570312, 0.08841133117675781, 0.0915069580078125, 0.09460258483886719, 0.09769821166992188, 0.10079383850097656, 0.10388946533203125, 0.10698509216308594, 0.11008071899414062, 0.11317634582519531, 0.11627197265625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 2.0, 7.0, 5.0, 17.0, 10.0, 15.0, 19.0, 27.0, 36.0, 36.0, 44.0, 62.0, 78.0, 105.0, 89.0, 88.0, 79.0, 51.0, 40.0, 41.0, 28.0, 25.0, 18.0, 17.0, 10.0, 11.0, 11.0, 6.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06231689453125, -0.060210227966308594, -0.05810356140136719, -0.05599689483642578, -0.053890228271484375, -0.05178356170654297, -0.04967689514160156, -0.047570228576660156, -0.04546356201171875, -0.043356895446777344, -0.04125022888183594, -0.03914356231689453, -0.037036895751953125, -0.03493022918701172, -0.03282356262207031, -0.030716896057128906, -0.0286102294921875, -0.026503562927246094, -0.024396896362304688, -0.02229022979736328, -0.020183563232421875, -0.01807689666748047, -0.015970230102539062, -0.013863563537597656, -0.01175689697265625, -0.009650230407714844, -0.0075435638427734375, -0.005436897277832031, -0.003330230712890625, -0.0012235641479492188, 0.0008831024169921875, 0.0029897689819335938, 0.005096435546875, 0.007203102111816406, 0.009309768676757812, 0.011416435241699219, 0.013523101806640625, 0.01562976837158203, 0.017736434936523438, 0.019843101501464844, 0.02194976806640625, 0.024056434631347656, 0.026163101196289062, 0.02826976776123047, 0.030376434326171875, 0.03248310089111328, 0.03458976745605469, 0.036696434020996094, 0.0388031005859375, 0.040909767150878906, 0.04301643371582031, 0.04512310028076172, 0.047229766845703125, 0.04933643341064453, 0.05144309997558594, 0.053549766540527344, 0.05565643310546875, 0.057763099670410156, 0.05986976623535156, 0.06197643280029297, 0.06408309936523438, 0.06618976593017578, 0.06829643249511719, 0.0704030990600586, 0.072509765625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 8.0, 6.0, 17.0, 19.0, 38.0, 50.0, 97.0, 122.0, 129.0, 122.0, 133.0, 88.0, 88.0, 35.0, 22.0, 9.0, 13.0, 8.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5888552665710449, -0.5526053309440613, -0.5163554549217224, -0.48010551929473877, -0.4438556134700775, -0.40760570764541626, -0.3713557720184326, -0.33510586619377136, -0.2988559603691101, -0.26260605454444885, -0.2263561338186264, -0.19010621309280396, -0.1538563072681427, -0.11760640144348145, -0.081356480717659, -0.04510655999183655, -0.008856654167175293, 0.02739325910806656, 0.06364317238330841, 0.09989308565855026, 0.13614299893379211, 0.17239290475845337, 0.20864282548427582, 0.24489274621009827, 0.2811426520347595, 0.3173925578594208, 0.35364246368408203, 0.3898923993110657, 0.42614230513572693, 0.4623922109603882, 0.4986421465873718, 0.5348920822143555, 0.5711419582366943, 0.607391893863678, 0.6436417698860168, 0.6798917055130005, 0.7161415815353394, 0.752391517162323, 0.7886414527893066, 0.8248913288116455, 0.8611412644386292, 0.8973912000656128, 0.9336410760879517, 0.9698910117149353, 1.006140947341919, 1.0423908233642578, 1.0786406993865967, 1.114890694618225, 1.151140570640564, 1.1873904466629028, 1.2236404418945312, 1.2598903179168701, 1.296140193939209, 1.3323900699615479, 1.3686400651931763, 1.4048899412155151, 1.4411399364471436, 1.4773898124694824, 1.5136398077011108, 1.5498896837234497, 1.5861395597457886, 1.622389554977417, 1.6586394309997559, 1.6948893070220947, 1.7311391830444336]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 9.0, 4.0, 7.0, 12.0, 14.0, 16.0, 18.0, 16.0, 24.0, 34.0, 35.0, 34.0, 47.0, 34.0, 43.0, 47.0, 44.0, 47.0, 47.0, 50.0, 52.0, 41.0, 35.0, 43.0, 36.0, 36.0, 30.0, 31.0, 22.0, 20.0, 17.0, 14.0, 10.0, 12.0, 7.0, 7.0, 2.0, 3.0, 1.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7124967575073242, -0.6862809062004089, -0.6600650548934937, -0.6338492631912231, -0.6076334118843079, -0.5814175605773926, -0.5552017688751221, -0.5289859175682068, -0.5027700662612915, -0.4765542149543762, -0.4503383934497833, -0.42412257194519043, -0.39790672063827515, -0.37169086933135986, -0.34547504782676697, -0.3192592263221741, -0.2930433750152588, -0.2668275237083435, -0.2406117022037506, -0.21439586579799652, -0.18818002939224243, -0.16196419298648834, -0.13574835658073425, -0.10953252017498016, -0.08331668376922607, -0.057100847363471985, -0.030885010957717896, -0.004669174551963806, 0.021546661853790283, 0.04776249825954437, 0.07397833466529846, 0.10019417107105255, 0.12640994787216187, 0.15262578427791595, 0.17884162068367004, 0.20505745708942413, 0.23127329349517822, 0.2574891448020935, 0.2837049663066864, 0.3099207878112793, 0.3361366391181946, 0.36235249042510986, 0.38856831192970276, 0.41478413343429565, 0.44099998474121094, 0.4672158360481262, 0.4934316575527191, 0.519647479057312, 0.5458633303642273, 0.5720791816711426, 0.5982949733734131, 0.6245108246803284, 0.6507266759872437, 0.6769425272941589, 0.7031583786010742, 0.7293741703033447, 0.75559002161026, 0.7818058729171753, 0.8080216646194458, 0.8342375159263611, 0.8604533672332764, 0.8866692185401917, 0.9128850698471069, 0.9391008615493774, 0.9653167128562927]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 9.0, 3.0, 4.0, 3.0, 14.0, 17.0, 17.0, 39.0, 60.0, 85.0, 122.0, 206.0, 382.0, 609.0, 1221.0, 2438.0, 5267.0, 13525.0, 42526.0, 199647.0, 3392947.0, 434695.0, 67255.0, 19272.0, 7111.0, 3194.0, 1533.0, 849.0, 494.0, 280.0, 178.0, 85.0, 60.0, 36.0, 43.0, 22.0, 16.0, 11.0, 6.0, 2.0, 1.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1527099609375, -0.14788818359375, -0.14306640625, -0.13824462890625, -0.1334228515625, -0.12860107421875, -0.123779296875, -0.11895751953125, -0.1141357421875, -0.10931396484375, -0.1044921875, -0.09967041015625, -0.0948486328125, -0.09002685546875, -0.085205078125, -0.08038330078125, -0.0755615234375, -0.07073974609375, -0.06591796875, -0.06109619140625, -0.0562744140625, -0.05145263671875, -0.046630859375, -0.04180908203125, -0.0369873046875, -0.03216552734375, -0.02734375, -0.02252197265625, -0.0177001953125, -0.01287841796875, -0.008056640625, -0.00323486328125, 0.0015869140625, 0.00640869140625, 0.01123046875, 0.01605224609375, 0.0208740234375, 0.02569580078125, 0.030517578125, 0.03533935546875, 0.0401611328125, 0.04498291015625, 0.0498046875, 0.05462646484375, 0.0594482421875, 0.06427001953125, 0.069091796875, 0.07391357421875, 0.0787353515625, 0.08355712890625, 0.08837890625, 0.09320068359375, 0.0980224609375, 0.10284423828125, 0.107666015625, 0.11248779296875, 0.1173095703125, 0.12213134765625, 0.126953125, 0.13177490234375, 0.1365966796875, 0.14141845703125, 0.146240234375, 0.15106201171875, 0.1558837890625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 6.0, 10.0, 12.0, 20.0, 16.0, 36.0, 52.0, 51.0, 76.0, 76.0, 99.0, 93.0, 69.0, 78.0, 75.0, 59.0, 51.0, 31.0, 31.0, 18.0, 19.0, 4.0, 9.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05194091796875, -0.050345420837402344, -0.04874992370605469, -0.04715442657470703, -0.045558929443359375, -0.04396343231201172, -0.04236793518066406, -0.040772438049316406, -0.03917694091796875, -0.037581443786621094, -0.03598594665527344, -0.03439044952392578, -0.032794952392578125, -0.03119945526123047, -0.029603958129882812, -0.028008460998535156, -0.0264129638671875, -0.024817466735839844, -0.023221969604492188, -0.02162647247314453, -0.020030975341796875, -0.01843547821044922, -0.016839981079101562, -0.015244483947753906, -0.01364898681640625, -0.012053489685058594, -0.010457992553710938, -0.008862495422363281, -0.007266998291015625, -0.005671501159667969, -0.0040760040283203125, -0.0024805068969726562, -0.000885009765625, 0.0007104873657226562, 0.0023059844970703125, 0.0039014816284179688, 0.005496978759765625, 0.007092475891113281, 0.008687973022460938, 0.010283470153808594, 0.01187896728515625, 0.013474464416503906, 0.015069961547851562, 0.01666545867919922, 0.018260955810546875, 0.01985645294189453, 0.021451950073242188, 0.023047447204589844, 0.0246429443359375, 0.026238441467285156, 0.027833938598632812, 0.02942943572998047, 0.031024932861328125, 0.03262042999267578, 0.03421592712402344, 0.035811424255371094, 0.03740692138671875, 0.039002418518066406, 0.04059791564941406, 0.04219341278076172, 0.043788909912109375, 0.04538440704345703, 0.04697990417480469, 0.048575401306152344, 0.0501708984375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 7.0, 4.0, 9.0, 11.0, 10.0, 21.0, 28.0, 46.0, 72.0, 93.0, 184.0, 342.0, 685.0, 1639.0, 3952.0, 11387.0, 39201.0, 175362.0, 2923299.0, 893931.0, 104108.0, 26256.0, 8107.0, 2994.0, 1213.0, 560.0, 306.0, 170.0, 88.0, 75.0, 34.0, 21.0, 18.0, 16.0, 10.0, 5.0, 9.0, 5.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1719970703125, -0.1658191680908203, -0.15964126586914062, -0.15346336364746094, -0.14728546142578125, -0.14110755920410156, -0.13492965698242188, -0.1287517547607422, -0.1225738525390625, -0.11639595031738281, -0.11021804809570312, -0.10404014587402344, -0.09786224365234375, -0.09168434143066406, -0.08550643920898438, -0.07932853698730469, -0.073150634765625, -0.06697273254394531, -0.060794830322265625, -0.05461692810058594, -0.04843902587890625, -0.04226112365722656, -0.036083221435546875, -0.029905319213867188, -0.0237274169921875, -0.017549514770507812, -0.011371612548828125, -0.0051937103271484375, 0.00098419189453125, 0.0071620941162109375, 0.013339996337890625, 0.019517898559570312, 0.02569580078125, 0.03187370300292969, 0.038051605224609375, 0.04422950744628906, 0.05040740966796875, 0.05658531188964844, 0.06276321411132812, 0.06894111633300781, 0.0751190185546875, 0.08129692077636719, 0.08747482299804688, 0.09365272521972656, 0.09983062744140625, 0.10600852966308594, 0.11218643188476562, 0.11836433410644531, 0.124542236328125, 0.1307201385498047, 0.13689804077148438, 0.14307594299316406, 0.14925384521484375, 0.15543174743652344, 0.16160964965820312, 0.1677875518798828, 0.1739654541015625, 0.1801433563232422, 0.18632125854492188, 0.19249916076660156, 0.19867706298828125, 0.20485496520996094, 0.21103286743164062, 0.2172107696533203, 0.223388671875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 1.0, 5.0, 7.0, 11.0, 13.0, 15.0, 18.0, 35.0, 47.0, 48.0, 91.0, 172.0, 276.0, 690.0, 1403.0, 531.0, 250.0, 145.0, 87.0, 66.0, 43.0, 29.0, 30.0, 17.0, 15.0, 7.0, 5.0, 9.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049591064453125, -0.047274112701416016, -0.04495716094970703, -0.04264020919799805, -0.04032325744628906, -0.03800630569458008, -0.035689353942871094, -0.03337240219116211, -0.031055450439453125, -0.02873849868774414, -0.026421546936035156, -0.024104595184326172, -0.021787643432617188, -0.019470691680908203, -0.01715373992919922, -0.014836788177490234, -0.01251983642578125, -0.010202884674072266, -0.007885932922363281, -0.005568981170654297, -0.0032520294189453125, -0.0009350776672363281, 0.0013818740844726562, 0.0036988258361816406, 0.006015777587890625, 0.00833272933959961, 0.010649681091308594, 0.012966632843017578, 0.015283584594726562, 0.017600536346435547, 0.01991748809814453, 0.022234439849853516, 0.0245513916015625, 0.026868343353271484, 0.02918529510498047, 0.03150224685668945, 0.03381919860839844, 0.03613615036010742, 0.038453102111816406, 0.04077005386352539, 0.043087005615234375, 0.04540395736694336, 0.047720909118652344, 0.05003786087036133, 0.05235481262207031, 0.0546717643737793, 0.05698871612548828, 0.059305667877197266, 0.06162261962890625, 0.06393957138061523, 0.06625652313232422, 0.0685734748840332, 0.07089042663574219, 0.07320737838745117, 0.07552433013916016, 0.07784128189086914, 0.08015823364257812, 0.08247518539428711, 0.0847921371459961, 0.08710908889770508, 0.08942604064941406, 0.09174299240112305, 0.09405994415283203, 0.09637689590454102, 0.09869384765625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 15.0, 21.0, 42.0, 66.0, 97.0, 147.0, 142.0, 158.0, 127.0, 86.0, 53.0, 26.0, 18.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3175918459892273, -0.29725760221481323, -0.27692335844039917, -0.2565890848636627, -0.23625484108924866, -0.2159205973148346, -0.19558633863925934, -0.17525207996368408, -0.15491783618927002, -0.13458359241485596, -0.1142493337392807, -0.09391508251428604, -0.07358083128929138, -0.05324658006429672, -0.03291232883930206, -0.012578070163726807, 0.007756173610687256, 0.028090424835681915, 0.048424676060676575, 0.06875892728567123, 0.0890931785106659, 0.10942742973566055, 0.1297616809606552, 0.15009593963623047, 0.17043018341064453, 0.1907644271850586, 0.21109868586063385, 0.2314329445362091, 0.25176718831062317, 0.27210143208503723, 0.2924357056617737, 0.31276994943618774, 0.3331042528152466, 0.35343849658966064, 0.3737727403640747, 0.39410701394081116, 0.4144412577152252, 0.4347755014896393, 0.45510977506637573, 0.4754440188407898, 0.49577826261520386, 0.5161125063896179, 0.536446750164032, 0.556780993938446, 0.5771152973175049, 0.597449541091919, 0.617783784866333, 0.6381180286407471, 0.6584522724151611, 0.6787865161895752, 0.6991207599639893, 0.7194550037384033, 0.7397892475128174, 0.7601235508918762, 0.7804577946662903, 0.8007920384407043, 0.8211262822151184, 0.8414605259895325, 0.8617947697639465, 0.8821290135383606, 0.9024633169174194, 0.9227975606918335, 0.9431318044662476, 0.9634660482406616, 0.9838002920150757]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 9.0, 10.0, 8.0, 12.0, 17.0, 12.0, 25.0, 32.0, 35.0, 38.0, 30.0, 32.0, 41.0, 36.0, 40.0, 54.0, 50.0, 32.0, 57.0, 46.0, 40.0, 49.0, 36.0, 48.0, 45.0, 25.0, 23.0, 27.0, 17.0, 19.0, 16.0, 12.0, 9.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.3442193269729614, -0.33554336428642273, -0.32686740159988403, -0.3181914687156677, -0.30951550602912903, -0.30083954334259033, -0.292163610458374, -0.2834876477718353, -0.27481168508529663, -0.26613572239875793, -0.25745975971221924, -0.24878382682800293, -0.24010786414146423, -0.23143190145492554, -0.22275595366954803, -0.21408000588417053, -0.20540404319763184, -0.19672808051109314, -0.18805213272571564, -0.17937618494033813, -0.17070022225379944, -0.16202425956726074, -0.15334831178188324, -0.14467236399650574, -0.13599640130996704, -0.12732043862342834, -0.11864449083805084, -0.10996853560209274, -0.10129258036613464, -0.09261662513017654, -0.08394066989421844, -0.07526471465826035, -0.06658875942230225, -0.05791280418634415, -0.04923684895038605, -0.04056089371442795, -0.03188493847846985, -0.02320898324251175, -0.01453302800655365, -0.0058570727705955505, 0.002818882465362549, 0.011494837701320648, 0.020170792937278748, 0.028846748173236847, 0.037522703409194946, 0.046198658645153046, 0.054874613881111145, 0.06355056911706924, 0.07222652435302734, 0.08090247958898544, 0.08957843482494354, 0.09825439006090164, 0.10693034529685974, 0.11560630053281784, 0.12428225576877594, 0.13295820355415344, 0.14163416624069214, 0.15031012892723083, 0.15898607671260834, 0.16766202449798584, 0.17633798718452454, 0.18501394987106323, 0.19368989765644073, 0.20236584544181824, 0.21104180812835693]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 8.0, 7.0, 7.0, 5.0, 28.0, 29.0, 35.0, 51.0, 72.0, 111.0, 158.0, 261.0, 394.0, 642.0, 1113.0, 2057.0, 3755.0, 7232.0, 13841.0, 26361.0, 52453.0, 104190.0, 218777.0, 302925.0, 155556.0, 77121.0, 39264.0, 19695.0, 10126.0, 5343.0, 2887.0, 1604.0, 929.0, 571.0, 324.0, 201.0, 127.0, 95.0, 58.0, 39.0, 34.0, 19.0, 23.0, 6.0, 6.0, 10.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1070556640625, -0.10339927673339844, -0.09974288940429688, -0.09608650207519531, -0.09243011474609375, -0.08877372741699219, -0.08511734008789062, -0.08146095275878906, -0.0778045654296875, -0.07414817810058594, -0.07049179077148438, -0.06683540344238281, -0.06317901611328125, -0.05952262878417969, -0.055866241455078125, -0.05220985412597656, -0.048553466796875, -0.04489707946777344, -0.041240692138671875, -0.03758430480957031, -0.03392791748046875, -0.030271530151367188, -0.026615142822265625, -0.022958755493164062, -0.0193023681640625, -0.015645980834960938, -0.011989593505859375, -0.008333206176757812, -0.00467681884765625, -0.0010204315185546875, 0.002635955810546875, 0.0062923431396484375, 0.00994873046875, 0.013605117797851562, 0.017261505126953125, 0.020917892456054688, 0.02457427978515625, 0.028230667114257812, 0.031887054443359375, 0.03554344177246094, 0.0391998291015625, 0.04285621643066406, 0.046512603759765625, 0.05016899108886719, 0.05382537841796875, 0.05748176574707031, 0.061138153076171875, 0.06479454040527344, 0.068450927734375, 0.07210731506347656, 0.07576370239257812, 0.07942008972167969, 0.08307647705078125, 0.08673286437988281, 0.09038925170898438, 0.09404563903808594, 0.0977020263671875, 0.10135841369628906, 0.10501480102539062, 0.10867118835449219, 0.11232757568359375, 0.11598396301269531, 0.11964035034179688, 0.12329673767089844, 0.126953125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 10.0, 8.0, 10.0, 11.0, 20.0, 23.0, 33.0, 52.0, 54.0, 63.0, 63.0, 72.0, 65.0, 80.0, 86.0, 71.0, 71.0, 53.0, 40.0, 30.0, 25.0, 21.0, 16.0, 13.0, 7.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0484619140625, -0.046901702880859375, -0.04534149169921875, -0.043781280517578125, -0.0422210693359375, -0.040660858154296875, -0.03910064697265625, -0.037540435791015625, -0.035980224609375, -0.034420013427734375, -0.03285980224609375, -0.031299591064453125, -0.0297393798828125, -0.028179168701171875, -0.02661895751953125, -0.025058746337890625, -0.02349853515625, -0.021938323974609375, -0.02037811279296875, -0.018817901611328125, -0.0172576904296875, -0.015697479248046875, -0.01413726806640625, -0.012577056884765625, -0.011016845703125, -0.009456634521484375, -0.00789642333984375, -0.006336212158203125, -0.0047760009765625, -0.003215789794921875, -0.00165557861328125, -9.5367431640625e-05, 0.00146484375, 0.003025054931640625, 0.00458526611328125, 0.006145477294921875, 0.0077056884765625, 0.009265899658203125, 0.01082611083984375, 0.012386322021484375, 0.013946533203125, 0.015506744384765625, 0.01706695556640625, 0.018627166748046875, 0.0201873779296875, 0.021747589111328125, 0.02330780029296875, 0.024868011474609375, 0.02642822265625, 0.027988433837890625, 0.02954864501953125, 0.031108856201171875, 0.0326690673828125, 0.034229278564453125, 0.03578948974609375, 0.037349700927734375, 0.038909912109375, 0.040470123291015625, 0.04203033447265625, 0.043590545654296875, 0.0451507568359375, 0.046710968017578125, 0.04827117919921875, 0.049831390380859375, 0.0513916015625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 6.0, 8.0, 8.0, 28.0, 20.0, 31.0, 34.0, 66.0, 71.0, 122.0, 167.0, 238.0, 337.0, 502.0, 837.0, 1442.0, 3538.0, 12658.0, 56414.0, 255253.0, 529308.0, 143181.0, 31100.0, 7432.0, 2409.0, 1186.0, 635.0, 437.0, 325.0, 211.0, 164.0, 111.0, 88.0, 58.0, 39.0, 28.0, 26.0, 15.0, 7.0, 6.0, 9.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2066650390625, -0.20046043395996094, -0.19425582885742188, -0.1880512237548828, -0.18184661865234375, -0.1756420135498047, -0.16943740844726562, -0.16323280334472656, -0.1570281982421875, -0.15082359313964844, -0.14461898803710938, -0.1384143829345703, -0.13220977783203125, -0.1260051727294922, -0.11980056762695312, -0.11359596252441406, -0.107391357421875, -0.10118675231933594, -0.09498214721679688, -0.08877754211425781, -0.08257293701171875, -0.07636833190917969, -0.07016372680664062, -0.06395912170410156, -0.0577545166015625, -0.05154991149902344, -0.045345306396484375, -0.03914070129394531, -0.03293609619140625, -0.026731491088867188, -0.020526885986328125, -0.014322280883789062, -0.00811767578125, -0.0019130706787109375, 0.004291534423828125, 0.010496139526367188, 0.01670074462890625, 0.022905349731445312, 0.029109954833984375, 0.03531455993652344, 0.0415191650390625, 0.04772377014160156, 0.053928375244140625, 0.06013298034667969, 0.06633758544921875, 0.07254219055175781, 0.07874679565429688, 0.08495140075683594, 0.091156005859375, 0.09736061096191406, 0.10356521606445312, 0.10976982116699219, 0.11597442626953125, 0.12217903137207031, 0.12838363647460938, 0.13458824157714844, 0.1407928466796875, 0.14699745178222656, 0.15320205688476562, 0.1594066619873047, 0.16561126708984375, 0.1718158721923828, 0.17802047729492188, 0.18422508239746094, 0.1904296875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 7.0, 4.0, 9.0, 9.0, 20.0, 19.0, 18.0, 25.0, 37.0, 29.0, 42.0, 35.0, 44.0, 64.0, 44.0, 56.0, 45.0, 61.0, 56.0, 60.0, 45.0, 29.0, 31.0, 36.0, 31.0, 27.0, 22.0, 15.0, 13.0, 20.0, 13.0, 8.0, 9.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.18798828125, -0.18281173706054688, -0.17763519287109375, -0.17245864868164062, -0.1672821044921875, -0.16210556030273438, -0.15692901611328125, -0.15175247192382812, -0.146575927734375, -0.14139938354492188, -0.13622283935546875, -0.13104629516601562, -0.1258697509765625, -0.12069320678710938, -0.11551666259765625, -0.11034011840820312, -0.10516357421875, -0.09998703002929688, -0.09481048583984375, -0.08963394165039062, -0.0844573974609375, -0.07928085327148438, -0.07410430908203125, -0.06892776489257812, -0.063751220703125, -0.058574676513671875, -0.05339813232421875, -0.048221588134765625, -0.0430450439453125, -0.037868499755859375, -0.03269195556640625, -0.027515411376953125, -0.0223388671875, -0.017162322998046875, -0.01198577880859375, -0.006809234619140625, -0.0016326904296875, 0.003543853759765625, 0.00872039794921875, 0.013896942138671875, 0.019073486328125, 0.024250030517578125, 0.02942657470703125, 0.034603118896484375, 0.0397796630859375, 0.044956207275390625, 0.05013275146484375, 0.055309295654296875, 0.06048583984375, 0.06566238403320312, 0.07083892822265625, 0.07601547241210938, 0.0811920166015625, 0.08636856079101562, 0.09154510498046875, 0.09672164916992188, 0.101898193359375, 0.10707473754882812, 0.11225128173828125, 0.11742782592773438, 0.1226043701171875, 0.12778091430664062, 0.13295745849609375, 0.13813400268554688, 0.143310546875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 5.0, 5.0, 9.0, 9.0, 9.0, 22.0, 23.0, 28.0, 47.0, 43.0, 76.0, 107.0, 168.0, 253.0, 381.0, 701.0, 1302.0, 3296.0, 12837.0, 148238.0, 810505.0, 57947.0, 7511.0, 2283.0, 1107.0, 596.0, 358.0, 221.0, 142.0, 79.0, 75.0, 52.0, 26.0, 17.0, 21.0, 21.0, 10.0, 5.0, 7.0, 1.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2490234375, -0.24053573608398438, -0.23204803466796875, -0.22356033325195312, -0.2150726318359375, -0.20658493041992188, -0.19809722900390625, -0.18960952758789062, -0.181121826171875, -0.17263412475585938, -0.16414642333984375, -0.15565872192382812, -0.1471710205078125, -0.13868331909179688, -0.13019561767578125, -0.12170791625976562, -0.11322021484375, -0.10473251342773438, -0.09624481201171875, -0.08775711059570312, -0.0792694091796875, -0.07078170776367188, -0.06229400634765625, -0.053806304931640625, -0.045318603515625, -0.036830902099609375, -0.02834320068359375, -0.019855499267578125, -0.0113677978515625, -0.002880096435546875, 0.00560760498046875, 0.014095306396484375, 0.0225830078125, 0.031070709228515625, 0.03955841064453125, 0.048046112060546875, 0.0565338134765625, 0.06502151489257812, 0.07350921630859375, 0.08199691772460938, 0.090484619140625, 0.09897232055664062, 0.10746002197265625, 0.11594772338867188, 0.1244354248046875, 0.13292312622070312, 0.14141082763671875, 0.14989852905273438, 0.15838623046875, 0.16687393188476562, 0.17536163330078125, 0.18384933471679688, 0.1923370361328125, 0.20082473754882812, 0.20931243896484375, 0.21780014038085938, 0.226287841796875, 0.23477554321289062, 0.24326324462890625, 0.2517509460449219, 0.2602386474609375, 0.2687263488769531, 0.27721405029296875, 0.2857017517089844, 0.294189453125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 8.0, 13.0, 12.0, 20.0, 35.0, 31.0, 40.0, 54.0, 65.0, 86.0, 93.0, 97.0, 93.0, 75.0, 57.0, 52.0, 51.0, 36.0, 25.0, 16.0, 13.0, 9.0, 5.0, 4.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00011366605758666992, -0.00011036824434995651, -0.0001070704311132431, -0.0001037726178765297, -0.00010047480463981628, -9.717699140310287e-05, -9.387917816638947e-05, -9.058136492967606e-05, -8.728355169296265e-05, -8.398573845624924e-05, -8.068792521953583e-05, -7.739011198282242e-05, -7.409229874610901e-05, -7.07944855093956e-05, -6.749667227268219e-05, -6.419885903596878e-05, -6.090104579925537e-05, -5.760323256254196e-05, -5.430541932582855e-05, -5.100760608911514e-05, -4.7709792852401733e-05, -4.4411979615688324e-05, -4.1114166378974915e-05, -3.7816353142261505e-05, -3.4518539905548096e-05, -3.1220726668834686e-05, -2.7922913432121277e-05, -2.4625100195407867e-05, -2.1327286958694458e-05, -1.802947372198105e-05, -1.473166048526764e-05, -1.143384724855423e-05, -8.13603401184082e-06, -4.838220775127411e-06, -1.5404075384140015e-06, 1.757405698299408e-06, 5.055218935012817e-06, 8.353032171726227e-06, 1.1650845408439636e-05, 1.4948658645153046e-05, 1.8246471881866455e-05, 2.1544285118579865e-05, 2.4842098355293274e-05, 2.8139911592006683e-05, 3.143772482872009e-05, 3.47355380654335e-05, 3.803335130214691e-05, 4.133116453886032e-05, 4.462897777557373e-05, 4.792679101228714e-05, 5.122460424900055e-05, 5.452241748571396e-05, 5.782023072242737e-05, 6.111804395914078e-05, 6.441585719585419e-05, 6.77136704325676e-05, 7.1011483669281e-05, 7.430929690599442e-05, 7.760711014270782e-05, 8.090492337942123e-05, 8.420273661613464e-05, 8.750054985284805e-05, 9.079836308956146e-05, 9.409617632627487e-05, 9.739398956298828e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 6.0, 9.0, 7.0, 13.0, 17.0, 28.0, 33.0, 69.0, 100.0, 215.0, 402.0, 963.0, 2348.0, 7991.0, 65313.0, 854538.0, 101672.0, 10066.0, 2750.0, 1014.0, 427.0, 242.0, 124.0, 76.0, 39.0, 30.0, 16.0, 10.0, 8.0, 6.0, 5.0, 7.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.28466796875, -0.2759284973144531, -0.26718902587890625, -0.2584495544433594, -0.2497100830078125, -0.24097061157226562, -0.23223114013671875, -0.22349166870117188, -0.214752197265625, -0.20601272583007812, -0.19727325439453125, -0.18853378295898438, -0.1797943115234375, -0.17105484008789062, -0.16231536865234375, -0.15357589721679688, -0.14483642578125, -0.13609695434570312, -0.12735748291015625, -0.11861801147460938, -0.1098785400390625, -0.10113906860351562, -0.09239959716796875, -0.08366012573242188, -0.074920654296875, -0.06618118286132812, -0.05744171142578125, -0.048702239990234375, -0.0399627685546875, -0.031223297119140625, -0.02248382568359375, -0.013744354248046875, -0.0050048828125, 0.003734588623046875, 0.01247406005859375, 0.021213531494140625, 0.0299530029296875, 0.038692474365234375, 0.04743194580078125, 0.056171417236328125, 0.064910888671875, 0.07365036010742188, 0.08238983154296875, 0.09112930297851562, 0.0998687744140625, 0.10860824584960938, 0.11734771728515625, 0.12608718872070312, 0.13482666015625, 0.14356613159179688, 0.15230560302734375, 0.16104507446289062, 0.1697845458984375, 0.17852401733398438, 0.18726348876953125, 0.19600296020507812, 0.204742431640625, 0.21348190307617188, 0.22222137451171875, 0.23096084594726562, 0.2397003173828125, 0.24843978881835938, 0.25717926025390625, 0.2659187316894531, 0.274658203125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 11.0, 10.0, 13.0, 29.0, 33.0, 49.0, 63.0, 81.0, 131.0, 136.0, 129.0, 108.0, 65.0, 45.0, 21.0, 18.0, 15.0, 6.0, 3.0, 2.0, 9.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1107177734375, -0.10668182373046875, -0.1026458740234375, -0.09860992431640625, -0.094573974609375, -0.09053802490234375, -0.0865020751953125, -0.08246612548828125, -0.07843017578125, -0.07439422607421875, -0.0703582763671875, -0.06632232666015625, -0.062286376953125, -0.05825042724609375, -0.0542144775390625, -0.05017852783203125, -0.046142578125, -0.04210662841796875, -0.0380706787109375, -0.03403472900390625, -0.029998779296875, -0.02596282958984375, -0.0219268798828125, -0.01789093017578125, -0.01385498046875, -0.00981903076171875, -0.0057830810546875, -0.00174713134765625, 0.002288818359375, 0.00632476806640625, 0.0103607177734375, 0.01439666748046875, 0.0184326171875, 0.02246856689453125, 0.0265045166015625, 0.03054046630859375, 0.034576416015625, 0.03861236572265625, 0.0426483154296875, 0.04668426513671875, 0.05072021484375, 0.05475616455078125, 0.0587921142578125, 0.06282806396484375, 0.066864013671875, 0.07089996337890625, 0.0749359130859375, 0.07897186279296875, 0.0830078125, 0.08704376220703125, 0.0910797119140625, 0.09511566162109375, 0.099151611328125, 0.10318756103515625, 0.1072235107421875, 0.11125946044921875, 0.11529541015625, 0.11933135986328125, 0.1233673095703125, 0.12740325927734375, 0.131439208984375, 0.13547515869140625, 0.1395111083984375, 0.14354705810546875, 0.1475830078125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 2.0, 6.0, 16.0, 22.0, 47.0, 62.0, 111.0, 122.0, 146.0, 134.0, 112.0, 94.0, 51.0, 30.0, 16.0, 12.0, 6.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4575613737106323, -1.4084463119506836, -1.3593312501907349, -1.3102161884307861, -1.261101245880127, -1.2119861841201782, -1.1628711223602295, -1.1137560606002808, -1.064640998840332, -1.0155259370803833, -0.9664108753204346, -0.9172958731651306, -0.8681808114051819, -0.8190657496452332, -0.7699507474899292, -0.7208356857299805, -0.6717206239700317, -0.622605562210083, -0.5734905004501343, -0.5243754982948303, -0.4752604365348816, -0.42614537477493286, -0.3770303428173065, -0.3279153108596802, -0.27880024909973145, -0.2296852022409439, -0.18057015538215637, -0.13145510852336884, -0.0823400616645813, -0.03322501480579376, 0.015890032052993774, 0.06500506401062012, 0.1141200065612793, 0.16323505342006683, 0.21235010027885437, 0.2614651322364807, 0.31058019399642944, 0.3596952557563782, 0.4088102877140045, 0.45792531967163086, 0.5070403814315796, 0.5561554431915283, 0.605270504951477, 0.654385507106781, 0.7035005688667297, 0.7526156306266785, 0.8017306327819824, 0.8508456945419312, 0.8999607563018799, 0.9490758180618286, 0.9981908798217773, 1.047305941581726, 1.0964210033416748, 1.145535945892334, 1.1946510076522827, 1.2437660694122314, 1.2928811311721802, 1.341996192932129, 1.3911112546920776, 1.4402263164520264, 1.4893412590026855, 1.5384563207626343, 1.587571382522583, 1.6366864442825317, 1.6858015060424805]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 3.0, 9.0, 6.0, 14.0, 7.0, 17.0, 15.0, 25.0, 35.0, 22.0, 31.0, 40.0, 50.0, 41.0, 44.0, 43.0, 48.0, 43.0, 33.0, 62.0, 37.0, 44.0, 37.0, 31.0, 31.0, 29.0, 30.0, 23.0, 24.0, 22.0, 20.0, 12.0, 14.0, 5.0, 8.0, 5.0, 8.0, 6.0, 0.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.7968870997428894, -0.7721466422080994, -0.7474061846733093, -0.7226657271385193, -0.6979252696037292, -0.6731848120689392, -0.6484442949295044, -0.6237038373947144, -0.5989633798599243, -0.5742229223251343, -0.5494824647903442, -0.5247420072555542, -0.5000015497207642, -0.4752610921859741, -0.4505206048488617, -0.42578014731407166, -0.401039719581604, -0.37629926204681396, -0.3515588045120239, -0.3268183469772339, -0.30207788944244385, -0.2773374319076538, -0.2525969445705414, -0.22785648703575134, -0.2031160295009613, -0.17837557196617126, -0.15363511443138123, -0.12889464199543, -0.10415418446063995, -0.07941372692584991, -0.05467325448989868, -0.029932796955108643, -0.005192279815673828, 0.01954818144440651, 0.04428864270448685, 0.06902910768985748, 0.09376956522464752, 0.11851002275943756, 0.1432504951953888, 0.16799095273017883, 0.19273141026496887, 0.2174718677997589, 0.24221232533454895, 0.2669528126716614, 0.2916932702064514, 0.31643372774124146, 0.3411741852760315, 0.36591464281082153, 0.3906551003456116, 0.4153955578804016, 0.44013601541519165, 0.4648764729499817, 0.48961693048477173, 0.5143573880195618, 0.5390979051589966, 0.5638383626937866, 0.5885788202285767, 0.6133192777633667, 0.6380597352981567, 0.6628001928329468, 0.6875406503677368, 0.7122811079025269, 0.7370215654373169, 0.7617620229721069, 0.786502480506897]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 6.0, 17.0, 26.0, 29.0, 58.0, 87.0, 152.0, 251.0, 487.0, 795.0, 1475.0, 2772.0, 6032.0, 13171.0, 32216.0, 99163.0, 560890.0, 3123383.0, 249719.0, 61665.0, 22536.0, 9453.0, 4613.0, 2309.0, 1199.0, 700.0, 401.0, 255.0, 153.0, 88.0, 56.0, 41.0, 24.0, 15.0, 17.0, 10.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12347412109375, -0.11895275115966797, -0.11443138122558594, -0.1099100112915039, -0.10538864135742188, -0.10086727142333984, -0.09634590148925781, -0.09182453155517578, -0.08730316162109375, -0.08278179168701172, -0.07826042175292969, -0.07373905181884766, -0.06921768188476562, -0.0646963119506836, -0.06017494201660156, -0.05565357208251953, -0.0511322021484375, -0.04661083221435547, -0.04208946228027344, -0.037568092346191406, -0.033046722412109375, -0.028525352478027344, -0.024003982543945312, -0.01948261260986328, -0.01496124267578125, -0.010439872741699219, -0.0059185028076171875, -0.0013971328735351562, 0.003124237060546875, 0.007645606994628906, 0.012166976928710938, 0.01668834686279297, 0.021209716796875, 0.02573108673095703, 0.030252456665039062, 0.034773826599121094, 0.039295196533203125, 0.043816566467285156, 0.04833793640136719, 0.05285930633544922, 0.05738067626953125, 0.06190204620361328, 0.06642341613769531, 0.07094478607177734, 0.07546615600585938, 0.0799875259399414, 0.08450889587402344, 0.08903026580810547, 0.0935516357421875, 0.09807300567626953, 0.10259437561035156, 0.1071157455444336, 0.11163711547851562, 0.11615848541259766, 0.12067985534667969, 0.12520122528076172, 0.12972259521484375, 0.13424396514892578, 0.1387653350830078, 0.14328670501708984, 0.14780807495117188, 0.1523294448852539, 0.15685081481933594, 0.16137218475341797, 0.1658935546875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 4.0, 6.0, 4.0, 8.0, 7.0, 25.0, 16.0, 32.0, 34.0, 41.0, 58.0, 62.0, 68.0, 78.0, 74.0, 78.0, 80.0, 62.0, 47.0, 54.0, 36.0, 39.0, 21.0, 21.0, 13.0, 12.0, 6.0, 6.0, 8.0, 5.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045074462890625, -0.04356813430786133, -0.042061805725097656, -0.040555477142333984, -0.03904914855957031, -0.03754281997680664, -0.03603649139404297, -0.0345301628112793, -0.033023834228515625, -0.03151750564575195, -0.03001117706298828, -0.02850484848022461, -0.026998519897460938, -0.025492191314697266, -0.023985862731933594, -0.022479534149169922, -0.02097320556640625, -0.019466876983642578, -0.017960548400878906, -0.016454219818115234, -0.014947891235351562, -0.01344156265258789, -0.011935234069824219, -0.010428905487060547, -0.008922576904296875, -0.007416248321533203, -0.005909919738769531, -0.004403591156005859, -0.0028972625732421875, -0.0013909339904785156, 0.00011539459228515625, 0.0016217231750488281, 0.0031280517578125, 0.004634380340576172, 0.006140708923339844, 0.007647037506103516, 0.009153366088867188, 0.01065969467163086, 0.012166023254394531, 0.013672351837158203, 0.015178680419921875, 0.016685009002685547, 0.01819133758544922, 0.01969766616821289, 0.021203994750976562, 0.022710323333740234, 0.024216651916503906, 0.025722980499267578, 0.02722930908203125, 0.028735637664794922, 0.030241966247558594, 0.031748294830322266, 0.03325462341308594, 0.03476095199584961, 0.03626728057861328, 0.03777360916137695, 0.039279937744140625, 0.0407862663269043, 0.04229259490966797, 0.04379892349243164, 0.04530525207519531, 0.046811580657958984, 0.048317909240722656, 0.04982423782348633, 0.05133056640625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 4.0, 7.0, 3.0, 10.0, 9.0, 18.0, 29.0, 43.0, 48.0, 94.0, 143.0, 205.0, 326.0, 596.0, 1030.0, 2002.0, 3921.0, 8172.0, 18689.0, 45940.0, 134926.0, 598820.0, 2773088.0, 427433.0, 108982.0, 38877.0, 16027.0, 7246.0, 3444.0, 1752.0, 954.0, 512.0, 321.0, 170.0, 131.0, 99.0, 64.0, 42.0, 43.0, 20.0, 15.0, 13.0, 7.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.15576171875, -0.15148353576660156, -0.14720535278320312, -0.1429271697998047, -0.13864898681640625, -0.1343708038330078, -0.13009262084960938, -0.12581443786621094, -0.1215362548828125, -0.11725807189941406, -0.11297988891601562, -0.10870170593261719, -0.10442352294921875, -0.10014533996582031, -0.09586715698242188, -0.09158897399902344, -0.087310791015625, -0.08303260803222656, -0.07875442504882812, -0.07447624206542969, -0.07019805908203125, -0.06591987609863281, -0.061641693115234375, -0.05736351013183594, -0.0530853271484375, -0.04880714416503906, -0.044528961181640625, -0.04025077819824219, -0.03597259521484375, -0.03169441223144531, -0.027416229248046875, -0.023138046264648438, -0.01885986328125, -0.014581680297851562, -0.010303497314453125, -0.0060253143310546875, -0.00174713134765625, 0.0025310516357421875, 0.006809234619140625, 0.011087417602539062, 0.0153656005859375, 0.019643783569335938, 0.023921966552734375, 0.028200149536132812, 0.03247833251953125, 0.03675651550292969, 0.041034698486328125, 0.04531288146972656, 0.049591064453125, 0.05386924743652344, 0.058147430419921875, 0.06242561340332031, 0.06670379638671875, 0.07098197937011719, 0.07526016235351562, 0.07953834533691406, 0.0838165283203125, 0.08809471130371094, 0.09237289428710938, 0.09665107727050781, 0.10092926025390625, 0.10520744323730469, 0.10948562622070312, 0.11376380920410156, 0.1180419921875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 10.0, 11.0, 23.0, 27.0, 45.0, 64.0, 90.0, 154.0, 283.0, 570.0, 1387.0, 660.0, 292.0, 174.0, 82.0, 65.0, 41.0, 23.0, 18.0, 17.0, 6.0, 12.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.078857421875, -0.07564735412597656, -0.07243728637695312, -0.06922721862792969, -0.06601715087890625, -0.06280708312988281, -0.059597015380859375, -0.05638694763183594, -0.0531768798828125, -0.04996681213378906, -0.046756744384765625, -0.04354667663574219, -0.04033660888671875, -0.03712654113769531, -0.033916473388671875, -0.030706405639648438, -0.027496337890625, -0.024286270141601562, -0.021076202392578125, -0.017866134643554688, -0.01465606689453125, -0.011445999145507812, -0.008235931396484375, -0.0050258636474609375, -0.0018157958984375, 0.0013942718505859375, 0.004604339599609375, 0.007814407348632812, 0.01102447509765625, 0.014234542846679688, 0.017444610595703125, 0.020654678344726562, 0.02386474609375, 0.027074813842773438, 0.030284881591796875, 0.03349494934082031, 0.03670501708984375, 0.03991508483886719, 0.043125152587890625, 0.04633522033691406, 0.0495452880859375, 0.05275535583496094, 0.055965423583984375, 0.05917549133300781, 0.06238555908203125, 0.06559562683105469, 0.06880569458007812, 0.07201576232910156, 0.075225830078125, 0.07843589782714844, 0.08164596557617188, 0.08485603332519531, 0.08806610107421875, 0.09127616882324219, 0.09448623657226562, 0.09769630432128906, 0.1009063720703125, 0.10411643981933594, 0.10732650756835938, 0.11053657531738281, 0.11374664306640625, 0.11695671081542969, 0.12016677856445312, 0.12337684631347656, 0.1265869140625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 10.0, 8.0, 17.0, 20.0, 30.0, 44.0, 56.0, 72.0, 94.0, 100.0, 115.0, 82.0, 78.0, 86.0, 61.0, 46.0, 29.0, 22.0, 12.0, 6.0, 9.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.33861249685287476, -0.32289037108421326, -0.30716824531555176, -0.29144614934921265, -0.27572402358055115, -0.26000189781188965, -0.24427978694438934, -0.22855767607688904, -0.21283555030822754, -0.19711342453956604, -0.18139131367206573, -0.16566920280456543, -0.14994707703590393, -0.13422495126724243, -0.11850284039974213, -0.10278072208166122, -0.08705860376358032, -0.07133648544549942, -0.05561436712741852, -0.039892248809337616, -0.024170130491256714, -0.008448012173175812, 0.00727410614490509, 0.022996224462985992, 0.038718342781066895, 0.0544404610991478, 0.0701625794172287, 0.0858846977353096, 0.1016068160533905, 0.1173289343714714, 0.1330510526895523, 0.1487731635570526, 0.16449522972106934, 0.18021735548973083, 0.19593946635723114, 0.21166157722473145, 0.22738370299339294, 0.24310582876205444, 0.25882792472839355, 0.27455005049705505, 0.29027217626571655, 0.30599430203437805, 0.32171642780303955, 0.33743852376937866, 0.35316064953804016, 0.36888277530670166, 0.38460487127304077, 0.40032699704170227, 0.41604912281036377, 0.43177124857902527, 0.44749337434768677, 0.4632154703140259, 0.4789375960826874, 0.4946597218513489, 0.510381817817688, 0.5261039733886719, 0.541826069355011, 0.5575481653213501, 0.573270320892334, 0.5889924168586731, 0.6047145128250122, 0.6204366683959961, 0.6361587643623352, 0.6518809199333191, 0.6676030158996582]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 9.0, 9.0, 5.0, 9.0, 10.0, 12.0, 15.0, 20.0, 20.0, 26.0, 23.0, 28.0, 30.0, 37.0, 27.0, 56.0, 31.0, 46.0, 48.0, 37.0, 37.0, 40.0, 38.0, 39.0, 45.0, 36.0, 32.0, 28.0, 42.0, 26.0, 21.0, 22.0, 15.0, 15.0, 16.0, 9.0, 14.0, 7.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2956008315086365, -0.28671133518218994, -0.2778218388557434, -0.2689323425292969, -0.26004284620285034, -0.2511533498764038, -0.24226383864879608, -0.23337434232234955, -0.22448483109474182, -0.2155953347682953, -0.20670583844184875, -0.19781634211540222, -0.1889268308877945, -0.18003733456134796, -0.17114783823490143, -0.1622583419084549, -0.15336884558200836, -0.14447934925556183, -0.1355898529291153, -0.12670034170150757, -0.11781084537506104, -0.1089213490486145, -0.10003185272216797, -0.09114235639572144, -0.0822528526186943, -0.07336335629224777, -0.06447385251522064, -0.05558435618877411, -0.04669485613703728, -0.037805356085300446, -0.028915859758853912, -0.02002635970711708, -0.011136859655380249, -0.002247360534965992, 0.006642138585448265, 0.015531636774539948, 0.02442113682627678, 0.03331063687801361, 0.042200133204460144, 0.051089633256196976, 0.05997913330793381, 0.06886862963438034, 0.07775813341140747, 0.086647629737854, 0.09553712606430054, 0.10442662984132767, 0.1133161261677742, 0.12220562994480133, 0.13109512627124786, 0.1399846225976944, 0.14887411892414093, 0.15776363015174866, 0.1666531264781952, 0.17554262280464172, 0.18443211913108826, 0.1933216154575348, 0.20221111178398132, 0.21110060811042786, 0.2199901044368744, 0.22887960076332092, 0.23776911199092865, 0.24665860831737518, 0.2555481195449829, 0.26443761587142944, 0.273327112197876]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 10.0, 13.0, 22.0, 26.0, 51.0, 98.0, 166.0, 328.0, 581.0, 1060.0, 2170.0, 4510.0, 10126.0, 23692.0, 59477.0, 222221.0, 553883.0, 103168.0, 37974.0, 15869.0, 6649.0, 3098.0, 1567.0, 828.0, 402.0, 239.0, 139.0, 80.0, 35.0, 23.0, 18.0, 14.0, 7.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1964111328125, -0.1905059814453125, -0.184600830078125, -0.1786956787109375, -0.17279052734375, -0.1668853759765625, -0.160980224609375, -0.1550750732421875, -0.149169921875, -0.1432647705078125, -0.137359619140625, -0.1314544677734375, -0.12554931640625, -0.1196441650390625, -0.113739013671875, -0.1078338623046875, -0.1019287109375, -0.0960235595703125, -0.090118408203125, -0.0842132568359375, -0.07830810546875, -0.0724029541015625, -0.066497802734375, -0.0605926513671875, -0.0546875, -0.0487823486328125, -0.042877197265625, -0.0369720458984375, -0.03106689453125, -0.0251617431640625, -0.019256591796875, -0.0133514404296875, -0.0074462890625, -0.0015411376953125, 0.004364013671875, 0.0102691650390625, 0.01617431640625, 0.0220794677734375, 0.027984619140625, 0.0338897705078125, 0.039794921875, 0.0457000732421875, 0.051605224609375, 0.0575103759765625, 0.06341552734375, 0.0693206787109375, 0.075225830078125, 0.0811309814453125, 0.0870361328125, 0.0929412841796875, 0.098846435546875, 0.1047515869140625, 0.11065673828125, 0.1165618896484375, 0.122467041015625, 0.1283721923828125, 0.13427734375, 0.1401824951171875, 0.146087646484375, 0.1519927978515625, 0.15789794921875, 0.1638031005859375, 0.169708251953125, 0.1756134033203125, 0.1815185546875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 7.0, 8.0, 10.0, 17.0, 16.0, 25.0, 38.0, 51.0, 44.0, 47.0, 72.0, 71.0, 65.0, 72.0, 78.0, 70.0, 60.0, 55.0, 50.0, 28.0, 34.0, 25.0, 17.0, 16.0, 11.0, 5.0, 4.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045806884765625, -0.0442500114440918, -0.042693138122558594, -0.04113626480102539, -0.03957939147949219, -0.038022518157958984, -0.03646564483642578, -0.03490877151489258, -0.033351898193359375, -0.03179502487182617, -0.03023815155029297, -0.028681278228759766, -0.027124404907226562, -0.02556753158569336, -0.024010658264160156, -0.022453784942626953, -0.02089691162109375, -0.019340038299560547, -0.017783164978027344, -0.01622629165649414, -0.014669418334960938, -0.013112545013427734, -0.011555671691894531, -0.009998798370361328, -0.008441925048828125, -0.006885051727294922, -0.005328178405761719, -0.0037713050842285156, -0.0022144317626953125, -0.0006575584411621094, 0.0008993148803710938, 0.002456188201904297, 0.0040130615234375, 0.005569934844970703, 0.007126808166503906, 0.00868368148803711, 0.010240554809570312, 0.011797428131103516, 0.013354301452636719, 0.014911174774169922, 0.016468048095703125, 0.018024921417236328, 0.01958179473876953, 0.021138668060302734, 0.022695541381835938, 0.02425241470336914, 0.025809288024902344, 0.027366161346435547, 0.02892303466796875, 0.030479907989501953, 0.032036781311035156, 0.03359365463256836, 0.03515052795410156, 0.036707401275634766, 0.03826427459716797, 0.03982114791870117, 0.041378021240234375, 0.04293489456176758, 0.04449176788330078, 0.046048641204833984, 0.04760551452636719, 0.04916238784790039, 0.050719261169433594, 0.0522761344909668, 0.0538330078125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 7.0, 7.0, 6.0, 6.0, 5.0, 8.0, 15.0, 20.0, 26.0, 28.0, 45.0, 57.0, 79.0, 107.0, 164.0, 226.0, 371.0, 553.0, 1028.0, 2020.0, 5173.0, 16474.0, 59668.0, 366292.0, 496195.0, 69648.0, 19203.0, 5942.0, 2280.0, 1055.0, 592.0, 369.0, 240.0, 177.0, 145.0, 78.0, 65.0, 59.0, 38.0, 22.0, 20.0, 23.0, 8.0, 11.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2120361328125, -0.20520973205566406, -0.19838333129882812, -0.1915569305419922, -0.18473052978515625, -0.1779041290283203, -0.17107772827148438, -0.16425132751464844, -0.1574249267578125, -0.15059852600097656, -0.14377212524414062, -0.1369457244873047, -0.13011932373046875, -0.12329292297363281, -0.11646652221679688, -0.10964012145996094, -0.102813720703125, -0.09598731994628906, -0.08916091918945312, -0.08233451843261719, -0.07550811767578125, -0.06868171691894531, -0.061855316162109375, -0.05502891540527344, -0.0482025146484375, -0.04137611389160156, -0.034549713134765625, -0.027723312377929688, -0.02089691162109375, -0.014070510864257812, -0.007244110107421875, -0.0004177093505859375, 0.00640869140625, 0.013235092163085938, 0.020061492919921875, 0.026887893676757812, 0.03371429443359375, 0.04054069519042969, 0.047367095947265625, 0.05419349670410156, 0.0610198974609375, 0.06784629821777344, 0.07467269897460938, 0.08149909973144531, 0.08832550048828125, 0.09515190124511719, 0.10197830200195312, 0.10880470275878906, 0.115631103515625, 0.12245750427246094, 0.12928390502929688, 0.1361103057861328, 0.14293670654296875, 0.1497631072998047, 0.15658950805664062, 0.16341590881347656, 0.1702423095703125, 0.17706871032714844, 0.18389511108398438, 0.1907215118408203, 0.19754791259765625, 0.2043743133544922, 0.21120071411132812, 0.21802711486816406, 0.224853515625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 2.0, 5.0, 7.0, 6.0, 14.0, 20.0, 32.0, 31.0, 31.0, 42.0, 32.0, 50.0, 49.0, 51.0, 56.0, 49.0, 60.0, 45.0, 64.0, 46.0, 54.0, 44.0, 32.0, 28.0, 33.0, 20.0, 25.0, 11.0, 12.0, 10.0, 10.0, 8.0, 5.0, 3.0, 6.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.178955078125, -0.17360305786132812, -0.16825103759765625, -0.16289901733398438, -0.1575469970703125, -0.15219497680664062, -0.14684295654296875, -0.14149093627929688, -0.136138916015625, -0.13078689575195312, -0.12543487548828125, -0.12008285522460938, -0.1147308349609375, -0.10937881469726562, -0.10402679443359375, -0.09867477416992188, -0.09332275390625, -0.08797073364257812, -0.08261871337890625, -0.07726669311523438, -0.0719146728515625, -0.06656265258789062, -0.06121063232421875, -0.055858612060546875, -0.050506591796875, -0.045154571533203125, -0.03980255126953125, -0.034450531005859375, -0.0290985107421875, -0.023746490478515625, -0.01839447021484375, -0.013042449951171875, -0.0076904296875, -0.002338409423828125, 0.00301361083984375, 0.008365631103515625, 0.0137176513671875, 0.019069671630859375, 0.02442169189453125, 0.029773712158203125, 0.035125732421875, 0.040477752685546875, 0.04582977294921875, 0.051181793212890625, 0.0565338134765625, 0.061885833740234375, 0.06723785400390625, 0.07258987426757812, 0.07794189453125, 0.08329391479492188, 0.08864593505859375, 0.09399795532226562, 0.0993499755859375, 0.10470199584960938, 0.11005401611328125, 0.11540603637695312, 0.120758056640625, 0.12611007690429688, 0.13146209716796875, 0.13681411743164062, 0.1421661376953125, 0.14751815795898438, 0.15287017822265625, 0.15822219848632812, 0.16357421875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 12.0, 17.0, 30.0, 47.0, 63.0, 95.0, 169.0, 361.0, 803.0, 1894.0, 5187.0, 16760.0, 69768.0, 765689.0, 146754.0, 27920.0, 8096.0, 2778.0, 1092.0, 454.0, 241.0, 134.0, 72.0, 39.0, 29.0, 15.0, 12.0, 10.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.2314453125, -0.22589397430419922, -0.22034263610839844, -0.21479129791259766, -0.20923995971679688, -0.2036886215209961, -0.1981372833251953, -0.19258594512939453, -0.18703460693359375, -0.18148326873779297, -0.1759319305419922, -0.1703805923461914, -0.16482925415039062, -0.15927791595458984, -0.15372657775878906, -0.14817523956298828, -0.1426239013671875, -0.13707256317138672, -0.13152122497558594, -0.12596988677978516, -0.12041854858398438, -0.1148672103881836, -0.10931587219238281, -0.10376453399658203, -0.09821319580078125, -0.09266185760498047, -0.08711051940917969, -0.0815591812133789, -0.07600784301757812, -0.07045650482177734, -0.06490516662597656, -0.05935382843017578, -0.053802490234375, -0.04825115203857422, -0.04269981384277344, -0.037148475646972656, -0.031597137451171875, -0.026045799255371094, -0.020494461059570312, -0.014943122863769531, -0.00939178466796875, -0.0038404464721679688, 0.0017108917236328125, 0.007262229919433594, 0.012813568115234375, 0.018364906311035156, 0.023916244506835938, 0.02946758270263672, 0.0350189208984375, 0.04057025909423828, 0.04612159729003906, 0.051672935485839844, 0.057224273681640625, 0.0627756118774414, 0.06832695007324219, 0.07387828826904297, 0.07942962646484375, 0.08498096466064453, 0.09053230285644531, 0.0960836410522461, 0.10163497924804688, 0.10718631744384766, 0.11273765563964844, 0.11828899383544922, 0.12384033203125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 4.0, 13.0, 10.0, 11.0, 35.0, 61.0, 98.0, 124.0, 173.0, 165.0, 124.0, 64.0, 43.0, 20.0, 20.0, 9.0, 10.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002090930938720703, -0.000202864408493042, -0.00019663572311401367, -0.00019040703773498535, -0.00018417835235595703, -0.0001779496669769287, -0.0001717209815979004, -0.00016549229621887207, -0.00015926361083984375, -0.00015303492546081543, -0.0001468062400817871, -0.0001405775547027588, -0.00013434886932373047, -0.00012812018394470215, -0.00012189149856567383, -0.00011566281318664551, -0.00010943412780761719, -0.00010320544242858887, -9.697675704956055e-05, -9.074807167053223e-05, -8.45193862915039e-05, -7.829070091247559e-05, -7.206201553344727e-05, -6.583333015441895e-05, -5.9604644775390625e-05, -5.3375959396362305e-05, -4.7147274017333984e-05, -4.0918588638305664e-05, -3.4689903259277344e-05, -2.8461217880249023e-05, -2.2232532501220703e-05, -1.6003847122192383e-05, -9.775161743164062e-06, -3.546476364135742e-06, 2.682209014892578e-06, 8.910894393920898e-06, 1.5139579772949219e-05, 2.136826515197754e-05, 2.759695053100586e-05, 3.382563591003418e-05, 4.00543212890625e-05, 4.628300666809082e-05, 5.251169204711914e-05, 5.874037742614746e-05, 6.496906280517578e-05, 7.11977481842041e-05, 7.742643356323242e-05, 8.365511894226074e-05, 8.988380432128906e-05, 9.611248970031738e-05, 0.0001023411750793457, 0.00010856986045837402, 0.00011479854583740234, 0.00012102723121643066, 0.00012725591659545898, 0.0001334846019744873, 0.00013971328735351562, 0.00014594197273254395, 0.00015217065811157227, 0.00015839934349060059, 0.0001646280288696289, 0.00017085671424865723, 0.00017708539962768555, 0.00018331408500671387, 0.0001895427703857422]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 7.0, 6.0, 6.0, 10.0, 12.0, 18.0, 26.0, 35.0, 43.0, 75.0, 95.0, 174.0, 268.0, 492.0, 1030.0, 2726.0, 8729.0, 36977.0, 381072.0, 557356.0, 43695.0, 10181.0, 3041.0, 1158.0, 546.0, 274.0, 160.0, 92.0, 62.0, 45.0, 35.0, 24.0, 23.0, 15.0, 14.0, 12.0, 7.0, 5.0, 3.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1773681640625, -0.17215919494628906, -0.16695022583007812, -0.1617412567138672, -0.15653228759765625, -0.1513233184814453, -0.14611434936523438, -0.14090538024902344, -0.1356964111328125, -0.13048744201660156, -0.12527847290039062, -0.12006950378417969, -0.11486053466796875, -0.10965156555175781, -0.10444259643554688, -0.09923362731933594, -0.094024658203125, -0.08881568908691406, -0.08360671997070312, -0.07839775085449219, -0.07318878173828125, -0.06797981262207031, -0.06277084350585938, -0.05756187438964844, -0.0523529052734375, -0.04714393615722656, -0.041934967041015625, -0.03672599792480469, -0.03151702880859375, -0.026308059692382812, -0.021099090576171875, -0.015890121459960938, -0.01068115234375, -0.0054721832275390625, -0.000263214111328125, 0.0049457550048828125, 0.01015472412109375, 0.015363693237304688, 0.020572662353515625, 0.025781631469726562, 0.0309906005859375, 0.03619956970214844, 0.041408538818359375, 0.04661750793457031, 0.05182647705078125, 0.05703544616699219, 0.062244415283203125, 0.06745338439941406, 0.072662353515625, 0.07787132263183594, 0.08308029174804688, 0.08828926086425781, 0.09349822998046875, 0.09870719909667969, 0.10391616821289062, 0.10912513732910156, 0.1143341064453125, 0.11954307556152344, 0.12475204467773438, 0.1299610137939453, 0.13516998291015625, 0.1403789520263672, 0.14558792114257812, 0.15079689025878906, 0.156005859375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 7.0, 8.0, 4.0, 5.0, 6.0, 4.0, 7.0, 15.0, 15.0, 23.0, 51.0, 63.0, 161.0, 239.0, 183.0, 69.0, 41.0, 20.0, 23.0, 13.0, 10.0, 12.0, 7.0, 4.0, 4.0, 8.0, 0.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11566162109375, -0.1118783950805664, -0.10809516906738281, -0.10431194305419922, -0.10052871704101562, -0.09674549102783203, -0.09296226501464844, -0.08917903900146484, -0.08539581298828125, -0.08161258697509766, -0.07782936096191406, -0.07404613494873047, -0.07026290893554688, -0.06647968292236328, -0.06269645690917969, -0.058913230895996094, -0.0551300048828125, -0.051346778869628906, -0.04756355285644531, -0.04378032684326172, -0.039997100830078125, -0.03621387481689453, -0.03243064880371094, -0.028647422790527344, -0.02486419677734375, -0.021080970764160156, -0.017297744750976562, -0.013514518737792969, -0.009731292724609375, -0.005948066711425781, -0.0021648406982421875, 0.0016183853149414062, 0.005401611328125, 0.009184837341308594, 0.012968063354492188, 0.01675128936767578, 0.020534515380859375, 0.02431774139404297, 0.028100967407226562, 0.031884193420410156, 0.03566741943359375, 0.039450645446777344, 0.04323387145996094, 0.04701709747314453, 0.050800323486328125, 0.05458354949951172, 0.05836677551269531, 0.062150001525878906, 0.0659332275390625, 0.0697164535522461, 0.07349967956542969, 0.07728290557861328, 0.08106613159179688, 0.08484935760498047, 0.08863258361816406, 0.09241580963134766, 0.09619903564453125, 0.09998226165771484, 0.10376548767089844, 0.10754871368408203, 0.11133193969726562, 0.11511516571044922, 0.11889839172363281, 0.1226816177368164, 0.12646484375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 13.0, 32.0, 52.0, 110.0, 168.0, 207.0, 173.0, 120.0, 64.0, 37.0, 16.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2968658208847046, -1.227510929107666, -1.1581560373306274, -1.0888011455535889, -1.0194463729858398, -0.9500914216041565, -0.8807365894317627, -0.8113816976547241, -0.7420268058776855, -0.672671914100647, -0.6033170223236084, -0.5339621901512146, -0.464607298374176, -0.39525240659713745, -0.32589754462242126, -0.2565426826477051, -0.1871877908706665, -0.11783291399478912, -0.04847803711891174, 0.020876839756965637, 0.09023171663284302, 0.1595866084098816, 0.22894147038459778, 0.29829633235931396, 0.36765122413635254, 0.4370061159133911, 0.5063610076904297, 0.5757158398628235, 0.6450707316398621, 0.7144256234169006, 0.7837804555892944, 0.853135347366333, 0.9224903583526611, 0.9918452501296997, 1.0612001419067383, 1.1305550336837769, 1.1999099254608154, 1.2692646980285645, 1.338619589805603, 1.4079744815826416, 1.4773293733596802, 1.5466842651367188, 1.6160391569137573, 1.685394048690796, 1.754748821258545, 1.824103832244873, 1.893458604812622, 1.9628134965896606, 2.032168388366699, 2.1015231609344482, 2.1708781719207764, 2.2402329444885254, 2.3095879554748535, 2.3789427280426025, 2.4482977390289307, 2.5176525115966797, 2.587007522583008, 2.656362295150757, 2.725717306137085, 2.795072078704834, 2.864427089691162, 2.933781862258911, 3.0031368732452393, 3.0724916458129883, 3.1418464183807373]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 8.0, 8.0, 6.0, 9.0, 13.0, 13.0, 12.0, 11.0, 7.0, 18.0, 20.0, 17.0, 23.0, 30.0, 33.0, 35.0, 35.0, 41.0, 35.0, 29.0, 35.0, 32.0, 39.0, 45.0, 50.0, 28.0, 42.0, 34.0, 32.0, 35.0, 26.0, 14.0, 28.0, 18.0, 16.0, 23.0, 14.0, 15.0, 13.0, 11.0, 12.0, 12.0, 3.0, 5.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6337169408798218, -0.613333523273468, -0.592950165271759, -0.5725667476654053, -0.5521833896636963, -0.5317999720573425, -0.5114165544509888, -0.4910331666469574, -0.470649778842926, -0.45026639103889465, -0.4298830032348633, -0.4094995856285095, -0.38911619782447815, -0.3687328100204468, -0.348349392414093, -0.32796600461006165, -0.3075826168060303, -0.2871992290019989, -0.26681584119796753, -0.24643242359161377, -0.2260490357875824, -0.20566564798355103, -0.18528224527835846, -0.1648988425731659, -0.14451545476913452, -0.12413205951452255, -0.10374866425991058, -0.08336526900529861, -0.06298187375068665, -0.042598478496074677, -0.022215083241462708, -0.0018316805362701416, 0.018551647663116455, 0.038935042917728424, 0.05931843817234039, 0.07970183342695236, 0.10008522868156433, 0.1204686239361763, 0.14085201919078827, 0.16123542189598083, 0.1816188097000122, 0.20200219750404358, 0.22238560020923615, 0.2427690029144287, 0.2631523907184601, 0.28353577852249146, 0.3039191961288452, 0.3243025839328766, 0.34468597173690796, 0.36506935954093933, 0.3854527473449707, 0.40583616495132446, 0.42621955275535583, 0.4466029405593872, 0.46698635816574097, 0.48736974596977234, 0.5077531337738037, 0.5281365513801575, 0.5485199093818665, 0.5689033269882202, 0.5892866849899292, 0.609670102596283, 0.6300535202026367, 0.6504368782043457, 0.6708202958106995]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 9.0, 3.0, 11.0, 22.0, 29.0, 26.0, 57.0, 108.0, 172.0, 285.0, 495.0, 972.0, 1772.0, 3513.0, 7853.0, 18569.0, 49749.0, 182878.0, 3003684.0, 753231.0, 109783.0, 34524.0, 13873.0, 6129.0, 2840.0, 1570.0, 856.0, 463.0, 293.0, 154.0, 132.0, 75.0, 55.0, 36.0, 22.0, 15.0, 14.0, 6.0, 5.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1458740234375, -0.14098358154296875, -0.1360931396484375, -0.13120269775390625, -0.126312255859375, -0.12142181396484375, -0.1165313720703125, -0.11164093017578125, -0.10675048828125, -0.10186004638671875, -0.0969696044921875, -0.09207916259765625, -0.087188720703125, -0.08229827880859375, -0.0774078369140625, -0.07251739501953125, -0.067626953125, -0.06273651123046875, -0.0578460693359375, -0.05295562744140625, -0.048065185546875, -0.04317474365234375, -0.0382843017578125, -0.03339385986328125, -0.02850341796875, -0.02361297607421875, -0.0187225341796875, -0.01383209228515625, -0.008941650390625, -0.00405120849609375, 0.0008392333984375, 0.00572967529296875, 0.0106201171875, 0.01551055908203125, 0.0204010009765625, 0.02529144287109375, 0.030181884765625, 0.03507232666015625, 0.0399627685546875, 0.04485321044921875, 0.04974365234375, 0.05463409423828125, 0.0595245361328125, 0.06441497802734375, 0.069305419921875, 0.07419586181640625, 0.0790863037109375, 0.08397674560546875, 0.0888671875, 0.09375762939453125, 0.0986480712890625, 0.10353851318359375, 0.108428955078125, 0.11331939697265625, 0.1182098388671875, 0.12310028076171875, 0.12799072265625, 0.13288116455078125, 0.1377716064453125, 0.14266204833984375, 0.147552490234375, 0.15244293212890625, 0.1573333740234375, 0.16222381591796875, 0.1671142578125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 3.0, 6.0, 11.0, 11.0, 16.0, 22.0, 19.0, 28.0, 35.0, 45.0, 53.0, 62.0, 52.0, 70.0, 62.0, 78.0, 63.0, 66.0, 58.0, 49.0, 46.0, 32.0, 25.0, 23.0, 13.0, 13.0, 12.0, 13.0, 5.0, 4.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04876708984375, -0.04724264144897461, -0.04571819305419922, -0.04419374465942383, -0.04266929626464844, -0.04114484786987305, -0.039620399475097656, -0.038095951080322266, -0.036571502685546875, -0.035047054290771484, -0.033522605895996094, -0.0319981575012207, -0.030473709106445312, -0.028949260711669922, -0.02742481231689453, -0.02590036392211914, -0.02437591552734375, -0.02285146713256836, -0.02132701873779297, -0.019802570343017578, -0.018278121948242188, -0.016753673553466797, -0.015229225158691406, -0.013704776763916016, -0.012180328369140625, -0.010655879974365234, -0.009131431579589844, -0.007606983184814453, -0.0060825347900390625, -0.004558086395263672, -0.0030336380004882812, -0.0015091896057128906, 1.52587890625e-05, 0.0015397071838378906, 0.0030641555786132812, 0.004588603973388672, 0.0061130523681640625, 0.007637500762939453, 0.009161949157714844, 0.010686397552490234, 0.012210845947265625, 0.013735294342041016, 0.015259742736816406, 0.016784191131591797, 0.018308639526367188, 0.019833087921142578, 0.02135753631591797, 0.02288198471069336, 0.02440643310546875, 0.02593088150024414, 0.02745532989501953, 0.028979778289794922, 0.030504226684570312, 0.0320286750793457, 0.033553123474121094, 0.035077571868896484, 0.036602020263671875, 0.038126468658447266, 0.039650917053222656, 0.04117536544799805, 0.04269981384277344, 0.04422426223754883, 0.04574871063232422, 0.04727315902709961, 0.048797607421875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 11.0, 6.0, 9.0, 14.0, 18.0, 22.0, 32.0, 44.0, 76.0, 104.0, 169.0, 226.0, 373.0, 641.0, 1013.0, 1905.0, 3397.0, 7079.0, 15147.0, 35458.0, 98032.0, 412957.0, 2965374.0, 473701.0, 107494.0, 38430.0, 16246.0, 7703.0, 3778.0, 1964.0, 1099.0, 649.0, 395.0, 268.0, 163.0, 97.0, 56.0, 44.0, 26.0, 19.0, 7.0, 8.0, 9.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1346435546875, -0.13008499145507812, -0.12552642822265625, -0.12096786499023438, -0.1164093017578125, -0.11185073852539062, -0.10729217529296875, -0.10273361206054688, -0.098175048828125, -0.09361648559570312, -0.08905792236328125, -0.08449935913085938, -0.0799407958984375, -0.07538223266601562, -0.07082366943359375, -0.06626510620117188, -0.06170654296875, -0.057147979736328125, -0.05258941650390625, -0.048030853271484375, -0.0434722900390625, -0.038913726806640625, -0.03435516357421875, -0.029796600341796875, -0.025238037109375, -0.020679473876953125, -0.01612091064453125, -0.011562347412109375, -0.0070037841796875, -0.002445220947265625, 0.00211334228515625, 0.006671905517578125, 0.01123046875, 0.015789031982421875, 0.02034759521484375, 0.024906158447265625, 0.0294647216796875, 0.034023284912109375, 0.03858184814453125, 0.043140411376953125, 0.047698974609375, 0.052257537841796875, 0.05681610107421875, 0.061374664306640625, 0.0659332275390625, 0.07049179077148438, 0.07505035400390625, 0.07960891723632812, 0.08416748046875, 0.08872604370117188, 0.09328460693359375, 0.09784317016601562, 0.1024017333984375, 0.10696029663085938, 0.11151885986328125, 0.11607742309570312, 0.120635986328125, 0.12519454956054688, 0.12975311279296875, 0.13431167602539062, 0.1388702392578125, 0.14342880249023438, 0.14798736572265625, 0.15254592895507812, 0.1571044921875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 7.0, 3.0, 12.0, 5.0, 13.0, 22.0, 23.0, 42.0, 53.0, 66.0, 97.0, 155.0, 276.0, 560.0, 1342.0, 584.0, 277.0, 165.0, 98.0, 71.0, 47.0, 34.0, 22.0, 22.0, 14.0, 15.0, 14.0, 9.0, 5.0, 8.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06536865234375, -0.06307601928710938, -0.06078338623046875, -0.058490753173828125, -0.0561981201171875, -0.053905487060546875, -0.05161285400390625, -0.049320220947265625, -0.047027587890625, -0.044734954833984375, -0.04244232177734375, -0.040149688720703125, -0.0378570556640625, -0.035564422607421875, -0.03327178955078125, -0.030979156494140625, -0.0286865234375, -0.026393890380859375, -0.02410125732421875, -0.021808624267578125, -0.0195159912109375, -0.017223358154296875, -0.01493072509765625, -0.012638092041015625, -0.010345458984375, -0.008052825927734375, -0.00576019287109375, -0.003467559814453125, -0.0011749267578125, 0.001117706298828125, 0.00341033935546875, 0.005702972412109375, 0.00799560546875, 0.010288238525390625, 0.01258087158203125, 0.014873504638671875, 0.0171661376953125, 0.019458770751953125, 0.02175140380859375, 0.024044036865234375, 0.026336669921875, 0.028629302978515625, 0.03092193603515625, 0.033214569091796875, 0.0355072021484375, 0.037799835205078125, 0.04009246826171875, 0.042385101318359375, 0.044677734375, 0.046970367431640625, 0.04926300048828125, 0.051555633544921875, 0.0538482666015625, 0.056140899658203125, 0.05843353271484375, 0.060726165771484375, 0.063018798828125, 0.06531143188476562, 0.06760406494140625, 0.06989669799804688, 0.0721893310546875, 0.07448196411132812, 0.07677459716796875, 0.07906723022460938, 0.08135986328125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 8.0, 15.0, 37.0, 97.0, 212.0, 238.0, 213.0, 110.0, 47.0, 18.0, 9.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.186853289604187, -1.1517101526260376, -1.1165670156478882, -1.0814238786697388, -1.0462807416915894, -1.01113760471344, -0.9759945273399353, -0.9408513903617859, -0.9057082533836365, -0.8705651164054871, -0.8354219794273376, -0.8002788424491882, -0.7651357650756836, -0.7299926280975342, -0.6948494911193848, -0.6597063541412354, -0.6245632171630859, -0.5894200801849365, -0.5542769432067871, -0.5191338062286377, -0.48399069905281067, -0.44884756207466125, -0.41370445489883423, -0.3785613179206848, -0.3434181809425354, -0.308275043964386, -0.2731319069862366, -0.23798879981040955, -0.20284566283226013, -0.16770252585411072, -0.1325594037771225, -0.09741628170013428, -0.06227302551269531, -0.027129895985126495, 0.008013233542442322, 0.04315636307001114, 0.07829949259757996, 0.11344262957572937, 0.1485857516527176, 0.1837288737297058, 0.21887201070785522, 0.25401514768600464, 0.28915828466415405, 0.3243013918399811, 0.3594445288181305, 0.3945876657962799, 0.42973077297210693, 0.46487390995025635, 0.5000170469284058, 0.5351601839065552, 0.5703033208847046, 0.605446457862854, 0.6405895948410034, 0.6757327318191528, 0.7108758091926575, 0.7460189461708069, 0.7811620831489563, 0.8163052201271057, 0.8514483571052551, 0.8865914940834045, 0.9217345714569092, 0.9568777084350586, 0.992020845413208, 1.0271639823913574, 1.0623071193695068]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 4.0, 4.0, 5.0, 6.0, 6.0, 7.0, 13.0, 12.0, 22.0, 14.0, 14.0, 26.0, 25.0, 22.0, 20.0, 40.0, 31.0, 29.0, 42.0, 51.0, 37.0, 38.0, 25.0, 39.0, 33.0, 35.0, 33.0, 37.0, 31.0, 23.0, 25.0, 32.0, 30.0, 20.0, 28.0, 22.0, 19.0, 16.0, 16.0, 17.0, 2.0, 14.0, 9.0, 8.0, 3.0, 5.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.22011446952819824, -0.21283075213432312, -0.205547034740448, -0.19826331734657288, -0.19097959995269775, -0.18369588255882263, -0.1764121651649475, -0.1691284477710724, -0.16184473037719727, -0.15456101298332214, -0.14727729558944702, -0.1399935781955719, -0.13270986080169678, -0.12542614340782166, -0.11814243346452713, -0.11085871607065201, -0.10357500612735748, -0.09629128873348236, -0.08900757133960724, -0.08172385394573212, -0.074440136551857, -0.06715641915798187, -0.05987270921468735, -0.052588991820812225, -0.0453052744269371, -0.03802155703306198, -0.03073784150183201, -0.023454125970602036, -0.016170408576726913, -0.008886691182851791, -0.0016029775142669678, 0.005680739879608154, 0.012964457273483276, 0.0202481746673584, 0.02753189019858837, 0.034815605729818344, 0.042099323123693466, 0.04938304051756859, 0.05666675418615341, 0.06395047158002853, 0.07123418897390366, 0.07851790636777878, 0.0858016237616539, 0.09308533370494843, 0.10036905109882355, 0.10765276849269867, 0.11493648588657379, 0.12222020328044891, 0.12950392067432404, 0.13678763806819916, 0.14407135546207428, 0.1513550728559494, 0.15863879024982452, 0.16592250764369965, 0.17320621013641357, 0.1804899275302887, 0.18777364492416382, 0.19505736231803894, 0.20234107971191406, 0.20962479710578918, 0.2169085144996643, 0.22419223189353943, 0.23147594928741455, 0.23875966668128967, 0.2460433840751648]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 6.0, 21.0, 30.0, 32.0, 59.0, 96.0, 142.0, 265.0, 493.0, 993.0, 2166.0, 4796.0, 10639.0, 23124.0, 50998.0, 209346.0, 555652.0, 117588.0, 38564.0, 18054.0, 8251.0, 3744.0, 1736.0, 810.0, 400.0, 196.0, 141.0, 65.0, 34.0, 30.0, 18.0, 22.0, 9.0, 5.0, 5.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.1737060546875, -0.1690540313720703, -0.16440200805664062, -0.15974998474121094, -0.15509796142578125, -0.15044593811035156, -0.14579391479492188, -0.1411418914794922, -0.1364898681640625, -0.1318378448486328, -0.12718582153320312, -0.12253379821777344, -0.11788177490234375, -0.11322975158691406, -0.10857772827148438, -0.10392570495605469, -0.099273681640625, -0.09462165832519531, -0.08996963500976562, -0.08531761169433594, -0.08066558837890625, -0.07601356506347656, -0.07136154174804688, -0.06670951843261719, -0.0620574951171875, -0.05740547180175781, -0.052753448486328125, -0.04810142517089844, -0.04344940185546875, -0.03879737854003906, -0.034145355224609375, -0.029493331909179688, -0.02484130859375, -0.020189285278320312, -0.015537261962890625, -0.010885238647460938, -0.00623321533203125, -0.0015811920166015625, 0.003070831298828125, 0.0077228546142578125, 0.0123748779296875, 0.017026901245117188, 0.021678924560546875, 0.026330947875976562, 0.03098297119140625, 0.03563499450683594, 0.040287017822265625, 0.04493904113769531, 0.049591064453125, 0.05424308776855469, 0.058895111083984375, 0.06354713439941406, 0.06819915771484375, 0.07285118103027344, 0.07750320434570312, 0.08215522766113281, 0.0868072509765625, 0.09145927429199219, 0.09611129760742188, 0.10076332092285156, 0.10541534423828125, 0.11006736755371094, 0.11471939086914062, 0.11937141418457031, 0.1240234375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 6.0, 8.0, 5.0, 10.0, 10.0, 25.0, 29.0, 34.0, 28.0, 43.0, 49.0, 57.0, 52.0, 73.0, 49.0, 63.0, 51.0, 55.0, 55.0, 50.0, 39.0, 47.0, 42.0, 27.0, 20.0, 16.0, 9.0, 20.0, 9.0, 6.0, 4.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.050140380859375, -0.04868936538696289, -0.04723834991455078, -0.04578733444213867, -0.04433631896972656, -0.04288530349731445, -0.041434288024902344, -0.039983272552490234, -0.038532257080078125, -0.037081241607666016, -0.035630226135253906, -0.0341792106628418, -0.03272819519042969, -0.03127717971801758, -0.02982616424560547, -0.02837514877319336, -0.02692413330078125, -0.02547311782836914, -0.02402210235595703, -0.022571086883544922, -0.021120071411132812, -0.019669055938720703, -0.018218040466308594, -0.016767024993896484, -0.015316009521484375, -0.013864994049072266, -0.012413978576660156, -0.010962963104248047, -0.009511947631835938, -0.008060932159423828, -0.006609916687011719, -0.005158901214599609, -0.0037078857421875, -0.0022568702697753906, -0.0008058547973632812, 0.0006451606750488281, 0.0020961761474609375, 0.003547191619873047, 0.004998207092285156, 0.006449222564697266, 0.007900238037109375, 0.009351253509521484, 0.010802268981933594, 0.012253284454345703, 0.013704299926757812, 0.015155315399169922, 0.01660633087158203, 0.01805734634399414, 0.01950836181640625, 0.02095937728881836, 0.02241039276123047, 0.023861408233642578, 0.025312423706054688, 0.026763439178466797, 0.028214454650878906, 0.029665470123291016, 0.031116485595703125, 0.032567501068115234, 0.034018516540527344, 0.03546953201293945, 0.03692054748535156, 0.03837156295776367, 0.03982257843017578, 0.04127359390258789, 0.042724609375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 3.0, 3.0, 9.0, 7.0, 10.0, 15.0, 24.0, 33.0, 25.0, 38.0, 71.0, 98.0, 149.0, 253.0, 418.0, 804.0, 1689.0, 3916.0, 9263.0, 22523.0, 53123.0, 368232.0, 486036.0, 58696.0, 24552.0, 10353.0, 4213.0, 1874.0, 863.0, 481.0, 265.0, 149.0, 93.0, 80.0, 44.0, 37.0, 33.0, 21.0, 15.0, 12.0, 9.0, 6.0, 5.0, 5.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.191162109375, -0.1855487823486328, -0.17993545532226562, -0.17432212829589844, -0.16870880126953125, -0.16309547424316406, -0.15748214721679688, -0.1518688201904297, -0.1462554931640625, -0.1406421661376953, -0.13502883911132812, -0.12941551208496094, -0.12380218505859375, -0.11818885803222656, -0.11257553100585938, -0.10696220397949219, -0.101348876953125, -0.09573554992675781, -0.09012222290039062, -0.08450889587402344, -0.07889556884765625, -0.07328224182128906, -0.06766891479492188, -0.06205558776855469, -0.0564422607421875, -0.05082893371582031, -0.045215606689453125, -0.03960227966308594, -0.03398895263671875, -0.028375625610351562, -0.022762298583984375, -0.017148971557617188, -0.01153564453125, -0.0059223175048828125, -0.000308990478515625, 0.0053043365478515625, 0.01091766357421875, 0.016530990600585938, 0.022144317626953125, 0.027757644653320312, 0.0333709716796875, 0.03898429870605469, 0.044597625732421875, 0.05021095275878906, 0.05582427978515625, 0.06143760681152344, 0.06705093383789062, 0.07266426086425781, 0.078277587890625, 0.08389091491699219, 0.08950424194335938, 0.09511756896972656, 0.10073089599609375, 0.10634422302246094, 0.11195755004882812, 0.11757087707519531, 0.1231842041015625, 0.1287975311279297, 0.13441085815429688, 0.14002418518066406, 0.14563751220703125, 0.15125083923339844, 0.15686416625976562, 0.1624774932861328, 0.1680908203125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 8.0, 5.0, 4.0, 12.0, 15.0, 8.0, 10.0, 18.0, 20.0, 26.0, 33.0, 33.0, 47.0, 48.0, 40.0, 49.0, 42.0, 67.0, 56.0, 66.0, 58.0, 59.0, 44.0, 39.0, 37.0, 24.0, 23.0, 32.0, 17.0, 9.0, 10.0, 12.0, 10.0, 11.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.181396484375, -0.17522239685058594, -0.16904830932617188, -0.1628742218017578, -0.15670013427734375, -0.1505260467529297, -0.14435195922851562, -0.13817787170410156, -0.1320037841796875, -0.12582969665527344, -0.11965560913085938, -0.11348152160644531, -0.10730743408203125, -0.10113334655761719, -0.09495925903320312, -0.08878517150878906, -0.082611083984375, -0.07643699645996094, -0.07026290893554688, -0.06408882141113281, -0.05791473388671875, -0.05174064636230469, -0.045566558837890625, -0.03939247131347656, -0.0332183837890625, -0.027044296264648438, -0.020870208740234375, -0.014696121215820312, -0.00852203369140625, -0.0023479461669921875, 0.003826141357421875, 0.010000228881835938, 0.01617431640625, 0.022348403930664062, 0.028522491455078125, 0.03469657897949219, 0.04087066650390625, 0.04704475402832031, 0.053218841552734375, 0.05939292907714844, 0.0655670166015625, 0.07174110412597656, 0.07791519165039062, 0.08408927917480469, 0.09026336669921875, 0.09643745422363281, 0.10261154174804688, 0.10878562927246094, 0.114959716796875, 0.12113380432128906, 0.12730789184570312, 0.1334819793701172, 0.13965606689453125, 0.1458301544189453, 0.15200424194335938, 0.15817832946777344, 0.1643524169921875, 0.17052650451660156, 0.17670059204101562, 0.1828746795654297, 0.18904876708984375, 0.1952228546142578, 0.20139694213867188, 0.20757102966308594, 0.2137451171875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 3.0, 6.0, 4.0, 9.0, 7.0, 16.0, 17.0, 25.0, 41.0, 65.0, 90.0, 127.0, 236.0, 373.0, 679.0, 1327.0, 2921.0, 6301.0, 15024.0, 38731.0, 181980.0, 694308.0, 64904.0, 23644.0, 9472.0, 4108.0, 1890.0, 907.0, 505.0, 327.0, 177.0, 116.0, 63.0, 45.0, 24.0, 28.0, 21.0, 7.0, 7.0, 9.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.10955810546875, -0.10581111907958984, -0.10206413269042969, -0.09831714630126953, -0.09457015991210938, -0.09082317352294922, -0.08707618713378906, -0.0833292007446289, -0.07958221435546875, -0.0758352279663086, -0.07208824157714844, -0.06834125518798828, -0.06459426879882812, -0.06084728240966797, -0.05710029602050781, -0.053353309631347656, -0.0496063232421875, -0.045859336853027344, -0.04211235046386719, -0.03836536407470703, -0.034618377685546875, -0.03087139129638672, -0.027124404907226562, -0.023377418518066406, -0.01963043212890625, -0.015883445739746094, -0.012136459350585938, -0.008389472961425781, -0.004642486572265625, -0.0008955001831054688, 0.0028514862060546875, 0.006598472595214844, 0.010345458984375, 0.014092445373535156, 0.017839431762695312, 0.02158641815185547, 0.025333404541015625, 0.02908039093017578, 0.03282737731933594, 0.036574363708496094, 0.04032135009765625, 0.044068336486816406, 0.04781532287597656, 0.05156230926513672, 0.055309295654296875, 0.05905628204345703, 0.06280326843261719, 0.06655025482177734, 0.0702972412109375, 0.07404422760009766, 0.07779121398925781, 0.08153820037841797, 0.08528518676757812, 0.08903217315673828, 0.09277915954589844, 0.0965261459350586, 0.10027313232421875, 0.1040201187133789, 0.10776710510253906, 0.11151409149169922, 0.11526107788085938, 0.11900806427001953, 0.12275505065917969, 0.12650203704833984, 0.1302490234375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 6.0, 6.0, 8.0, 10.0, 8.0, 19.0, 35.0, 34.0, 46.0, 59.0, 62.0, 75.0, 85.0, 110.0, 82.0, 86.0, 67.0, 56.0, 46.0, 27.0, 23.0, 16.0, 11.0, 4.0, 5.0, 7.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.903575897216797e-05, -7.579661905765533e-05, -7.25574791431427e-05, -6.931833922863007e-05, -6.607919931411743e-05, -6.28400593996048e-05, -5.960091948509216e-05, -5.636177957057953e-05, -5.3122639656066895e-05, -4.988349974155426e-05, -4.6644359827041626e-05, -4.340521991252899e-05, -4.016607999801636e-05, -3.692694008350372e-05, -3.368780016899109e-05, -3.0448660254478455e-05, -2.720952033996582e-05, -2.3970380425453186e-05, -2.0731240510940552e-05, -1.7492100596427917e-05, -1.4252960681915283e-05, -1.1013820767402649e-05, -7.774680852890015e-06, -4.53554093837738e-06, -1.296401023864746e-06, 1.942738890647888e-06, 5.1818788051605225e-06, 8.421018719673157e-06, 1.1660158634185791e-05, 1.4899298548698425e-05, 1.813843846321106e-05, 2.1377578377723694e-05, 2.4616718292236328e-05, 2.7855858206748962e-05, 3.10949981212616e-05, 3.433413803577423e-05, 3.7573277950286865e-05, 4.08124178647995e-05, 4.4051557779312134e-05, 4.729069769382477e-05, 5.05298376083374e-05, 5.376897752285004e-05, 5.700811743736267e-05, 6.0247257351875305e-05, 6.348639726638794e-05, 6.672553718090057e-05, 6.996467709541321e-05, 7.320381700992584e-05, 7.644295692443848e-05, 7.968209683895111e-05, 8.292123675346375e-05, 8.616037666797638e-05, 8.939951658248901e-05, 9.263865649700165e-05, 9.587779641151428e-05, 9.911693632602692e-05, 0.00010235607624053955, 0.00010559521615505219, 0.00010883435606956482, 0.00011207349598407745, 0.00011531263589859009, 0.00011855177581310272, 0.00012179091572761536, 0.000125030055642128, 0.00012826919555664062]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 5.0, 9.0, 11.0, 19.0, 49.0, 78.0, 138.0, 257.0, 674.0, 1788.0, 6105.0, 25007.0, 193308.0, 761639.0, 45007.0, 10051.0, 2749.0, 875.0, 385.0, 161.0, 95.0, 43.0, 35.0, 15.0, 16.0, 14.0, 6.0, 2.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1688232421875, -0.1626129150390625, -0.156402587890625, -0.1501922607421875, -0.14398193359375, -0.1377716064453125, -0.131561279296875, -0.1253509521484375, -0.119140625, -0.1129302978515625, -0.106719970703125, -0.1005096435546875, -0.09429931640625, -0.0880889892578125, -0.081878662109375, -0.0756683349609375, -0.0694580078125, -0.0632476806640625, -0.057037353515625, -0.0508270263671875, -0.04461669921875, -0.0384063720703125, -0.032196044921875, -0.0259857177734375, -0.019775390625, -0.0135650634765625, -0.007354736328125, -0.0011444091796875, 0.00506591796875, 0.0112762451171875, 0.017486572265625, 0.0236968994140625, 0.0299072265625, 0.0361175537109375, 0.042327880859375, 0.0485382080078125, 0.05474853515625, 0.0609588623046875, 0.067169189453125, 0.0733795166015625, 0.07958984375, 0.0858001708984375, 0.092010498046875, 0.0982208251953125, 0.10443115234375, 0.1106414794921875, 0.116851806640625, 0.1230621337890625, 0.1292724609375, 0.1354827880859375, 0.141693115234375, 0.1479034423828125, 0.15411376953125, 0.1603240966796875, 0.166534423828125, 0.1727447509765625, 0.178955078125, 0.1851654052734375, 0.191375732421875, 0.1975860595703125, 0.20379638671875, 0.2100067138671875, 0.216217041015625, 0.2224273681640625, 0.2286376953125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 6.0, 6.0, 6.0, 10.0, 10.0, 10.0, 19.0, 20.0, 28.0, 41.0, 95.0, 204.0, 268.0, 116.0, 48.0, 33.0, 22.0, 18.0, 13.0, 4.0, 6.0, 4.0, 5.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12445068359375, -0.1200418472290039, -0.11563301086425781, -0.11122417449951172, -0.10681533813476562, -0.10240650177001953, -0.09799766540527344, -0.09358882904052734, -0.08917999267578125, -0.08477115631103516, -0.08036231994628906, -0.07595348358154297, -0.07154464721679688, -0.06713581085205078, -0.06272697448730469, -0.058318138122558594, -0.0539093017578125, -0.049500465393066406, -0.04509162902832031, -0.04068279266357422, -0.036273956298828125, -0.03186511993408203, -0.027456283569335938, -0.023047447204589844, -0.01863861083984375, -0.014229774475097656, -0.009820938110351562, -0.005412101745605469, -0.001003265380859375, 0.0034055709838867188, 0.007814407348632812, 0.012223243713378906, 0.016632080078125, 0.021040916442871094, 0.025449752807617188, 0.02985858917236328, 0.034267425537109375, 0.03867626190185547, 0.04308509826660156, 0.047493934631347656, 0.05190277099609375, 0.056311607360839844, 0.06072044372558594, 0.06512928009033203, 0.06953811645507812, 0.07394695281982422, 0.07835578918457031, 0.0827646255493164, 0.0871734619140625, 0.0915822982788086, 0.09599113464355469, 0.10039997100830078, 0.10480880737304688, 0.10921764373779297, 0.11362648010253906, 0.11803531646728516, 0.12244415283203125, 0.12685298919677734, 0.13126182556152344, 0.13567066192626953, 0.14007949829101562, 0.14448833465576172, 0.1488971710205078, 0.1533060073852539, 0.15771484375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 16.0, 24.0, 46.0, 68.0, 109.0, 151.0, 162.0, 153.0, 111.0, 72.0, 37.0, 24.0, 19.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6694378852844238, -1.613257646560669, -1.5570772886276245, -1.50089693069458, -1.4447166919708252, -1.3885364532470703, -1.3323560953140259, -1.2761757373809814, -1.2199954986572266, -1.1638152599334717, -1.1076349020004272, -1.0514545440673828, -0.9952743053436279, -0.9390940070152283, -0.8829137086868286, -0.826733410358429, -0.7705531120300293, -0.7143728137016296, -0.65819251537323, -0.6020122170448303, -0.5458319187164307, -0.489651620388031, -0.43347132205963135, -0.3772910237312317, -0.32111072540283203, -0.2649304270744324, -0.20875012874603271, -0.15256983041763306, -0.0963895320892334, -0.04020923376083374, 0.015971064567565918, 0.07215136289596558, 0.12833166122436523, 0.1845119595527649, 0.24069225788116455, 0.2968725562095642, 0.35305285453796387, 0.4092331528663635, 0.4654134511947632, 0.5215937495231628, 0.5777740478515625, 0.6339543461799622, 0.6901346445083618, 0.7463149428367615, 0.8024952411651611, 0.8586755394935608, 0.9148558378219604, 0.9710361361503601, 1.0272164344787598, 1.0833966732025146, 1.139577031135559, 1.1957573890686035, 1.2519376277923584, 1.3081178665161133, 1.3642982244491577, 1.4204785823822021, 1.476658821105957, 1.532839059829712, 1.5890194177627563, 1.6451997756958008, 1.7013800144195557, 1.7575602531433105, 1.813740611076355, 1.8699209690093994, 1.9261012077331543]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 5.0, 6.0, 11.0, 8.0, 12.0, 16.0, 13.0, 14.0, 25.0, 13.0, 30.0, 34.0, 26.0, 42.0, 47.0, 28.0, 48.0, 44.0, 38.0, 39.0, 36.0, 37.0, 32.0, 37.0, 43.0, 34.0, 32.0, 38.0, 37.0, 28.0, 23.0, 14.0, 14.0, 12.0, 16.0, 8.0, 7.0, 7.0, 5.0, 5.0, 9.0, 7.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6811830997467041, -0.6585243344306946, -0.6358655691146851, -0.6132067441940308, -0.5905479788780212, -0.5678892135620117, -0.5452304482460022, -0.5225716829299927, -0.4999128580093384, -0.47725409269332886, -0.45459529757499695, -0.4319365322589874, -0.4092777371406555, -0.386618971824646, -0.3639602065086365, -0.34130141139030457, -0.31864264607429504, -0.2959838807582855, -0.2733250856399536, -0.2506663203239441, -0.22800752520561218, -0.20534875988960266, -0.18268997967243195, -0.16003119945526123, -0.13737241923809052, -0.1147136390209198, -0.09205485880374908, -0.06939608603715897, -0.04673730581998825, -0.024078525602817535, -0.001419752836227417, 0.0212390273809433, 0.043897807598114014, 0.06655658781528473, 0.08921536803245544, 0.11187414079904556, 0.13453292846679688, 0.1571916937828064, 0.1798504739999771, 0.20250925421714783, 0.22516803443431854, 0.24782681465148926, 0.2704855799674988, 0.2931443750858307, 0.3158031404018402, 0.3384619355201721, 0.36112070083618164, 0.38377946615219116, 0.40643826127052307, 0.4290970265865326, 0.4517558217048645, 0.474414587020874, 0.49707338213920593, 0.5197321772575378, 0.5423909425735474, 0.5650497078895569, 0.5877084732055664, 0.6103672385215759, 0.6330260038375854, 0.6556848287582397, 0.6783435940742493, 0.7010023593902588, 0.7236611247062683, 0.7463198900222778, 0.7689787149429321]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 9.0, 7.0, 5.0, 10.0, 12.0, 25.0, 41.0, 61.0, 84.0, 150.0, 220.0, 419.0, 705.0, 1297.0, 2507.0, 5485.0, 12456.0, 32201.0, 102577.0, 647832.0, 3116068.0, 189085.0, 50267.0, 18040.0, 7606.0, 3413.0, 1641.0, 826.0, 486.0, 279.0, 155.0, 114.0, 60.0, 45.0, 32.0, 21.0, 15.0, 10.0, 6.0, 3.0, 1.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17919921875, -0.17284584045410156, -0.16649246215820312, -0.1601390838623047, -0.15378570556640625, -0.1474323272705078, -0.14107894897460938, -0.13472557067871094, -0.1283721923828125, -0.12201881408691406, -0.11566543579101562, -0.10931205749511719, -0.10295867919921875, -0.09660530090332031, -0.09025192260742188, -0.08389854431152344, -0.077545166015625, -0.07119178771972656, -0.06483840942382812, -0.05848503112792969, -0.05213165283203125, -0.04577827453613281, -0.039424896240234375, -0.03307151794433594, -0.0267181396484375, -0.020364761352539062, -0.014011383056640625, -0.0076580047607421875, -0.00130462646484375, 0.0050487518310546875, 0.011402130126953125, 0.017755508422851562, 0.02410888671875, 0.030462265014648438, 0.036815643310546875, 0.04316902160644531, 0.04952239990234375, 0.05587577819824219, 0.062229156494140625, 0.06858253479003906, 0.0749359130859375, 0.08128929138183594, 0.08764266967773438, 0.09399604797363281, 0.10034942626953125, 0.10670280456542969, 0.11305618286132812, 0.11940956115722656, 0.125762939453125, 0.13211631774902344, 0.13846969604492188, 0.1448230743408203, 0.15117645263671875, 0.1575298309326172, 0.16388320922851562, 0.17023658752441406, 0.1765899658203125, 0.18294334411621094, 0.18929672241210938, 0.1956501007080078, 0.20200347900390625, 0.2083568572998047, 0.21471023559570312, 0.22106361389160156, 0.2274169921875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 1.0, 4.0, 9.0, 8.0, 14.0, 34.0, 29.0, 20.0, 33.0, 33.0, 40.0, 52.0, 49.0, 44.0, 67.0, 64.0, 50.0, 50.0, 70.0, 45.0, 54.0, 49.0, 27.0, 39.0, 30.0, 18.0, 19.0, 10.0, 6.0, 5.0, 6.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05169677734375, -0.05021381378173828, -0.04873085021972656, -0.047247886657714844, -0.045764923095703125, -0.044281959533691406, -0.04279899597167969, -0.04131603240966797, -0.03983306884765625, -0.03835010528564453, -0.03686714172363281, -0.035384178161621094, -0.033901214599609375, -0.032418251037597656, -0.030935287475585938, -0.02945232391357422, -0.0279693603515625, -0.02648639678955078, -0.025003433227539062, -0.023520469665527344, -0.022037506103515625, -0.020554542541503906, -0.019071578979492188, -0.01758861541748047, -0.01610565185546875, -0.014622688293457031, -0.013139724731445312, -0.011656761169433594, -0.010173797607421875, -0.008690834045410156, -0.0072078704833984375, -0.005724906921386719, -0.004241943359375, -0.0027589797973632812, -0.0012760162353515625, 0.00020694732666015625, 0.001689910888671875, 0.0031728744506835938, 0.0046558380126953125, 0.006138801574707031, 0.00762176513671875, 0.009104728698730469, 0.010587692260742188, 0.012070655822753906, 0.013553619384765625, 0.015036582946777344, 0.016519546508789062, 0.01800251007080078, 0.0194854736328125, 0.02096843719482422, 0.022451400756835938, 0.023934364318847656, 0.025417327880859375, 0.026900291442871094, 0.028383255004882812, 0.02986621856689453, 0.03134918212890625, 0.03283214569091797, 0.03431510925292969, 0.035798072814941406, 0.037281036376953125, 0.038763999938964844, 0.04024696350097656, 0.04172992706298828, 0.043212890625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 2.0, 8.0, 9.0, 10.0, 16.0, 13.0, 26.0, 44.0, 51.0, 85.0, 138.0, 182.0, 357.0, 541.0, 997.0, 1836.0, 3720.0, 8046.0, 18878.0, 54172.0, 206317.0, 2921042.0, 792066.0, 121942.0, 36944.0, 14187.0, 6116.0, 2859.0, 1525.0, 869.0, 478.0, 286.0, 156.0, 115.0, 75.0, 65.0, 32.0, 18.0, 13.0, 14.0, 9.0, 8.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.25, -0.2423839569091797, -0.23476791381835938, -0.22715187072753906, -0.21953582763671875, -0.21191978454589844, -0.20430374145507812, -0.1966876983642578, -0.1890716552734375, -0.1814556121826172, -0.17383956909179688, -0.16622352600097656, -0.15860748291015625, -0.15099143981933594, -0.14337539672851562, -0.1357593536376953, -0.128143310546875, -0.12052726745605469, -0.11291122436523438, -0.10529518127441406, -0.09767913818359375, -0.09006309509277344, -0.08244705200195312, -0.07483100891113281, -0.0672149658203125, -0.05959892272949219, -0.051982879638671875, -0.04436683654785156, -0.03675079345703125, -0.029134750366210938, -0.021518707275390625, -0.013902664184570312, -0.00628662109375, 0.0013294219970703125, 0.008945465087890625, 0.016561508178710938, 0.02417755126953125, 0.03179359436035156, 0.039409637451171875, 0.04702568054199219, 0.0546417236328125, 0.06225776672363281, 0.06987380981445312, 0.07748985290527344, 0.08510589599609375, 0.09272193908691406, 0.10033798217773438, 0.10795402526855469, 0.115570068359375, 0.12318611145019531, 0.13080215454101562, 0.13841819763183594, 0.14603424072265625, 0.15365028381347656, 0.16126632690429688, 0.1688823699951172, 0.1764984130859375, 0.1841144561767578, 0.19173049926757812, 0.19934654235839844, 0.20696258544921875, 0.21457862854003906, 0.22219467163085938, 0.2298107147216797, 0.2374267578125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 4.0, 6.0, 7.0, 13.0, 22.0, 26.0, 49.0, 61.0, 105.0, 181.0, 310.0, 924.0, 1484.0, 348.0, 180.0, 119.0, 62.0, 45.0, 33.0, 18.0, 17.0, 13.0, 15.0, 7.0, 4.0, 2.0, 1.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1365966796875, -0.13291549682617188, -0.12923431396484375, -0.12555313110351562, -0.1218719482421875, -0.11819076538085938, -0.11450958251953125, -0.11082839965820312, -0.107147216796875, -0.10346603393554688, -0.09978485107421875, -0.09610366821289062, -0.0924224853515625, -0.08874130249023438, -0.08506011962890625, -0.08137893676757812, -0.07769775390625, -0.07401657104492188, -0.07033538818359375, -0.06665420532226562, -0.0629730224609375, -0.059291839599609375, -0.05561065673828125, -0.051929473876953125, -0.048248291015625, -0.044567108154296875, -0.04088592529296875, -0.037204742431640625, -0.0335235595703125, -0.029842376708984375, -0.02616119384765625, -0.022480010986328125, -0.018798828125, -0.015117645263671875, -0.01143646240234375, -0.007755279541015625, -0.0040740966796875, -0.000392913818359375, 0.00328826904296875, 0.006969451904296875, 0.010650634765625, 0.014331817626953125, 0.01801300048828125, 0.021694183349609375, 0.0253753662109375, 0.029056549072265625, 0.03273773193359375, 0.036418914794921875, 0.04010009765625, 0.043781280517578125, 0.04746246337890625, 0.051143646240234375, 0.0548248291015625, 0.058506011962890625, 0.06218719482421875, 0.06586837768554688, 0.069549560546875, 0.07323074340820312, 0.07691192626953125, 0.08059310913085938, 0.0842742919921875, 0.08795547485351562, 0.09163665771484375, 0.09531784057617188, 0.0989990234375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 12.0, 21.0, 32.0, 64.0, 101.0, 110.0, 144.0, 143.0, 115.0, 100.0, 68.0, 41.0, 25.0, 9.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9159307479858398, -0.8875405788421631, -0.8591504693031311, -0.8307603001594543, -0.8023701906204224, -0.7739800214767456, -0.7455899119377136, -0.7171997427940369, -0.6888096332550049, -0.6604194641113281, -0.6320293545722961, -0.6036391854286194, -0.5752490758895874, -0.5468589067459106, -0.5184687972068787, -0.4900786280632019, -0.46168848872184753, -0.43329834938049316, -0.4049082100391388, -0.3765180706977844, -0.34812793135643005, -0.3197377920150757, -0.2913476228713989, -0.26295751333236694, -0.23456735908985138, -0.206177219748497, -0.17778708040714264, -0.14939692616462708, -0.1210067942738533, -0.09261664748191833, -0.06422650814056396, -0.035836368799209595, -0.007446229457855225, 0.020943911746144295, 0.049334052950143814, 0.07772419601678848, 0.10611433535814285, 0.13450448215007782, 0.1628946214914322, 0.19128476083278656, 0.21967490017414093, 0.2480650395154953, 0.27645519375801086, 0.30484533309936523, 0.3332354724407196, 0.361625611782074, 0.39001575112342834, 0.4184058904647827, 0.4467960298061371, 0.47518616914749146, 0.5035763382911682, 0.5319664478302002, 0.560356616973877, 0.5887467265129089, 0.6171368956565857, 0.6455270051956177, 0.6739171743392944, 0.7023073434829712, 0.7306974530220032, 0.7590876221656799, 0.7874777317047119, 0.8158679008483887, 0.8442580103874207, 0.8726481795310974, 0.9010382890701294]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 5.0, 3.0, 4.0, 3.0, 9.0, 4.0, 6.0, 9.0, 10.0, 15.0, 19.0, 19.0, 30.0, 24.0, 30.0, 24.0, 34.0, 45.0, 41.0, 43.0, 32.0, 45.0, 24.0, 51.0, 58.0, 42.0, 42.0, 35.0, 38.0, 40.0, 32.0, 35.0, 30.0, 16.0, 15.0, 16.0, 14.0, 11.0, 13.0, 9.0, 8.0, 7.0, 4.0, 2.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.33580803871154785, -0.3247198462486267, -0.31363165378570557, -0.30254343152046204, -0.2914552390575409, -0.28036704659461975, -0.2692788243293762, -0.2581906318664551, -0.24710243940353394, -0.2360142469406128, -0.22492603957653046, -0.21383783221244812, -0.20274963974952698, -0.19166144728660583, -0.1805732399225235, -0.16948503255844116, -0.15839684009552002, -0.14730864763259888, -0.13622044026851654, -0.1251322329044342, -0.11404404044151306, -0.10295584052801132, -0.09186764061450958, -0.08077944070100784, -0.0696912407875061, -0.058603040874004364, -0.047514840960502625, -0.036426641047000885, -0.025338441133499146, -0.014250241219997406, -0.0031620413064956665, 0.007926158607006073, 0.019014358520507812, 0.030102558434009552, 0.04119075834751129, 0.05227895826101303, 0.06336715817451477, 0.07445535808801651, 0.08554355800151825, 0.09663175791501999, 0.10771995782852173, 0.11880815774202347, 0.1298963576555252, 0.14098456501960754, 0.1520727574825287, 0.16316094994544983, 0.17424915730953217, 0.1853373646736145, 0.19642555713653564, 0.2075137495994568, 0.21860195696353912, 0.22969016432762146, 0.2407783567905426, 0.25186654925346375, 0.2629547715187073, 0.2740429639816284, 0.28513115644454956, 0.2962193489074707, 0.30730754137039185, 0.3183957636356354, 0.3294839560985565, 0.34057214856147766, 0.3516603708267212, 0.36274856328964233, 0.3738367557525635]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 9.0, 8.0, 14.0, 18.0, 21.0, 32.0, 53.0, 80.0, 127.0, 181.0, 328.0, 539.0, 938.0, 1753.0, 3229.0, 6028.0, 11405.0, 21016.0, 39181.0, 69437.0, 124418.0, 244205.0, 245380.0, 124887.0, 69977.0, 39148.0, 21332.0, 11461.0, 6215.0, 3103.0, 1700.0, 914.0, 530.0, 324.0, 174.0, 128.0, 89.0, 48.0, 41.0, 28.0, 17.0, 16.0, 12.0, 2.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.1279296875, -0.12416744232177734, -0.12040519714355469, -0.11664295196533203, -0.11288070678710938, -0.10911846160888672, -0.10535621643066406, -0.1015939712524414, -0.09783172607421875, -0.0940694808959961, -0.09030723571777344, -0.08654499053955078, -0.08278274536132812, -0.07902050018310547, -0.07525825500488281, -0.07149600982666016, -0.0677337646484375, -0.06397151947021484, -0.06020927429199219, -0.05644702911376953, -0.052684783935546875, -0.04892253875732422, -0.04516029357910156, -0.041398048400878906, -0.03763580322265625, -0.033873558044433594, -0.030111312866210938, -0.02634906768798828, -0.022586822509765625, -0.01882457733154297, -0.015062332153320312, -0.011300086975097656, -0.007537841796875, -0.0037755966186523438, -1.33514404296875e-05, 0.0037488937377929688, 0.007511138916015625, 0.011273384094238281, 0.015035629272460938, 0.018797874450683594, 0.02256011962890625, 0.026322364807128906, 0.030084609985351562, 0.03384685516357422, 0.037609100341796875, 0.04137134552001953, 0.04513359069824219, 0.048895835876464844, 0.0526580810546875, 0.056420326232910156, 0.06018257141113281, 0.06394481658935547, 0.06770706176757812, 0.07146930694580078, 0.07523155212402344, 0.0789937973022461, 0.08275604248046875, 0.0865182876586914, 0.09028053283691406, 0.09404277801513672, 0.09780502319335938, 0.10156726837158203, 0.10532951354980469, 0.10909175872802734, 0.11285400390625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 8.0, 11.0, 13.0, 11.0, 15.0, 13.0, 18.0, 29.0, 32.0, 35.0, 36.0, 31.0, 41.0, 40.0, 53.0, 57.0, 43.0, 55.0, 66.0, 50.0, 43.0, 46.0, 36.0, 29.0, 26.0, 29.0, 27.0, 27.0, 11.0, 13.0, 14.0, 10.0, 4.0, 6.0, 6.0, 10.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0511474609375, -0.04968118667602539, -0.04821491241455078, -0.04674863815307617, -0.04528236389160156, -0.04381608963012695, -0.042349815368652344, -0.040883541107177734, -0.039417266845703125, -0.037950992584228516, -0.036484718322753906, -0.0350184440612793, -0.03355216979980469, -0.03208589553833008, -0.03061962127685547, -0.02915334701538086, -0.02768707275390625, -0.02622079849243164, -0.02475452423095703, -0.023288249969482422, -0.021821975708007812, -0.020355701446533203, -0.018889427185058594, -0.017423152923583984, -0.015956878662109375, -0.014490604400634766, -0.013024330139160156, -0.011558055877685547, -0.010091781616210938, -0.008625507354736328, -0.007159233093261719, -0.005692958831787109, -0.0042266845703125, -0.0027604103088378906, -0.0012941360473632812, 0.00017213821411132812, 0.0016384124755859375, 0.003104686737060547, 0.004570960998535156, 0.006037235260009766, 0.007503509521484375, 0.008969783782958984, 0.010436058044433594, 0.011902332305908203, 0.013368606567382812, 0.014834880828857422, 0.01630115509033203, 0.01776742935180664, 0.01923370361328125, 0.02069997787475586, 0.02216625213623047, 0.023632526397705078, 0.025098800659179688, 0.026565074920654297, 0.028031349182128906, 0.029497623443603516, 0.030963897705078125, 0.032430171966552734, 0.033896446228027344, 0.03536272048950195, 0.03682899475097656, 0.03829526901245117, 0.03976154327392578, 0.04122781753540039, 0.042694091796875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 5.0, 8.0, 9.0, 29.0, 25.0, 25.0, 41.0, 54.0, 87.0, 108.0, 161.0, 235.0, 311.0, 473.0, 833.0, 1602.0, 4506.0, 20114.0, 109364.0, 605977.0, 244796.0, 45561.0, 8749.0, 2484.0, 1075.0, 612.0, 401.0, 268.0, 171.0, 133.0, 92.0, 62.0, 55.0, 31.0, 28.0, 11.0, 14.0, 11.0, 8.0, 4.0, 6.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.315673828125, -0.3057289123535156, -0.29578399658203125, -0.2858390808105469, -0.2758941650390625, -0.2659492492675781, -0.25600433349609375, -0.24605941772460938, -0.236114501953125, -0.22616958618164062, -0.21622467041015625, -0.20627975463867188, -0.1963348388671875, -0.18638992309570312, -0.17644500732421875, -0.16650009155273438, -0.15655517578125, -0.14661026000976562, -0.13666534423828125, -0.12672042846679688, -0.1167755126953125, -0.10683059692382812, -0.09688568115234375, -0.08694076538085938, -0.076995849609375, -0.06705093383789062, -0.05710601806640625, -0.047161102294921875, -0.0372161865234375, -0.027271270751953125, -0.01732635498046875, -0.007381439208984375, 0.0025634765625, 0.012508392333984375, 0.02245330810546875, 0.032398223876953125, 0.0423431396484375, 0.052288055419921875, 0.06223297119140625, 0.07217788696289062, 0.082122802734375, 0.09206771850585938, 0.10201263427734375, 0.11195755004882812, 0.1219024658203125, 0.13184738159179688, 0.14179229736328125, 0.15173721313476562, 0.16168212890625, 0.17162704467773438, 0.18157196044921875, 0.19151687622070312, 0.2014617919921875, 0.21140670776367188, 0.22135162353515625, 0.23129653930664062, 0.241241455078125, 0.2511863708496094, 0.26113128662109375, 0.2710762023925781, 0.2810211181640625, 0.2909660339355469, 0.30091094970703125, 0.3108558654785156, 0.32080078125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 5.0, 4.0, 4.0, 8.0, 9.0, 9.0, 9.0, 19.0, 16.0, 19.0, 24.0, 28.0, 25.0, 32.0, 49.0, 41.0, 46.0, 46.0, 59.0, 43.0, 57.0, 58.0, 46.0, 58.0, 54.0, 33.0, 28.0, 28.0, 23.0, 18.0, 22.0, 18.0, 16.0, 10.0, 6.0, 6.0, 7.0, 4.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.253662109375, -0.2463550567626953, -0.23904800415039062, -0.23174095153808594, -0.22443389892578125, -0.21712684631347656, -0.20981979370117188, -0.2025127410888672, -0.1952056884765625, -0.1878986358642578, -0.18059158325195312, -0.17328453063964844, -0.16597747802734375, -0.15867042541503906, -0.15136337280273438, -0.1440563201904297, -0.136749267578125, -0.1294422149658203, -0.12213516235351562, -0.11482810974121094, -0.10752105712890625, -0.10021400451660156, -0.09290695190429688, -0.08559989929199219, -0.0782928466796875, -0.07098579406738281, -0.06367874145507812, -0.05637168884277344, -0.04906463623046875, -0.04175758361816406, -0.034450531005859375, -0.027143478393554688, -0.01983642578125, -0.012529373168945312, -0.005222320556640625, 0.0020847320556640625, 0.00939178466796875, 0.016698837280273438, 0.024005889892578125, 0.03131294250488281, 0.0386199951171875, 0.04592704772949219, 0.053234100341796875, 0.06054115295410156, 0.06784820556640625, 0.07515525817871094, 0.08246231079101562, 0.08976936340332031, 0.097076416015625, 0.10438346862792969, 0.11169052124023438, 0.11899757385253906, 0.12630462646484375, 0.13361167907714844, 0.14091873168945312, 0.1482257843017578, 0.1555328369140625, 0.1628398895263672, 0.17014694213867188, 0.17745399475097656, 0.18476104736328125, 0.19206809997558594, 0.19937515258789062, 0.2066822052001953, 0.2139892578125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 2.0, 6.0, 5.0, 6.0, 10.0, 22.0, 17.0, 22.0, 48.0, 77.0, 131.0, 180.0, 324.0, 627.0, 1199.0, 2640.0, 6579.0, 20433.0, 84140.0, 476590.0, 355924.0, 71258.0, 17546.0, 5820.0, 2329.0, 1183.0, 591.0, 322.0, 180.0, 127.0, 76.0, 37.0, 30.0, 29.0, 12.0, 7.0, 7.0, 7.0, 7.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1700439453125, -0.1647205352783203, -0.15939712524414062, -0.15407371520996094, -0.14875030517578125, -0.14342689514160156, -0.13810348510742188, -0.1327800750732422, -0.1274566650390625, -0.12213325500488281, -0.11680984497070312, -0.11148643493652344, -0.10616302490234375, -0.10083961486816406, -0.09551620483398438, -0.09019279479980469, -0.084869384765625, -0.07954597473144531, -0.07422256469726562, -0.06889915466308594, -0.06357574462890625, -0.05825233459472656, -0.052928924560546875, -0.04760551452636719, -0.0422821044921875, -0.03695869445800781, -0.031635284423828125, -0.026311874389648438, -0.02098846435546875, -0.015665054321289062, -0.010341644287109375, -0.0050182342529296875, 0.00030517578125, 0.0056285858154296875, 0.010951995849609375, 0.016275405883789062, 0.02159881591796875, 0.026922225952148438, 0.032245635986328125, 0.03756904602050781, 0.0428924560546875, 0.04821586608886719, 0.053539276123046875, 0.05886268615722656, 0.06418609619140625, 0.06950950622558594, 0.07483291625976562, 0.08015632629394531, 0.085479736328125, 0.09080314636230469, 0.09612655639648438, 0.10144996643066406, 0.10677337646484375, 0.11209678649902344, 0.11742019653320312, 0.12274360656738281, 0.1280670166015625, 0.1333904266357422, 0.13871383666992188, 0.14403724670410156, 0.14936065673828125, 0.15468406677246094, 0.16000747680664062, 0.1653308868408203, 0.170654296875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 9.0, 1.0, 2.0, 5.0, 4.0, 12.0, 13.0, 22.0, 20.0, 29.0, 33.0, 56.0, 73.0, 89.0, 98.0, 108.0, 102.0, 78.0, 80.0, 44.0, 28.0, 32.0, 19.0, 18.0, 12.0, 10.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.177757263183594e-05, -7.812492549419403e-05, -7.447227835655212e-05, -7.081963121891022e-05, -6.716698408126831e-05, -6.35143369436264e-05, -5.98616898059845e-05, -5.620904266834259e-05, -5.2556395530700684e-05, -4.890374839305878e-05, -4.525110125541687e-05, -4.159845411777496e-05, -3.794580698013306e-05, -3.429315984249115e-05, -3.064051270484924e-05, -2.6987865567207336e-05, -2.333521842956543e-05, -1.9682571291923523e-05, -1.6029924154281616e-05, -1.237727701663971e-05, -8.724629878997803e-06, -5.071982741355896e-06, -1.4193356037139893e-06, 2.2333115339279175e-06, 5.885958671569824e-06, 9.538605809211731e-06, 1.3191252946853638e-05, 1.6843900084495544e-05, 2.049654722213745e-05, 2.4149194359779358e-05, 2.7801841497421265e-05, 3.145448863506317e-05, 3.510713577270508e-05, 3.8759782910346985e-05, 4.241243004798889e-05, 4.60650771856308e-05, 4.9717724323272705e-05, 5.337037146091461e-05, 5.702301859855652e-05, 6.0675665736198425e-05, 6.432831287384033e-05, 6.798096001148224e-05, 7.163360714912415e-05, 7.528625428676605e-05, 7.893890142440796e-05, 8.259154856204987e-05, 8.624419569969177e-05, 8.989684283733368e-05, 9.354948997497559e-05, 9.720213711261749e-05, 0.0001008547842502594, 0.0001045074313879013, 0.00010816007852554321, 0.00011181272566318512, 0.00011546537280082703, 0.00011911801993846893, 0.00012277066707611084, 0.00012642331421375275, 0.00013007596135139465, 0.00013372860848903656, 0.00013738125562667847, 0.00014103390276432037, 0.00014468654990196228, 0.0001483391970396042, 0.0001519918441772461]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 10.0, 3.0, 19.0, 20.0, 31.0, 62.0, 70.0, 122.0, 179.0, 336.0, 617.0, 1425.0, 3948.0, 16633.0, 106360.0, 676025.0, 204504.0, 28449.0, 5963.0, 1938.0, 811.0, 417.0, 234.0, 119.0, 78.0, 58.0, 41.0, 15.0, 10.0, 12.0, 9.0, 3.0, 5.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2337646484375, -0.2266063690185547, -0.21944808959960938, -0.21228981018066406, -0.20513153076171875, -0.19797325134277344, -0.19081497192382812, -0.1836566925048828, -0.1764984130859375, -0.1693401336669922, -0.16218185424804688, -0.15502357482910156, -0.14786529541015625, -0.14070701599121094, -0.13354873657226562, -0.1263904571533203, -0.119232177734375, -0.11207389831542969, -0.10491561889648438, -0.09775733947753906, -0.09059906005859375, -0.08344078063964844, -0.07628250122070312, -0.06912422180175781, -0.0619659423828125, -0.05480766296386719, -0.047649383544921875, -0.04049110412597656, -0.03333282470703125, -0.026174545288085938, -0.019016265869140625, -0.011857986450195312, -0.00469970703125, 0.0024585723876953125, 0.009616851806640625, 0.016775131225585938, 0.02393341064453125, 0.031091690063476562, 0.038249969482421875, 0.04540824890136719, 0.0525665283203125, 0.05972480773925781, 0.06688308715820312, 0.07404136657714844, 0.08119964599609375, 0.08835792541503906, 0.09551620483398438, 0.10267448425292969, 0.109832763671875, 0.11699104309082031, 0.12414932250976562, 0.13130760192871094, 0.13846588134765625, 0.14562416076660156, 0.15278244018554688, 0.1599407196044922, 0.1670989990234375, 0.1742572784423828, 0.18141555786132812, 0.18857383728027344, 0.19573211669921875, 0.20289039611816406, 0.21004867553710938, 0.2172069549560547, 0.224365234375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 4.0, 4.0, 7.0, 9.0, 14.0, 13.0, 21.0, 21.0, 19.0, 20.0, 25.0, 54.0, 54.0, 80.0, 84.0, 97.0, 85.0, 77.0, 64.0, 45.0, 32.0, 34.0, 25.0, 23.0, 21.0, 15.0, 8.0, 12.0, 7.0, 3.0, 6.0, 5.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1300048828125, -0.12613773345947266, -0.12227058410644531, -0.11840343475341797, -0.11453628540039062, -0.11066913604736328, -0.10680198669433594, -0.1029348373413086, -0.09906768798828125, -0.0952005386352539, -0.09133338928222656, -0.08746623992919922, -0.08359909057617188, -0.07973194122314453, -0.07586479187011719, -0.07199764251708984, -0.0681304931640625, -0.06426334381103516, -0.06039619445800781, -0.05652904510498047, -0.052661895751953125, -0.04879474639892578, -0.04492759704589844, -0.041060447692871094, -0.03719329833984375, -0.033326148986816406, -0.029458999633789062, -0.02559185028076172, -0.021724700927734375, -0.01785755157470703, -0.013990402221679688, -0.010123252868652344, -0.006256103515625, -0.0023889541625976562, 0.0014781951904296875, 0.005345344543457031, 0.009212493896484375, 0.013079643249511719, 0.016946792602539062, 0.020813941955566406, 0.02468109130859375, 0.028548240661621094, 0.03241539001464844, 0.03628253936767578, 0.040149688720703125, 0.04401683807373047, 0.04788398742675781, 0.051751136779785156, 0.0556182861328125, 0.059485435485839844, 0.06335258483886719, 0.06721973419189453, 0.07108688354492188, 0.07495403289794922, 0.07882118225097656, 0.0826883316040039, 0.08655548095703125, 0.0904226303100586, 0.09428977966308594, 0.09815692901611328, 0.10202407836914062, 0.10589122772216797, 0.10975837707519531, 0.11362552642822266, 0.11749267578125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 5.0, 17.0, 61.0, 104.0, 174.0, 193.0, 195.0, 133.0, 70.0, 35.0, 10.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.692439556121826, -4.590233325958252, -4.4880266189575195, -4.385820388793945, -4.283614158630371, -4.181407451629639, -4.0792012214660645, -3.976994752883911, -3.874788284301758, -3.7725818157196045, -3.670375347137451, -3.568169116973877, -3.4659626483917236, -3.3637561798095703, -3.261549949645996, -3.1593434810638428, -3.0571370124816895, -2.954930543899536, -2.852724075317383, -2.7505178451538086, -2.6483113765716553, -2.546104907989502, -2.4438986778259277, -2.3416922092437744, -2.239485740661621, -2.1372792720794678, -2.0350728034973145, -1.9328665733337402, -1.830660104751587, -1.7284536361694336, -1.6262472867965698, -1.524040937423706, -1.4218345880508423, -1.3196282386779785, -1.2174217700958252, -1.1152153015136719, -1.013008952140808, -0.9108025431632996, -0.808596134185791, -0.7063897252082825, -0.6041833162307739, -0.5019769072532654, -0.39977049827575684, -0.2975640892982483, -0.19535768032073975, -0.0931512713432312, 0.009055137634277344, 0.11126154661178589, 0.21346795558929443, 0.315674364566803, 0.4178807735443115, 0.5200871825218201, 0.6222935914993286, 0.7245000004768372, 0.8267064094543457, 0.9289128184318542, 1.0311192274093628, 1.1333255767822266, 1.2355320453643799, 1.3377385139465332, 1.439944863319397, 1.5421512126922607, 1.644357681274414, 1.7465641498565674, 1.8487704992294312]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 3.0, 1.0, 8.0, 8.0, 8.0, 6.0, 12.0, 13.0, 9.0, 23.0, 25.0, 20.0, 28.0, 23.0, 34.0, 42.0, 42.0, 42.0, 51.0, 50.0, 41.0, 58.0, 41.0, 42.0, 39.0, 40.0, 32.0, 40.0, 43.0, 35.0, 29.0, 20.0, 21.0, 12.0, 14.0, 12.0, 8.0, 5.0, 12.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1537410020828247, -1.1154236793518066, -1.0771063566207886, -1.0387890338897705, -1.0004717111587524, -0.9621543884277344, -0.9238371253013611, -0.885519802570343, -0.847202479839325, -0.8088851571083069, -0.7705678343772888, -0.7322505116462708, -0.6939332485198975, -0.6556159257888794, -0.6172986030578613, -0.5789812803268433, -0.5406639575958252, -0.5023466348648071, -0.46402931213378906, -0.4257120192050934, -0.3873946964740753, -0.34907737374305725, -0.3107600808143616, -0.2724427580833435, -0.23412543535232544, -0.19580811262130737, -0.1574908047914505, -0.11917348951101303, -0.08085617423057556, -0.042538851499557495, -0.0042215436697006226, 0.03409576416015625, 0.07241296768188477, 0.11073028296232224, 0.1490475982427597, 0.18736490607261658, 0.22568222880363464, 0.2639995515346527, 0.3023168444633484, 0.34063416719436646, 0.3789514899253845, 0.4172688126564026, 0.45558613538742065, 0.49390342831611633, 0.532220721244812, 0.5705380439758301, 0.6088553667068481, 0.6471726894378662, 0.6854900121688843, 0.7238073348999023, 0.7621246576309204, 0.8004419803619385, 0.8387593030929565, 0.8770766258239746, 0.9153938889503479, 0.953711211681366, 0.992028534412384, 1.0303457975387573, 1.0686631202697754, 1.1069804430007935, 1.1452977657318115, 1.1836150884628296, 1.2219324111938477, 1.2602497339248657, 1.2985670566558838]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 3.0, 7.0, 12.0, 10.0, 25.0, 44.0, 54.0, 75.0, 102.0, 161.0, 280.0, 466.0, 835.0, 1509.0, 3048.0, 6090.0, 14360.0, 36824.0, 122517.0, 795855.0, 2900838.0, 218077.0, 56658.0, 19975.0, 8243.0, 3715.0, 1953.0, 978.0, 600.0, 337.0, 196.0, 133.0, 93.0, 61.0, 37.0, 33.0, 18.0, 22.0, 5.0, 6.0, 3.0, 10.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20751953125, -0.20064544677734375, -0.1937713623046875, -0.18689727783203125, -0.180023193359375, -0.17314910888671875, -0.1662750244140625, -0.15940093994140625, -0.15252685546875, -0.14565277099609375, -0.1387786865234375, -0.13190460205078125, -0.125030517578125, -0.11815643310546875, -0.1112823486328125, -0.10440826416015625, -0.0975341796875, -0.09066009521484375, -0.0837860107421875, -0.07691192626953125, -0.070037841796875, -0.06316375732421875, -0.0562896728515625, -0.04941558837890625, -0.04254150390625, -0.03566741943359375, -0.0287933349609375, -0.02191925048828125, -0.015045166015625, -0.00817108154296875, -0.0012969970703125, 0.00557708740234375, 0.012451171875, 0.01932525634765625, 0.0261993408203125, 0.03307342529296875, 0.039947509765625, 0.04682159423828125, 0.0536956787109375, 0.06056976318359375, 0.06744384765625, 0.07431793212890625, 0.0811920166015625, 0.08806610107421875, 0.094940185546875, 0.10181427001953125, 0.1086883544921875, 0.11556243896484375, 0.1224365234375, 0.12931060791015625, 0.1361846923828125, 0.14305877685546875, 0.149932861328125, 0.15680694580078125, 0.1636810302734375, 0.17055511474609375, 0.17742919921875, 0.18430328369140625, 0.1911773681640625, 0.19805145263671875, 0.204925537109375, 0.21179962158203125, 0.2186737060546875, 0.22554779052734375, 0.232421875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 5.0, 4.0, 4.0, 10.0, 11.0, 11.0, 16.0, 14.0, 16.0, 22.0, 19.0, 30.0, 33.0, 27.0, 33.0, 32.0, 35.0, 42.0, 41.0, 35.0, 41.0, 53.0, 30.0, 48.0, 38.0, 39.0, 42.0, 39.0, 33.0, 39.0, 26.0, 18.0, 17.0, 13.0, 20.0, 11.0, 12.0, 10.0, 11.0, 6.0, 9.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.046966552734375, -0.04559326171875, -0.044219970703125, -0.0428466796875, -0.041473388671875, -0.04010009765625, -0.038726806640625, -0.037353515625, -0.035980224609375, -0.03460693359375, -0.033233642578125, -0.0318603515625, -0.030487060546875, -0.02911376953125, -0.027740478515625, -0.0263671875, -0.024993896484375, -0.02362060546875, -0.022247314453125, -0.0208740234375, -0.019500732421875, -0.01812744140625, -0.016754150390625, -0.015380859375, -0.014007568359375, -0.01263427734375, -0.011260986328125, -0.0098876953125, -0.008514404296875, -0.00714111328125, -0.005767822265625, -0.00439453125, -0.003021240234375, -0.00164794921875, -0.000274658203125, 0.0010986328125, 0.002471923828125, 0.00384521484375, 0.005218505859375, 0.006591796875, 0.007965087890625, 0.00933837890625, 0.010711669921875, 0.0120849609375, 0.013458251953125, 0.01483154296875, 0.016204833984375, 0.017578125, 0.018951416015625, 0.02032470703125, 0.021697998046875, 0.0230712890625, 0.024444580078125, 0.02581787109375, 0.027191162109375, 0.028564453125, 0.029937744140625, 0.03131103515625, 0.032684326171875, 0.0340576171875, 0.035430908203125, 0.03680419921875, 0.038177490234375, 0.03955078125, 0.040924072265625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 5.0, 8.0, 13.0, 20.0, 23.0, 29.0, 39.0, 58.0, 85.0, 112.0, 160.0, 238.0, 341.0, 499.0, 831.0, 1289.0, 2094.0, 3852.0, 7056.0, 14072.0, 30398.0, 73995.0, 218197.0, 1228211.0, 2186493.0, 269643.0, 87062.0, 35223.0, 15843.0, 7788.0, 4311.0, 2273.0, 1400.0, 862.0, 537.0, 388.0, 247.0, 176.0, 120.0, 96.0, 47.0, 37.0, 23.0, 26.0, 22.0, 10.0, 10.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0], "bins": [-0.2239990234375, -0.21722793579101562, -0.21045684814453125, -0.20368576049804688, -0.1969146728515625, -0.19014358520507812, -0.18337249755859375, -0.17660140991210938, -0.169830322265625, -0.16305923461914062, -0.15628814697265625, -0.14951705932617188, -0.1427459716796875, -0.13597488403320312, -0.12920379638671875, -0.12243270874023438, -0.11566162109375, -0.10889053344726562, -0.10211944580078125, -0.09534835815429688, -0.0885772705078125, -0.08180618286132812, -0.07503509521484375, -0.06826400756835938, -0.061492919921875, -0.054721832275390625, -0.04795074462890625, -0.041179656982421875, -0.0344085693359375, -0.027637481689453125, -0.02086639404296875, -0.014095306396484375, -0.00732421875, -0.000553131103515625, 0.00621795654296875, 0.012989044189453125, 0.0197601318359375, 0.026531219482421875, 0.03330230712890625, 0.040073394775390625, 0.046844482421875, 0.053615570068359375, 0.06038665771484375, 0.06715774536132812, 0.0739288330078125, 0.08069992065429688, 0.08747100830078125, 0.09424209594726562, 0.10101318359375, 0.10778427124023438, 0.11455535888671875, 0.12132644653320312, 0.1280975341796875, 0.13486862182617188, 0.14163970947265625, 0.14841079711914062, 0.155181884765625, 0.16195297241210938, 0.16872406005859375, 0.17549514770507812, 0.1822662353515625, 0.18903732299804688, 0.19580841064453125, 0.20257949829101562, 0.2093505859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 7.0, 5.0, 5.0, 6.0, 19.0, 5.0, 23.0, 24.0, 29.0, 46.0, 67.0, 104.0, 128.0, 223.0, 381.0, 837.0, 1059.0, 354.0, 241.0, 126.0, 110.0, 78.0, 49.0, 32.0, 33.0, 17.0, 8.0, 16.0, 10.0, 9.0, 6.0, 1.0, 9.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1441650390625, -0.1398029327392578, -0.13544082641601562, -0.13107872009277344, -0.12671661376953125, -0.12235450744628906, -0.11799240112304688, -0.11363029479980469, -0.1092681884765625, -0.10490608215332031, -0.10054397583007812, -0.09618186950683594, -0.09181976318359375, -0.08745765686035156, -0.08309555053710938, -0.07873344421386719, -0.074371337890625, -0.07000923156738281, -0.06564712524414062, -0.06128501892089844, -0.05692291259765625, -0.05256080627441406, -0.048198699951171875, -0.04383659362792969, -0.0394744873046875, -0.03511238098144531, -0.030750274658203125, -0.026388168334960938, -0.02202606201171875, -0.017663955688476562, -0.013301849365234375, -0.008939743041992188, -0.00457763671875, -0.0002155303955078125, 0.004146575927734375, 0.008508682250976562, 0.01287078857421875, 0.017232894897460938, 0.021595001220703125, 0.025957107543945312, 0.0303192138671875, 0.03468132019042969, 0.039043426513671875, 0.04340553283691406, 0.04776763916015625, 0.05212974548339844, 0.056491851806640625, 0.06085395812988281, 0.065216064453125, 0.06957817077636719, 0.07394027709960938, 0.07830238342285156, 0.08266448974609375, 0.08702659606933594, 0.09138870239257812, 0.09575080871582031, 0.1001129150390625, 0.10447502136230469, 0.10883712768554688, 0.11319923400878906, 0.11756134033203125, 0.12192344665527344, 0.12628555297851562, 0.1306476593017578, 0.135009765625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 7.0, 12.0, 21.0, 32.0, 56.0, 104.0, 145.0, 160.0, 145.0, 123.0, 88.0, 42.0, 38.0, 19.0, 7.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.285744547843933, -1.2390635013580322, -1.1923824548721313, -1.1457014083862305, -1.0990204811096191, -1.0523394346237183, -1.0056583881378174, -0.9589773416519165, -0.9122962951660156, -0.8656152486801147, -0.8189342021942139, -0.7722532153129578, -0.7255721688270569, -0.678891122341156, -0.6322101354598999, -0.585529088973999, -0.5388480424880981, -0.49216699600219727, -0.4454859793186188, -0.3988049626350403, -0.3521239161491394, -0.3054428696632385, -0.25876185297966003, -0.21208083629608154, -0.16539978981018066, -0.11871875822544098, -0.0720377266407013, -0.02535669505596161, 0.021324336528778076, 0.06800536811351776, 0.11468639969825745, 0.16136741638183594, 0.20804858207702637, 0.25472962856292725, 0.30141064524650574, 0.34809166193008423, 0.3947727084159851, 0.441453754901886, 0.4881347715854645, 0.534815788269043, 0.5814968347549438, 0.6281778812408447, 0.6748589277267456, 0.7215399146080017, 0.7682209610939026, 0.8149020075798035, 0.8615829944610596, 0.9082640409469604, 0.9549450874328613, 1.0016261339187622, 1.048307180404663, 1.094988226890564, 1.1416692733764648, 1.1883502006530762, 1.235031247138977, 1.281712293624878, 1.3283933401107788, 1.3750743865966797, 1.4217554330825806, 1.4684364795684814, 1.5151174068450928, 1.5617984533309937, 1.6084794998168945, 1.6551605463027954, 1.7018415927886963]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 4.0, 8.0, 4.0, 8.0, 10.0, 16.0, 18.0, 23.0, 25.0, 25.0, 23.0, 23.0, 30.0, 33.0, 41.0, 40.0, 40.0, 34.0, 44.0, 31.0, 39.0, 33.0, 33.0, 32.0, 34.0, 37.0, 30.0, 28.0, 23.0, 26.0, 19.0, 27.0, 25.0, 16.0, 17.0, 15.0, 16.0, 8.0, 7.0, 9.0, 11.0, 8.0, 9.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.4640202522277832, -0.449476957321167, -0.4349336326122284, -0.4203903377056122, -0.40584704279899597, -0.3913037180900574, -0.37676042318344116, -0.36221712827682495, -0.34767383337020874, -0.33313053846359253, -0.31858721375465393, -0.3040439188480377, -0.2895006239414215, -0.2749572992324829, -0.2604140043258667, -0.2458707094192505, -0.2313273847103119, -0.21678407490253448, -0.20224077999591827, -0.18769747018814087, -0.17315417528152466, -0.15861086547374725, -0.14406755566596985, -0.12952426075935364, -0.11498095095157623, -0.10043764859437943, -0.08589434623718262, -0.07135103642940521, -0.056807734072208405, -0.0422644317150116, -0.027721121907234192, -0.013177819550037384, 0.0013654828071594238, 0.01590878702700138, 0.030452091246843338, 0.044995397329330444, 0.05953869968652725, 0.07408200204372406, 0.08862531185150146, 0.10316861420869827, 0.11771191656589508, 0.13225522637367249, 0.1467985212802887, 0.1613418310880661, 0.1758851408958435, 0.19042843580245972, 0.20497174561023712, 0.21951505541801453, 0.23405835032463074, 0.24860166013240814, 0.26314496994018555, 0.27768826484680176, 0.29223155975341797, 0.3067748546600342, 0.3213181793689728, 0.335861474275589, 0.3504047989845276, 0.3649480938911438, 0.3794914186000824, 0.3940347135066986, 0.4085780084133148, 0.4231213331222534, 0.43766462802886963, 0.45220792293548584, 0.46675121784210205]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 7.0, 3.0, 10.0, 12.0, 15.0, 17.0, 33.0, 46.0, 53.0, 94.0, 135.0, 212.0, 316.0, 487.0, 770.0, 1330.0, 2167.0, 3886.0, 6420.0, 10918.0, 18418.0, 31756.0, 53653.0, 88780.0, 135925.0, 179940.0, 176671.0, 130271.0, 83673.0, 50498.0, 29663.0, 17404.0, 10225.0, 5889.0, 3427.0, 2006.0, 1224.0, 798.0, 466.0, 309.0, 210.0, 118.0, 94.0, 61.0, 34.0, 36.0, 22.0, 17.0, 6.0, 12.0, 9.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0], "bins": [-0.11029052734375, -0.10694217681884766, -0.10359382629394531, -0.10024547576904297, -0.09689712524414062, -0.09354877471923828, -0.09020042419433594, -0.0868520736694336, -0.08350372314453125, -0.0801553726196289, -0.07680702209472656, -0.07345867156982422, -0.07011032104492188, -0.06676197052001953, -0.06341361999511719, -0.060065269470214844, -0.0567169189453125, -0.053368568420410156, -0.05002021789550781, -0.04667186737060547, -0.043323516845703125, -0.03997516632080078, -0.03662681579589844, -0.033278465270996094, -0.02993011474609375, -0.026581764221191406, -0.023233413696289062, -0.01988506317138672, -0.016536712646484375, -0.013188362121582031, -0.009840011596679688, -0.006491661071777344, -0.003143310546875, 0.00020503997802734375, 0.0035533905029296875, 0.006901741027832031, 0.010250091552734375, 0.013598442077636719, 0.016946792602539062, 0.020295143127441406, 0.02364349365234375, 0.026991844177246094, 0.030340194702148438, 0.03368854522705078, 0.037036895751953125, 0.04038524627685547, 0.04373359680175781, 0.047081947326660156, 0.0504302978515625, 0.053778648376464844, 0.05712699890136719, 0.06047534942626953, 0.06382369995117188, 0.06717205047607422, 0.07052040100097656, 0.0738687515258789, 0.07721710205078125, 0.0805654525756836, 0.08391380310058594, 0.08726215362548828, 0.09061050415039062, 0.09395885467529297, 0.09730720520019531, 0.10065555572509766, 0.10400390625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 2.0, 4.0, 3.0, 9.0, 5.0, 8.0, 5.0, 16.0, 17.0, 7.0, 15.0, 20.0, 30.0, 21.0, 19.0, 27.0, 31.0, 30.0, 36.0, 36.0, 36.0, 44.0, 40.0, 56.0, 51.0, 46.0, 39.0, 32.0, 44.0, 26.0, 31.0, 26.0, 26.0, 24.0, 21.0, 17.0, 18.0, 7.0, 16.0, 17.0, 10.0, 13.0, 7.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.046844482421875, -0.045360565185546875, -0.04387664794921875, -0.042392730712890625, -0.0409088134765625, -0.039424896240234375, -0.03794097900390625, -0.036457061767578125, -0.03497314453125, -0.033489227294921875, -0.03200531005859375, -0.030521392822265625, -0.0290374755859375, -0.027553558349609375, -0.02606964111328125, -0.024585723876953125, -0.023101806640625, -0.021617889404296875, -0.02013397216796875, -0.018650054931640625, -0.0171661376953125, -0.015682220458984375, -0.01419830322265625, -0.012714385986328125, -0.01123046875, -0.009746551513671875, -0.00826263427734375, -0.006778717041015625, -0.0052947998046875, -0.003810882568359375, -0.00232696533203125, -0.000843048095703125, 0.000640869140625, 0.002124786376953125, 0.00360870361328125, 0.005092620849609375, 0.0065765380859375, 0.008060455322265625, 0.00954437255859375, 0.011028289794921875, 0.01251220703125, 0.013996124267578125, 0.01548004150390625, 0.016963958740234375, 0.0184478759765625, 0.019931793212890625, 0.02141571044921875, 0.022899627685546875, 0.024383544921875, 0.025867462158203125, 0.02735137939453125, 0.028835296630859375, 0.0303192138671875, 0.031803131103515625, 0.03328704833984375, 0.034770965576171875, 0.0362548828125, 0.037738800048828125, 0.03922271728515625, 0.040706634521484375, 0.0421905517578125, 0.043674468994140625, 0.04515838623046875, 0.046642303466796875, 0.048126220703125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 6.0, 7.0, 6.0, 9.0, 18.0, 21.0, 18.0, 30.0, 45.0, 69.0, 82.0, 126.0, 158.0, 255.0, 353.0, 543.0, 957.0, 1945.0, 6638.0, 32432.0, 197431.0, 589654.0, 177483.0, 29631.0, 6091.0, 1927.0, 878.0, 523.0, 336.0, 246.0, 181.0, 141.0, 76.0, 68.0, 41.0, 31.0, 24.0, 30.0, 14.0, 11.0, 8.0, 6.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34326171875, -0.3319969177246094, -0.32073211669921875, -0.3094673156738281, -0.2982025146484375, -0.2869377136230469, -0.27567291259765625, -0.2644081115722656, -0.253143310546875, -0.24187850952148438, -0.23061370849609375, -0.21934890747070312, -0.2080841064453125, -0.19681930541992188, -0.18555450439453125, -0.17428970336914062, -0.16302490234375, -0.15176010131835938, -0.14049530029296875, -0.12923049926757812, -0.1179656982421875, -0.10670089721679688, -0.09543609619140625, -0.08417129516601562, -0.072906494140625, -0.061641693115234375, -0.05037689208984375, -0.039112091064453125, -0.0278472900390625, -0.016582489013671875, -0.00531768798828125, 0.005947113037109375, 0.0172119140625, 0.028476715087890625, 0.03974151611328125, 0.051006317138671875, 0.0622711181640625, 0.07353591918945312, 0.08480072021484375, 0.09606552124023438, 0.107330322265625, 0.11859512329101562, 0.12985992431640625, 0.14112472534179688, 0.1523895263671875, 0.16365432739257812, 0.17491912841796875, 0.18618392944335938, 0.19744873046875, 0.20871353149414062, 0.21997833251953125, 0.23124313354492188, 0.2425079345703125, 0.2537727355957031, 0.26503753662109375, 0.2763023376464844, 0.287567138671875, 0.2988319396972656, 0.31009674072265625, 0.3213615417480469, 0.3326263427734375, 0.3438911437988281, 0.35515594482421875, 0.3664207458496094, 0.377685546875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 6.0, 3.0, 4.0, 5.0, 4.0, 10.0, 11.0, 17.0, 13.0, 8.0, 17.0, 14.0, 19.0, 15.0, 25.0, 34.0, 35.0, 27.0, 32.0, 32.0, 47.0, 64.0, 34.0, 37.0, 41.0, 40.0, 36.0, 32.0, 37.0, 41.0, 35.0, 35.0, 23.0, 19.0, 31.0, 20.0, 20.0, 9.0, 16.0, 10.0, 5.0, 7.0, 6.0, 5.0, 4.0, 0.0, 4.0, 4.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.259765625, -0.25160980224609375, -0.2434539794921875, -0.23529815673828125, -0.227142333984375, -0.21898651123046875, -0.2108306884765625, -0.20267486572265625, -0.19451904296875, -0.18636322021484375, -0.1782073974609375, -0.17005157470703125, -0.161895751953125, -0.15373992919921875, -0.1455841064453125, -0.13742828369140625, -0.1292724609375, -0.12111663818359375, -0.1129608154296875, -0.10480499267578125, -0.096649169921875, -0.08849334716796875, -0.0803375244140625, -0.07218170166015625, -0.06402587890625, -0.05587005615234375, -0.0477142333984375, -0.03955841064453125, -0.031402587890625, -0.02324676513671875, -0.0150909423828125, -0.00693511962890625, 0.001220703125, 0.00937652587890625, 0.0175323486328125, 0.02568817138671875, 0.033843994140625, 0.04199981689453125, 0.0501556396484375, 0.05831146240234375, 0.06646728515625, 0.07462310791015625, 0.0827789306640625, 0.09093475341796875, 0.099090576171875, 0.10724639892578125, 0.1154022216796875, 0.12355804443359375, 0.1317138671875, 0.13986968994140625, 0.1480255126953125, 0.15618133544921875, 0.164337158203125, 0.17249298095703125, 0.1806488037109375, 0.18880462646484375, 0.19696044921875, 0.20511627197265625, 0.2132720947265625, 0.22142791748046875, 0.229583740234375, 0.23773956298828125, 0.2458953857421875, 0.25405120849609375, 0.26220703125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 1.0, 0.0, 8.0, 5.0, 6.0, 10.0, 14.0, 19.0, 29.0, 47.0, 51.0, 99.0, 138.0, 278.0, 472.0, 910.0, 2102.0, 4925.0, 14174.0, 50733.0, 235469.0, 520473.0, 163395.0, 36662.0, 11077.0, 3899.0, 1678.0, 830.0, 410.0, 211.0, 128.0, 101.0, 64.0, 47.0, 19.0, 22.0, 24.0, 11.0, 4.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2061767578125, -0.20000076293945312, -0.19382476806640625, -0.18764877319335938, -0.1814727783203125, -0.17529678344726562, -0.16912078857421875, -0.16294479370117188, -0.156768798828125, -0.15059280395507812, -0.14441680908203125, -0.13824081420898438, -0.1320648193359375, -0.12588882446289062, -0.11971282958984375, -0.11353683471679688, -0.10736083984375, -0.10118484497070312, -0.09500885009765625, -0.08883285522460938, -0.0826568603515625, -0.07648086547851562, -0.07030487060546875, -0.06412887573242188, -0.057952880859375, -0.051776885986328125, -0.04560089111328125, -0.039424896240234375, -0.0332489013671875, -0.027072906494140625, -0.02089691162109375, -0.014720916748046875, -0.008544921875, -0.002368927001953125, 0.00380706787109375, 0.009983062744140625, 0.0161590576171875, 0.022335052490234375, 0.02851104736328125, 0.034687042236328125, 0.040863037109375, 0.047039031982421875, 0.05321502685546875, 0.059391021728515625, 0.0655670166015625, 0.07174301147460938, 0.07791900634765625, 0.08409500122070312, 0.09027099609375, 0.09644699096679688, 0.10262298583984375, 0.10879898071289062, 0.1149749755859375, 0.12115097045898438, 0.12732696533203125, 0.13350296020507812, 0.139678955078125, 0.14585494995117188, 0.15203094482421875, 0.15820693969726562, 0.1643829345703125, 0.17055892944335938, 0.17673492431640625, 0.18291091918945312, 0.1890869140625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 6.0, 6.0, 11.0, 11.0, 22.0, 22.0, 22.0, 30.0, 36.0, 45.0, 47.0, 69.0, 68.0, 101.0, 75.0, 65.0, 74.0, 59.0, 58.0, 36.0, 31.0, 27.0, 14.0, 12.0, 18.0, 6.0, 4.0, 8.0, 5.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.00013530254364013672, -0.00013203732669353485, -0.00012877210974693298, -0.00012550689280033112, -0.00012224167585372925, -0.00011897645890712738, -0.00011571124196052551, -0.00011244602501392365, -0.00010918080806732178, -0.00010591559112071991, -0.00010265037417411804, -9.938515722751617e-05, -9.61199402809143e-05, -9.285472333431244e-05, -8.958950638771057e-05, -8.63242894411087e-05, -8.305907249450684e-05, -7.979385554790497e-05, -7.65286386013031e-05, -7.326342165470123e-05, -6.999820470809937e-05, -6.67329877614975e-05, -6.346777081489563e-05, -6.020255386829376e-05, -5.6937336921691895e-05, -5.367211997509003e-05, -5.040690302848816e-05, -4.714168608188629e-05, -4.3876469135284424e-05, -4.0611252188682556e-05, -3.734603524208069e-05, -3.408081829547882e-05, -3.081560134887695e-05, -2.7550384402275085e-05, -2.4285167455673218e-05, -2.101995050907135e-05, -1.7754733562469482e-05, -1.4489516615867615e-05, -1.1224299669265747e-05, -7.95908272266388e-06, -4.693865776062012e-06, -1.428648829460144e-06, 1.8365681171417236e-06, 5.101785063743591e-06, 8.367002010345459e-06, 1.1632218956947327e-05, 1.4897435903549194e-05, 1.8162652850151062e-05, 2.142786979675293e-05, 2.4693086743354797e-05, 2.7958303689956665e-05, 3.122352063655853e-05, 3.44887375831604e-05, 3.775395452976227e-05, 4.1019171476364136e-05, 4.4284388422966003e-05, 4.754960536956787e-05, 5.081482231616974e-05, 5.4080039262771606e-05, 5.7345256209373474e-05, 6.061047315597534e-05, 6.387569010257721e-05, 6.714090704917908e-05, 7.040612399578094e-05, 7.367134094238281e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 2.0, 8.0, 17.0, 21.0, 39.0, 60.0, 121.0, 212.0, 454.0, 977.0, 2808.0, 10327.0, 67183.0, 585954.0, 335503.0, 34893.0, 6425.0, 2028.0, 740.0, 377.0, 164.0, 86.0, 67.0, 30.0, 17.0, 20.0, 10.0, 5.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.276611328125, -0.26702117919921875, -0.2574310302734375, -0.24784088134765625, -0.238250732421875, -0.22866058349609375, -0.2190704345703125, -0.20948028564453125, -0.19989013671875, -0.19029998779296875, -0.1807098388671875, -0.17111968994140625, -0.161529541015625, -0.15193939208984375, -0.1423492431640625, -0.13275909423828125, -0.1231689453125, -0.11357879638671875, -0.1039886474609375, -0.09439849853515625, -0.084808349609375, -0.07521820068359375, -0.0656280517578125, -0.05603790283203125, -0.04644775390625, -0.03685760498046875, -0.0272674560546875, -0.01767730712890625, -0.008087158203125, 0.00150299072265625, 0.0110931396484375, 0.02068328857421875, 0.0302734375, 0.03986358642578125, 0.0494537353515625, 0.05904388427734375, 0.068634033203125, 0.07822418212890625, 0.0878143310546875, 0.09740447998046875, 0.10699462890625, 0.11658477783203125, 0.1261749267578125, 0.13576507568359375, 0.145355224609375, 0.15494537353515625, 0.1645355224609375, 0.17412567138671875, 0.1837158203125, 0.19330596923828125, 0.2028961181640625, 0.21248626708984375, 0.222076416015625, 0.23166656494140625, 0.2412567138671875, 0.25084686279296875, 0.26043701171875, 0.27002716064453125, 0.2796173095703125, 0.28920745849609375, 0.298797607421875, 0.30838775634765625, 0.3179779052734375, 0.32756805419921875, 0.337158203125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 7.0, 10.0, 13.0, 12.0, 14.0, 38.0, 37.0, 32.0, 50.0, 58.0, 54.0, 65.0, 72.0, 79.0, 78.0, 62.0, 47.0, 42.0, 38.0, 37.0, 40.0, 22.0, 19.0, 19.0, 9.0, 7.0, 9.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.142578125, -0.13773155212402344, -0.13288497924804688, -0.1280384063720703, -0.12319183349609375, -0.11834526062011719, -0.11349868774414062, -0.10865211486816406, -0.1038055419921875, -0.09895896911621094, -0.09411239624023438, -0.08926582336425781, -0.08441925048828125, -0.07957267761230469, -0.07472610473632812, -0.06987953186035156, -0.065032958984375, -0.06018638610839844, -0.055339813232421875, -0.05049324035644531, -0.04564666748046875, -0.04080009460449219, -0.035953521728515625, -0.031106948852539062, -0.0262603759765625, -0.021413803100585938, -0.016567230224609375, -0.011720657348632812, -0.00687408447265625, -0.0020275115966796875, 0.002819061279296875, 0.0076656341552734375, 0.01251220703125, 0.017358779907226562, 0.022205352783203125, 0.027051925659179688, 0.03189849853515625, 0.03674507141113281, 0.041591644287109375, 0.04643821716308594, 0.0512847900390625, 0.05613136291503906, 0.060977935791015625, 0.06582450866699219, 0.07067108154296875, 0.07551765441894531, 0.08036422729492188, 0.08521080017089844, 0.090057373046875, 0.09490394592285156, 0.09975051879882812, 0.10459709167480469, 0.10944366455078125, 0.11429023742675781, 0.11913681030273438, 0.12398338317871094, 0.1288299560546875, 0.13367652893066406, 0.13852310180664062, 0.1433696746826172, 0.14821624755859375, 0.1530628204345703, 0.15790939331054688, 0.16275596618652344, 0.1676025390625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 7.0, 15.0, 34.0, 66.0, 89.0, 147.0, 153.0, 151.0, 114.0, 104.0, 54.0, 33.0, 21.0, 9.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.354488372802734, -4.259562015533447, -4.164635181427002, -4.069708824157715, -3.9747822284698486, -3.8798556327819824, -3.7849292755126953, -3.690002679824829, -3.595076084136963, -3.5001494884490967, -3.4052228927612305, -3.3102965354919434, -3.215369939804077, -3.120443344116211, -3.025516986846924, -2.9305903911590576, -2.8356637954711914, -2.740737199783325, -2.645810604095459, -2.550884246826172, -2.4559576511383057, -2.3610310554504395, -2.2661046981811523, -2.171178102493286, -2.07625150680542, -1.9813249111175537, -1.886398434638977, -1.7914719581604004, -1.6965453624725342, -1.601618766784668, -1.5066922903060913, -1.4117658138275146, -1.3168392181396484, -1.2219126224517822, -1.1269861459732056, -1.032059669494629, -0.9371330738067627, -0.8422065377235413, -0.7472800016403198, -0.6523534655570984, -0.557426929473877, -0.4625003933906555, -0.3675738573074341, -0.27264732122421265, -0.1777207851409912, -0.08279424905776978, 0.01213228702545166, 0.1070588231086731, 0.20198535919189453, 0.29691189527511597, 0.3918384313583374, 0.48676496744155884, 0.5816915035247803, 0.6766180396080017, 0.7715445756912231, 0.8664711117744446, 0.961397647857666, 1.0563242435455322, 1.1512507200241089, 1.2461771965026855, 1.3411037921905518, 1.436030387878418, 1.5309568643569946, 1.6258833408355713, 1.7208099365234375]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 7.0, 2.0, 5.0, 6.0, 8.0, 11.0, 8.0, 16.0, 19.0, 14.0, 16.0, 22.0, 19.0, 34.0, 33.0, 31.0, 42.0, 45.0, 40.0, 37.0, 35.0, 41.0, 49.0, 43.0, 52.0, 45.0, 49.0, 17.0, 42.0, 39.0, 30.0, 23.0, 30.0, 21.0, 14.0, 8.0, 19.0, 11.0, 6.0, 9.0, 1.0, 7.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.801051139831543, -1.7524038553237915, -1.70375657081604, -1.6551092863082886, -1.606462001800537, -1.5578147172927856, -1.5091674327850342, -1.4605201482772827, -1.4118728637695312, -1.3632255792617798, -1.3145782947540283, -1.2659310102462769, -1.2172837257385254, -1.168636441230774, -1.1199891567230225, -1.071341872215271, -1.0226945877075195, -0.9740473031997681, -0.9254000186920166, -0.8767527341842651, -0.8281054496765137, -0.7794581651687622, -0.7308108806610107, -0.6821635961532593, -0.6335163116455078, -0.5848690271377563, -0.5362217426300049, -0.4875744581222534, -0.43892717361450195, -0.3902798891067505, -0.341632604598999, -0.29298532009124756, -0.2443380355834961, -0.19569075107574463, -0.14704346656799316, -0.0983961820602417, -0.049748897552490234, -0.0011016130447387695, 0.047545671463012695, 0.09619295597076416, 0.14484024047851562, 0.1934875249862671, 0.24213480949401855, 0.29078209400177, 0.3394293785095215, 0.38807666301727295, 0.4367239475250244, 0.4853712320327759, 0.5340185165405273, 0.5826658010482788, 0.6313130855560303, 0.6799603700637817, 0.7286076545715332, 0.7772549390792847, 0.8259022235870361, 0.8745495080947876, 0.9231967926025391, 0.9718440771102905, 1.020491361618042, 1.0691386461257935, 1.117785930633545, 1.1664332151412964, 1.2150804996490479, 1.2637277841567993, 1.3123750686645508]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 4.0, 3.0, 8.0, 15.0, 12.0, 17.0, 26.0, 34.0, 35.0, 58.0, 86.0, 111.0, 175.0, 232.0, 352.0, 514.0, 856.0, 1501.0, 2784.0, 6055.0, 16555.0, 73295.0, 3850210.0, 195044.0, 28645.0, 8953.0, 3733.0, 1930.0, 1070.0, 674.0, 410.0, 274.0, 185.0, 102.0, 84.0, 63.0, 53.0, 25.0, 23.0, 19.0, 13.0, 17.0, 6.0, 10.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.345947265625, -0.3353691101074219, -0.32479095458984375, -0.3142127990722656, -0.3036346435546875, -0.2930564880371094, -0.28247833251953125, -0.2719001770019531, -0.261322021484375, -0.2507438659667969, -0.24016571044921875, -0.22958755493164062, -0.2190093994140625, -0.20843124389648438, -0.19785308837890625, -0.18727493286132812, -0.17669677734375, -0.16611862182617188, -0.15554046630859375, -0.14496231079101562, -0.1343841552734375, -0.12380599975585938, -0.11322784423828125, -0.10264968872070312, -0.092071533203125, -0.08149337768554688, -0.07091522216796875, -0.060337066650390625, -0.0497589111328125, -0.039180755615234375, -0.02860260009765625, -0.018024444580078125, -0.0074462890625, 0.003131866455078125, 0.01371002197265625, 0.024288177490234375, 0.0348663330078125, 0.045444488525390625, 0.05602264404296875, 0.06660079956054688, 0.077178955078125, 0.08775711059570312, 0.09833526611328125, 0.10891342163085938, 0.1194915771484375, 0.13006973266601562, 0.14064788818359375, 0.15122604370117188, 0.16180419921875, 0.17238235473632812, 0.18296051025390625, 0.19353866577148438, 0.2041168212890625, 0.21469497680664062, 0.22527313232421875, 0.23585128784179688, 0.246429443359375, 0.2570075988769531, 0.26758575439453125, 0.2781639099121094, 0.2887420654296875, 0.2993202209472656, 0.30989837646484375, 0.3204765319824219, 0.3310546875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 4.0, 1.0, 4.0, 3.0, 7.0, 10.0, 6.0, 12.0, 9.0, 26.0, 17.0, 17.0, 23.0, 33.0, 26.0, 27.0, 37.0, 38.0, 40.0, 38.0, 47.0, 48.0, 37.0, 35.0, 45.0, 40.0, 43.0, 38.0, 40.0, 34.0, 26.0, 38.0, 25.0, 27.0, 16.0, 15.0, 15.0, 9.0, 10.0, 11.0, 5.0, 4.0, 2.0, 5.0, 5.0, 1.0, 7.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.056732177734375, -0.05499982833862305, -0.053267478942871094, -0.05153512954711914, -0.04980278015136719, -0.048070430755615234, -0.04633808135986328, -0.04460573196411133, -0.042873382568359375, -0.04114103317260742, -0.03940868377685547, -0.037676334381103516, -0.03594398498535156, -0.03421163558959961, -0.032479286193847656, -0.030746936798095703, -0.02901458740234375, -0.027282238006591797, -0.025549888610839844, -0.02381753921508789, -0.022085189819335938, -0.020352840423583984, -0.01862049102783203, -0.016888141632080078, -0.015155792236328125, -0.013423442840576172, -0.011691093444824219, -0.009958744049072266, -0.008226394653320312, -0.006494045257568359, -0.004761695861816406, -0.003029346466064453, -0.0012969970703125, 0.0004353523254394531, 0.0021677017211914062, 0.0039000511169433594, 0.0056324005126953125, 0.007364749908447266, 0.009097099304199219, 0.010829448699951172, 0.012561798095703125, 0.014294147491455078, 0.01602649688720703, 0.017758846282958984, 0.019491195678710938, 0.02122354507446289, 0.022955894470214844, 0.024688243865966797, 0.02642059326171875, 0.028152942657470703, 0.029885292053222656, 0.03161764144897461, 0.03334999084472656, 0.035082340240478516, 0.03681468963623047, 0.03854703903198242, 0.040279388427734375, 0.04201173782348633, 0.04374408721923828, 0.045476436614990234, 0.04720878601074219, 0.04894113540649414, 0.050673484802246094, 0.05240583419799805, 0.05413818359375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 5.0, 7.0, 7.0, 7.0, 15.0, 9.0, 11.0, 22.0, 25.0, 14.0, 39.0, 39.0, 69.0, 68.0, 101.0, 112.0, 147.0, 209.0, 299.0, 476.0, 907.0, 2626.0, 14169.0, 3333964.0, 822629.0, 13377.0, 2454.0, 876.0, 481.0, 274.0, 205.0, 127.0, 103.0, 97.0, 74.0, 54.0, 42.0, 34.0, 32.0, 20.0, 14.0, 10.0, 16.0, 5.0, 5.0, 0.0, 3.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.1728515625, -1.1361846923828125, -1.099517822265625, -1.0628509521484375, -1.02618408203125, -0.9895172119140625, -0.952850341796875, -0.9161834716796875, -0.8795166015625, -0.8428497314453125, -0.806182861328125, -0.7695159912109375, -0.73284912109375, -0.6961822509765625, -0.659515380859375, -0.6228485107421875, -0.586181640625, -0.5495147705078125, -0.512847900390625, -0.4761810302734375, -0.43951416015625, -0.4028472900390625, -0.366180419921875, -0.3295135498046875, -0.2928466796875, -0.2561798095703125, -0.219512939453125, -0.1828460693359375, -0.14617919921875, -0.1095123291015625, -0.072845458984375, -0.0361785888671875, 0.00048828125, 0.0371551513671875, 0.073822021484375, 0.1104888916015625, 0.14715576171875, 0.1838226318359375, 0.220489501953125, 0.2571563720703125, 0.2938232421875, 0.3304901123046875, 0.367156982421875, 0.4038238525390625, 0.44049072265625, 0.4771575927734375, 0.513824462890625, 0.5504913330078125, 0.587158203125, 0.6238250732421875, 0.660491943359375, 0.6971588134765625, 0.73382568359375, 0.7704925537109375, 0.807159423828125, 0.8438262939453125, 0.8804931640625, 0.9171600341796875, 0.953826904296875, 0.9904937744140625, 1.02716064453125, 1.0638275146484375, 1.100494384765625, 1.1371612548828125, 1.173828125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 18.0, 55.0, 145.0, 3531.0, 215.0, 75.0, 14.0, 7.0, 5.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.324951171875, -0.31607818603515625, -0.3072052001953125, -0.29833221435546875, -0.289459228515625, -0.28058624267578125, -0.2717132568359375, -0.26284027099609375, -0.25396728515625, -0.24509429931640625, -0.2362213134765625, -0.22734832763671875, -0.218475341796875, -0.20960235595703125, -0.2007293701171875, -0.19185638427734375, -0.1829833984375, -0.17411041259765625, -0.1652374267578125, -0.15636444091796875, -0.147491455078125, -0.13861846923828125, -0.1297454833984375, -0.12087249755859375, -0.11199951171875, -0.10312652587890625, -0.0942535400390625, -0.08538055419921875, -0.076507568359375, -0.06763458251953125, -0.0587615966796875, -0.04988861083984375, -0.041015625, -0.03214263916015625, -0.0232696533203125, -0.01439666748046875, -0.005523681640625, 0.00334930419921875, 0.0122222900390625, 0.02109527587890625, 0.02996826171875, 0.03884124755859375, 0.0477142333984375, 0.05658721923828125, 0.065460205078125, 0.07433319091796875, 0.0832061767578125, 0.09207916259765625, 0.1009521484375, 0.10982513427734375, 0.1186981201171875, 0.12757110595703125, 0.136444091796875, 0.14531707763671875, 0.1541900634765625, 0.16306304931640625, 0.17193603515625, 0.18080902099609375, 0.1896820068359375, 0.19855499267578125, 0.207427978515625, 0.21630096435546875, 0.2251739501953125, 0.23404693603515625, 0.242919921875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 6.0, 1.0, 5.0, 14.0, 11.0, 15.0, 12.0, 30.0, 32.0, 27.0, 41.0, 60.0, 49.0, 55.0, 60.0, 73.0, 84.0, 72.0, 81.0, 59.0, 51.0, 44.0, 38.0, 21.0, 14.0, 15.0, 11.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.4650503396987915, -0.45184797048568726, -0.438645601272583, -0.42544323205947876, -0.4122408628463745, -0.39903849363327026, -0.385836124420166, -0.37263375520706177, -0.3594313859939575, -0.34622901678085327, -0.333026647567749, -0.3198242783546448, -0.3066219091415405, -0.2934195399284363, -0.28021717071533203, -0.2670148015022278, -0.2538124620914459, -0.24061009287834167, -0.22740772366523743, -0.21420535445213318, -0.20100298523902893, -0.18780061602592468, -0.17459826171398163, -0.16139589250087738, -0.14819352328777313, -0.13499115407466888, -0.12178878486156464, -0.10858642309904099, -0.09538405388593674, -0.08218168467283249, -0.06897932291030884, -0.05577695369720459, -0.04257461428642273, -0.02937224693596363, -0.016169879585504532, -0.0029675140976905823, 0.010234855115413666, 0.023437224328517914, 0.036639586091041565, 0.04984195530414581, 0.06304432451725006, 0.07624669373035431, 0.08944906294345856, 0.10265142470598221, 0.11585379391908646, 0.1290561556816101, 0.14225852489471436, 0.1554608941078186, 0.16866326332092285, 0.1818656325340271, 0.19506800174713135, 0.2082703709602356, 0.22147274017333984, 0.2346751093864441, 0.24787746369838715, 0.2610798478126526, 0.27428221702575684, 0.2874845862388611, 0.30068695545196533, 0.3138893246650696, 0.32709169387817383, 0.3402940630912781, 0.3534964323043823, 0.3666988015174866, 0.37990114092826843]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 8.0, 5.0, 7.0, 6.0, 5.0, 3.0, 17.0, 17.0, 17.0, 28.0, 13.0, 26.0, 29.0, 22.0, 41.0, 22.0, 43.0, 35.0, 28.0, 37.0, 52.0, 49.0, 31.0, 45.0, 36.0, 33.0, 27.0, 28.0, 36.0, 28.0, 31.0, 30.0, 23.0, 21.0, 21.0, 18.0, 13.0, 14.0, 11.0, 5.0, 10.0, 5.0, 1.0, 5.0, 6.0, 4.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.28381919860839844, -0.27472493052482605, -0.2656306326389313, -0.2565363645553589, -0.2474420815706253, -0.23834779858589172, -0.22925351560115814, -0.22015923261642456, -0.21106496453285217, -0.2019706815481186, -0.192876398563385, -0.18378213047981262, -0.17468784749507904, -0.16559356451034546, -0.15649928152561188, -0.1474049985408783, -0.13831071555614471, -0.12921643257141113, -0.12012215703725815, -0.11102787405252457, -0.10193359851837158, -0.092839315533638, -0.08374503254890442, -0.07465075701475143, -0.06555647403001785, -0.05646219477057457, -0.04736791551113129, -0.038273632526397705, -0.029179353266954422, -0.02008507400751114, -0.010990791022777557, -0.0018965154886245728, 0.007197767496109009, 0.016292046755552292, 0.025386327877640724, 0.034480608999729156, 0.04357488825917244, 0.05266916751861572, 0.061763450503349304, 0.07085772603750229, 0.07995200902223587, 0.08904629200696945, 0.09814056754112244, 0.10723485052585602, 0.1163291335105896, 0.125423401594162, 0.13451769948005676, 0.14361196756362915, 0.15270625054836273, 0.1618005335330963, 0.1708948165178299, 0.17998909950256348, 0.18908336758613586, 0.19817765057086945, 0.20727193355560303, 0.21636620163917542, 0.2254604995250702, 0.23455478250980377, 0.24364906549453735, 0.25274333357810974, 0.2618376314640045, 0.2709318995475769, 0.2800261974334717, 0.28912046551704407, 0.29821473360061646]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 4.0, 2.0, 3.0, 4.0, 6.0, 10.0, 11.0, 10.0, 23.0, 29.0, 38.0, 55.0, 90.0, 120.0, 190.0, 280.0, 428.0, 767.0, 1364.0, 2317.0, 4051.0, 7461.0, 14587.0, 28149.0, 53559.0, 100001.0, 169833.0, 220350.0, 189426.0, 118408.0, 64776.0, 33957.0, 17533.0, 9174.0, 4849.0, 2663.0, 1553.0, 900.0, 522.0, 317.0, 219.0, 145.0, 117.0, 65.0, 54.0, 45.0, 25.0, 11.0, 12.0, 15.0, 10.0, 9.0, 12.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.169677734375, -0.16463470458984375, -0.1595916748046875, -0.15454864501953125, -0.149505615234375, -0.14446258544921875, -0.1394195556640625, -0.13437652587890625, -0.12933349609375, -0.12429046630859375, -0.1192474365234375, -0.11420440673828125, -0.109161376953125, -0.10411834716796875, -0.0990753173828125, -0.09403228759765625, -0.0889892578125, -0.08394622802734375, -0.0789031982421875, -0.07386016845703125, -0.068817138671875, -0.06377410888671875, -0.0587310791015625, -0.05368804931640625, -0.04864501953125, -0.04360198974609375, -0.0385589599609375, -0.03351593017578125, -0.028472900390625, -0.02342987060546875, -0.0183868408203125, -0.01334381103515625, -0.00830078125, -0.00325775146484375, 0.0017852783203125, 0.00682830810546875, 0.011871337890625, 0.01691436767578125, 0.0219573974609375, 0.02700042724609375, 0.03204345703125, 0.03708648681640625, 0.0421295166015625, 0.04717254638671875, 0.052215576171875, 0.05725860595703125, 0.0623016357421875, 0.06734466552734375, 0.0723876953125, 0.07743072509765625, 0.0824737548828125, 0.08751678466796875, 0.092559814453125, 0.09760284423828125, 0.1026458740234375, 0.10768890380859375, 0.11273193359375, 0.11777496337890625, 0.1228179931640625, 0.12786102294921875, 0.132904052734375, 0.13794708251953125, 0.1429901123046875, 0.14803314208984375, 0.153076171875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 8.0, 9.0, 4.0, 17.0, 14.0, 17.0, 20.0, 32.0, 30.0, 18.0, 18.0, 30.0, 29.0, 42.0, 30.0, 33.0, 38.0, 41.0, 39.0, 40.0, 29.0, 35.0, 37.0, 45.0, 43.0, 39.0, 37.0, 35.0, 18.0, 20.0, 20.0, 19.0, 13.0, 10.0, 8.0, 10.0, 14.0, 11.0, 7.0, 5.0, 7.0, 5.0, 5.0, 3.0, 5.0, 2.0, 2.0], "bins": [-0.0733642578125, -0.07134199142456055, -0.0693197250366211, -0.06729745864868164, -0.06527519226074219, -0.06325292587280273, -0.06123065948486328, -0.05920839309692383, -0.057186126708984375, -0.05516386032104492, -0.05314159393310547, -0.051119327545166016, -0.04909706115722656, -0.04707479476928711, -0.045052528381347656, -0.0430302619934082, -0.04100799560546875, -0.0389857292175293, -0.036963462829589844, -0.03494119644165039, -0.03291893005371094, -0.030896663665771484, -0.02887439727783203, -0.026852130889892578, -0.024829864501953125, -0.022807598114013672, -0.02078533172607422, -0.018763065338134766, -0.016740798950195312, -0.01471853256225586, -0.012696266174316406, -0.010673999786376953, -0.0086517333984375, -0.006629467010498047, -0.004607200622558594, -0.0025849342346191406, -0.0005626678466796875, 0.0014595985412597656, 0.0034818649291992188, 0.005504131317138672, 0.007526397705078125, 0.009548664093017578, 0.011570930480957031, 0.013593196868896484, 0.015615463256835938, 0.01763772964477539, 0.019659996032714844, 0.021682262420654297, 0.02370452880859375, 0.025726795196533203, 0.027749061584472656, 0.02977132797241211, 0.03179359436035156, 0.033815860748291016, 0.03583812713623047, 0.03786039352416992, 0.039882659912109375, 0.04190492630004883, 0.04392719268798828, 0.045949459075927734, 0.04797172546386719, 0.04999399185180664, 0.052016258239746094, 0.05403852462768555, 0.056060791015625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 5.0, 14.0, 10.0, 23.0, 16.0, 22.0, 37.0, 61.0, 81.0, 99.0, 170.0, 255.0, 334.0, 541.0, 926.0, 1659.0, 3547.0, 10626.0, 46415.0, 263549.0, 559475.0, 124649.0, 23907.0, 6330.0, 2476.0, 1233.0, 692.0, 458.0, 286.0, 205.0, 121.0, 86.0, 77.0, 51.0, 34.0, 22.0, 17.0, 11.0, 8.0, 10.0, 2.0, 5.0, 3.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.4501953125, -0.4362525939941406, -0.42230987548828125, -0.4083671569824219, -0.3944244384765625, -0.3804817199707031, -0.36653900146484375, -0.3525962829589844, -0.338653564453125, -0.3247108459472656, -0.31076812744140625, -0.2968254089355469, -0.2828826904296875, -0.2689399719238281, -0.25499725341796875, -0.24105453491210938, -0.22711181640625, -0.21316909790039062, -0.19922637939453125, -0.18528366088867188, -0.1713409423828125, -0.15739822387695312, -0.14345550537109375, -0.12951278686523438, -0.115570068359375, -0.10162734985351562, -0.08768463134765625, -0.07374191284179688, -0.0597991943359375, -0.045856475830078125, -0.03191375732421875, -0.017971038818359375, -0.0040283203125, 0.009914398193359375, 0.02385711669921875, 0.037799835205078125, 0.0517425537109375, 0.06568527221679688, 0.07962799072265625, 0.09357070922851562, 0.107513427734375, 0.12145614624023438, 0.13539886474609375, 0.14934158325195312, 0.1632843017578125, 0.17722702026367188, 0.19116973876953125, 0.20511245727539062, 0.21905517578125, 0.23299789428710938, 0.24694061279296875, 0.2608833312988281, 0.2748260498046875, 0.2887687683105469, 0.30271148681640625, 0.3166542053222656, 0.330596923828125, 0.3445396423339844, 0.35848236083984375, 0.3724250793457031, 0.3863677978515625, 0.4003105163574219, 0.41425323486328125, 0.4281959533691406, 0.442138671875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 7.0, 4.0, 13.0, 9.0, 16.0, 11.0, 21.0, 19.0, 27.0, 19.0, 24.0, 33.0, 25.0, 40.0, 40.0, 44.0, 42.0, 45.0, 46.0, 41.0, 43.0, 44.0, 46.0, 33.0, 47.0, 32.0, 31.0, 34.0, 25.0, 22.0, 24.0, 17.0, 13.0, 9.0, 15.0, 12.0, 4.0, 3.0, 1.0, 4.0, 3.0, 5.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.4150390625, -0.40302276611328125, -0.3910064697265625, -0.37899017333984375, -0.366973876953125, -0.35495758056640625, -0.3429412841796875, -0.33092498779296875, -0.31890869140625, -0.30689239501953125, -0.2948760986328125, -0.28285980224609375, -0.270843505859375, -0.25882720947265625, -0.2468109130859375, -0.23479461669921875, -0.2227783203125, -0.21076202392578125, -0.1987457275390625, -0.18672943115234375, -0.174713134765625, -0.16269683837890625, -0.1506805419921875, -0.13866424560546875, -0.12664794921875, -0.11463165283203125, -0.1026153564453125, -0.09059906005859375, -0.078582763671875, -0.06656646728515625, -0.0545501708984375, -0.04253387451171875, -0.030517578125, -0.01850128173828125, -0.0064849853515625, 0.00553131103515625, 0.017547607421875, 0.02956390380859375, 0.0415802001953125, 0.05359649658203125, 0.06561279296875, 0.07762908935546875, 0.0896453857421875, 0.10166168212890625, 0.113677978515625, 0.12569427490234375, 0.1377105712890625, 0.14972686767578125, 0.1617431640625, 0.17375946044921875, 0.1857757568359375, 0.19779205322265625, 0.209808349609375, 0.22182464599609375, 0.2338409423828125, 0.24585723876953125, 0.25787353515625, 0.26988983154296875, 0.2819061279296875, 0.29392242431640625, 0.305938720703125, 0.31795501708984375, 0.3299713134765625, 0.34198760986328125, 0.35400390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 8.0, 16.0, 16.0, 40.0, 79.0, 129.0, 262.0, 596.0, 1731.0, 6582.0, 45207.0, 715720.0, 254011.0, 18593.0, 3598.0, 1086.0, 406.0, 213.0, 109.0, 58.0, 30.0, 21.0, 11.0, 8.0, 10.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.6103515625, -0.5953903198242188, -0.5804290771484375, -0.5654678344726562, -0.550506591796875, -0.5355453491210938, -0.5205841064453125, -0.5056228637695312, -0.49066162109375, -0.47570037841796875, -0.4607391357421875, -0.44577789306640625, -0.430816650390625, -0.41585540771484375, -0.4008941650390625, -0.38593292236328125, -0.3709716796875, -0.35601043701171875, -0.3410491943359375, -0.32608795166015625, -0.311126708984375, -0.29616546630859375, -0.2812042236328125, -0.26624298095703125, -0.25128173828125, -0.23632049560546875, -0.2213592529296875, -0.20639801025390625, -0.191436767578125, -0.17647552490234375, -0.1615142822265625, -0.14655303955078125, -0.131591796875, -0.11663055419921875, -0.1016693115234375, -0.08670806884765625, -0.071746826171875, -0.05678558349609375, -0.0418243408203125, -0.02686309814453125, -0.01190185546875, 0.00305938720703125, 0.0180206298828125, 0.03298187255859375, 0.047943115234375, 0.06290435791015625, 0.0778656005859375, 0.09282684326171875, 0.1077880859375, 0.12274932861328125, 0.1377105712890625, 0.15267181396484375, 0.167633056640625, 0.18259429931640625, 0.1975555419921875, 0.21251678466796875, 0.22747802734375, 0.24243927001953125, 0.2574005126953125, 0.27236175537109375, 0.287322998046875, 0.30228424072265625, 0.3172454833984375, 0.33220672607421875, 0.34716796875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 11.0, 12.0, 30.0, 27.0, 35.0, 45.0, 68.0, 65.0, 58.0, 95.0, 106.0, 79.0, 76.0, 68.0, 49.0, 45.0, 38.0, 27.0, 19.0, 10.0, 16.0, 7.0, 6.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00012576580047607422, -0.00012165307998657227, -0.00011754035949707031, -0.00011342763900756836, -0.0001093149185180664, -0.00010520219802856445, -0.0001010894775390625, -9.697675704956055e-05, -9.28640365600586e-05, -8.875131607055664e-05, -8.463859558105469e-05, -8.052587509155273e-05, -7.641315460205078e-05, -7.230043411254883e-05, -6.818771362304688e-05, -6.407499313354492e-05, -5.996227264404297e-05, -5.5849552154541016e-05, -5.173683166503906e-05, -4.762411117553711e-05, -4.3511390686035156e-05, -3.93986701965332e-05, -3.528594970703125e-05, -3.11732292175293e-05, -2.7060508728027344e-05, -2.294778823852539e-05, -1.8835067749023438e-05, -1.4722347259521484e-05, -1.0609626770019531e-05, -6.496906280517578e-06, -2.384185791015625e-06, 1.7285346984863281e-06, 5.841255187988281e-06, 9.953975677490234e-06, 1.4066696166992188e-05, 1.817941665649414e-05, 2.2292137145996094e-05, 2.6404857635498047e-05, 3.0517578125e-05, 3.463029861450195e-05, 3.8743019104003906e-05, 4.285573959350586e-05, 4.696846008300781e-05, 5.1081180572509766e-05, 5.519390106201172e-05, 5.930662155151367e-05, 6.341934204101562e-05, 6.753206253051758e-05, 7.164478302001953e-05, 7.575750350952148e-05, 7.987022399902344e-05, 8.398294448852539e-05, 8.809566497802734e-05, 9.22083854675293e-05, 9.632110595703125e-05, 0.0001004338264465332, 0.00010454654693603516, 0.00010865926742553711, 0.00011277198791503906, 0.00011688470840454102, 0.00012099742889404297, 0.00012511014938354492, 0.00012922286987304688, 0.00013333559036254883, 0.00013744831085205078]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 14.0, 9.0, 17.0, 28.0, 41.0, 55.0, 97.0, 128.0, 232.0, 459.0, 852.0, 2045.0, 5383.0, 18964.0, 121191.0, 683998.0, 179083.0, 24665.0, 6528.0, 2471.0, 1014.0, 518.0, 277.0, 153.0, 99.0, 84.0, 35.0, 32.0, 16.0, 10.0, 8.0, 9.0, 4.0, 7.0, 6.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.30615234375, -0.296142578125, -0.2861328125, -0.276123046875, -0.26611328125, -0.256103515625, -0.24609375, -0.236083984375, -0.22607421875, -0.216064453125, -0.2060546875, -0.196044921875, -0.18603515625, -0.176025390625, -0.166015625, -0.156005859375, -0.14599609375, -0.135986328125, -0.1259765625, -0.115966796875, -0.10595703125, -0.095947265625, -0.0859375, -0.075927734375, -0.06591796875, -0.055908203125, -0.0458984375, -0.035888671875, -0.02587890625, -0.015869140625, -0.005859375, 0.004150390625, 0.01416015625, 0.024169921875, 0.0341796875, 0.044189453125, 0.05419921875, 0.064208984375, 0.07421875, 0.084228515625, 0.09423828125, 0.104248046875, 0.1142578125, 0.124267578125, 0.13427734375, 0.144287109375, 0.154296875, 0.164306640625, 0.17431640625, 0.184326171875, 0.1943359375, 0.204345703125, 0.21435546875, 0.224365234375, 0.234375, 0.244384765625, 0.25439453125, 0.264404296875, 0.2744140625, 0.284423828125, 0.29443359375, 0.304443359375, 0.314453125, 0.324462890625, 0.33447265625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 6.0, 6.0, 10.0, 6.0, 17.0, 25.0, 40.0, 69.0, 78.0, 90.0, 119.0, 116.0, 109.0, 103.0, 60.0, 45.0, 24.0, 30.0, 11.0, 11.0, 5.0, 6.0, 5.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2083740234375, -0.1985607147216797, -0.18874740600585938, -0.17893409729003906, -0.16912078857421875, -0.15930747985839844, -0.14949417114257812, -0.1396808624267578, -0.1298675537109375, -0.12005424499511719, -0.11024093627929688, -0.10042762756347656, -0.09061431884765625, -0.08080101013183594, -0.07098770141601562, -0.06117439270019531, -0.051361083984375, -0.04154777526855469, -0.031734466552734375, -0.021921157836914062, -0.01210784912109375, -0.0022945404052734375, 0.007518768310546875, 0.017332077026367188, 0.0271453857421875, 0.03695869445800781, 0.046772003173828125, 0.05658531188964844, 0.06639862060546875, 0.07621192932128906, 0.08602523803710938, 0.09583854675292969, 0.10565185546875, 0.11546516418457031, 0.12527847290039062, 0.13509178161621094, 0.14490509033203125, 0.15471839904785156, 0.16453170776367188, 0.1743450164794922, 0.1841583251953125, 0.1939716339111328, 0.20378494262695312, 0.21359825134277344, 0.22341156005859375, 0.23322486877441406, 0.24303817749023438, 0.2528514862060547, 0.262664794921875, 0.2724781036376953, 0.2822914123535156, 0.29210472106933594, 0.30191802978515625, 0.31173133850097656, 0.3215446472167969, 0.3313579559326172, 0.3411712646484375, 0.3509845733642578, 0.3607978820800781, 0.37061119079589844, 0.38042449951171875, 0.39023780822753906, 0.4000511169433594, 0.4098644256591797, 0.419677734375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 20.0, 17.0, 38.0, 42.0, 82.0, 110.0, 156.0, 132.0, 110.0, 107.0, 74.0, 50.0, 26.0, 14.0, 8.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.134925603866577, -3.011815071105957, -2.888704299926758, -2.7655935287475586, -2.6424829959869385, -2.5193724632263184, -2.396261692047119, -2.27315092086792, -2.1500403881073, -2.0269298553466797, -1.9038190841674805, -1.7807084321975708, -1.6575977802276611, -1.5344871282577515, -1.4113764762878418, -1.2882658243179321, -1.1651551723480225, -1.0420445203781128, -0.9189338684082031, -0.7958232164382935, -0.6727125644683838, -0.5496019124984741, -0.42649126052856445, -0.3033806085586548, -0.18026995658874512, -0.05715930461883545, 0.06595134735107422, 0.1890619993209839, 0.31217265129089355, 0.4352833032608032, 0.5583939552307129, 0.6815046072006226, 0.8046150207519531, 0.9277256727218628, 1.0508363246917725, 1.1739469766616821, 1.2970576286315918, 1.4201682806015015, 1.5432789325714111, 1.6663895845413208, 1.7895002365112305, 1.9126108884811401, 2.03572154045105, 2.15883207321167, 2.281942844390869, 2.4050536155700684, 2.5281641483306885, 2.6512746810913086, 2.774385452270508, 2.897496223449707, 3.020606756210327, 3.1437172889709473, 3.2668280601501465, 3.3899388313293457, 3.513049364089966, 3.636159896850586, 3.759270668029785, 3.8823814392089844, 4.005492210388184, 4.128602504730225, 4.251713275909424, 4.374824047088623, 4.497934341430664, 4.621045112609863, 4.7441558837890625]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 5.0, 13.0, 6.0, 11.0, 18.0, 14.0, 26.0, 18.0, 27.0, 27.0, 28.0, 23.0, 44.0, 49.0, 30.0, 41.0, 46.0, 48.0, 56.0, 47.0, 42.0, 38.0, 33.0, 33.0, 24.0, 39.0, 24.0, 29.0, 27.0, 21.0, 21.0, 12.0, 11.0, 9.0, 10.0, 10.0, 7.0, 4.0, 4.0, 4.0, 4.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.234001636505127, -2.169093370437622, -2.104184865951538, -2.039276599884033, -1.9743683338165283, -1.9094599485397339, -1.8445515632629395, -1.7796432971954346, -1.7147350311279297, -1.6498266458511353, -1.5849183797836304, -1.520009994506836, -1.455101728439331, -1.3901933431625366, -1.3252849578857422, -1.2603766918182373, -1.1954683065414429, -1.1305599212646484, -1.0656516551971436, -1.0007432699203491, -0.9358350038528442, -0.8709266185760498, -0.8060182929039001, -0.7411099672317505, -0.6762016415596008, -0.6112933158874512, -0.5463849902153015, -0.48147663474082947, -0.4165683090686798, -0.35165998339653015, -0.2867516279220581, -0.22184330224990845, -0.1569349765777588, -0.09202664345502853, -0.02711831033229828, 0.03779003024101257, 0.10269835591316223, 0.1676066815853119, 0.23251503705978394, 0.2974233627319336, 0.36233168840408325, 0.4272400140762329, 0.49214833974838257, 0.5570566654205322, 0.6219650506973267, 0.6868733167648315, 0.751781702041626, 0.8166900277137756, 0.8815983533859253, 0.946506679058075, 1.0114150047302246, 1.076323390007019, 1.141231656074524, 1.2061400413513184, 1.2710483074188232, 1.3359566926956177, 1.400865077972412, 1.4657734632492065, 1.5306817293167114, 1.5955901145935059, 1.6604983806610107, 1.7254067659378052, 1.7903151512145996, 1.8552234172821045, 1.9201316833496094]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 6.0, 8.0, 8.0, 5.0, 22.0, 39.0, 51.0, 87.0, 171.0, 435.0, 1005.0, 2822.0, 10909.0, 143555.0, 4002162.0, 25521.0, 4897.0, 1538.0, 539.0, 245.0, 112.0, 59.0, 30.0, 22.0, 10.0, 11.0, 4.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.798828125, -0.771484375, -0.744140625, -0.716796875, -0.689453125, -0.662109375, -0.634765625, -0.607421875, -0.580078125, -0.552734375, -0.525390625, -0.498046875, -0.470703125, -0.443359375, -0.416015625, -0.388671875, -0.361328125, -0.333984375, -0.306640625, -0.279296875, -0.251953125, -0.224609375, -0.197265625, -0.169921875, -0.142578125, -0.115234375, -0.087890625, -0.060546875, -0.033203125, -0.005859375, 0.021484375, 0.048828125, 0.076171875, 0.103515625, 0.130859375, 0.158203125, 0.185546875, 0.212890625, 0.240234375, 0.267578125, 0.294921875, 0.322265625, 0.349609375, 0.376953125, 0.404296875, 0.431640625, 0.458984375, 0.486328125, 0.513671875, 0.541015625, 0.568359375, 0.595703125, 0.623046875, 0.650390625, 0.677734375, 0.705078125, 0.732421875, 0.759765625, 0.787109375, 0.814453125, 0.841796875, 0.869140625, 0.896484375, 0.923828125, 0.951171875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 9.0, 4.0, 8.0, 4.0, 10.0, 10.0, 20.0, 24.0, 23.0, 25.0, 33.0, 47.0, 38.0, 46.0, 48.0, 54.0, 50.0, 55.0, 56.0, 56.0, 53.0, 46.0, 43.0, 41.0, 32.0, 29.0, 29.0, 16.0, 18.0, 15.0, 12.0, 13.0, 8.0, 9.0, 7.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0966796875, -0.09398174285888672, -0.09128379821777344, -0.08858585357666016, -0.08588790893554688, -0.0831899642944336, -0.08049201965332031, -0.07779407501220703, -0.07509613037109375, -0.07239818572998047, -0.06970024108886719, -0.0670022964477539, -0.06430435180664062, -0.061606407165527344, -0.05890846252441406, -0.05621051788330078, -0.0535125732421875, -0.05081462860107422, -0.04811668395996094, -0.045418739318847656, -0.042720794677734375, -0.040022850036621094, -0.03732490539550781, -0.03462696075439453, -0.03192901611328125, -0.02923107147216797, -0.026533126831054688, -0.023835182189941406, -0.021137237548828125, -0.018439292907714844, -0.015741348266601562, -0.013043403625488281, -0.010345458984375, -0.007647514343261719, -0.0049495697021484375, -0.0022516250610351562, 0.000446319580078125, 0.0031442642211914062, 0.0058422088623046875, 0.008540153503417969, 0.01123809814453125, 0.013936042785644531, 0.016633987426757812, 0.019331932067871094, 0.022029876708984375, 0.024727821350097656, 0.027425765991210938, 0.03012371063232422, 0.0328216552734375, 0.03551959991455078, 0.03821754455566406, 0.040915489196777344, 0.043613433837890625, 0.046311378479003906, 0.04900932312011719, 0.05170726776123047, 0.05440521240234375, 0.05710315704345703, 0.05980110168457031, 0.062499046325683594, 0.06519699096679688, 0.06789493560791016, 0.07059288024902344, 0.07329082489013672, 0.07598876953125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 8.0, 10.0, 10.0, 12.0, 14.0, 24.0, 30.0, 43.0, 89.0, 135.0, 214.0, 482.0, 1041.0, 2784.0, 9438.0, 64253.0, 4044680.0, 57224.0, 9078.0, 2623.0, 1007.0, 490.0, 208.0, 119.0, 70.0, 43.0, 31.0, 26.0, 16.0, 13.0, 17.0, 3.0, 10.0, 8.0, 6.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.4541015625, -1.4163131713867188, -1.3785247802734375, -1.3407363891601562, -1.302947998046875, -1.2651596069335938, -1.2273712158203125, -1.1895828247070312, -1.15179443359375, -1.1140060424804688, -1.0762176513671875, -1.0384292602539062, -1.000640869140625, -0.9628524780273438, -0.9250640869140625, -0.8872756958007812, -0.8494873046875, -0.8116989135742188, -0.7739105224609375, -0.7361221313476562, -0.698333740234375, -0.6605453491210938, -0.6227569580078125, -0.5849685668945312, -0.54718017578125, -0.5093917846679688, -0.4716033935546875, -0.43381500244140625, -0.396026611328125, -0.35823822021484375, -0.3204498291015625, -0.28266143798828125, -0.244873046875, -0.20708465576171875, -0.1692962646484375, -0.13150787353515625, -0.093719482421875, -0.05593109130859375, -0.0181427001953125, 0.01964569091796875, 0.05743408203125, 0.09522247314453125, 0.1330108642578125, 0.17079925537109375, 0.208587646484375, 0.24637603759765625, 0.2841644287109375, 0.32195281982421875, 0.3597412109375, 0.39752960205078125, 0.4353179931640625, 0.47310638427734375, 0.510894775390625, 0.5486831665039062, 0.5864715576171875, 0.6242599487304688, 0.66204833984375, 0.6998367309570312, 0.7376251220703125, 0.7754135131835938, 0.813201904296875, 0.8509902954101562, 0.8887786865234375, 0.9265670776367188, 0.96435546875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 18.0, 15.0, 23.0, 74.0, 235.0, 3250.0, 300.0, 63.0, 24.0, 30.0, 11.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.36962890625, -0.3613319396972656, -0.35303497314453125, -0.3447380065917969, -0.3364410400390625, -0.3281440734863281, -0.31984710693359375, -0.3115501403808594, -0.303253173828125, -0.2949562072753906, -0.28665924072265625, -0.2783622741699219, -0.2700653076171875, -0.2617683410644531, -0.25347137451171875, -0.24517440795898438, -0.23687744140625, -0.22858047485351562, -0.22028350830078125, -0.21198654174804688, -0.2036895751953125, -0.19539260864257812, -0.18709564208984375, -0.17879867553710938, -0.170501708984375, -0.16220474243164062, -0.15390777587890625, -0.14561080932617188, -0.1373138427734375, -0.12901687622070312, -0.12071990966796875, -0.11242294311523438, -0.1041259765625, -0.09582901000976562, -0.08753204345703125, -0.07923507690429688, -0.0709381103515625, -0.06264114379882812, -0.05434417724609375, -0.046047210693359375, -0.037750244140625, -0.029453277587890625, -0.02115631103515625, -0.012859344482421875, -0.0045623779296875, 0.003734588623046875, 0.01203155517578125, 0.020328521728515625, 0.02862548828125, 0.036922454833984375, 0.04521942138671875, 0.053516387939453125, 0.0618133544921875, 0.07011032104492188, 0.07840728759765625, 0.08670425415039062, 0.095001220703125, 0.10329818725585938, 0.11159515380859375, 0.11989212036132812, 0.1281890869140625, 0.13648605346679688, 0.14478302001953125, 0.15307998657226562, 0.161376953125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 3.0, 4.0, 4.0, 3.0, 10.0, 26.0, 25.0, 26.0, 37.0, 45.0, 60.0, 59.0, 75.0, 56.0, 76.0, 79.0, 66.0, 76.0, 55.0, 41.0, 30.0, 35.0, 27.0, 21.0, 24.0, 18.0, 9.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5710350275039673, -0.5541232228279114, -0.5372114181518555, -0.5202996730804443, -0.5033878684043884, -0.4864760637283325, -0.469564288854599, -0.4526525139808655, -0.43574070930480957, -0.41882890462875366, -0.40191712975502014, -0.3850053548812866, -0.3680935502052307, -0.3511817455291748, -0.3342699706554413, -0.31735819578170776, -0.30044639110565186, -0.28353458642959595, -0.2666228115558624, -0.2497110217809677, -0.232799232006073, -0.21588744223117828, -0.19897565245628357, -0.18206386268138885, -0.16515207290649414, -0.14824028313159943, -0.1313284933567047, -0.11441670358181, -0.09750491380691528, -0.08059312403202057, -0.06368133425712585, -0.04676954448223114, -0.0298578143119812, -0.012946024537086487, 0.0039657652378082275, 0.020877555012702942, 0.037789344787597656, 0.05470113456249237, 0.07161292433738708, 0.0885247141122818, 0.10543650388717651, 0.12234829366207123, 0.13926008343696594, 0.15617187321186066, 0.17308366298675537, 0.18999545276165009, 0.2069072425365448, 0.22381903231143951, 0.24073082208633423, 0.25764262676239014, 0.27455440163612366, 0.2914661765098572, 0.3083779811859131, 0.325289785861969, 0.3422015607357025, 0.35911333560943604, 0.37602514028549194, 0.39293694496154785, 0.40984871983528137, 0.4267604947090149, 0.4436722993850708, 0.4605841040611267, 0.47749587893486023, 0.49440765380859375, 0.5113194584846497]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 4.0, 4.0, 4.0, 1.0, 6.0, 4.0, 4.0, 8.0, 9.0, 3.0, 9.0, 10.0, 11.0, 18.0, 15.0, 17.0, 23.0, 29.0, 23.0, 29.0, 24.0, 34.0, 27.0, 44.0, 32.0, 37.0, 43.0, 43.0, 43.0, 39.0, 55.0, 41.0, 36.0, 25.0, 19.0, 22.0, 28.0, 26.0, 29.0, 26.0, 25.0, 16.0, 10.0, 11.0, 8.0, 7.0, 7.0, 6.0, 5.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3184284567832947, -0.3076654076576233, -0.2969023287296295, -0.28613927960395813, -0.27537623047828674, -0.26461315155029297, -0.2538501024246216, -0.243087038397789, -0.23232397437095642, -0.22156091034412384, -0.21079786121845245, -0.20003479719161987, -0.1892717331647873, -0.1785086691379547, -0.16774562001228333, -0.15698255598545074, -0.14621950685977936, -0.13545644283294678, -0.1246933862566948, -0.11393032968044281, -0.10316726565361023, -0.09240420907735825, -0.08164115250110626, -0.07087808847427368, -0.0601150318980217, -0.049351971596479416, -0.038588911294937134, -0.02782585471868515, -0.017062794417142868, -0.006299734115600586, 0.004463322460651398, 0.015226386487483978, 0.025989443063735962, 0.036752503365278244, 0.047515563666820526, 0.05827862024307251, 0.06904168426990509, 0.07980474084615707, 0.09056779742240906, 0.10133086144924164, 0.11209391802549362, 0.1228569746017456, 0.13362003862857819, 0.14438310265541077, 0.15514615178108215, 0.16590921580791473, 0.17667227983474731, 0.1874353289604187, 0.19819839298725128, 0.20896145701408386, 0.21972450613975525, 0.23048757016658783, 0.2412506341934204, 0.2520136833190918, 0.2627767324447632, 0.27353981137275696, 0.28430286049842834, 0.29506590962409973, 0.3058289885520935, 0.3165920376777649, 0.3273550868034363, 0.33811816573143005, 0.34888121485710144, 0.3596442937850952, 0.3704073429107666]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 10.0, 8.0, 8.0, 18.0, 22.0, 29.0, 39.0, 49.0, 90.0, 131.0, 185.0, 288.0, 422.0, 747.0, 1145.0, 1834.0, 3222.0, 5519.0, 10593.0, 19899.0, 40067.0, 80268.0, 162332.0, 258843.0, 221296.0, 119874.0, 58793.0, 29133.0, 14767.0, 7928.0, 4456.0, 2516.0, 1484.0, 898.0, 567.0, 354.0, 241.0, 163.0, 116.0, 59.0, 37.0, 28.0, 23.0, 18.0, 17.0, 8.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.171630859375, -0.16586685180664062, -0.16010284423828125, -0.15433883666992188, -0.1485748291015625, -0.14281082153320312, -0.13704681396484375, -0.13128280639648438, -0.125518798828125, -0.11975479125976562, -0.11399078369140625, -0.10822677612304688, -0.1024627685546875, -0.09669876098632812, -0.09093475341796875, -0.08517074584960938, -0.07940673828125, -0.07364273071289062, -0.06787872314453125, -0.062114715576171875, -0.0563507080078125, -0.050586700439453125, -0.04482269287109375, -0.039058685302734375, -0.033294677734375, -0.027530670166015625, -0.02176666259765625, -0.016002655029296875, -0.0102386474609375, -0.004474639892578125, 0.00128936767578125, 0.007053375244140625, 0.0128173828125, 0.018581390380859375, 0.02434539794921875, 0.030109405517578125, 0.0358734130859375, 0.041637420654296875, 0.04740142822265625, 0.053165435791015625, 0.058929443359375, 0.06469345092773438, 0.07045745849609375, 0.07622146606445312, 0.0819854736328125, 0.08774948120117188, 0.09351348876953125, 0.09927749633789062, 0.10504150390625, 0.11080551147460938, 0.11656951904296875, 0.12233352661132812, 0.1280975341796875, 0.13386154174804688, 0.13962554931640625, 0.14538955688476562, 0.151153564453125, 0.15691757202148438, 0.16268157958984375, 0.16844558715820312, 0.1742095947265625, 0.17997360229492188, 0.18573760986328125, 0.19150161743164062, 0.197265625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 9.0, 4.0, 15.0, 8.0, 7.0, 18.0, 12.0, 27.0, 21.0, 28.0, 32.0, 41.0, 46.0, 51.0, 33.0, 51.0, 53.0, 51.0, 58.0, 49.0, 50.0, 42.0, 44.0, 34.0, 34.0, 20.0, 25.0, 18.0, 22.0, 24.0, 14.0, 13.0, 5.0, 9.0, 8.0, 6.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0985107421875, -0.09549903869628906, -0.09248733520507812, -0.08947563171386719, -0.08646392822265625, -0.08345222473144531, -0.08044052124023438, -0.07742881774902344, -0.0744171142578125, -0.07140541076660156, -0.06839370727539062, -0.06538200378417969, -0.06237030029296875, -0.05935859680175781, -0.056346893310546875, -0.05333518981933594, -0.050323486328125, -0.04731178283691406, -0.044300079345703125, -0.04128837585449219, -0.03827667236328125, -0.03526496887207031, -0.032253265380859375, -0.029241561889648438, -0.0262298583984375, -0.023218154907226562, -0.020206451416015625, -0.017194747924804688, -0.01418304443359375, -0.011171340942382812, -0.008159637451171875, -0.0051479339599609375, -0.00213623046875, 0.0008754730224609375, 0.003887176513671875, 0.0068988800048828125, 0.00991058349609375, 0.012922286987304688, 0.015933990478515625, 0.018945693969726562, 0.0219573974609375, 0.024969100952148438, 0.027980804443359375, 0.030992507934570312, 0.03400421142578125, 0.03701591491699219, 0.040027618408203125, 0.04303932189941406, 0.046051025390625, 0.04906272888183594, 0.052074432373046875, 0.05508613586425781, 0.05809783935546875, 0.06110954284667969, 0.06412124633789062, 0.06713294982910156, 0.0701446533203125, 0.07315635681152344, 0.07616806030273438, 0.07917976379394531, 0.08219146728515625, 0.08520317077636719, 0.08821487426757812, 0.09122657775878906, 0.09423828125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 0.0, 5.0, 4.0, 12.0, 12.0, 14.0, 18.0, 36.0, 66.0, 116.0, 175.0, 373.0, 700.0, 1530.0, 5793.0, 49294.0, 798592.0, 175836.0, 11633.0, 2411.0, 912.0, 456.0, 244.0, 122.0, 71.0, 47.0, 27.0, 17.0, 11.0, 12.0, 6.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.552734375, -0.526031494140625, -0.49932861328125, -0.472625732421875, -0.4459228515625, -0.419219970703125, -0.39251708984375, -0.365814208984375, -0.339111328125, -0.312408447265625, -0.28570556640625, -0.259002685546875, -0.2322998046875, -0.205596923828125, -0.17889404296875, -0.152191162109375, -0.12548828125, -0.098785400390625, -0.07208251953125, -0.045379638671875, -0.0186767578125, 0.008026123046875, 0.03472900390625, 0.061431884765625, 0.088134765625, 0.114837646484375, 0.14154052734375, 0.168243408203125, 0.1949462890625, 0.221649169921875, 0.24835205078125, 0.275054931640625, 0.3017578125, 0.328460693359375, 0.35516357421875, 0.381866455078125, 0.4085693359375, 0.435272216796875, 0.46197509765625, 0.488677978515625, 0.515380859375, 0.542083740234375, 0.56878662109375, 0.595489501953125, 0.6221923828125, 0.648895263671875, 0.67559814453125, 0.702301025390625, 0.72900390625, 0.755706787109375, 0.78240966796875, 0.809112548828125, 0.8358154296875, 0.862518310546875, 0.88922119140625, 0.915924072265625, 0.942626953125, 0.969329833984375, 0.99603271484375, 1.022735595703125, 1.0494384765625, 1.076141357421875, 1.10284423828125, 1.129547119140625, 1.15625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 8.0, 9.0, 9.0, 19.0, 11.0, 15.0, 22.0, 22.0, 29.0, 38.0, 24.0, 23.0, 32.0, 35.0, 43.0, 57.0, 56.0, 48.0, 41.0, 44.0, 22.0, 37.0, 43.0, 42.0, 40.0, 34.0, 22.0, 25.0, 32.0, 19.0, 26.0, 17.0, 7.0, 17.0, 9.0, 9.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39404296875, -0.379669189453125, -0.36529541015625, -0.350921630859375, -0.3365478515625, -0.322174072265625, -0.30780029296875, -0.293426513671875, -0.279052734375, -0.264678955078125, -0.25030517578125, -0.235931396484375, -0.2215576171875, -0.207183837890625, -0.19281005859375, -0.178436279296875, -0.1640625, -0.149688720703125, -0.13531494140625, -0.120941162109375, -0.1065673828125, -0.092193603515625, -0.07781982421875, -0.063446044921875, -0.049072265625, -0.034698486328125, -0.02032470703125, -0.005950927734375, 0.0084228515625, 0.022796630859375, 0.03717041015625, 0.051544189453125, 0.06591796875, 0.080291748046875, 0.09466552734375, 0.109039306640625, 0.1234130859375, 0.137786865234375, 0.15216064453125, 0.166534423828125, 0.180908203125, 0.195281982421875, 0.20965576171875, 0.224029541015625, 0.2384033203125, 0.252777099609375, 0.26715087890625, 0.281524658203125, 0.2958984375, 0.310272216796875, 0.32464599609375, 0.339019775390625, 0.3533935546875, 0.367767333984375, 0.38214111328125, 0.396514892578125, 0.410888671875, 0.425262451171875, 0.43963623046875, 0.454010009765625, 0.4683837890625, 0.482757568359375, 0.49713134765625, 0.511505126953125, 0.52587890625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 8.0, 13.0, 19.0, 32.0, 42.0, 73.0, 126.0, 190.0, 354.0, 857.0, 2157.0, 7496.0, 47215.0, 598421.0, 354192.0, 28581.0, 5531.0, 1785.0, 663.0, 341.0, 177.0, 103.0, 56.0, 46.0, 24.0, 8.0, 7.0, 10.0, 7.0, 5.0, 3.0, 5.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.264892578125, -0.25331878662109375, -0.2417449951171875, -0.23017120361328125, -0.218597412109375, -0.20702362060546875, -0.1954498291015625, -0.18387603759765625, -0.17230224609375, -0.16072845458984375, -0.1491546630859375, -0.13758087158203125, -0.126007080078125, -0.11443328857421875, -0.1028594970703125, -0.09128570556640625, -0.0797119140625, -0.06813812255859375, -0.0565643310546875, -0.04499053955078125, -0.033416748046875, -0.02184295654296875, -0.0102691650390625, 0.00130462646484375, 0.01287841796875, 0.02445220947265625, 0.0360260009765625, 0.04759979248046875, 0.059173583984375, 0.07074737548828125, 0.0823211669921875, 0.09389495849609375, 0.10546875, 0.11704254150390625, 0.1286163330078125, 0.14019012451171875, 0.151763916015625, 0.16333770751953125, 0.1749114990234375, 0.18648529052734375, 0.19805908203125, 0.20963287353515625, 0.2212066650390625, 0.23278045654296875, 0.244354248046875, 0.25592803955078125, 0.2675018310546875, 0.27907562255859375, 0.2906494140625, 0.30222320556640625, 0.3137969970703125, 0.32537078857421875, 0.336944580078125, 0.34851837158203125, 0.3600921630859375, 0.37166595458984375, 0.38323974609375, 0.39481353759765625, 0.4063873291015625, 0.41796112060546875, 0.429534912109375, 0.44110870361328125, 0.4526824951171875, 0.46425628662109375, 0.475830078125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 8.0, 4.0, 10.0, 14.0, 18.0, 22.0, 21.0, 33.0, 43.0, 46.0, 48.0, 66.0, 82.0, 89.0, 91.0, 60.0, 70.0, 60.0, 40.0, 38.0, 19.0, 31.0, 16.0, 16.0, 13.0, 14.0, 4.0, 6.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.79304313659668e-05, -9.486079216003418e-05, -9.179115295410156e-05, -8.872151374816895e-05, -8.565187454223633e-05, -8.258223533630371e-05, -7.95125961303711e-05, -7.644295692443848e-05, -7.337331771850586e-05, -7.030367851257324e-05, -6.723403930664062e-05, -6.416440010070801e-05, -6.109476089477539e-05, -5.8025121688842773e-05, -5.4955482482910156e-05, -5.188584327697754e-05, -4.881620407104492e-05, -4.5746564865112305e-05, -4.267692565917969e-05, -3.960728645324707e-05, -3.653764724731445e-05, -3.3468008041381836e-05, -3.039836883544922e-05, -2.73287296295166e-05, -2.4259090423583984e-05, -2.1189451217651367e-05, -1.811981201171875e-05, -1.5050172805786133e-05, -1.1980533599853516e-05, -8.910894393920898e-06, -5.841255187988281e-06, -2.771615982055664e-06, 2.980232238769531e-07, 3.3676624298095703e-06, 6.4373016357421875e-06, 9.506940841674805e-06, 1.2576580047607422e-05, 1.564621925354004e-05, 1.8715858459472656e-05, 2.1785497665405273e-05, 2.485513687133789e-05, 2.7924776077270508e-05, 3.0994415283203125e-05, 3.406405448913574e-05, 3.713369369506836e-05, 4.0203332901000977e-05, 4.3272972106933594e-05, 4.634261131286621e-05, 4.941225051879883e-05, 5.2481889724731445e-05, 5.555152893066406e-05, 5.862116813659668e-05, 6.16908073425293e-05, 6.476044654846191e-05, 6.783008575439453e-05, 7.089972496032715e-05, 7.396936416625977e-05, 7.703900337219238e-05, 8.0108642578125e-05, 8.317828178405762e-05, 8.624792098999023e-05, 8.931756019592285e-05, 9.238719940185547e-05, 9.545683860778809e-05, 9.85264778137207e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 5.0, 4.0, 8.0, 8.0, 13.0, 9.0, 32.0, 22.0, 60.0, 93.0, 123.0, 207.0, 315.0, 559.0, 1062.0, 2216.0, 5828.0, 23379.0, 155656.0, 636744.0, 184233.0, 26743.0, 6576.0, 2254.0, 1041.0, 548.0, 296.0, 170.0, 114.0, 80.0, 44.0, 33.0, 22.0, 19.0, 13.0, 7.0, 5.0, 1.0, 6.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.267333984375, -0.25885772705078125, -0.2503814697265625, -0.24190521240234375, -0.233428955078125, -0.22495269775390625, -0.2164764404296875, -0.20800018310546875, -0.19952392578125, -0.19104766845703125, -0.1825714111328125, -0.17409515380859375, -0.165618896484375, -0.15714263916015625, -0.1486663818359375, -0.14019012451171875, -0.1317138671875, -0.12323760986328125, -0.1147613525390625, -0.10628509521484375, -0.097808837890625, -0.08933258056640625, -0.0808563232421875, -0.07238006591796875, -0.06390380859375, -0.05542755126953125, -0.0469512939453125, -0.03847503662109375, -0.029998779296875, -0.02152252197265625, -0.0130462646484375, -0.00457000732421875, 0.00390625, 0.01238250732421875, 0.0208587646484375, 0.02933502197265625, 0.037811279296875, 0.04628753662109375, 0.0547637939453125, 0.06324005126953125, 0.07171630859375, 0.08019256591796875, 0.0886688232421875, 0.09714508056640625, 0.105621337890625, 0.11409759521484375, 0.1225738525390625, 0.13105010986328125, 0.1395263671875, 0.14800262451171875, 0.1564788818359375, 0.16495513916015625, 0.173431396484375, 0.18190765380859375, 0.1903839111328125, 0.19886016845703125, 0.20733642578125, 0.21581268310546875, 0.2242889404296875, 0.23276519775390625, 0.241241455078125, 0.24971771240234375, 0.2581939697265625, 0.26667022705078125, 0.275146484375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 2.0, 9.0, 19.0, 12.0, 10.0, 21.0, 26.0, 30.0, 33.0, 54.0, 62.0, 73.0, 73.0, 89.0, 83.0, 73.0, 67.0, 62.0, 46.0, 44.0, 25.0, 23.0, 15.0, 16.0, 10.0, 13.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.18017578125, -0.17345809936523438, -0.16674041748046875, -0.16002273559570312, -0.1533050537109375, -0.14658737182617188, -0.13986968994140625, -0.13315200805664062, -0.126434326171875, -0.11971664428710938, -0.11299896240234375, -0.10628128051757812, -0.0995635986328125, -0.09284591674804688, -0.08612823486328125, -0.07941055297851562, -0.07269287109375, -0.06597518920898438, -0.05925750732421875, -0.052539825439453125, -0.0458221435546875, -0.039104461669921875, -0.03238677978515625, -0.025669097900390625, -0.018951416015625, -0.012233734130859375, -0.00551605224609375, 0.001201629638671875, 0.0079193115234375, 0.014636993408203125, 0.02135467529296875, 0.028072357177734375, 0.0347900390625, 0.041507720947265625, 0.04822540283203125, 0.054943084716796875, 0.0616607666015625, 0.06837844848632812, 0.07509613037109375, 0.08181381225585938, 0.088531494140625, 0.09524917602539062, 0.10196685791015625, 0.10868453979492188, 0.1154022216796875, 0.12211990356445312, 0.12883758544921875, 0.13555526733398438, 0.14227294921875, 0.14899063110351562, 0.15570831298828125, 0.16242599487304688, 0.1691436767578125, 0.17586135864257812, 0.18257904052734375, 0.18929672241210938, 0.196014404296875, 0.20273208618164062, 0.20944976806640625, 0.21616744995117188, 0.2228851318359375, 0.22960281372070312, 0.23632049560546875, 0.24303817749023438, 0.249755859375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 16.0, 23.0, 42.0, 78.0, 114.0, 178.0, 176.0, 149.0, 106.0, 58.0, 28.0, 17.0, 11.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.5629000663757324, -3.409046173095703, -3.255192279815674, -3.1013383865356445, -2.9474844932556152, -2.793630599975586, -2.6397764682769775, -2.4859225749969482, -2.332068681716919, -2.1782147884368896, -2.0243608951568604, -1.8705068826675415, -1.7166529893875122, -1.562799096107483, -1.408945083618164, -1.2550911903381348, -1.1012372970581055, -0.9473834037780762, -0.7935294508934021, -0.639675498008728, -0.48582160472869873, -0.33196771144866943, -0.17811375856399536, -0.02425980567932129, 0.129594087600708, 0.2834480106830597, 0.4373019337654114, 0.5911558866500854, 0.7450097799301147, 0.898863673210144, 1.052717685699463, 1.2065715789794922, 1.3604249954223633, 1.5142788887023926, 1.6681327819824219, 1.8219867944717407, 1.97584068775177, 2.1296944618225098, 2.283548593521118, 2.4374024868011475, 2.5912563800811768, 2.745110273361206, 2.8989641666412354, 3.0528180599212646, 3.206672191619873, 3.3605260848999023, 3.5143799781799316, 3.668233871459961, 3.8220877647399902, 3.9759416580200195, 4.129795551300049, 4.283649444580078, 4.437503337860107, 4.591357231140137, 4.745211124420166, 4.899065017700195, 5.052919387817383, 5.206773281097412, 5.360627174377441, 5.514481067657471, 5.6683349609375, 5.822188854217529, 5.976042747497559, 6.129897117614746, 6.283750534057617]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 4.0, 5.0, 11.0, 12.0, 12.0, 9.0, 15.0, 20.0, 19.0, 28.0, 29.0, 39.0, 48.0, 46.0, 51.0, 61.0, 64.0, 59.0, 55.0, 47.0, 39.0, 39.0, 41.0, 28.0, 37.0, 30.0, 32.0, 19.0, 31.0, 9.0, 9.0, 10.0, 9.0, 10.0, 6.0, 4.0, 5.0, 2.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.6403796672821045, -2.564349412918091, -2.488319158554077, -2.4122889041900635, -2.3362584114074707, -2.260228157043457, -2.1841979026794434, -2.1081676483154297, -2.032137393951416, -1.9561071395874023, -1.8800768852233887, -1.8040465116500854, -1.7280162572860718, -1.651986002922058, -1.5759556293487549, -1.4999253749847412, -1.4238951206207275, -1.3478648662567139, -1.2718346118927002, -1.195804238319397, -1.1197739839553833, -1.0437437295913696, -0.9677134156227112, -0.8916831016540527, -0.8156528472900391, -0.7396225929260254, -0.6635922789573669, -0.5875619649887085, -0.5115317106246948, -0.43550142645835876, -0.3594711422920227, -0.28344082832336426, -0.20741057395935059, -0.13138028979301453, -0.05535000562667847, 0.020680278539657593, 0.09671056270599365, 0.1727408468723297, 0.24877113103866577, 0.3248014450073242, 0.4008316993713379, 0.47686198353767395, 0.55289226770401, 0.6289225816726685, 0.7049528360366821, 0.7809830904006958, 0.8570134043693542, 0.9330437183380127, 1.0090739727020264, 1.08510422706604, 1.1611344814300537, 1.237164855003357, 1.3131951093673706, 1.3892253637313843, 1.4652557373046875, 1.5412859916687012, 1.6173162460327148, 1.6933465003967285, 1.7693767547607422, 1.8454071283340454, 1.921437382698059, 1.9974676370620728, 2.073498010635376, 2.1495282649993896, 2.2255585193634033]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 3.0, 5.0, 7.0, 8.0, 13.0, 15.0, 24.0, 40.0, 53.0, 90.0, 193.0, 329.0, 630.0, 1515.0, 3994.0, 22896.0, 4124936.0, 31536.0, 4775.0, 1661.0, 728.0, 378.0, 154.0, 116.0, 70.0, 41.0, 17.0, 24.0, 8.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.005859375, -0.9739837646484375, -0.942108154296875, -0.9102325439453125, -0.87835693359375, -0.8464813232421875, -0.814605712890625, -0.7827301025390625, -0.7508544921875, -0.7189788818359375, -0.687103271484375, -0.6552276611328125, -0.62335205078125, -0.5914764404296875, -0.559600830078125, -0.5277252197265625, -0.495849609375, -0.4639739990234375, -0.432098388671875, -0.4002227783203125, -0.36834716796875, -0.3364715576171875, -0.304595947265625, -0.2727203369140625, -0.2408447265625, -0.2089691162109375, -0.177093505859375, -0.1452178955078125, -0.11334228515625, -0.0814666748046875, -0.049591064453125, -0.0177154541015625, 0.01416015625, 0.0460357666015625, 0.077911376953125, 0.1097869873046875, 0.14166259765625, 0.1735382080078125, 0.205413818359375, 0.2372894287109375, 0.2691650390625, 0.3010406494140625, 0.332916259765625, 0.3647918701171875, 0.39666748046875, 0.4285430908203125, 0.460418701171875, 0.4922943115234375, 0.524169921875, 0.5560455322265625, 0.587921142578125, 0.6197967529296875, 0.65167236328125, 0.6835479736328125, 0.715423583984375, 0.7472991943359375, 0.7791748046875, 0.8110504150390625, 0.842926025390625, 0.8748016357421875, 0.90667724609375, 0.9385528564453125, 0.970428466796875, 1.0023040771484375, 1.0341796875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 4.0, 8.0, 6.0, 11.0, 10.0, 20.0, 23.0, 21.0, 31.0, 38.0, 40.0, 39.0, 49.0, 63.0, 54.0, 69.0, 59.0, 61.0, 53.0, 44.0, 48.0, 49.0, 40.0, 34.0, 35.0, 23.0, 19.0, 16.0, 10.0, 13.0, 8.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11761474609375, -0.11374378204345703, -0.10987281799316406, -0.1060018539428711, -0.10213088989257812, -0.09825992584228516, -0.09438896179199219, -0.09051799774169922, -0.08664703369140625, -0.08277606964111328, -0.07890510559082031, -0.07503414154052734, -0.07116317749023438, -0.0672922134399414, -0.06342124938964844, -0.05955028533935547, -0.0556793212890625, -0.05180835723876953, -0.04793739318847656, -0.044066429138183594, -0.040195465087890625, -0.036324501037597656, -0.03245353698730469, -0.02858257293701172, -0.02471160888671875, -0.02084064483642578, -0.016969680786132812, -0.013098716735839844, -0.009227752685546875, -0.005356788635253906, -0.0014858245849609375, 0.0023851394653320312, 0.006256103515625, 0.010127067565917969, 0.013998031616210938, 0.017868995666503906, 0.021739959716796875, 0.025610923767089844, 0.029481887817382812, 0.03335285186767578, 0.03722381591796875, 0.04109477996826172, 0.04496574401855469, 0.048836708068847656, 0.052707672119140625, 0.056578636169433594, 0.06044960021972656, 0.06432056427001953, 0.0681915283203125, 0.07206249237060547, 0.07593345642089844, 0.0798044204711914, 0.08367538452148438, 0.08754634857177734, 0.09141731262207031, 0.09528827667236328, 0.09915924072265625, 0.10303020477294922, 0.10690116882324219, 0.11077213287353516, 0.11464309692382812, 0.1185140609741211, 0.12238502502441406, 0.12625598907470703, 0.130126953125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 7.0, 8.0, 11.0, 36.0, 47.0, 74.0, 107.0, 149.0, 216.0, 385.0, 614.0, 1230.0, 2559.0, 7045.0, 45667.0, 4082654.0, 41526.0, 6691.0, 2400.0, 1191.0, 646.0, 363.0, 233.0, 145.0, 85.0, 71.0, 47.0, 27.0, 17.0, 9.0, 10.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85986328125, -0.8296737670898438, -0.7994842529296875, -0.7692947387695312, -0.739105224609375, -0.7089157104492188, -0.6787261962890625, -0.6485366821289062, -0.61834716796875, -0.5881576538085938, -0.5579681396484375, -0.5277786254882812, -0.497589111328125, -0.46739959716796875, -0.4372100830078125, -0.40702056884765625, -0.3768310546875, -0.34664154052734375, -0.3164520263671875, -0.28626251220703125, -0.256072998046875, -0.22588348388671875, -0.1956939697265625, -0.16550445556640625, -0.13531494140625, -0.10512542724609375, -0.0749359130859375, -0.04474639892578125, -0.014556884765625, 0.01563262939453125, 0.0458221435546875, 0.07601165771484375, 0.106201171875, 0.13639068603515625, 0.1665802001953125, 0.19676971435546875, 0.226959228515625, 0.25714874267578125, 0.2873382568359375, 0.31752777099609375, 0.34771728515625, 0.37790679931640625, 0.4080963134765625, 0.43828582763671875, 0.468475341796875, 0.49866485595703125, 0.5288543701171875, 0.5590438842773438, 0.5892333984375, 0.6194229125976562, 0.6496124267578125, 0.6798019409179688, 0.709991455078125, 0.7401809692382812, 0.7703704833984375, 0.8005599975585938, 0.83074951171875, 0.8609390258789062, 0.8911285400390625, 0.9213180541992188, 0.951507568359375, 0.9816970825195312, 1.0118865966796875, 1.0420761108398438, 1.072265625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 12.0, 22.0, 21.0, 56.0, 198.0, 3424.0, 190.0, 56.0, 31.0, 21.0, 12.0, 3.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1597900390625, -0.1543731689453125, -0.148956298828125, -0.1435394287109375, -0.13812255859375, -0.1327056884765625, -0.127288818359375, -0.1218719482421875, -0.116455078125, -0.1110382080078125, -0.105621337890625, -0.1002044677734375, -0.09478759765625, -0.0893707275390625, -0.083953857421875, -0.0785369873046875, -0.0731201171875, -0.0677032470703125, -0.062286376953125, -0.0568695068359375, -0.05145263671875, -0.0460357666015625, -0.040618896484375, -0.0352020263671875, -0.02978515625, -0.0243682861328125, -0.018951416015625, -0.0135345458984375, -0.00811767578125, -0.0027008056640625, 0.002716064453125, 0.0081329345703125, 0.0135498046875, 0.0189666748046875, 0.024383544921875, 0.0298004150390625, 0.03521728515625, 0.0406341552734375, 0.046051025390625, 0.0514678955078125, 0.056884765625, 0.0623016357421875, 0.067718505859375, 0.0731353759765625, 0.07855224609375, 0.0839691162109375, 0.089385986328125, 0.0948028564453125, 0.1002197265625, 0.1056365966796875, 0.111053466796875, 0.1164703369140625, 0.12188720703125, 0.1273040771484375, 0.132720947265625, 0.1381378173828125, 0.1435546875, 0.1489715576171875, 0.154388427734375, 0.1598052978515625, 0.16522216796875, 0.1706390380859375, 0.176055908203125, 0.1814727783203125, 0.1868896484375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 11.0, 19.0, 25.0, 28.0, 48.0, 50.0, 55.0, 91.0, 103.0, 66.0, 101.0, 99.0, 67.0, 60.0, 44.0, 34.0, 25.0, 9.0, 15.0, 11.0, 6.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5061824321746826, -0.49159905314445496, -0.4770156741142273, -0.46243229508399963, -0.447848916053772, -0.4332655668258667, -0.41868215799331665, -0.4040988087654114, -0.3895154297351837, -0.37493205070495605, -0.3603486716747284, -0.34576529264450073, -0.33118191361427307, -0.3165985345840454, -0.30201518535614014, -0.2874318063259125, -0.2728484272956848, -0.25826504826545715, -0.2436816692352295, -0.22909829020500183, -0.21451492607593536, -0.1999315470457077, -0.18534816801548004, -0.17076480388641357, -0.15618139505386353, -0.14159801602363586, -0.1270146369934082, -0.11243126541376114, -0.09784789383411407, -0.08326451480388641, -0.06868113577365875, -0.05409776419401169, -0.039514392614364624, -0.02493101730942726, -0.01034764014184475, 0.0042357370257377625, 0.018819112330675125, 0.03340248763561249, 0.04798586666584015, 0.06256923824548721, 0.07715261727571487, 0.09173599630594254, 0.1063193678855896, 0.12090274691581726, 0.13548612594604492, 0.15006950497627258, 0.16465288400650024, 0.1792362481355667, 0.19381962716579437, 0.20840300619602203, 0.2229863852262497, 0.23756974935531616, 0.2521531283855438, 0.2667365074157715, 0.28131988644599915, 0.2959032654762268, 0.31048664450645447, 0.32507002353668213, 0.3396534025669098, 0.35423678159713745, 0.3688201606273651, 0.3834035396575928, 0.39798688888549805, 0.4125702679157257, 0.42715364694595337]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 7.0, 9.0, 11.0, 5.0, 10.0, 4.0, 22.0, 23.0, 11.0, 26.0, 23.0, 29.0, 24.0, 18.0, 30.0, 31.0, 34.0, 30.0, 35.0, 47.0, 44.0, 53.0, 43.0, 48.0, 33.0, 43.0, 34.0, 37.0, 24.0, 25.0, 24.0, 22.0, 24.0, 13.0, 22.0, 11.0, 21.0, 9.0, 8.0, 6.0, 6.0, 4.0, 5.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2699427008628845, -0.26148009300231934, -0.25301751494407654, -0.24455492198467255, -0.23609232902526855, -0.22762973606586456, -0.21916714310646057, -0.21070455014705658, -0.2022419571876526, -0.1937793642282486, -0.1853167712688446, -0.1768541783094406, -0.16839158535003662, -0.15992899239063263, -0.15146639943122864, -0.14300380647182465, -0.13454121351242065, -0.12607862055301666, -0.11761602759361267, -0.10915343463420868, -0.10069084167480469, -0.0922282487154007, -0.0837656557559967, -0.07530306279659271, -0.06684046983718872, -0.05837787687778473, -0.04991528391838074, -0.041452690958976746, -0.032990097999572754, -0.024527505040168762, -0.01606491208076477, -0.007602319121360779, 0.0008602738380432129, 0.009322866797447205, 0.017785459756851196, 0.026248052716255188, 0.03471064567565918, 0.04317323863506317, 0.05163583159446716, 0.060098424553871155, 0.06856101751327515, 0.07702361047267914, 0.08548620343208313, 0.09394879639148712, 0.10241138935089111, 0.1108739823102951, 0.1193365752696991, 0.1277991682291031, 0.13626176118850708, 0.14472435414791107, 0.15318694710731506, 0.16164954006671906, 0.17011213302612305, 0.17857472598552704, 0.18703731894493103, 0.19549991190433502, 0.203962504863739, 0.212425097823143, 0.220887690782547, 0.229350283741951, 0.23781287670135498, 0.24627546966075897, 0.25473806262016296, 0.26320064067840576, 0.27166324853897095]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 4.0, 6.0, 9.0, 9.0, 23.0, 19.0, 46.0, 59.0, 74.0, 103.0, 184.0, 297.0, 498.0, 905.0, 1477.0, 3163.0, 6761.0, 15375.0, 36677.0, 91389.0, 233658.0, 357672.0, 179193.0, 69821.0, 28128.0, 11850.0, 5427.0, 2556.0, 1330.0, 714.0, 378.0, 255.0, 147.0, 107.0, 67.0, 61.0, 32.0, 18.0, 17.0, 14.0, 8.0, 5.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0], "bins": [-0.2496337890625, -0.24257278442382812, -0.23551177978515625, -0.22845077514648438, -0.2213897705078125, -0.21432876586914062, -0.20726776123046875, -0.20020675659179688, -0.193145751953125, -0.18608474731445312, -0.17902374267578125, -0.17196273803710938, -0.1649017333984375, -0.15784072875976562, -0.15077972412109375, -0.14371871948242188, -0.13665771484375, -0.12959671020507812, -0.12253570556640625, -0.11547470092773438, -0.1084136962890625, -0.10135269165039062, -0.09429168701171875, -0.08723068237304688, -0.080169677734375, -0.07310867309570312, -0.06604766845703125, -0.058986663818359375, -0.0519256591796875, -0.044864654541015625, -0.03780364990234375, -0.030742645263671875, -0.023681640625, -0.016620635986328125, -0.00955963134765625, -0.002498626708984375, 0.0045623779296875, 0.011623382568359375, 0.01868438720703125, 0.025745391845703125, 0.032806396484375, 0.039867401123046875, 0.04692840576171875, 0.053989410400390625, 0.0610504150390625, 0.06811141967773438, 0.07517242431640625, 0.08223342895507812, 0.08929443359375, 0.09635543823242188, 0.10341644287109375, 0.11047744750976562, 0.1175384521484375, 0.12459945678710938, 0.13166046142578125, 0.13872146606445312, 0.145782470703125, 0.15284347534179688, 0.15990447998046875, 0.16696548461914062, 0.1740264892578125, 0.18108749389648438, 0.18814849853515625, 0.19520950317382812, 0.2022705078125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 3.0, 8.0, 7.0, 6.0, 13.0, 18.0, 20.0, 20.0, 25.0, 27.0, 37.0, 54.0, 48.0, 70.0, 52.0, 58.0, 74.0, 65.0, 58.0, 44.0, 55.0, 49.0, 42.0, 24.0, 27.0, 21.0, 24.0, 18.0, 11.0, 13.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.127197265625, -0.12273025512695312, -0.11826324462890625, -0.11379623413085938, -0.1093292236328125, -0.10486221313476562, -0.10039520263671875, -0.09592819213867188, -0.091461181640625, -0.08699417114257812, -0.08252716064453125, -0.07806015014648438, -0.0735931396484375, -0.06912612915039062, -0.06465911865234375, -0.060192108154296875, -0.05572509765625, -0.051258087158203125, -0.04679107666015625, -0.042324066162109375, -0.0378570556640625, -0.033390045166015625, -0.02892303466796875, -0.024456024169921875, -0.019989013671875, -0.015522003173828125, -0.01105499267578125, -0.006587982177734375, -0.0021209716796875, 0.002346038818359375, 0.00681304931640625, 0.011280059814453125, 0.0157470703125, 0.020214080810546875, 0.02468109130859375, 0.029148101806640625, 0.0336151123046875, 0.038082122802734375, 0.04254913330078125, 0.047016143798828125, 0.051483154296875, 0.055950164794921875, 0.06041717529296875, 0.06488418579101562, 0.0693511962890625, 0.07381820678710938, 0.07828521728515625, 0.08275222778320312, 0.08721923828125, 0.09168624877929688, 0.09615325927734375, 0.10062026977539062, 0.1050872802734375, 0.10955429077148438, 0.11402130126953125, 0.11848831176757812, 0.122955322265625, 0.12742233276367188, 0.13188934326171875, 0.13635635375976562, 0.1408233642578125, 0.14529037475585938, 0.14975738525390625, 0.15422439575195312, 0.15869140625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 5.0, 3.0, 3.0, 7.0, 8.0, 12.0, 26.0, 23.0, 52.0, 66.0, 80.0, 103.0, 177.0, 285.0, 409.0, 666.0, 1449.0, 3992.0, 20164.0, 257502.0, 704712.0, 47629.0, 6756.0, 1944.0, 938.0, 489.0, 364.0, 224.0, 137.0, 90.0, 66.0, 45.0, 41.0, 20.0, 16.0, 12.0, 12.0, 11.0, 5.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5556640625, -0.537261962890625, -0.51885986328125, -0.500457763671875, -0.4820556640625, -0.463653564453125, -0.44525146484375, -0.426849365234375, -0.408447265625, -0.390045166015625, -0.37164306640625, -0.353240966796875, -0.3348388671875, -0.316436767578125, -0.29803466796875, -0.279632568359375, -0.26123046875, -0.242828369140625, -0.22442626953125, -0.206024169921875, -0.1876220703125, -0.169219970703125, -0.15081787109375, -0.132415771484375, -0.114013671875, -0.095611572265625, -0.07720947265625, -0.058807373046875, -0.0404052734375, -0.022003173828125, -0.00360107421875, 0.014801025390625, 0.033203125, 0.051605224609375, 0.07000732421875, 0.088409423828125, 0.1068115234375, 0.125213623046875, 0.14361572265625, 0.162017822265625, 0.180419921875, 0.198822021484375, 0.21722412109375, 0.235626220703125, 0.2540283203125, 0.272430419921875, 0.29083251953125, 0.309234619140625, 0.32763671875, 0.346038818359375, 0.36444091796875, 0.382843017578125, 0.4012451171875, 0.419647216796875, 0.43804931640625, 0.456451416015625, 0.474853515625, 0.493255615234375, 0.51165771484375, 0.530059814453125, 0.5484619140625, 0.566864013671875, 0.58526611328125, 0.603668212890625, 0.6220703125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 9.0, 9.0, 5.0, 18.0, 22.0, 24.0, 20.0, 19.0, 21.0, 20.0, 29.0, 39.0, 31.0, 45.0, 49.0, 50.0, 39.0, 47.0, 39.0, 35.0, 36.0, 42.0, 38.0, 41.0, 29.0, 26.0, 28.0, 28.0, 23.0, 24.0, 18.0, 24.0, 10.0, 9.0, 14.0, 4.0, 8.0, 9.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.467041015625, -0.4519615173339844, -0.43688201904296875, -0.4218025207519531, -0.4067230224609375, -0.3916435241699219, -0.37656402587890625, -0.3614845275878906, -0.346405029296875, -0.3313255310058594, -0.31624603271484375, -0.3011665344238281, -0.2860870361328125, -0.2710075378417969, -0.25592803955078125, -0.24084854125976562, -0.22576904296875, -0.21068954467773438, -0.19561004638671875, -0.18053054809570312, -0.1654510498046875, -0.15037155151367188, -0.13529205322265625, -0.12021255493164062, -0.105133056640625, -0.09005355834960938, -0.07497406005859375, -0.059894561767578125, -0.0448150634765625, -0.029735565185546875, -0.01465606689453125, 0.000423431396484375, 0.0155029296875, 0.030582427978515625, 0.04566192626953125, 0.060741424560546875, 0.0758209228515625, 0.09090042114257812, 0.10597991943359375, 0.12105941772460938, 0.136138916015625, 0.15121841430664062, 0.16629791259765625, 0.18137741088867188, 0.1964569091796875, 0.21153640747070312, 0.22661590576171875, 0.24169540405273438, 0.25677490234375, 0.2718544006347656, 0.28693389892578125, 0.3020133972167969, 0.3170928955078125, 0.3321723937988281, 0.34725189208984375, 0.3623313903808594, 0.377410888671875, 0.3924903869628906, 0.40756988525390625, 0.4226493835449219, 0.4377288818359375, 0.4528083801269531, 0.46788787841796875, 0.4829673767089844, 0.498046875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 7.0, 10.0, 18.0, 25.0, 33.0, 55.0, 85.0, 139.0, 261.0, 586.0, 1374.0, 4905.0, 33725.0, 599703.0, 378347.0, 23289.0, 3742.0, 1169.0, 491.0, 239.0, 138.0, 70.0, 45.0, 22.0, 24.0, 14.0, 7.0, 7.0, 5.0, 5.0, 5.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.336181640625, -0.3256492614746094, -0.31511688232421875, -0.3045845031738281, -0.2940521240234375, -0.2835197448730469, -0.27298736572265625, -0.2624549865722656, -0.251922607421875, -0.24139022827148438, -0.23085784912109375, -0.22032546997070312, -0.2097930908203125, -0.19926071166992188, -0.18872833251953125, -0.17819595336914062, -0.16766357421875, -0.15713119506835938, -0.14659881591796875, -0.13606643676757812, -0.1255340576171875, -0.11500167846679688, -0.10446929931640625, -0.09393692016601562, -0.083404541015625, -0.07287216186523438, -0.06233978271484375, -0.051807403564453125, -0.0412750244140625, -0.030742645263671875, -0.02021026611328125, -0.009677886962890625, 0.0008544921875, 0.011386871337890625, 0.02191925048828125, 0.032451629638671875, 0.0429840087890625, 0.053516387939453125, 0.06404876708984375, 0.07458114624023438, 0.085113525390625, 0.09564590454101562, 0.10617828369140625, 0.11671066284179688, 0.1272430419921875, 0.13777542114257812, 0.14830780029296875, 0.15884017944335938, 0.16937255859375, 0.17990493774414062, 0.19043731689453125, 0.20096969604492188, 0.2115020751953125, 0.22203445434570312, 0.23256683349609375, 0.24309921264648438, 0.253631591796875, 0.2641639709472656, 0.27469635009765625, 0.2852287292480469, 0.2957611083984375, 0.3062934875488281, 0.31682586669921875, 0.3273582458496094, 0.337890625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 7.0, 7.0, 2.0, 9.0, 9.0, 13.0, 17.0, 19.0, 22.0, 26.0, 43.0, 62.0, 87.0, 109.0, 119.0, 98.0, 75.0, 47.0, 47.0, 24.0, 33.0, 27.0, 32.0, 22.0, 9.0, 9.0, 7.0, 2.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.07046890258789e-05, -7.765740156173706e-05, -7.461011409759521e-05, -7.156282663345337e-05, -6.851553916931152e-05, -6.546825170516968e-05, -6.242096424102783e-05, -5.9373676776885986e-05, -5.632638931274414e-05, -5.3279101848602295e-05, -5.023181438446045e-05, -4.7184526920318604e-05, -4.413723945617676e-05, -4.108995199203491e-05, -3.8042664527893066e-05, -3.499537706375122e-05, -3.1948089599609375e-05, -2.890080213546753e-05, -2.5853514671325684e-05, -2.2806227207183838e-05, -1.9758939743041992e-05, -1.6711652278900146e-05, -1.36643648147583e-05, -1.0617077350616455e-05, -7.569789886474609e-06, -4.522502422332764e-06, -1.475214958190918e-06, 1.5720725059509277e-06, 4.6193599700927734e-06, 7.666647434234619e-06, 1.0713934898376465e-05, 1.376122236251831e-05, 1.6808509826660156e-05, 1.9855797290802002e-05, 2.2903084754943848e-05, 2.5950372219085693e-05, 2.899765968322754e-05, 3.2044947147369385e-05, 3.509223461151123e-05, 3.8139522075653076e-05, 4.118680953979492e-05, 4.423409700393677e-05, 4.728138446807861e-05, 5.032867193222046e-05, 5.3375959396362305e-05, 5.642324686050415e-05, 5.9470534324645996e-05, 6.251782178878784e-05, 6.556510925292969e-05, 6.861239671707153e-05, 7.165968418121338e-05, 7.470697164535522e-05, 7.775425910949707e-05, 8.080154657363892e-05, 8.384883403778076e-05, 8.689612150192261e-05, 8.994340896606445e-05, 9.29906964302063e-05, 9.603798389434814e-05, 9.908527135848999e-05, 0.00010213255882263184, 0.00010517984628677368, 0.00010822713375091553, 0.00011127442121505737, 0.00011432170867919922]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 6.0, 5.0, 6.0, 5.0, 4.0, 17.0, 29.0, 45.0, 72.0, 137.0, 257.0, 529.0, 1142.0, 3095.0, 14799.0, 181382.0, 766566.0, 68621.0, 8003.0, 2154.0, 827.0, 397.0, 191.0, 97.0, 68.0, 39.0, 22.0, 8.0, 7.0, 5.0, 9.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.445068359375, -0.4340324401855469, -0.42299652099609375, -0.4119606018066406, -0.4009246826171875, -0.3898887634277344, -0.37885284423828125, -0.3678169250488281, -0.356781005859375, -0.3457450866699219, -0.33470916748046875, -0.3236732482910156, -0.3126373291015625, -0.3016014099121094, -0.29056549072265625, -0.2795295715332031, -0.26849365234375, -0.2574577331542969, -0.24642181396484375, -0.23538589477539062, -0.2243499755859375, -0.21331405639648438, -0.20227813720703125, -0.19124221801757812, -0.180206298828125, -0.16917037963867188, -0.15813446044921875, -0.14709854125976562, -0.1360626220703125, -0.12502670288085938, -0.11399078369140625, -0.10295486450195312, -0.0919189453125, -0.08088302612304688, -0.06984710693359375, -0.058811187744140625, -0.0477752685546875, -0.036739349365234375, -0.02570343017578125, -0.014667510986328125, -0.003631591796875, 0.007404327392578125, 0.01844024658203125, 0.029476165771484375, 0.0405120849609375, 0.051548004150390625, 0.06258392333984375, 0.07361984252929688, 0.08465576171875, 0.09569168090820312, 0.10672760009765625, 0.11776351928710938, 0.1287994384765625, 0.13983535766601562, 0.15087127685546875, 0.16190719604492188, 0.172943115234375, 0.18397903442382812, 0.19501495361328125, 0.20605087280273438, 0.2170867919921875, 0.22812271118164062, 0.23915863037109375, 0.2501945495605469, 0.26123046875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 6.0, 7.0, 8.0, 15.0, 12.0, 29.0, 26.0, 21.0, 46.0, 45.0, 54.0, 56.0, 82.0, 94.0, 91.0, 79.0, 65.0, 51.0, 46.0, 32.0, 25.0, 21.0, 26.0, 20.0, 7.0, 10.0, 6.0, 4.0, 6.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2149658203125, -0.20880889892578125, -0.2026519775390625, -0.19649505615234375, -0.190338134765625, -0.18418121337890625, -0.1780242919921875, -0.17186737060546875, -0.16571044921875, -0.15955352783203125, -0.1533966064453125, -0.14723968505859375, -0.141082763671875, -0.13492584228515625, -0.1287689208984375, -0.12261199951171875, -0.116455078125, -0.11029815673828125, -0.1041412353515625, -0.09798431396484375, -0.091827392578125, -0.08567047119140625, -0.0795135498046875, -0.07335662841796875, -0.06719970703125, -0.06104278564453125, -0.0548858642578125, -0.04872894287109375, -0.042572021484375, -0.03641510009765625, -0.0302581787109375, -0.02410125732421875, -0.0179443359375, -0.01178741455078125, -0.0056304931640625, 0.00052642822265625, 0.006683349609375, 0.01284027099609375, 0.0189971923828125, 0.02515411376953125, 0.03131103515625, 0.03746795654296875, 0.0436248779296875, 0.04978179931640625, 0.055938720703125, 0.06209564208984375, 0.0682525634765625, 0.07440948486328125, 0.08056640625, 0.08672332763671875, 0.0928802490234375, 0.09903717041015625, 0.105194091796875, 0.11135101318359375, 0.1175079345703125, 0.12366485595703125, 0.12982177734375, 0.13597869873046875, 0.1421356201171875, 0.14829254150390625, 0.154449462890625, 0.16060638427734375, 0.1667633056640625, 0.17292022705078125, 0.1790771484375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 9.0, 10.0, 44.0, 87.0, 139.0, 194.0, 203.0, 142.0, 82.0, 53.0, 23.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.191871643066406, -5.030223369598389, -4.868575096130371, -4.706927299499512, -4.545279026031494, -4.383630752563477, -4.221982955932617, -4.0603346824646, -3.898686408996582, -3.7370381355285645, -3.575390100479126, -3.4137420654296875, -3.25209379196167, -3.0904455184936523, -2.928797483444214, -2.7671494483947754, -2.605501174926758, -2.4438529014587402, -2.2822048664093018, -2.1205568313598633, -1.9589085578918457, -1.7972604036331177, -1.6356122493743896, -1.4739640951156616, -1.3123159408569336, -1.1506677865982056, -0.9890196323394775, -0.8273714780807495, -0.6657233238220215, -0.5040751695632935, -0.34242701530456543, -0.1807788610458374, -0.019130229949951172, 0.14251792430877686, 0.3041660785675049, 0.4658142328262329, 0.6274623870849609, 0.789110541343689, 0.950758695602417, 1.112406849861145, 1.274055004119873, 1.435703158378601, 1.597351312637329, 1.7589994668960571, 1.9206476211547852, 2.0822958946228027, 2.243943929672241, 2.4055919647216797, 2.5672402381896973, 2.728888511657715, 2.8905365467071533, 3.052184581756592, 3.2138328552246094, 3.375481128692627, 3.5371291637420654, 3.698777198791504, 3.8604254722595215, 4.022073745727539, 4.183721542358398, 4.345369815826416, 4.507018089294434, 4.668666362762451, 4.830314636230469, 4.991962432861328, 5.153610706329346]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 7.0, 4.0, 7.0, 9.0, 13.0, 20.0, 27.0, 28.0, 29.0, 58.0, 42.0, 50.0, 57.0, 47.0, 63.0, 50.0, 54.0, 66.0, 56.0, 57.0, 28.0, 37.0, 24.0, 23.0, 32.0, 28.0, 15.0, 13.0, 12.0, 10.0, 9.0, 6.0, 7.0, 6.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.012929677963257, -2.918456554412842, -2.8239834308624268, -2.7295103073120117, -2.6350371837615967, -2.5405640602111816, -2.4460911750793457, -2.3516178131103516, -2.2571449279785156, -2.1626718044281006, -2.0681986808776855, -1.9737255573272705, -1.8792524337768555, -1.7847793102264404, -1.690306305885315, -1.5958331823349, -1.5013599395751953, -1.4068868160247803, -1.3124136924743652, -1.2179405689239502, -1.1234674453735352, -1.0289943218231201, -0.9345213174819946, -0.8400481939315796, -0.7455750703811646, -0.6511019468307495, -0.5566288232803345, -0.4621557593345642, -0.36768263578414917, -0.27320951223373413, -0.17873644828796387, -0.08426332473754883, 0.01020956039428711, 0.10468266904354095, 0.1991557776927948, 0.29362887144088745, 0.3881019949913025, 0.48257511854171753, 0.5770481824874878, 0.6715213060379028, 0.7659944295883179, 0.8604675531387329, 0.954940676689148, 1.0494136810302734, 1.1438868045806885, 1.2383599281311035, 1.3328330516815186, 1.4273061752319336, 1.5217792987823486, 1.6162524223327637, 1.7107255458831787, 1.8051986694335938, 1.8996717929840088, 1.9941449165344238, 2.0886178016662598, 2.183091163635254, 2.27756404876709, 2.372037172317505, 2.46651029586792, 2.560983419418335, 2.65545654296875, 2.749929666519165, 2.84440279006958, 2.938875675201416, 3.03334903717041]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 10.0, 14.0, 11.0, 14.0, 23.0, 34.0, 39.0, 48.0, 75.0, 137.0, 176.0, 276.0, 446.0, 684.0, 1165.0, 2321.0, 4740.0, 13963.0, 69278.0, 3898357.0, 166350.0, 22636.0, 6737.0, 2852.0, 1553.0, 823.0, 510.0, 322.0, 236.0, 142.0, 109.0, 65.0, 48.0, 27.0, 15.0, 13.0, 12.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47412109375, -0.4586639404296875, -0.443206787109375, -0.4277496337890625, -0.41229248046875, -0.3968353271484375, -0.381378173828125, -0.3659210205078125, -0.3504638671875, -0.3350067138671875, -0.319549560546875, -0.3040924072265625, -0.28863525390625, -0.2731781005859375, -0.257720947265625, -0.2422637939453125, -0.226806640625, -0.2113494873046875, -0.195892333984375, -0.1804351806640625, -0.16497802734375, -0.1495208740234375, -0.134063720703125, -0.1186065673828125, -0.1031494140625, -0.0876922607421875, -0.072235107421875, -0.0567779541015625, -0.04132080078125, -0.0258636474609375, -0.010406494140625, 0.0050506591796875, 0.0205078125, 0.0359649658203125, 0.051422119140625, 0.0668792724609375, 0.08233642578125, 0.0977935791015625, 0.113250732421875, 0.1287078857421875, 0.1441650390625, 0.1596221923828125, 0.175079345703125, 0.1905364990234375, 0.20599365234375, 0.2214508056640625, 0.236907958984375, 0.2523651123046875, 0.267822265625, 0.2832794189453125, 0.298736572265625, 0.3141937255859375, 0.32965087890625, 0.3451080322265625, 0.360565185546875, 0.3760223388671875, 0.3914794921875, 0.4069366455078125, 0.422393798828125, 0.4378509521484375, 0.45330810546875, 0.4687652587890625, 0.484222412109375, 0.4996795654296875, 0.51513671875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 1.0, 1.0, 2.0, 4.0, 9.0, 3.0, 8.0, 17.0, 16.0, 18.0, 23.0, 23.0, 33.0, 38.0, 48.0, 48.0, 50.0, 71.0, 66.0, 67.0, 53.0, 66.0, 60.0, 54.0, 34.0, 39.0, 32.0, 29.0, 13.0, 22.0, 13.0, 11.0, 5.0, 7.0, 11.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.15478515625, -0.15075111389160156, -0.14671707153320312, -0.1426830291748047, -0.13864898681640625, -0.1346149444580078, -0.13058090209960938, -0.12654685974121094, -0.1225128173828125, -0.11847877502441406, -0.11444473266601562, -0.11041069030761719, -0.10637664794921875, -0.10234260559082031, -0.09830856323242188, -0.09427452087402344, -0.090240478515625, -0.08620643615722656, -0.08217239379882812, -0.07813835144042969, -0.07410430908203125, -0.07007026672363281, -0.06603622436523438, -0.06200218200683594, -0.0579681396484375, -0.05393409729003906, -0.049900054931640625, -0.04586601257324219, -0.04183197021484375, -0.03779792785644531, -0.033763885498046875, -0.029729843139648438, -0.02569580078125, -0.021661758422851562, -0.017627716064453125, -0.013593673706054688, -0.00955963134765625, -0.0055255889892578125, -0.001491546630859375, 0.0025424957275390625, 0.0065765380859375, 0.010610580444335938, 0.014644622802734375, 0.018678665161132812, 0.02271270751953125, 0.026746749877929688, 0.030780792236328125, 0.03481483459472656, 0.038848876953125, 0.04288291931152344, 0.046916961669921875, 0.05095100402832031, 0.05498504638671875, 0.05901908874511719, 0.06305313110351562, 0.06708717346191406, 0.0711212158203125, 0.07515525817871094, 0.07918930053710938, 0.08322334289550781, 0.08725738525390625, 0.09129142761230469, 0.09532546997070312, 0.09935951232910156, 0.1033935546875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 6.0, 7.0, 8.0, 6.0, 12.0, 11.0, 13.0, 20.0, 22.0, 33.0, 48.0, 69.0, 87.0, 120.0, 199.0, 361.0, 725.0, 1519.0, 4455.0, 21148.0, 3307784.0, 831421.0, 18939.0, 4131.0, 1432.0, 665.0, 388.0, 205.0, 118.0, 84.0, 62.0, 47.0, 37.0, 26.0, 18.0, 18.0, 10.0, 7.0, 2.0, 6.0, 3.0, 6.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.0595703125, -1.0301132202148438, -1.0006561279296875, -0.9711990356445312, -0.941741943359375, -0.9122848510742188, -0.8828277587890625, -0.8533706665039062, -0.82391357421875, -0.7944564819335938, -0.7649993896484375, -0.7355422973632812, -0.706085205078125, -0.6766281127929688, -0.6471710205078125, -0.6177139282226562, -0.5882568359375, -0.5587997436523438, -0.5293426513671875, -0.49988555908203125, -0.470428466796875, -0.44097137451171875, -0.4115142822265625, -0.38205718994140625, -0.35260009765625, -0.32314300537109375, -0.2936859130859375, -0.26422882080078125, -0.234771728515625, -0.20531463623046875, -0.1758575439453125, -0.14640045166015625, -0.116943359375, -0.08748626708984375, -0.0580291748046875, -0.02857208251953125, 0.000885009765625, 0.03034210205078125, 0.0597991943359375, 0.08925628662109375, 0.11871337890625, 0.14817047119140625, 0.1776275634765625, 0.20708465576171875, 0.236541748046875, 0.26599884033203125, 0.2954559326171875, 0.32491302490234375, 0.3543701171875, 0.38382720947265625, 0.4132843017578125, 0.44274139404296875, 0.472198486328125, 0.5016555786132812, 0.5311126708984375, 0.5605697631835938, 0.59002685546875, 0.6194839477539062, 0.6489410400390625, 0.6783981323242188, 0.707855224609375, 0.7373123168945312, 0.7667694091796875, 0.7962265014648438, 0.82568359375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 12.0, 9.0, 13.0, 36.0, 87.0, 536.0, 3076.0, 183.0, 53.0, 27.0, 23.0, 8.0, 8.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62060546875, -0.6062431335449219, -0.5918807983398438, -0.5775184631347656, -0.5631561279296875, -0.5487937927246094, -0.5344314575195312, -0.5200691223144531, -0.505706787109375, -0.4913444519042969, -0.47698211669921875, -0.4626197814941406, -0.4482574462890625, -0.4338951110839844, -0.41953277587890625, -0.4051704406738281, -0.39080810546875, -0.3764457702636719, -0.36208343505859375, -0.3477210998535156, -0.3333587646484375, -0.3189964294433594, -0.30463409423828125, -0.2902717590332031, -0.275909423828125, -0.2615470886230469, -0.24718475341796875, -0.23282241821289062, -0.2184600830078125, -0.20409774780273438, -0.18973541259765625, -0.17537307739257812, -0.1610107421875, -0.14664840698242188, -0.13228607177734375, -0.11792373657226562, -0.1035614013671875, -0.08919906616210938, -0.07483673095703125, -0.060474395751953125, -0.046112060546875, -0.031749725341796875, -0.01738739013671875, -0.003025054931640625, 0.0113372802734375, 0.025699615478515625, 0.04006195068359375, 0.054424285888671875, 0.06878662109375, 0.08314895629882812, 0.09751129150390625, 0.11187362670898438, 0.1262359619140625, 0.14059829711914062, 0.15496063232421875, 0.16932296752929688, 0.183685302734375, 0.19804763793945312, 0.21240997314453125, 0.22677230834960938, 0.2411346435546875, 0.2554969787597656, 0.26985931396484375, 0.2842216491699219, 0.298583984375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 5.0, 8.0, 11.0, 29.0, 42.0, 50.0, 66.0, 82.0, 69.0, 106.0, 102.0, 107.0, 71.0, 58.0, 61.0, 42.0, 27.0, 14.0, 13.0, 5.0, 5.0, 4.0, 7.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.9232059717178345, -0.8934664726257324, -0.8637269139289856, -0.8339874148368835, -0.8042478561401367, -0.7745083570480347, -0.7447688579559326, -0.7150293588638306, -0.6852898001670837, -0.6555503010749817, -0.6258107423782349, -0.5960712432861328, -0.5663317441940308, -0.5365921854972839, -0.5068526864051819, -0.47711315751075745, -0.447373628616333, -0.41763409972190857, -0.38789457082748413, -0.3581550717353821, -0.32841554284095764, -0.2986760139465332, -0.26893651485443115, -0.2391969859600067, -0.20945745706558228, -0.17971792817115784, -0.1499784141778946, -0.12023889273405075, -0.09049937129020691, -0.06075984239578247, -0.031020328402519226, -0.0012808144092559814, 0.02845865488052368, 0.05819817632436752, 0.08793769776821136, 0.1176772192120552, 0.14741674065589905, 0.1771562695503235, 0.20689578354358673, 0.23663529753684998, 0.2663748264312744, 0.29611435532569885, 0.3258538842201233, 0.35559338331222534, 0.3853329122066498, 0.4150724411010742, 0.44481194019317627, 0.4745514690876007, 0.5042909979820251, 0.5340304970741272, 0.563770055770874, 0.5935095548629761, 0.6232490539550781, 0.652988612651825, 0.682728111743927, 0.7124676704406738, 0.7422071695327759, 0.7719466686248779, 0.8016862273216248, 0.8314257264137268, 0.8611652851104736, 0.8909047842025757, 0.9206442832946777, 0.9503837823867798, 0.9801233410835266]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 10.0, 12.0, 10.0, 8.0, 13.0, 7.0, 23.0, 28.0, 26.0, 26.0, 25.0, 33.0, 37.0, 36.0, 51.0, 40.0, 38.0, 52.0, 55.0, 40.0, 47.0, 42.0, 49.0, 37.0, 31.0, 37.0, 33.0, 24.0, 29.0, 13.0, 20.0, 14.0, 11.0, 13.0, 9.0, 8.0, 4.0, 1.0, 5.0, 1.0, 7.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7504131197929382, -0.7291819453239441, -0.7079508304595947, -0.6867196559906006, -0.6654884815216064, -0.6442573666572571, -0.6230261921882629, -0.6017950773239136, -0.5805639028549194, -0.5593327283859253, -0.5381016135215759, -0.5168704390525818, -0.49563929438591003, -0.4744081497192383, -0.45317697525024414, -0.4319458305835724, -0.41071468591690063, -0.3894835412502289, -0.36825239658355713, -0.347021222114563, -0.32579007744789124, -0.3045589327812195, -0.28332775831222534, -0.2620966136455536, -0.24086546897888184, -0.21963432431221008, -0.19840316474437714, -0.1771720051765442, -0.15594086050987244, -0.13470971584320068, -0.11347855627536774, -0.09224739670753479, -0.07101625204086304, -0.04978509992361069, -0.028553947806358337, -0.0073227956891059875, 0.013908356428146362, 0.03513950854539871, 0.05637066066265106, 0.07760182023048401, 0.09883296489715576, 0.12006411701440811, 0.14129526913166046, 0.1625264286994934, 0.18375757336616516, 0.20498871803283691, 0.22621987760066986, 0.2474510371685028, 0.26868218183517456, 0.2899133265018463, 0.31114447116851807, 0.3323756456375122, 0.35360679030418396, 0.3748379349708557, 0.39606910943984985, 0.4173002541065216, 0.43853139877319336, 0.4597625434398651, 0.48099368810653687, 0.502224862575531, 0.5234559774398804, 0.5446871519088745, 0.5659183263778687, 0.5871495008468628, 0.6083806157112122]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 6.0, 11.0, 16.0, 26.0, 39.0, 71.0, 103.0, 149.0, 269.0, 463.0, 794.0, 1437.0, 2637.0, 4963.0, 9640.0, 20112.0, 42131.0, 89385.0, 209963.0, 362416.0, 163017.0, 72860.0, 34241.0, 16373.0, 8109.0, 4161.0, 2247.0, 1268.0, 687.0, 380.0, 208.0, 143.0, 82.0, 41.0, 39.0, 20.0, 12.0, 10.0, 9.0, 5.0, 6.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.269775390625, -0.2608909606933594, -0.25200653076171875, -0.24312210083007812, -0.2342376708984375, -0.22535324096679688, -0.21646881103515625, -0.20758438110351562, -0.198699951171875, -0.18981552124023438, -0.18093109130859375, -0.17204666137695312, -0.1631622314453125, -0.15427780151367188, -0.14539337158203125, -0.13650894165039062, -0.12762451171875, -0.11874008178710938, -0.10985565185546875, -0.10097122192382812, -0.0920867919921875, -0.08320236206054688, -0.07431793212890625, -0.06543350219726562, -0.056549072265625, -0.047664642333984375, -0.03878021240234375, -0.029895782470703125, -0.0210113525390625, -0.012126922607421875, -0.00324249267578125, 0.005641937255859375, 0.0145263671875, 0.023410797119140625, 0.03229522705078125, 0.041179656982421875, 0.0500640869140625, 0.058948516845703125, 0.06783294677734375, 0.07671737670898438, 0.085601806640625, 0.09448623657226562, 0.10337066650390625, 0.11225509643554688, 0.1211395263671875, 0.13002395629882812, 0.13890838623046875, 0.14779281616210938, 0.15667724609375, 0.16556167602539062, 0.17444610595703125, 0.18333053588867188, 0.1922149658203125, 0.20109939575195312, 0.20998382568359375, 0.21886825561523438, 0.227752685546875, 0.23663711547851562, 0.24552154541015625, 0.2544059753417969, 0.2632904052734375, 0.2721748352050781, 0.28105926513671875, 0.2899436950683594, 0.298828125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 10.0, 5.0, 16.0, 17.0, 15.0, 13.0, 35.0, 36.0, 29.0, 46.0, 49.0, 62.0, 57.0, 58.0, 49.0, 66.0, 54.0, 62.0, 48.0, 42.0, 44.0, 38.0, 29.0, 28.0, 18.0, 24.0, 10.0, 6.0, 10.0, 8.0, 2.0, 5.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1690673828125, -0.16436004638671875, -0.1596527099609375, -0.15494537353515625, -0.150238037109375, -0.14553070068359375, -0.1408233642578125, -0.13611602783203125, -0.13140869140625, -0.12670135498046875, -0.1219940185546875, -0.11728668212890625, -0.112579345703125, -0.10787200927734375, -0.1031646728515625, -0.09845733642578125, -0.09375, -0.08904266357421875, -0.0843353271484375, -0.07962799072265625, -0.074920654296875, -0.07021331787109375, -0.0655059814453125, -0.06079864501953125, -0.05609130859375, -0.05138397216796875, -0.0466766357421875, -0.04196929931640625, -0.037261962890625, -0.03255462646484375, -0.0278472900390625, -0.02313995361328125, -0.0184326171875, -0.01372528076171875, -0.0090179443359375, -0.00431060791015625, 0.000396728515625, 0.00510406494140625, 0.0098114013671875, 0.01451873779296875, 0.01922607421875, 0.02393341064453125, 0.0286407470703125, 0.03334808349609375, 0.038055419921875, 0.04276275634765625, 0.0474700927734375, 0.05217742919921875, 0.056884765625, 0.06159210205078125, 0.0662994384765625, 0.07100677490234375, 0.075714111328125, 0.08042144775390625, 0.0851287841796875, 0.08983612060546875, 0.09454345703125, 0.09925079345703125, 0.1039581298828125, 0.10866546630859375, 0.113372802734375, 0.11808013916015625, 0.1227874755859375, 0.12749481201171875, 0.1322021484375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 11.0, 5.0, 8.0, 13.0, 12.0, 27.0, 41.0, 52.0, 75.0, 171.0, 252.0, 371.0, 576.0, 1171.0, 2708.0, 9987.0, 82112.0, 796453.0, 134588.0, 13570.0, 3244.0, 1323.0, 672.0, 434.0, 234.0, 145.0, 100.0, 54.0, 43.0, 30.0, 23.0, 13.0, 7.0, 6.0, 7.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.91943359375, -0.8949737548828125, -0.870513916015625, -0.8460540771484375, -0.82159423828125, -0.7971343994140625, -0.772674560546875, -0.7482147216796875, -0.7237548828125, -0.6992950439453125, -0.674835205078125, -0.6503753662109375, -0.62591552734375, -0.6014556884765625, -0.576995849609375, -0.5525360107421875, -0.528076171875, -0.5036163330078125, -0.479156494140625, -0.4546966552734375, -0.43023681640625, -0.4057769775390625, -0.381317138671875, -0.3568572998046875, -0.3323974609375, -0.3079376220703125, -0.283477783203125, -0.2590179443359375, -0.23455810546875, -0.2100982666015625, -0.185638427734375, -0.1611785888671875, -0.13671875, -0.1122589111328125, -0.087799072265625, -0.0633392333984375, -0.03887939453125, -0.0144195556640625, 0.010040283203125, 0.0345001220703125, 0.0589599609375, 0.0834197998046875, 0.107879638671875, 0.1323394775390625, 0.15679931640625, 0.1812591552734375, 0.205718994140625, 0.2301788330078125, 0.254638671875, 0.2790985107421875, 0.303558349609375, 0.3280181884765625, 0.35247802734375, 0.3769378662109375, 0.401397705078125, 0.4258575439453125, 0.4503173828125, 0.4747772216796875, 0.499237060546875, 0.5236968994140625, 0.54815673828125, 0.5726165771484375, 0.597076416015625, 0.6215362548828125, 0.64599609375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 10.0, 7.0, 12.0, 8.0, 8.0, 20.0, 17.0, 7.0, 22.0, 18.0, 21.0, 31.0, 35.0, 27.0, 45.0, 38.0, 49.0, 47.0, 48.0, 64.0, 43.0, 46.0, 37.0, 33.0, 41.0, 35.0, 31.0, 30.0, 36.0, 28.0, 26.0, 16.0, 9.0, 12.0, 9.0, 11.0, 10.0, 8.0, 4.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5634765625, -0.5464248657226562, -0.5293731689453125, -0.5123214721679688, -0.495269775390625, -0.47821807861328125, -0.4611663818359375, -0.44411468505859375, -0.42706298828125, -0.41001129150390625, -0.3929595947265625, -0.37590789794921875, -0.358856201171875, -0.34180450439453125, -0.3247528076171875, -0.30770111083984375, -0.2906494140625, -0.27359771728515625, -0.2565460205078125, -0.23949432373046875, -0.222442626953125, -0.20539093017578125, -0.1883392333984375, -0.17128753662109375, -0.15423583984375, -0.13718414306640625, -0.1201324462890625, -0.10308074951171875, -0.086029052734375, -0.06897735595703125, -0.0519256591796875, -0.03487396240234375, -0.017822265625, -0.00077056884765625, 0.0162811279296875, 0.03333282470703125, 0.050384521484375, 0.06743621826171875, 0.0844879150390625, 0.10153961181640625, 0.11859130859375, 0.13564300537109375, 0.1526947021484375, 0.16974639892578125, 0.186798095703125, 0.20384979248046875, 0.2209014892578125, 0.23795318603515625, 0.2550048828125, 0.27205657958984375, 0.2891082763671875, 0.30615997314453125, 0.323211669921875, 0.34026336669921875, 0.3573150634765625, 0.37436676025390625, 0.39141845703125, 0.40847015380859375, 0.4255218505859375, 0.44257354736328125, 0.459625244140625, 0.47667694091796875, 0.4937286376953125, 0.5107803344726562, 0.52783203125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 5.0, 7.0, 6.0, 16.0, 22.0, 21.0, 27.0, 50.0, 97.0, 144.0, 269.0, 519.0, 1214.0, 2992.0, 8965.0, 39874.0, 407808.0, 523224.0, 47595.0, 9973.0, 3194.0, 1271.0, 558.0, 297.0, 171.0, 82.0, 49.0, 36.0, 21.0, 14.0, 13.0, 6.0, 7.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.30078125, -0.29219818115234375, -0.2836151123046875, -0.27503204345703125, -0.266448974609375, -0.25786590576171875, -0.2492828369140625, -0.24069976806640625, -0.23211669921875, -0.22353363037109375, -0.2149505615234375, -0.20636749267578125, -0.197784423828125, -0.18920135498046875, -0.1806182861328125, -0.17203521728515625, -0.1634521484375, -0.15486907958984375, -0.1462860107421875, -0.13770294189453125, -0.129119873046875, -0.12053680419921875, -0.1119537353515625, -0.10337066650390625, -0.09478759765625, -0.08620452880859375, -0.0776214599609375, -0.06903839111328125, -0.060455322265625, -0.05187225341796875, -0.0432891845703125, -0.03470611572265625, -0.026123046875, -0.01753997802734375, -0.0089569091796875, -0.00037384033203125, 0.008209228515625, 0.01679229736328125, 0.0253753662109375, 0.03395843505859375, 0.04254150390625, 0.05112457275390625, 0.0597076416015625, 0.06829071044921875, 0.076873779296875, 0.08545684814453125, 0.0940399169921875, 0.10262298583984375, 0.1112060546875, 0.11978912353515625, 0.1283721923828125, 0.13695526123046875, 0.145538330078125, 0.15412139892578125, 0.1627044677734375, 0.17128753662109375, 0.17987060546875, 0.18845367431640625, 0.1970367431640625, 0.20561981201171875, 0.214202880859375, 0.22278594970703125, 0.2313690185546875, 0.23995208740234375, 0.24853515625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 11.0, 6.0, 10.0, 15.0, 20.0, 29.0, 32.0, 42.0, 68.0, 83.0, 95.0, 139.0, 128.0, 77.0, 50.0, 46.0, 30.0, 36.0, 22.0, 14.0, 19.0, 15.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00015687942504882812, -0.00015281885862350464, -0.00014875829219818115, -0.00014469772577285767, -0.00014063715934753418, -0.0001365765929222107, -0.0001325160264968872, -0.00012845546007156372, -0.00012439489364624023, -0.00012033432722091675, -0.00011627376079559326, -0.00011221319437026978, -0.00010815262794494629, -0.0001040920615196228, -0.00010003149509429932, -9.597092866897583e-05, -9.191036224365234e-05, -8.784979581832886e-05, -8.378922939300537e-05, -7.972866296768188e-05, -7.56680965423584e-05, -7.160753011703491e-05, -6.754696369171143e-05, -6.348639726638794e-05, -5.942583084106445e-05, -5.536526441574097e-05, -5.130469799041748e-05, -4.7244131565093994e-05, -4.318356513977051e-05, -3.912299871444702e-05, -3.5062432289123535e-05, -3.100186586380005e-05, -2.6941299438476562e-05, -2.2880733013153076e-05, -1.882016658782959e-05, -1.4759600162506104e-05, -1.0699033737182617e-05, -6.638467311859131e-06, -2.5779008865356445e-06, 1.4826655387878418e-06, 5.543231964111328e-06, 9.603798389434814e-06, 1.36643648147583e-05, 1.7724931240081787e-05, 2.1785497665405273e-05, 2.584606409072876e-05, 2.9906630516052246e-05, 3.396719694137573e-05, 3.802776336669922e-05, 4.2088329792022705e-05, 4.614889621734619e-05, 5.020946264266968e-05, 5.4270029067993164e-05, 5.833059549331665e-05, 6.239116191864014e-05, 6.645172834396362e-05, 7.051229476928711e-05, 7.45728611946106e-05, 7.863342761993408e-05, 8.269399404525757e-05, 8.675456047058105e-05, 9.081512689590454e-05, 9.487569332122803e-05, 9.893625974655151e-05, 0.000102996826171875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 2.0, 5.0, 13.0, 16.0, 17.0, 29.0, 35.0, 64.0, 85.0, 138.0, 228.0, 460.0, 871.0, 1882.0, 4776.0, 17520.0, 116173.0, 721552.0, 153939.0, 21004.0, 5489.0, 2147.0, 858.0, 512.0, 262.0, 156.0, 112.0, 63.0, 33.0, 27.0, 21.0, 15.0, 8.0, 11.0, 9.0, 9.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2509765625, -0.24276351928710938, -0.23455047607421875, -0.22633743286132812, -0.2181243896484375, -0.20991134643554688, -0.20169830322265625, -0.19348526000976562, -0.185272216796875, -0.17705917358398438, -0.16884613037109375, -0.16063308715820312, -0.1524200439453125, -0.14420700073242188, -0.13599395751953125, -0.12778091430664062, -0.11956787109375, -0.11135482788085938, -0.10314178466796875, -0.09492874145507812, -0.0867156982421875, -0.07850265502929688, -0.07028961181640625, -0.062076568603515625, -0.053863525390625, -0.045650482177734375, -0.03743743896484375, -0.029224395751953125, -0.0210113525390625, -0.012798309326171875, -0.00458526611328125, 0.003627777099609375, 0.0118408203125, 0.020053863525390625, 0.02826690673828125, 0.036479949951171875, 0.0446929931640625, 0.052906036376953125, 0.06111907958984375, 0.06933212280273438, 0.077545166015625, 0.08575820922851562, 0.09397125244140625, 0.10218429565429688, 0.1103973388671875, 0.11861038208007812, 0.12682342529296875, 0.13503646850585938, 0.14324951171875, 0.15146255493164062, 0.15967559814453125, 0.16788864135742188, 0.1761016845703125, 0.18431472778320312, 0.19252777099609375, 0.20074081420898438, 0.208953857421875, 0.21716690063476562, 0.22537994384765625, 0.23359298706054688, 0.2418060302734375, 0.2500190734863281, 0.25823211669921875, 0.2664451599121094, 0.274658203125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 8.0, 4.0, 5.0, 9.0, 6.0, 14.0, 10.0, 18.0, 33.0, 31.0, 33.0, 61.0, 56.0, 80.0, 88.0, 70.0, 68.0, 80.0, 46.0, 59.0, 48.0, 31.0, 20.0, 19.0, 24.0, 12.0, 7.0, 7.0, 11.0, 8.0, 3.0, 10.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0], "bins": [-0.205322265625, -0.1996936798095703, -0.19406509399414062, -0.18843650817871094, -0.18280792236328125, -0.17717933654785156, -0.17155075073242188, -0.1659221649169922, -0.1602935791015625, -0.1546649932861328, -0.14903640747070312, -0.14340782165527344, -0.13777923583984375, -0.13215065002441406, -0.12652206420898438, -0.12089347839355469, -0.115264892578125, -0.10963630676269531, -0.10400772094726562, -0.09837913513183594, -0.09275054931640625, -0.08712196350097656, -0.08149337768554688, -0.07586479187011719, -0.0702362060546875, -0.06460762023925781, -0.058979034423828125, -0.05335044860839844, -0.04772186279296875, -0.04209327697753906, -0.036464691162109375, -0.030836105346679688, -0.02520751953125, -0.019578933715820312, -0.013950347900390625, -0.008321762084960938, -0.00269317626953125, 0.0029354095458984375, 0.008563995361328125, 0.014192581176757812, 0.0198211669921875, 0.025449752807617188, 0.031078338623046875, 0.03670692443847656, 0.04233551025390625, 0.04796409606933594, 0.053592681884765625, 0.05922126770019531, 0.064849853515625, 0.07047843933105469, 0.07610702514648438, 0.08173561096191406, 0.08736419677734375, 0.09299278259277344, 0.09862136840820312, 0.10424995422363281, 0.1098785400390625, 0.11550712585449219, 0.12113571166992188, 0.12676429748535156, 0.13239288330078125, 0.13802146911621094, 0.14365005493164062, 0.1492786407470703, 0.1549072265625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 6.0, 5.0, 10.0, 11.0, 22.0, 47.0, 72.0, 103.0, 138.0, 175.0, 151.0, 119.0, 68.0, 35.0, 19.0, 9.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.929521083831787, -4.779421806335449, -4.629322052001953, -4.479222774505615, -4.329123497009277, -4.1790242195129395, -4.028924942016602, -3.8788251876831055, -3.7287259101867676, -3.5786266326904297, -3.4285271167755127, -3.2784276008605957, -3.128328323364258, -2.97822904586792, -2.828129529953003, -2.678030014038086, -2.527930736541748, -2.37783145904541, -2.227731943130493, -2.077632427215576, -1.9275331497192383, -1.7774337530136108, -1.6273343563079834, -1.477234959602356, -1.3271355628967285, -1.177036166191101, -1.0269367694854736, -0.8768373727798462, -0.7267379760742188, -0.5766385793685913, -0.42653918266296387, -0.2764397859573364, -0.12634038925170898, 0.023759007453918457, 0.1738584041595459, 0.32395780086517334, 0.4740571975708008, 0.6241565942764282, 0.7742559909820557, 0.9243553876876831, 1.0744547843933105, 1.224554181098938, 1.3746535778045654, 1.5247529745101929, 1.6748523712158203, 1.8249517679214478, 1.9750511646270752, 2.125150680541992, 2.27524995803833, 2.425349235534668, 2.575448751449585, 2.725548267364502, 2.87564754486084, 3.0257468223571777, 3.1758463382720947, 3.3259458541870117, 3.4760451316833496, 3.6261444091796875, 3.7762439250946045, 3.9263434410095215, 4.076442718505859, 4.226541996002197, 4.376641273498535, 4.526741027832031, 4.676840305328369]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 10.0, 12.0, 11.0, 17.0, 20.0, 21.0, 25.0, 30.0, 25.0, 42.0, 37.0, 48.0, 51.0, 38.0, 68.0, 61.0, 60.0, 60.0, 48.0, 72.0, 33.0, 43.0, 18.0, 26.0, 26.0, 13.0, 18.0, 14.0, 8.0, 10.0, 9.0, 6.0, 4.0, 5.0, 4.0, 8.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.75789737701416, -2.66742205619812, -2.576946973800659, -2.486471652984619, -2.395996570587158, -2.305521249771118, -2.215045928955078, -2.124570846557617, -2.0340957641601562, -1.9436205625534058, -1.8531453609466553, -1.7626700401306152, -1.6721949577331543, -1.5817196369171143, -1.4912444353103638, -1.4007692337036133, -1.3102939128875732, -1.2198187112808228, -1.1293435096740723, -1.0388681888580322, -0.9483930468559265, -0.857917845249176, -0.7674425840377808, -0.6769673824310303, -0.5864921808242798, -0.4960169792175293, -0.4055417478084564, -0.31506651639938354, -0.22459131479263306, -0.13411611318588257, -0.043640851974487305, 0.046834349632263184, 0.13730931282043457, 0.22778452932834625, 0.31825974583625793, 0.4087349772453308, 0.4992101788520813, 0.5896853804588318, 0.680160641670227, 0.7706358432769775, 0.861111044883728, 0.9515862464904785, 1.042061448097229, 1.1325366497039795, 1.2230119705200195, 1.3134870529174805, 1.4039623737335205, 1.494437575340271, 1.5849127769470215, 1.675387978553772, 1.7658631801605225, 1.8563385009765625, 1.9468135833740234, 2.0372889041900635, 2.1277642250061035, 2.2182393074035645, 2.3087143898010254, 2.3991897106170654, 2.4896647930145264, 2.5801401138305664, 2.6706151962280273, 2.7610905170440674, 2.8515658378601074, 2.9420409202575684, 3.0325162410736084]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 4.0, 7.0, 5.0, 5.0, 20.0, 17.0, 14.0, 30.0, 46.0, 53.0, 76.0, 107.0, 148.0, 155.0, 248.0, 387.0, 546.0, 809.0, 1247.0, 2185.0, 3647.0, 6778.0, 14012.0, 32301.0, 95929.0, 534029.0, 2824231.0, 520138.0, 95482.0, 31880.0, 13690.0, 6572.0, 3648.0, 2086.0, 1231.0, 763.0, 527.0, 354.0, 221.0, 206.0, 129.0, 96.0, 58.0, 45.0, 30.0, 26.0, 23.0, 13.0, 13.0, 12.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.226806640625, -0.2191162109375, -0.21142578125, -0.2037353515625, -0.196044921875, -0.1883544921875, -0.1806640625, -0.1729736328125, -0.165283203125, -0.1575927734375, -0.14990234375, -0.1422119140625, -0.134521484375, -0.1268310546875, -0.119140625, -0.1114501953125, -0.103759765625, -0.0960693359375, -0.08837890625, -0.0806884765625, -0.072998046875, -0.0653076171875, -0.0576171875, -0.0499267578125, -0.042236328125, -0.0345458984375, -0.02685546875, -0.0191650390625, -0.011474609375, -0.0037841796875, 0.00390625, 0.0115966796875, 0.019287109375, 0.0269775390625, 0.03466796875, 0.0423583984375, 0.050048828125, 0.0577392578125, 0.0654296875, 0.0731201171875, 0.080810546875, 0.0885009765625, 0.09619140625, 0.1038818359375, 0.111572265625, 0.1192626953125, 0.126953125, 0.1346435546875, 0.142333984375, 0.1500244140625, 0.15771484375, 0.1654052734375, 0.173095703125, 0.1807861328125, 0.1884765625, 0.1961669921875, 0.203857421875, 0.2115478515625, 0.21923828125, 0.2269287109375, 0.234619140625, 0.2423095703125, 0.25, 0.2576904296875, 0.265380859375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 8.0, 5.0, 12.0, 8.0, 18.0, 30.0, 33.0, 28.0, 32.0, 44.0, 34.0, 49.0, 54.0, 56.0, 62.0, 53.0, 48.0, 51.0, 52.0, 44.0, 43.0, 38.0, 36.0, 31.0, 24.0, 23.0, 16.0, 9.0, 16.0, 8.0, 9.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.142333984375, -0.1383228302001953, -0.13431167602539062, -0.13030052185058594, -0.12628936767578125, -0.12227821350097656, -0.11826705932617188, -0.11425590515136719, -0.1102447509765625, -0.10623359680175781, -0.10222244262695312, -0.09821128845214844, -0.09420013427734375, -0.09018898010253906, -0.08617782592773438, -0.08216667175292969, -0.078155517578125, -0.07414436340332031, -0.07013320922851562, -0.06612205505371094, -0.06211090087890625, -0.05809974670410156, -0.054088592529296875, -0.05007743835449219, -0.0460662841796875, -0.04205513000488281, -0.038043975830078125, -0.03403282165527344, -0.03002166748046875, -0.026010513305664062, -0.021999359130859375, -0.017988204956054688, -0.01397705078125, -0.009965896606445312, -0.005954742431640625, -0.0019435882568359375, 0.00206756591796875, 0.0060787200927734375, 0.010089874267578125, 0.014101028442382812, 0.0181121826171875, 0.022123336791992188, 0.026134490966796875, 0.030145645141601562, 0.03415679931640625, 0.03816795349121094, 0.042179107666015625, 0.04619026184082031, 0.050201416015625, 0.05421257019042969, 0.058223724365234375, 0.06223487854003906, 0.06624603271484375, 0.07025718688964844, 0.07426834106445312, 0.07827949523925781, 0.0822906494140625, 0.08630180358886719, 0.09031295776367188, 0.09432411193847656, 0.09833526611328125, 0.10234642028808594, 0.10635757446289062, 0.11036872863769531, 0.1143798828125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 6.0, 6.0, 10.0, 9.0, 27.0, 27.0, 34.0, 34.0, 63.0, 92.0, 168.0, 230.0, 366.0, 604.0, 1161.0, 2121.0, 4817.0, 11066.0, 29044.0, 94476.0, 525657.0, 2965880.0, 428322.0, 83647.0, 26990.0, 10327.0, 4388.0, 2092.0, 1071.0, 570.0, 346.0, 216.0, 136.0, 72.0, 59.0, 52.0, 25.0, 19.0, 13.0, 12.0, 10.0, 5.0, 7.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.321533203125, -0.3116264343261719, -0.30171966552734375, -0.2918128967285156, -0.2819061279296875, -0.2719993591308594, -0.26209259033203125, -0.2521858215332031, -0.242279052734375, -0.23237228393554688, -0.22246551513671875, -0.21255874633789062, -0.2026519775390625, -0.19274520874023438, -0.18283843994140625, -0.17293167114257812, -0.16302490234375, -0.15311813354492188, -0.14321136474609375, -0.13330459594726562, -0.1233978271484375, -0.11349105834960938, -0.10358428955078125, -0.09367752075195312, -0.083770751953125, -0.07386398315429688, -0.06395721435546875, -0.054050445556640625, -0.0441436767578125, -0.034236907958984375, -0.02433013916015625, -0.014423370361328125, -0.0045166015625, 0.005390167236328125, 0.01529693603515625, 0.025203704833984375, 0.0351104736328125, 0.045017242431640625, 0.05492401123046875, 0.06483078002929688, 0.074737548828125, 0.08464431762695312, 0.09455108642578125, 0.10445785522460938, 0.1143646240234375, 0.12427139282226562, 0.13417816162109375, 0.14408493041992188, 0.15399169921875, 0.16389846801757812, 0.17380523681640625, 0.18371200561523438, 0.1936187744140625, 0.20352554321289062, 0.21343231201171875, 0.22333908081054688, 0.233245849609375, 0.24315261840820312, 0.25305938720703125, 0.2629661560058594, 0.2728729248046875, 0.2827796936035156, 0.29268646240234375, 0.3025932312011719, 0.3125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 4.0, 1.0, 5.0, 6.0, 9.0, 7.0, 17.0, 13.0, 24.0, 28.0, 34.0, 58.0, 76.0, 132.0, 213.0, 375.0, 699.0, 907.0, 618.0, 307.0, 167.0, 119.0, 79.0, 59.0, 28.0, 30.0, 19.0, 15.0, 12.0, 5.0, 3.0, 6.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.51171875, -0.4972572326660156, -0.48279571533203125, -0.4683341979980469, -0.4538726806640625, -0.4394111633300781, -0.42494964599609375, -0.4104881286621094, -0.396026611328125, -0.3815650939941406, -0.36710357666015625, -0.3526420593261719, -0.3381805419921875, -0.3237190246582031, -0.30925750732421875, -0.2947959899902344, -0.28033447265625, -0.2658729553222656, -0.25141143798828125, -0.23694992065429688, -0.2224884033203125, -0.20802688598632812, -0.19356536865234375, -0.17910385131835938, -0.164642333984375, -0.15018081665039062, -0.13571929931640625, -0.12125778198242188, -0.1067962646484375, -0.09233474731445312, -0.07787322998046875, -0.06341171264648438, -0.0489501953125, -0.034488677978515625, -0.02002716064453125, -0.005565643310546875, 0.0088958740234375, 0.023357391357421875, 0.03781890869140625, 0.052280426025390625, 0.066741943359375, 0.08120346069335938, 0.09566497802734375, 0.11012649536132812, 0.1245880126953125, 0.13904953002929688, 0.15351104736328125, 0.16797256469726562, 0.18243408203125, 0.19689559936523438, 0.21135711669921875, 0.22581863403320312, 0.2402801513671875, 0.2547416687011719, 0.26920318603515625, 0.2836647033691406, 0.298126220703125, 0.3125877380371094, 0.32704925537109375, 0.3415107727050781, 0.3559722900390625, 0.3704338073730469, 0.38489532470703125, 0.3993568420410156, 0.413818359375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 5.0, 4.0, 11.0, 19.0, 41.0, 122.0, 238.0, 248.0, 165.0, 85.0, 29.0, 16.0, 3.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.198184013366699, -7.004678726196289, -6.811172962188721, -6.617667198181152, -6.424161911010742, -6.230656623840332, -6.037150859832764, -5.843645095825195, -5.650139808654785, -5.456634521484375, -5.263128757476807, -5.069622993469238, -4.876117706298828, -4.682612419128418, -4.48910665512085, -4.295600891113281, -4.102095603942871, -3.908590078353882, -3.7150845527648926, -3.5215790271759033, -3.328073501586914, -3.134567975997925, -2.9410624504089355, -2.7475569248199463, -2.554051399230957, -2.3605458736419678, -2.1670403480529785, -1.9735348224639893, -1.780029296875, -1.5865237712860107, -1.3930182456970215, -1.1995127201080322, -1.0060076713562012, -0.8125021457672119, -0.6189966201782227, -0.4254910945892334, -0.23198556900024414, -0.03848004341125488, 0.15502548217773438, 0.34853100776672363, 0.5420365333557129, 0.7355420589447021, 0.9290475845336914, 1.1225531101226807, 1.31605863571167, 1.5095641613006592, 1.7030696868896484, 1.8965752124786377, 2.090080738067627, 2.283586263656616, 2.4770917892456055, 2.6705973148345947, 2.864102840423584, 3.0576083660125732, 3.2511138916015625, 3.4446194171905518, 3.638124942779541, 3.8316304683685303, 4.0251359939575195, 4.21864128112793, 4.412147045135498, 4.605652809143066, 4.799158096313477, 4.992663383483887, 5.186169147491455]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 9.0, 9.0, 11.0, 15.0, 16.0, 17.0, 27.0, 27.0, 36.0, 40.0, 45.0, 38.0, 56.0, 40.0, 43.0, 57.0, 40.0, 48.0, 54.0, 50.0, 38.0, 41.0, 29.0, 35.0, 30.0, 24.0, 17.0, 19.0, 23.0, 11.0, 7.0, 7.0, 9.0, 8.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.888577938079834, -1.8317358493804932, -1.7748937606811523, -1.718051552772522, -1.6612094640731812, -1.6043673753738403, -1.5475252866744995, -1.4906830787658691, -1.4338409900665283, -1.3769989013671875, -1.3201568126678467, -1.2633146047592163, -1.2064725160598755, -1.1496304273605347, -1.0927883386611938, -1.0359461307525635, -0.9791041016578674, -0.9222620129585266, -0.865419864654541, -0.8085777759552002, -0.7517356276512146, -0.6948935389518738, -0.6380513906478882, -0.5812093019485474, -0.5243672132492065, -0.46752509474754333, -0.4106829762458801, -0.3538408875465393, -0.2969987392425537, -0.2401566505432129, -0.18331453204154968, -0.12647241353988647, -0.06963026523590088, -0.01278815045952797, 0.04405396431684494, 0.10089607536792755, 0.15773819386959076, 0.21458029747009277, 0.271422415971756, 0.3282645344734192, 0.3851066529750824, 0.4419487714767456, 0.4987908899784088, 0.555633008480072, 0.6124750971794128, 0.6693172454833984, 0.7261593341827393, 0.7830014228820801, 0.8398435711860657, 0.8966856598854065, 0.9535278081893921, 1.010369896888733, 1.0672119855880737, 1.124054193496704, 1.180896282196045, 1.2377383708953857, 1.2945804595947266, 1.3514225482940674, 1.4082646369934082, 1.4651068449020386, 1.5219489336013794, 1.5787910223007202, 1.635633111000061, 1.6924753189086914, 1.7493174076080322]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 11.0, 11.0, 16.0, 25.0, 31.0, 65.0, 79.0, 104.0, 166.0, 252.0, 322.0, 502.0, 680.0, 1065.0, 1560.0, 2341.0, 3631.0, 5820.0, 9614.0, 16510.0, 29259.0, 57849.0, 142997.0, 381026.0, 224686.0, 79522.0, 37781.0, 20618.0, 11784.0, 7177.0, 4502.0, 2831.0, 1795.0, 1184.0, 838.0, 549.0, 412.0, 263.0, 198.0, 127.0, 97.0, 67.0, 58.0, 36.0, 23.0, 30.0, 15.0, 8.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.2406005859375, -0.23276329040527344, -0.22492599487304688, -0.2170886993408203, -0.20925140380859375, -0.2014141082763672, -0.19357681274414062, -0.18573951721191406, -0.1779022216796875, -0.17006492614746094, -0.16222763061523438, -0.1543903350830078, -0.14655303955078125, -0.1387157440185547, -0.13087844848632812, -0.12304115295410156, -0.115203857421875, -0.10736656188964844, -0.09952926635742188, -0.09169197082519531, -0.08385467529296875, -0.07601737976074219, -0.06818008422851562, -0.06034278869628906, -0.0525054931640625, -0.04466819763183594, -0.036830902099609375, -0.028993606567382812, -0.02115631103515625, -0.013319015502929688, -0.005481719970703125, 0.0023555755615234375, 0.01019287109375, 0.018030166625976562, 0.025867462158203125, 0.03370475769042969, 0.04154205322265625, 0.04937934875488281, 0.057216644287109375, 0.06505393981933594, 0.0728912353515625, 0.08072853088378906, 0.08856582641601562, 0.09640312194824219, 0.10424041748046875, 0.11207771301269531, 0.11991500854492188, 0.12775230407714844, 0.135589599609375, 0.14342689514160156, 0.15126419067382812, 0.1591014862060547, 0.16693878173828125, 0.1747760772705078, 0.18261337280273438, 0.19045066833496094, 0.1982879638671875, 0.20612525939941406, 0.21396255493164062, 0.2217998504638672, 0.22963714599609375, 0.2374744415283203, 0.24531173706054688, 0.25314903259277344, 0.260986328125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 6.0, 6.0, 10.0, 4.0, 4.0, 16.0, 6.0, 18.0, 10.0, 20.0, 26.0, 22.0, 35.0, 28.0, 44.0, 44.0, 32.0, 40.0, 41.0, 57.0, 51.0, 33.0, 53.0, 41.0, 46.0, 31.0, 37.0, 42.0, 34.0, 24.0, 25.0, 16.0, 17.0, 16.0, 13.0, 13.0, 12.0, 4.0, 12.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11572265625, -0.1121826171875, -0.108642578125, -0.1051025390625, -0.1015625, -0.0980224609375, -0.094482421875, -0.0909423828125, -0.08740234375, -0.0838623046875, -0.080322265625, -0.0767822265625, -0.0732421875, -0.0697021484375, -0.066162109375, -0.0626220703125, -0.05908203125, -0.0555419921875, -0.052001953125, -0.0484619140625, -0.044921875, -0.0413818359375, -0.037841796875, -0.0343017578125, -0.03076171875, -0.0272216796875, -0.023681640625, -0.0201416015625, -0.0166015625, -0.0130615234375, -0.009521484375, -0.0059814453125, -0.00244140625, 0.0010986328125, 0.004638671875, 0.0081787109375, 0.01171875, 0.0152587890625, 0.018798828125, 0.0223388671875, 0.02587890625, 0.0294189453125, 0.032958984375, 0.0364990234375, 0.0400390625, 0.0435791015625, 0.047119140625, 0.0506591796875, 0.05419921875, 0.0577392578125, 0.061279296875, 0.0648193359375, 0.068359375, 0.0718994140625, 0.075439453125, 0.0789794921875, 0.08251953125, 0.0860595703125, 0.089599609375, 0.0931396484375, 0.0966796875, 0.1002197265625, 0.103759765625, 0.1072998046875, 0.11083984375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 10.0, 18.0, 10.0, 14.0, 15.0, 23.0, 29.0, 39.0, 73.0, 87.0, 137.0, 180.0, 298.0, 376.0, 629.0, 1124.0, 2453.0, 6134.0, 22990.0, 155878.0, 767589.0, 68691.0, 13060.0, 4170.0, 1841.0, 978.0, 552.0, 357.0, 234.0, 169.0, 111.0, 75.0, 52.0, 42.0, 29.0, 20.0, 20.0, 13.0, 10.0, 8.0, 6.0, 4.0, 4.0, 4.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.71875, -0.6989593505859375, -0.679168701171875, -0.6593780517578125, -0.63958740234375, -0.6197967529296875, -0.600006103515625, -0.5802154541015625, -0.5604248046875, -0.5406341552734375, -0.520843505859375, -0.5010528564453125, -0.48126220703125, -0.4614715576171875, -0.441680908203125, -0.4218902587890625, -0.402099609375, -0.3823089599609375, -0.362518310546875, -0.3427276611328125, -0.32293701171875, -0.3031463623046875, -0.283355712890625, -0.2635650634765625, -0.2437744140625, -0.2239837646484375, -0.204193115234375, -0.1844024658203125, -0.16461181640625, -0.1448211669921875, -0.125030517578125, -0.1052398681640625, -0.08544921875, -0.0656585693359375, -0.045867919921875, -0.0260772705078125, -0.00628662109375, 0.0135040283203125, 0.033294677734375, 0.0530853271484375, 0.0728759765625, 0.0926666259765625, 0.112457275390625, 0.1322479248046875, 0.15203857421875, 0.1718292236328125, 0.191619873046875, 0.2114105224609375, 0.231201171875, 0.2509918212890625, 0.270782470703125, 0.2905731201171875, 0.31036376953125, 0.3301544189453125, 0.349945068359375, 0.3697357177734375, 0.3895263671875, 0.4093170166015625, 0.429107666015625, 0.4488983154296875, 0.46868896484375, 0.4884796142578125, 0.508270263671875, 0.5280609130859375, 0.5478515625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 4.0, 4.0, 3.0, 11.0, 7.0, 9.0, 4.0, 19.0, 24.0, 19.0, 16.0, 29.0, 28.0, 49.0, 37.0, 41.0, 43.0, 56.0, 53.0, 54.0, 54.0, 50.0, 49.0, 44.0, 49.0, 30.0, 29.0, 27.0, 27.0, 19.0, 25.0, 15.0, 18.0, 13.0, 10.0, 8.0, 11.0, 4.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5439453125, -0.5262527465820312, -0.5085601806640625, -0.49086761474609375, -0.473175048828125, -0.45548248291015625, -0.4377899169921875, -0.42009735107421875, -0.40240478515625, -0.38471221923828125, -0.3670196533203125, -0.34932708740234375, -0.331634521484375, -0.31394195556640625, -0.2962493896484375, -0.27855682373046875, -0.2608642578125, -0.24317169189453125, -0.2254791259765625, -0.20778656005859375, -0.190093994140625, -0.17240142822265625, -0.1547088623046875, -0.13701629638671875, -0.11932373046875, -0.10163116455078125, -0.0839385986328125, -0.06624603271484375, -0.048553466796875, -0.03086090087890625, -0.0131683349609375, 0.00452423095703125, 0.022216796875, 0.03990936279296875, 0.0576019287109375, 0.07529449462890625, 0.092987060546875, 0.11067962646484375, 0.1283721923828125, 0.14606475830078125, 0.16375732421875, 0.18144989013671875, 0.1991424560546875, 0.21683502197265625, 0.234527587890625, 0.25222015380859375, 0.2699127197265625, 0.28760528564453125, 0.3052978515625, 0.32299041748046875, 0.3406829833984375, 0.35837554931640625, 0.376068115234375, 0.39376068115234375, 0.4114532470703125, 0.42914581298828125, 0.44683837890625, 0.46453094482421875, 0.4822235107421875, 0.49991607666015625, 0.517608642578125, 0.5353012084960938, 0.5529937744140625, 0.5706863403320312, 0.58837890625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 4.0, 7.0, 11.0, 13.0, 12.0, 19.0, 26.0, 41.0, 57.0, 87.0, 177.0, 289.0, 499.0, 1083.0, 2642.0, 7597.0, 29670.0, 195725.0, 710934.0, 75829.0, 15632.0, 4672.0, 1790.0, 777.0, 370.0, 204.0, 130.0, 81.0, 67.0, 36.0, 23.0, 11.0, 18.0, 8.0, 6.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2064208984375, -0.1982555389404297, -0.19009017944335938, -0.18192481994628906, -0.17375946044921875, -0.16559410095214844, -0.15742874145507812, -0.1492633819580078, -0.1410980224609375, -0.1329326629638672, -0.12476730346679688, -0.11660194396972656, -0.10843658447265625, -0.10027122497558594, -0.09210586547851562, -0.08394050598144531, -0.075775146484375, -0.06760978698730469, -0.059444427490234375, -0.05127906799316406, -0.04311370849609375, -0.03494834899902344, -0.026782989501953125, -0.018617630004882812, -0.0104522705078125, -0.0022869110107421875, 0.005878448486328125, 0.014043807983398438, 0.02220916748046875, 0.030374526977539062, 0.038539886474609375, 0.04670524597167969, 0.05487060546875, 0.06303596496582031, 0.07120132446289062, 0.07936668395996094, 0.08753204345703125, 0.09569740295410156, 0.10386276245117188, 0.11202812194824219, 0.1201934814453125, 0.1283588409423828, 0.13652420043945312, 0.14468955993652344, 0.15285491943359375, 0.16102027893066406, 0.16918563842773438, 0.1773509979248047, 0.185516357421875, 0.1936817169189453, 0.20184707641601562, 0.21001243591308594, 0.21817779541015625, 0.22634315490722656, 0.23450851440429688, 0.2426738739013672, 0.2508392333984375, 0.2590045928955078, 0.2671699523925781, 0.27533531188964844, 0.28350067138671875, 0.29166603088378906, 0.2998313903808594, 0.3079967498779297, 0.316162109375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 6.0, 5.0, 10.0, 9.0, 12.0, 24.0, 34.0, 29.0, 58.0, 66.0, 107.0, 141.0, 140.0, 89.0, 74.0, 43.0, 34.0, 24.0, 15.0, 18.0, 16.0, 17.0, 10.0, 2.0, 9.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00014209747314453125, -0.00013854540884494781, -0.00013499334454536438, -0.00013144128024578094, -0.0001278892159461975, -0.00012433715164661407, -0.00012078508734703064, -0.0001172330230474472, -0.00011368095874786377, -0.00011012889444828033, -0.0001065768301486969, -0.00010302476584911346, -9.947270154953003e-05, -9.59206372499466e-05, -9.236857295036316e-05, -8.881650865077972e-05, -8.526444435119629e-05, -8.171238005161285e-05, -7.816031575202942e-05, -7.460825145244598e-05, -7.105618715286255e-05, -6.750412285327911e-05, -6.395205855369568e-05, -6.0399994254112244e-05, -5.684792995452881e-05, -5.3295865654945374e-05, -4.974380135536194e-05, -4.6191737055778503e-05, -4.263967275619507e-05, -3.908760845661163e-05, -3.55355441570282e-05, -3.198347985744476e-05, -2.8431415557861328e-05, -2.4879351258277893e-05, -2.1327286958694458e-05, -1.7775222659111023e-05, -1.4223158359527588e-05, -1.0671094059944153e-05, -7.119029760360718e-06, -3.5669654607772827e-06, -1.4901161193847656e-08, 3.5371631383895874e-06, 7.0892274379730225e-06, 1.0641291737556458e-05, 1.4193356037139893e-05, 1.7745420336723328e-05, 2.1297484636306763e-05, 2.4849548935890198e-05, 2.8401613235473633e-05, 3.195367753505707e-05, 3.55057418346405e-05, 3.905780613422394e-05, 4.260987043380737e-05, 4.616193473339081e-05, 4.971399903297424e-05, 5.326606333255768e-05, 5.681812763214111e-05, 6.037019193172455e-05, 6.392225623130798e-05, 6.747432053089142e-05, 7.102638483047485e-05, 7.457844913005829e-05, 7.813051342964172e-05, 8.168257772922516e-05, 8.52346420288086e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 3.0, 5.0, 4.0, 13.0, 8.0, 20.0, 34.0, 40.0, 51.0, 71.0, 101.0, 159.0, 220.0, 361.0, 537.0, 922.0, 1819.0, 3688.0, 9116.0, 30644.0, 159637.0, 679870.0, 120699.0, 25332.0, 7899.0, 3240.0, 1640.0, 888.0, 488.0, 343.0, 205.0, 122.0, 98.0, 79.0, 48.0, 41.0, 25.0, 20.0, 16.0, 13.0, 11.0, 7.0, 6.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.2413330078125, -0.23432350158691406, -0.22731399536132812, -0.2203044891357422, -0.21329498291015625, -0.2062854766845703, -0.19927597045898438, -0.19226646423339844, -0.1852569580078125, -0.17824745178222656, -0.17123794555664062, -0.1642284393310547, -0.15721893310546875, -0.1502094268798828, -0.14319992065429688, -0.13619041442871094, -0.129180908203125, -0.12217140197753906, -0.11516189575195312, -0.10815238952636719, -0.10114288330078125, -0.09413337707519531, -0.08712387084960938, -0.08011436462402344, -0.0731048583984375, -0.06609535217285156, -0.059085845947265625, -0.05207633972167969, -0.04506683349609375, -0.03805732727050781, -0.031047821044921875, -0.024038314819335938, -0.01702880859375, -0.010019302368164062, -0.003009796142578125, 0.0039997100830078125, 0.01100921630859375, 0.018018722534179688, 0.025028228759765625, 0.03203773498535156, 0.0390472412109375, 0.04605674743652344, 0.053066253662109375, 0.06007575988769531, 0.06708526611328125, 0.07409477233886719, 0.08110427856445312, 0.08811378479003906, 0.095123291015625, 0.10213279724121094, 0.10914230346679688, 0.11615180969238281, 0.12316131591796875, 0.1301708221435547, 0.13718032836914062, 0.14418983459472656, 0.1511993408203125, 0.15820884704589844, 0.16521835327148438, 0.1722278594970703, 0.17923736572265625, 0.1862468719482422, 0.19325637817382812, 0.20026588439941406, 0.207275390625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 6.0, 3.0, 9.0, 11.0, 7.0, 5.0, 9.0, 17.0, 25.0, 27.0, 31.0, 42.0, 44.0, 83.0, 75.0, 99.0, 85.0, 95.0, 87.0, 44.0, 39.0, 35.0, 30.0, 19.0, 13.0, 9.0, 9.0, 9.0, 6.0, 4.0, 9.0, 7.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.27490234375, -0.26787757873535156, -0.2608528137207031, -0.2538280487060547, -0.24680328369140625, -0.2397785186767578, -0.23275375366210938, -0.22572898864746094, -0.2187042236328125, -0.21167945861816406, -0.20465469360351562, -0.1976299285888672, -0.19060516357421875, -0.1835803985595703, -0.17655563354492188, -0.16953086853027344, -0.162506103515625, -0.15548133850097656, -0.14845657348632812, -0.1414318084716797, -0.13440704345703125, -0.1273822784423828, -0.12035751342773438, -0.11333274841308594, -0.1063079833984375, -0.09928321838378906, -0.09225845336914062, -0.08523368835449219, -0.07820892333984375, -0.07118415832519531, -0.06415939331054688, -0.05713462829589844, -0.05010986328125, -0.04308509826660156, -0.036060333251953125, -0.029035568237304688, -0.02201080322265625, -0.014986038208007812, -0.007961273193359375, -0.0009365081787109375, 0.0060882568359375, 0.013113021850585938, 0.020137786865234375, 0.027162551879882812, 0.03418731689453125, 0.04121208190917969, 0.048236846923828125, 0.05526161193847656, 0.062286376953125, 0.06931114196777344, 0.07633590698242188, 0.08336067199707031, 0.09038543701171875, 0.09741020202636719, 0.10443496704101562, 0.11145973205566406, 0.1184844970703125, 0.12550926208496094, 0.13253402709960938, 0.1395587921142578, 0.14658355712890625, 0.1536083221435547, 0.16063308715820312, 0.16765785217285156, 0.1746826171875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 7.0, 5.0, 6.0, 8.0, 17.0, 33.0, 76.0, 111.0, 183.0, 239.0, 135.0, 105.0, 41.0, 19.0, 9.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 5.0], "bins": [-8.287578582763672, -8.1261568069458, -7.9647345542907715, -7.803312301635742, -7.641890525817871, -7.48046875, -7.319046497344971, -7.157624244689941, -6.99620246887207, -6.834780693054199, -6.67335844039917, -6.511936187744141, -6.3505144119262695, -6.189092636108398, -6.027670383453369, -5.86624813079834, -5.704826354980469, -5.543404579162598, -5.381982326507568, -5.220560073852539, -5.059138298034668, -4.897716522216797, -4.736294269561768, -4.574872016906738, -4.413450241088867, -4.252028465270996, -4.090606212615967, -3.9291841983795166, -3.7677621841430664, -3.606340169906616, -3.444918155670166, -3.283496141433716, -3.122074604034424, -2.9606525897979736, -2.7992305755615234, -2.6378085613250732, -2.476386547088623, -2.314964532852173, -2.1535425186157227, -1.9921205043792725, -1.8306984901428223, -1.669276475906372, -1.5078544616699219, -1.3464324474334717, -1.1850104331970215, -1.0235884189605713, -0.8621664047241211, -0.7007443904876709, -0.5393223762512207, -0.3779003620147705, -0.2164783477783203, -0.05505633354187012, 0.10636568069458008, 0.2677876949310303, 0.42920970916748047, 0.5906317234039307, 0.7520537376403809, 0.913475751876831, 1.0748977661132812, 1.2363197803497314, 1.3977417945861816, 1.5591638088226318, 1.720585823059082, 1.8820078372955322, 2.0434298515319824]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 6.0, 10.0, 10.0, 15.0, 14.0, 22.0, 29.0, 22.0, 35.0, 38.0, 35.0, 35.0, 43.0, 45.0, 49.0, 59.0, 56.0, 48.0, 55.0, 30.0, 58.0, 41.0, 44.0, 35.0, 21.0, 26.0, 23.0, 15.0, 13.0, 13.0, 7.0, 8.0, 7.0, 6.0, 12.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.6760222911834717, -2.6025078296661377, -2.5289933681488037, -2.4554789066314697, -2.3819644451141357, -2.3084499835968018, -2.2349355220794678, -2.161421060562134, -2.0879065990448, -2.014392137527466, -1.9408776760101318, -1.8673632144927979, -1.7938487529754639, -1.7203342914581299, -1.646819829940796, -1.573305368423462, -1.499790906906128, -1.426276445388794, -1.35276198387146, -1.279247522354126, -1.205733060836792, -1.132218599319458, -1.058704137802124, -0.98518967628479, -0.911675214767456, -0.8381607532501221, -0.7646462917327881, -0.6911318302154541, -0.6176173686981201, -0.5441029071807861, -0.47058844566345215, -0.39707398414611816, -0.3235592842102051, -0.2500448226928711, -0.1765303611755371, -0.10301589965820312, -0.02950143814086914, 0.044013023376464844, 0.11752748489379883, 0.1910419464111328, 0.2645564079284668, 0.3380708694458008, 0.41158533096313477, 0.48509979248046875, 0.5586142539978027, 0.6321287155151367, 0.7056431770324707, 0.7791576385498047, 0.8526721000671387, 0.9261865615844727, 0.9997010231018066, 1.0732154846191406, 1.1467299461364746, 1.2202444076538086, 1.2937588691711426, 1.3672733306884766, 1.4407877922058105, 1.5143022537231445, 1.5878167152404785, 1.6613311767578125, 1.7348456382751465, 1.8083600997924805, 1.8818745613098145, 1.9553890228271484, 2.0289034843444824]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 9.0, 6.0, 8.0, 7.0, 26.0, 21.0, 42.0, 52.0, 96.0, 124.0, 285.0, 1776.0, 207574.0, 3978296.0, 5127.0, 398.0, 163.0, 89.0, 57.0, 34.0, 23.0, 18.0, 15.0, 9.0, 7.0, 4.0, 6.0, 5.0, 1.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5712890625, -1.5208740234375, -1.470458984375, -1.4200439453125, -1.36962890625, -1.3192138671875, -1.268798828125, -1.2183837890625, -1.16796875, -1.1175537109375, -1.067138671875, -1.0167236328125, -0.96630859375, -0.9158935546875, -0.865478515625, -0.8150634765625, -0.7646484375, -0.7142333984375, -0.663818359375, -0.6134033203125, -0.56298828125, -0.5125732421875, -0.462158203125, -0.4117431640625, -0.361328125, -0.3109130859375, -0.260498046875, -0.2100830078125, -0.15966796875, -0.1092529296875, -0.058837890625, -0.0084228515625, 0.0419921875, 0.0924072265625, 0.142822265625, 0.1932373046875, 0.24365234375, 0.2940673828125, 0.344482421875, 0.3948974609375, 0.4453125, 0.4957275390625, 0.546142578125, 0.5965576171875, 0.64697265625, 0.6973876953125, 0.747802734375, 0.7982177734375, 0.8486328125, 0.8990478515625, 0.949462890625, 0.9998779296875, 1.05029296875, 1.1007080078125, 1.151123046875, 1.2015380859375, 1.251953125, 1.3023681640625, 1.352783203125, 1.4031982421875, 1.45361328125, 1.5040283203125, 1.554443359375, 1.6048583984375, 1.6552734375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 5.0, 0.0, 4.0, 3.0, 5.0, 8.0, 13.0, 7.0, 11.0, 10.0, 23.0, 23.0, 19.0, 34.0, 27.0, 45.0, 40.0, 47.0, 45.0, 48.0, 53.0, 43.0, 47.0, 40.0, 50.0, 42.0, 43.0, 41.0, 30.0, 31.0, 32.0, 24.0, 14.0, 24.0, 18.0, 12.0, 15.0, 5.0, 8.0, 7.0, 5.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.12139892578125, -0.11770820617675781, -0.11401748657226562, -0.11032676696777344, -0.10663604736328125, -0.10294532775878906, -0.09925460815429688, -0.09556388854980469, -0.0918731689453125, -0.08818244934082031, -0.08449172973632812, -0.08080101013183594, -0.07711029052734375, -0.07341957092285156, -0.06972885131835938, -0.06603813171386719, -0.062347412109375, -0.05865669250488281, -0.054965972900390625, -0.05127525329589844, -0.04758453369140625, -0.04389381408691406, -0.040203094482421875, -0.03651237487792969, -0.0328216552734375, -0.029130935668945312, -0.025440216064453125, -0.021749496459960938, -0.01805877685546875, -0.014368057250976562, -0.010677337646484375, -0.0069866180419921875, -0.0032958984375, 0.0003948211669921875, 0.004085540771484375, 0.0077762603759765625, 0.01146697998046875, 0.015157699584960938, 0.018848419189453125, 0.022539138793945312, 0.0262298583984375, 0.029920578002929688, 0.033611297607421875, 0.03730201721191406, 0.04099273681640625, 0.04468345642089844, 0.048374176025390625, 0.05206489562988281, 0.055755615234375, 0.05944633483886719, 0.06313705444335938, 0.06682777404785156, 0.07051849365234375, 0.07420921325683594, 0.07789993286132812, 0.08159065246582031, 0.0852813720703125, 0.08897209167480469, 0.09266281127929688, 0.09635353088378906, 0.10004425048828125, 0.10373497009277344, 0.10742568969726562, 0.11111640930175781, 0.11480712890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 6.0, 8.0, 16.0, 19.0, 43.0, 70.0, 101.0, 185.0, 351.0, 674.0, 1463.0, 3237.0, 7645.0, 22158.0, 85202.0, 601673.0, 3026407.0, 352020.0, 63521.0, 18240.0, 6377.0, 2609.0, 1148.0, 525.0, 266.0, 126.0, 80.0, 41.0, 23.0, 21.0, 10.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.412841796875, -0.40149688720703125, -0.3901519775390625, -0.37880706787109375, -0.367462158203125, -0.35611724853515625, -0.3447723388671875, -0.33342742919921875, -0.32208251953125, -0.31073760986328125, -0.2993927001953125, -0.28804779052734375, -0.276702880859375, -0.26535797119140625, -0.2540130615234375, -0.24266815185546875, -0.2313232421875, -0.21997833251953125, -0.2086334228515625, -0.19728851318359375, -0.185943603515625, -0.17459869384765625, -0.1632537841796875, -0.15190887451171875, -0.14056396484375, -0.12921905517578125, -0.1178741455078125, -0.10652923583984375, -0.095184326171875, -0.08383941650390625, -0.0724945068359375, -0.06114959716796875, -0.0498046875, -0.03845977783203125, -0.0271148681640625, -0.01576995849609375, -0.004425048828125, 0.00691986083984375, 0.0182647705078125, 0.02960968017578125, 0.04095458984375, 0.05229949951171875, 0.0636444091796875, 0.07498931884765625, 0.086334228515625, 0.09767913818359375, 0.1090240478515625, 0.12036895751953125, 0.1317138671875, 0.14305877685546875, 0.1544036865234375, 0.16574859619140625, 0.177093505859375, 0.18843841552734375, 0.1997833251953125, 0.21112823486328125, 0.22247314453125, 0.23381805419921875, 0.2451629638671875, 0.25650787353515625, 0.267852783203125, 0.27919769287109375, 0.2905426025390625, 0.30188751220703125, 0.313232421875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 6.0, 5.0, 12.0, 7.0, 11.0, 17.0, 21.0, 37.0, 33.0, 56.0, 88.0, 141.0, 194.0, 300.0, 518.0, 702.0, 644.0, 437.0, 257.0, 159.0, 110.0, 74.0, 60.0, 39.0, 28.0, 18.0, 20.0, 13.0, 15.0, 18.0, 7.0, 6.0, 7.0, 5.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.411376953125, -0.40019989013671875, -0.3890228271484375, -0.37784576416015625, -0.366668701171875, -0.35549163818359375, -0.3443145751953125, -0.33313751220703125, -0.32196044921875, -0.31078338623046875, -0.2996063232421875, -0.28842926025390625, -0.277252197265625, -0.26607513427734375, -0.2548980712890625, -0.24372100830078125, -0.2325439453125, -0.22136688232421875, -0.2101898193359375, -0.19901275634765625, -0.187835693359375, -0.17665863037109375, -0.1654815673828125, -0.15430450439453125, -0.14312744140625, -0.13195037841796875, -0.1207733154296875, -0.10959625244140625, -0.098419189453125, -0.08724212646484375, -0.0760650634765625, -0.06488800048828125, -0.0537109375, -0.04253387451171875, -0.0313568115234375, -0.02017974853515625, -0.009002685546875, 0.00217437744140625, 0.0133514404296875, 0.02452850341796875, 0.03570556640625, 0.04688262939453125, 0.0580596923828125, 0.06923675537109375, 0.080413818359375, 0.09159088134765625, 0.1027679443359375, 0.11394500732421875, 0.1251220703125, 0.13629913330078125, 0.1474761962890625, 0.15865325927734375, 0.169830322265625, 0.18100738525390625, 0.1921844482421875, 0.20336151123046875, 0.21453857421875, 0.22571563720703125, 0.2368927001953125, 0.24806976318359375, 0.259246826171875, 0.27042388916015625, 0.2816009521484375, 0.29277801513671875, 0.303955078125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 11.0, 24.0, 53.0, 102.0, 208.0, 232.0, 194.0, 91.0, 40.0, 14.0, 12.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.134166717529297, -4.979875564575195, -4.825584411621094, -4.67129373550415, -4.517002582550049, -4.362711429595947, -4.208420276641846, -4.054129600524902, -3.899838447570801, -3.745547294616699, -3.5912563800811768, -3.436965227127075, -3.2826743125915527, -3.128383159637451, -2.9740920066833496, -2.819801092147827, -2.6655099391937256, -2.511218786239624, -2.3569278717041016, -2.20263671875, -2.0483458042144775, -1.894054651260376, -1.739763617515564, -1.585472583770752, -1.43118155002594, -1.276890516281128, -1.122599482536316, -0.9683083891868591, -0.8140173554420471, -0.6597263216972351, -0.5054352283477783, -0.3511441946029663, -0.1968531608581543, -0.04256211221218109, 0.11172893643379211, 0.2660199999809265, 0.4203110337257385, 0.5746020674705505, 0.7288931608200073, 0.8831841945648193, 1.0374752283096313, 1.1917662620544434, 1.3460572957992554, 1.5003483295440674, 1.654639482498169, 1.8089303970336914, 1.963221549987793, 2.1175127029418945, 2.271803617477417, 2.4260947704315186, 2.580385684967041, 2.7346768379211426, 2.888967752456665, 3.0432589054107666, 3.197549819946289, 3.3518409729003906, 3.506132125854492, 3.6604232788085938, 3.814714193344116, 3.9690053462982178, 4.12329626083374, 4.277587413787842, 4.431878566741943, 4.586169242858887, 4.740460395812988]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 2.0, 7.0, 8.0, 7.0, 5.0, 8.0, 12.0, 10.0, 13.0, 13.0, 28.0, 20.0, 25.0, 22.0, 36.0, 29.0, 25.0, 41.0, 30.0, 32.0, 46.0, 41.0, 38.0, 37.0, 38.0, 28.0, 29.0, 42.0, 38.0, 30.0, 28.0, 26.0, 25.0, 25.0, 18.0, 23.0, 17.0, 10.0, 15.0, 7.0, 10.0, 11.0, 6.0, 5.0, 9.0, 11.0, 6.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-1.3456482887268066, -1.3037354946136475, -1.2618228197097778, -1.2199100255966187, -1.177997350692749, -1.1360845565795898, -1.0941717624664307, -1.052259087562561, -1.0103462934494019, -0.9684335589408875, -0.926520824432373, -0.8846080303192139, -0.8426952958106995, -0.8007825613021851, -0.7588698267936707, -0.7169570922851562, -0.6750443577766418, -0.6331316232681274, -0.591218888759613, -0.5493061542510986, -0.5073933601379395, -0.46548062562942505, -0.42356789112091064, -0.38165512681007385, -0.33974239230155945, -0.29782965779304504, -0.25591689348220825, -0.21400415897369385, -0.17209140956401825, -0.13017866015434265, -0.08826592564582825, -0.046353161334991455, -0.004440426826477051, 0.03747231885790825, 0.07938506454229355, 0.12129780650138855, 0.16321055591106415, 0.20512330532073975, 0.24703603982925415, 0.28894880414009094, 0.33086153864860535, 0.37277427315711975, 0.41468703746795654, 0.45659977197647095, 0.49851250648498535, 0.5404253005981445, 0.5823379755020142, 0.6242507696151733, 0.6661635041236877, 0.7080762386322021, 0.7499889731407166, 0.791901707649231, 0.8338145017623901, 0.8757272362709045, 0.917639970779419, 0.9595527648925781, 1.0014654397964478, 1.043378233909607, 1.0852909088134766, 1.1272037029266357, 1.1691163778305054, 1.2110291719436646, 1.2529418468475342, 1.2948546409606934, 1.3367674350738525]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 7.0, 5.0, 8.0, 8.0, 13.0, 14.0, 22.0, 25.0, 44.0, 55.0, 80.0, 142.0, 164.0, 251.0, 364.0, 488.0, 737.0, 1056.0, 1598.0, 2583.0, 4064.0, 6603.0, 11168.0, 20298.0, 39289.0, 94038.0, 274791.0, 354801.0, 127284.0, 50026.0, 24126.0, 13141.0, 7751.0, 4818.0, 2924.0, 1855.0, 1249.0, 805.0, 598.0, 361.0, 277.0, 195.0, 130.0, 84.0, 58.0, 39.0, 38.0, 20.0, 19.0, 15.0, 9.0, 12.0, 5.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.245361328125, -0.2381763458251953, -0.23099136352539062, -0.22380638122558594, -0.21662139892578125, -0.20943641662597656, -0.20225143432617188, -0.1950664520263672, -0.1878814697265625, -0.1806964874267578, -0.17351150512695312, -0.16632652282714844, -0.15914154052734375, -0.15195655822753906, -0.14477157592773438, -0.1375865936279297, -0.130401611328125, -0.12321662902832031, -0.11603164672851562, -0.10884666442871094, -0.10166168212890625, -0.09447669982910156, -0.08729171752929688, -0.08010673522949219, -0.0729217529296875, -0.06573677062988281, -0.058551788330078125, -0.05136680603027344, -0.04418182373046875, -0.03699684143066406, -0.029811859130859375, -0.022626876831054688, -0.01544189453125, -0.008256912231445312, -0.001071929931640625, 0.0061130523681640625, 0.01329803466796875, 0.020483016967773438, 0.027667999267578125, 0.03485298156738281, 0.0420379638671875, 0.04922294616699219, 0.056407928466796875, 0.06359291076660156, 0.07077789306640625, 0.07796287536621094, 0.08514785766601562, 0.09233283996582031, 0.099517822265625, 0.10670280456542969, 0.11388778686523438, 0.12107276916503906, 0.12825775146484375, 0.13544273376464844, 0.14262771606445312, 0.1498126983642578, 0.1569976806640625, 0.1641826629638672, 0.17136764526367188, 0.17855262756347656, 0.18573760986328125, 0.19292259216308594, 0.20010757446289062, 0.2072925567626953, 0.2144775390625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 7.0, 7.0, 11.0, 12.0, 15.0, 18.0, 29.0, 23.0, 27.0, 33.0, 31.0, 30.0, 42.0, 41.0, 38.0, 49.0, 45.0, 46.0, 44.0, 43.0, 43.0, 36.0, 49.0, 39.0, 21.0, 21.0, 29.0, 24.0, 30.0, 24.0, 21.0, 14.0, 13.0, 10.0, 4.0, 6.0, 3.0, 4.0, 2.0, 5.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11163330078125, -0.1077280044555664, -0.10382270812988281, -0.09991741180419922, -0.09601211547851562, -0.09210681915283203, -0.08820152282714844, -0.08429622650146484, -0.08039093017578125, -0.07648563385009766, -0.07258033752441406, -0.06867504119873047, -0.06476974487304688, -0.06086444854736328, -0.05695915222167969, -0.053053855895996094, -0.0491485595703125, -0.045243263244628906, -0.04133796691894531, -0.03743267059326172, -0.033527374267578125, -0.02962207794189453, -0.025716781616210938, -0.021811485290527344, -0.01790618896484375, -0.014000892639160156, -0.010095596313476562, -0.006190299987792969, -0.002285003662109375, 0.0016202926635742188, 0.0055255889892578125, 0.009430885314941406, 0.013336181640625, 0.017241477966308594, 0.021146774291992188, 0.02505207061767578, 0.028957366943359375, 0.03286266326904297, 0.03676795959472656, 0.040673255920410156, 0.04457855224609375, 0.048483848571777344, 0.05238914489746094, 0.05629444122314453, 0.060199737548828125, 0.06410503387451172, 0.06801033020019531, 0.0719156265258789, 0.0758209228515625, 0.0797262191772461, 0.08363151550292969, 0.08753681182861328, 0.09144210815429688, 0.09534740447998047, 0.09925270080566406, 0.10315799713134766, 0.10706329345703125, 0.11096858978271484, 0.11487388610839844, 0.11877918243408203, 0.12268447875976562, 0.12658977508544922, 0.1304950714111328, 0.1344003677368164, 0.1383056640625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 6.0, 13.0, 12.0, 12.0, 18.0, 18.0, 34.0, 47.0, 63.0, 83.0, 118.0, 200.0, 342.0, 528.0, 1004.0, 1938.0, 4640.0, 13609.0, 52593.0, 563770.0, 346834.0, 43197.0, 11394.0, 4044.0, 1681.0, 959.0, 487.0, 292.0, 183.0, 122.0, 86.0, 63.0, 42.0, 27.0, 25.0, 10.0, 14.0, 10.0, 8.0, 6.0, 6.0, 2.0, 2.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.482177734375, -0.4655113220214844, -0.44884490966796875, -0.4321784973144531, -0.4155120849609375, -0.3988456726074219, -0.38217926025390625, -0.3655128479003906, -0.348846435546875, -0.3321800231933594, -0.31551361083984375, -0.2988471984863281, -0.2821807861328125, -0.2655143737792969, -0.24884796142578125, -0.23218154907226562, -0.21551513671875, -0.19884872436523438, -0.18218231201171875, -0.16551589965820312, -0.1488494873046875, -0.13218307495117188, -0.11551666259765625, -0.09885025024414062, -0.082183837890625, -0.06551742553710938, -0.04885101318359375, -0.032184600830078125, -0.0155181884765625, 0.001148223876953125, 0.01781463623046875, 0.034481048583984375, 0.0511474609375, 0.06781387329101562, 0.08448028564453125, 0.10114669799804688, 0.1178131103515625, 0.13447952270507812, 0.15114593505859375, 0.16781234741210938, 0.184478759765625, 0.20114517211914062, 0.21781158447265625, 0.23447799682617188, 0.2511444091796875, 0.2678108215332031, 0.28447723388671875, 0.3011436462402344, 0.31781005859375, 0.3344764709472656, 0.35114288330078125, 0.3678092956542969, 0.3844757080078125, 0.4011421203613281, 0.41780853271484375, 0.4344749450683594, 0.451141357421875, 0.4678077697753906, 0.48447418212890625, 0.5011405944824219, 0.5178070068359375, 0.5344734191894531, 0.5511398315429688, 0.5678062438964844, 0.58447265625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 9.0, 10.0, 6.0, 8.0, 10.0, 18.0, 15.0, 17.0, 31.0, 32.0, 40.0, 50.0, 53.0, 44.0, 50.0, 60.0, 56.0, 63.0, 43.0, 63.0, 31.0, 42.0, 42.0, 36.0, 35.0, 26.0, 23.0, 16.0, 17.0, 15.0, 11.0, 9.0, 7.0, 0.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6650390625, -0.644622802734375, -0.62420654296875, -0.603790283203125, -0.5833740234375, -0.562957763671875, -0.54254150390625, -0.522125244140625, -0.501708984375, -0.481292724609375, -0.46087646484375, -0.440460205078125, -0.4200439453125, -0.399627685546875, -0.37921142578125, -0.358795166015625, -0.33837890625, -0.317962646484375, -0.29754638671875, -0.277130126953125, -0.2567138671875, -0.236297607421875, -0.21588134765625, -0.195465087890625, -0.175048828125, -0.154632568359375, -0.13421630859375, -0.113800048828125, -0.0933837890625, -0.072967529296875, -0.05255126953125, -0.032135009765625, -0.01171875, 0.008697509765625, 0.02911376953125, 0.049530029296875, 0.0699462890625, 0.090362548828125, 0.11077880859375, 0.131195068359375, 0.151611328125, 0.172027587890625, 0.19244384765625, 0.212860107421875, 0.2332763671875, 0.253692626953125, 0.27410888671875, 0.294525146484375, 0.31494140625, 0.335357666015625, 0.35577392578125, 0.376190185546875, 0.3966064453125, 0.417022705078125, 0.43743896484375, 0.457855224609375, 0.478271484375, 0.498687744140625, 0.51910400390625, 0.539520263671875, 0.5599365234375, 0.580352783203125, 0.60076904296875, 0.621185302734375, 0.6416015625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 5.0, 12.0, 9.0, 14.0, 19.0, 28.0, 41.0, 69.0, 130.0, 304.0, 784.0, 3050.0, 20099.0, 372471.0, 621624.0, 24686.0, 3626.0, 920.0, 326.0, 135.0, 70.0, 43.0, 28.0, 17.0, 12.0, 8.0, 8.0, 3.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.361328125, -0.3474578857421875, -0.333587646484375, -0.3197174072265625, -0.30584716796875, -0.2919769287109375, -0.278106689453125, -0.2642364501953125, -0.2503662109375, -0.2364959716796875, -0.222625732421875, -0.2087554931640625, -0.19488525390625, -0.1810150146484375, -0.167144775390625, -0.1532745361328125, -0.139404296875, -0.1255340576171875, -0.111663818359375, -0.0977935791015625, -0.08392333984375, -0.0700531005859375, -0.056182861328125, -0.0423126220703125, -0.0284423828125, -0.0145721435546875, -0.000701904296875, 0.0131683349609375, 0.02703857421875, 0.0409088134765625, 0.054779052734375, 0.0686492919921875, 0.08251953125, 0.0963897705078125, 0.110260009765625, 0.1241302490234375, 0.13800048828125, 0.1518707275390625, 0.165740966796875, 0.1796112060546875, 0.1934814453125, 0.2073516845703125, 0.221221923828125, 0.2350921630859375, 0.24896240234375, 0.2628326416015625, 0.276702880859375, 0.2905731201171875, 0.304443359375, 0.3183135986328125, 0.332183837890625, 0.3460540771484375, 0.35992431640625, 0.3737945556640625, 0.387664794921875, 0.4015350341796875, 0.4154052734375, 0.4292755126953125, 0.443145751953125, 0.4570159912109375, 0.47088623046875, 0.4847564697265625, 0.498626708984375, 0.5124969482421875, 0.5263671875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 6.0, 6.0, 10.0, 10.0, 9.0, 13.0, 11.0, 23.0, 19.0, 32.0, 46.0, 41.0, 76.0, 85.0, 105.0, 84.0, 100.0, 65.0, 55.0, 55.0, 26.0, 27.0, 16.0, 14.0, 9.0, 13.0, 10.0, 5.0, 5.0, 2.0, 3.0, 8.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.557868957519531e-05, -7.329694926738739e-05, -7.101520895957947e-05, -6.873346865177155e-05, -6.645172834396362e-05, -6.41699880361557e-05, -6.188824772834778e-05, -5.9606507420539856e-05, -5.7324767112731934e-05, -5.504302680492401e-05, -5.276128649711609e-05, -5.0479546189308167e-05, -4.8197805881500244e-05, -4.591606557369232e-05, -4.36343252658844e-05, -4.135258495807648e-05, -3.9070844650268555e-05, -3.678910434246063e-05, -3.450736403465271e-05, -3.222562372684479e-05, -2.9943883419036865e-05, -2.7662143111228943e-05, -2.538040280342102e-05, -2.3098662495613098e-05, -2.0816922187805176e-05, -1.8535181879997253e-05, -1.625344157218933e-05, -1.3971701264381409e-05, -1.1689960956573486e-05, -9.408220648765564e-06, -7.126480340957642e-06, -4.844740033149719e-06, -2.562999725341797e-06, -2.812594175338745e-07, 2.000480890274048e-06, 4.28222119808197e-06, 6.563961505889893e-06, 8.845701813697815e-06, 1.1127442121505737e-05, 1.340918242931366e-05, 1.5690922737121582e-05, 1.7972663044929504e-05, 2.0254403352737427e-05, 2.253614366054535e-05, 2.481788396835327e-05, 2.7099624276161194e-05, 2.9381364583969116e-05, 3.166310489177704e-05, 3.394484519958496e-05, 3.622658550739288e-05, 3.8508325815200806e-05, 4.079006612300873e-05, 4.307180643081665e-05, 4.535354673862457e-05, 4.7635287046432495e-05, 4.991702735424042e-05, 5.219876766204834e-05, 5.448050796985626e-05, 5.6762248277664185e-05, 5.904398858547211e-05, 6.132572889328003e-05, 6.360746920108795e-05, 6.588920950889587e-05, 6.81709498167038e-05, 7.045269012451172e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 5.0, 5.0, 3.0, 6.0, 8.0, 14.0, 25.0, 40.0, 49.0, 64.0, 124.0, 218.0, 524.0, 1144.0, 2943.0, 9826.0, 68873.0, 836388.0, 109679.0, 12603.0, 3509.0, 1349.0, 553.0, 247.0, 144.0, 78.0, 45.0, 37.0, 25.0, 8.0, 5.0, 2.0, 9.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.367431640625, -0.35457611083984375, -0.3417205810546875, -0.32886505126953125, -0.316009521484375, -0.30315399169921875, -0.2902984619140625, -0.27744293212890625, -0.26458740234375, -0.25173187255859375, -0.2388763427734375, -0.22602081298828125, -0.213165283203125, -0.20030975341796875, -0.1874542236328125, -0.17459869384765625, -0.1617431640625, -0.14888763427734375, -0.1360321044921875, -0.12317657470703125, -0.110321044921875, -0.09746551513671875, -0.0846099853515625, -0.07175445556640625, -0.05889892578125, -0.04604339599609375, -0.0331878662109375, -0.02033233642578125, -0.007476806640625, 0.00537872314453125, 0.0182342529296875, 0.03108978271484375, 0.0439453125, 0.05680084228515625, 0.0696563720703125, 0.08251190185546875, 0.095367431640625, 0.10822296142578125, 0.1210784912109375, 0.13393402099609375, 0.14678955078125, 0.15964508056640625, 0.1725006103515625, 0.18535614013671875, 0.198211669921875, 0.21106719970703125, 0.2239227294921875, 0.23677825927734375, 0.2496337890625, 0.26248931884765625, 0.2753448486328125, 0.28820037841796875, 0.301055908203125, 0.31391143798828125, 0.3267669677734375, 0.33962249755859375, 0.35247802734375, 0.36533355712890625, 0.3781890869140625, 0.39104461669921875, 0.403900146484375, 0.41675567626953125, 0.4296112060546875, 0.44246673583984375, 0.455322265625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 0.0, 2.0, 5.0, 6.0, 5.0, 8.0, 11.0, 21.0, 10.0, 25.0, 29.0, 42.0, 50.0, 54.0, 72.0, 85.0, 100.0, 86.0, 73.0, 65.0, 49.0, 53.0, 35.0, 27.0, 18.0, 12.0, 16.0, 10.0, 4.0, 5.0, 4.0, 3.0, 1.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.260009765625, -0.25267601013183594, -0.24534225463867188, -0.2380084991455078, -0.23067474365234375, -0.2233409881591797, -0.21600723266601562, -0.20867347717285156, -0.2013397216796875, -0.19400596618652344, -0.18667221069335938, -0.1793384552001953, -0.17200469970703125, -0.1646709442138672, -0.15733718872070312, -0.15000343322753906, -0.142669677734375, -0.13533592224121094, -0.12800216674804688, -0.12066841125488281, -0.11333465576171875, -0.10600090026855469, -0.09866714477539062, -0.09133338928222656, -0.0839996337890625, -0.07666587829589844, -0.06933212280273438, -0.06199836730957031, -0.05466461181640625, -0.04733085632324219, -0.039997100830078125, -0.03266334533691406, -0.02532958984375, -0.017995834350585938, -0.010662078857421875, -0.0033283233642578125, 0.00400543212890625, 0.011339187622070312, 0.018672943115234375, 0.026006698608398438, 0.0333404541015625, 0.04067420959472656, 0.048007965087890625, 0.05534172058105469, 0.06267547607421875, 0.07000923156738281, 0.07734298706054688, 0.08467674255371094, 0.092010498046875, 0.09934425354003906, 0.10667800903320312, 0.11401176452636719, 0.12134552001953125, 0.1286792755126953, 0.13601303100585938, 0.14334678649902344, 0.1506805419921875, 0.15801429748535156, 0.16534805297851562, 0.1726818084716797, 0.18001556396484375, 0.1873493194580078, 0.19468307495117188, 0.20201683044433594, 0.2093505859375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 4.0, 9.0, 10.0, 27.0, 62.0, 119.0, 264.0, 256.0, 139.0, 63.0, 18.0, 8.0, 7.0, 6.0, 2.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.128609657287598, -3.9339144229888916, -3.7392191886901855, -3.5445239543914795, -3.3498287200927734, -3.1551334857940674, -2.9604382514953613, -2.7657430171966553, -2.571047782897949, -2.376352548599243, -2.181657314300537, -1.986962080001831, -1.792266845703125, -1.597571611404419, -1.402876377105713, -1.2081811428070068, -1.0134859085083008, -0.8187906742095947, -0.6240954399108887, -0.4294002056121826, -0.23470497131347656, -0.04000973701477051, 0.15468549728393555, 0.3493807315826416, 0.5440759658813477, 0.7387712001800537, 0.9334664344787598, 1.1281616687774658, 1.3228569030761719, 1.517552137374878, 1.712247371673584, 1.90694260597229, 2.101637840270996, 2.296333074569702, 2.491028308868408, 2.6857235431671143, 2.8804187774658203, 3.0751140117645264, 3.2698092460632324, 3.4645044803619385, 3.6591997146606445, 3.8538949489593506, 4.048590183258057, 4.243285179138184, 4.437980651855469, 4.632676124572754, 4.827371120452881, 5.022066116333008, 5.216761589050293, 5.411457061767578, 5.606152057647705, 5.800847053527832, 5.995542526245117, 6.190237998962402, 6.384932994842529, 6.579627990722656, 6.774323463439941, 6.969018936157227, 7.1637139320373535, 7.3584089279174805, 7.553104400634766, 7.747799873352051, 7.942494869232178, 8.137189865112305, 8.33188533782959]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 13.0, 13.0, 10.0, 16.0, 14.0, 17.0, 18.0, 20.0, 26.0, 33.0, 39.0, 42.0, 30.0, 46.0, 52.0, 69.0, 71.0, 75.0, 62.0, 37.0, 40.0, 42.0, 36.0, 30.0, 25.0, 27.0, 23.0, 10.0, 15.0, 7.0, 16.0, 11.0, 2.0, 3.0, 7.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.73716139793396, -2.6523704528808594, -2.5675792694091797, -2.4827880859375, -2.3979971408843994, -2.313206195831299, -2.228415012359619, -2.1436238288879395, -2.058832883834839, -1.9740418195724487, -1.8892507553100586, -1.8044596910476685, -1.7196686267852783, -1.6348775625228882, -1.550086498260498, -1.465295433998108, -1.3805043697357178, -1.2957133054733276, -1.2109222412109375, -1.1261311769485474, -1.0413401126861572, -0.9565490484237671, -0.871757984161377, -0.7869669198989868, -0.7021758556365967, -0.6173847913742065, -0.5325937271118164, -0.44780266284942627, -0.36301159858703613, -0.278220534324646, -0.19342947006225586, -0.10863840579986572, -0.023847579956054688, 0.06094348430633545, 0.14573454856872559, 0.23052561283111572, 0.31531667709350586, 0.400107741355896, 0.48489880561828613, 0.5696898698806763, 0.6544809341430664, 0.7392719984054565, 0.8240630626678467, 0.9088541269302368, 0.993645191192627, 1.078436255455017, 1.1632273197174072, 1.2480183839797974, 1.3328094482421875, 1.4176005125045776, 1.5023915767669678, 1.587182641029358, 1.671973705291748, 1.7567647695541382, 1.8415558338165283, 1.9263468980789185, 2.0111379623413086, 2.0959291458129883, 2.180720090866089, 2.2655110359191895, 2.350302219390869, 2.435093402862549, 2.5198843479156494, 2.60467529296875, 2.6894664764404297]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 10.0, 5.0, 5.0, 8.0, 8.0, 18.0, 18.0, 39.0, 42.0, 87.0, 175.0, 346.0, 764.0, 1654.0, 3947.0, 10492.0, 30552.0, 110568.0, 638063.0, 2546574.0, 683440.0, 117942.0, 32015.0, 10520.0, 3939.0, 1605.0, 676.0, 325.0, 201.0, 88.0, 52.0, 38.0, 25.0, 18.0, 12.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.31201171875, -0.3039112091064453, -0.2958106994628906, -0.28771018981933594, -0.27960968017578125, -0.27150917053222656, -0.2634086608886719, -0.2553081512451172, -0.2472076416015625, -0.2391071319580078, -0.23100662231445312, -0.22290611267089844, -0.21480560302734375, -0.20670509338378906, -0.19860458374023438, -0.1905040740966797, -0.182403564453125, -0.1743030548095703, -0.16620254516601562, -0.15810203552246094, -0.15000152587890625, -0.14190101623535156, -0.13380050659179688, -0.1256999969482422, -0.1175994873046875, -0.10949897766113281, -0.10139846801757812, -0.09329795837402344, -0.08519744873046875, -0.07709693908691406, -0.06899642944335938, -0.06089591979980469, -0.05279541015625, -0.04469490051269531, -0.036594390869140625, -0.028493881225585938, -0.02039337158203125, -0.012292861938476562, -0.004192352294921875, 0.0039081573486328125, 0.0120086669921875, 0.020109176635742188, 0.028209686279296875, 0.03631019592285156, 0.04441070556640625, 0.05251121520996094, 0.060611724853515625, 0.06871223449707031, 0.076812744140625, 0.08491325378417969, 0.09301376342773438, 0.10111427307128906, 0.10921478271484375, 0.11731529235839844, 0.12541580200195312, 0.1335163116455078, 0.1416168212890625, 0.1497173309326172, 0.15781784057617188, 0.16591835021972656, 0.17401885986328125, 0.18211936950683594, 0.19021987915039062, 0.1983203887939453, 0.2064208984375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 7.0, 6.0, 7.0, 7.0, 9.0, 17.0, 10.0, 16.0, 34.0, 20.0, 22.0, 23.0, 34.0, 28.0, 39.0, 35.0, 49.0, 52.0, 40.0, 58.0, 45.0, 55.0, 33.0, 43.0, 54.0, 36.0, 35.0, 28.0, 21.0, 21.0, 27.0, 19.0, 18.0, 8.0, 13.0, 10.0, 4.0, 6.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1265869140625, -0.1228036880493164, -0.11902046203613281, -0.11523723602294922, -0.11145401000976562, -0.10767078399658203, -0.10388755798339844, -0.10010433197021484, -0.09632110595703125, -0.09253787994384766, -0.08875465393066406, -0.08497142791748047, -0.08118820190429688, -0.07740497589111328, -0.07362174987792969, -0.0698385238647461, -0.0660552978515625, -0.062272071838378906, -0.05848884582519531, -0.05470561981201172, -0.050922393798828125, -0.04713916778564453, -0.04335594177246094, -0.039572715759277344, -0.03578948974609375, -0.032006263732910156, -0.028223037719726562, -0.02443981170654297, -0.020656585693359375, -0.01687335968017578, -0.013090133666992188, -0.009306907653808594, -0.005523681640625, -0.0017404556274414062, 0.0020427703857421875, 0.005825996398925781, 0.009609222412109375, 0.013392448425292969, 0.017175674438476562, 0.020958900451660156, 0.02474212646484375, 0.028525352478027344, 0.03230857849121094, 0.03609180450439453, 0.039875030517578125, 0.04365825653076172, 0.04744148254394531, 0.051224708557128906, 0.0550079345703125, 0.058791160583496094, 0.06257438659667969, 0.06635761260986328, 0.07014083862304688, 0.07392406463623047, 0.07770729064941406, 0.08149051666259766, 0.08527374267578125, 0.08905696868896484, 0.09284019470214844, 0.09662342071533203, 0.10040664672851562, 0.10418987274169922, 0.10797309875488281, 0.1117563247680664, 0.11553955078125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 3.0, 5.0, 5.0, 5.0, 6.0, 17.0, 23.0, 44.0, 57.0, 56.0, 112.0, 180.0, 309.0, 503.0, 913.0, 1635.0, 3435.0, 7938.0, 19511.0, 55943.0, 189594.0, 945082.0, 2281870.0, 498104.0, 123345.0, 39321.0, 14650.0, 5832.0, 2706.0, 1316.0, 697.0, 404.0, 238.0, 147.0, 88.0, 66.0, 42.0, 25.0, 16.0, 14.0, 7.0, 10.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2408447265625, -0.23262977600097656, -0.22441482543945312, -0.2161998748779297, -0.20798492431640625, -0.1997699737548828, -0.19155502319335938, -0.18334007263183594, -0.1751251220703125, -0.16691017150878906, -0.15869522094726562, -0.1504802703857422, -0.14226531982421875, -0.1340503692626953, -0.12583541870117188, -0.11762046813964844, -0.109405517578125, -0.10119056701660156, -0.09297561645507812, -0.08476066589355469, -0.07654571533203125, -0.06833076477050781, -0.060115814208984375, -0.05190086364746094, -0.0436859130859375, -0.03547096252441406, -0.027256011962890625, -0.019041061401367188, -0.01082611083984375, -0.0026111602783203125, 0.005603790283203125, 0.013818740844726562, 0.02203369140625, 0.030248641967773438, 0.038463592529296875, 0.04667854309082031, 0.05489349365234375, 0.06310844421386719, 0.07132339477539062, 0.07953834533691406, 0.0877532958984375, 0.09596824645996094, 0.10418319702148438, 0.11239814758300781, 0.12061309814453125, 0.1288280487060547, 0.13704299926757812, 0.14525794982910156, 0.153472900390625, 0.16168785095214844, 0.16990280151367188, 0.1781177520751953, 0.18633270263671875, 0.1945476531982422, 0.20276260375976562, 0.21097755432128906, 0.2191925048828125, 0.22740745544433594, 0.23562240600585938, 0.2438373565673828, 0.25205230712890625, 0.2602672576904297, 0.2684822082519531, 0.27669715881347656, 0.284912109375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 5.0, 9.0, 13.0, 10.0, 13.0, 23.0, 29.0, 43.0, 61.0, 70.0, 80.0, 142.0, 129.0, 201.0, 356.0, 483.0, 502.0, 455.0, 356.0, 273.0, 197.0, 124.0, 108.0, 101.0, 78.0, 57.0, 52.0, 23.0, 16.0, 18.0, 14.0, 10.0, 8.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.4091796875, -0.3977394104003906, -0.38629913330078125, -0.3748588562011719, -0.3634185791015625, -0.3519783020019531, -0.34053802490234375, -0.3290977478027344, -0.317657470703125, -0.3062171936035156, -0.29477691650390625, -0.2833366394042969, -0.2718963623046875, -0.2604560852050781, -0.24901580810546875, -0.23757553100585938, -0.22613525390625, -0.21469497680664062, -0.20325469970703125, -0.19181442260742188, -0.1803741455078125, -0.16893386840820312, -0.15749359130859375, -0.14605331420898438, -0.134613037109375, -0.12317276000976562, -0.11173248291015625, -0.10029220581054688, -0.0888519287109375, -0.07741165161132812, -0.06597137451171875, -0.054531097412109375, -0.0430908203125, -0.031650543212890625, -0.02021026611328125, -0.008769989013671875, 0.0026702880859375, 0.014110565185546875, 0.02555084228515625, 0.036991119384765625, 0.048431396484375, 0.059871673583984375, 0.07131195068359375, 0.08275222778320312, 0.0941925048828125, 0.10563278198242188, 0.11707305908203125, 0.12851333618164062, 0.13995361328125, 0.15139389038085938, 0.16283416748046875, 0.17427444458007812, 0.1857147216796875, 0.19715499877929688, 0.20859527587890625, 0.22003555297851562, 0.231475830078125, 0.24291610717773438, 0.25435638427734375, 0.2657966613769531, 0.2772369384765625, 0.2886772155761719, 0.30011749267578125, 0.3115577697753906, 0.322998046875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 4.0, 7.0, 19.0, 51.0, 107.0, 181.0, 220.0, 211.0, 105.0, 37.0, 18.0, 11.0, 6.0, 7.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.286144733428955, -4.109877586364746, -3.933610439300537, -3.7573435306549072, -3.5810763835906982, -3.4048092365264893, -3.2285423278808594, -3.0522751808166504, -2.8760080337524414, -2.6997408866882324, -2.5234737396240234, -2.3472068309783936, -2.1709396839141846, -1.9946725368499756, -1.8184055089950562, -1.6421384811401367, -1.4658713340759277, -1.2896041870117188, -1.1133371591567993, -0.9370700716972351, -0.7608029842376709, -0.5845358967781067, -0.4082688093185425, -0.23200178146362305, -0.05573463439941406, 0.12053245306015015, 0.29679954051971436, 0.47306662797927856, 0.6493337154388428, 0.825600802898407, 1.0018678903579712, 1.1781349182128906, 1.3544015884399414, 1.5306687355041504, 1.7069357633590698, 1.8832027912139893, 2.0594699382781982, 2.2357370853424072, 2.412003993988037, 2.588271141052246, 2.764538288116455, 2.940805435180664, 3.117072582244873, 3.293339490890503, 3.469606637954712, 3.645873785018921, 3.822140693664551, 3.9984078407287598, 4.174674987792969, 4.350942134857178, 4.527209281921387, 4.703476428985596, 4.879743576049805, 5.0560102462768555, 5.2322773933410645, 5.408544540405273, 5.584811687469482, 5.761078834533691, 5.9373459815979, 6.113613128662109, 6.28987979888916, 6.466146945953369, 6.642414093017578, 6.818681240081787, 6.994948387145996]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 1.0, 7.0, 10.0, 13.0, 11.0, 15.0, 18.0, 12.0, 17.0, 25.0, 34.0, 26.0, 33.0, 45.0, 50.0, 53.0, 51.0, 42.0, 47.0, 40.0, 43.0, 47.0, 46.0, 47.0, 30.0, 38.0, 30.0, 24.0, 26.0, 21.0, 22.0, 13.0, 16.0, 8.0, 12.0, 3.0, 4.0, 4.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.864199161529541, -1.7974910736083984, -1.7307828664779663, -1.6640747785568237, -1.5973665714263916, -1.530658483505249, -1.4639503955841064, -1.3972423076629639, -1.3305341005325317, -1.2638260126113892, -1.197117805480957, -1.1304097175598145, -1.0637016296386719, -0.9969934225082397, -0.9302853345870972, -0.8635771870613098, -0.7968690395355225, -0.7301608920097351, -0.6634527444839478, -0.5967446565628052, -0.5300365090370178, -0.46332836151123047, -0.3966202437877655, -0.32991212606430054, -0.2632039785385132, -0.19649584591388702, -0.12978771328926086, -0.0630795806646347, 0.003628551959991455, 0.07033669948577881, 0.13704481720924377, 0.20375293493270874, 0.2704613208770752, 0.33716946840286255, 0.4038775861263275, 0.4705857038497925, 0.5372938513755798, 0.6040019989013672, 0.6707100868225098, 0.7374182343482971, 0.8041263818740845, 0.8708345293998718, 0.9375426769256592, 1.0042507648468018, 1.0709588527679443, 1.1376670598983765, 1.204375147819519, 1.2710833549499512, 1.3377914428710938, 1.4044995307922363, 1.4712077379226685, 1.537915825843811, 1.6046240329742432, 1.6713321208953857, 1.7380402088165283, 1.804748296737671, 1.871456503868103, 1.9381645917892456, 2.0048727989196777, 2.0715808868408203, 2.138288974761963, 2.2049970626831055, 2.271705389022827, 2.3384134769439697, 2.4051215648651123]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 8.0, 13.0, 11.0, 16.0, 26.0, 28.0, 46.0, 56.0, 97.0, 159.0, 235.0, 372.0, 616.0, 963.0, 1620.0, 2718.0, 5015.0, 9445.0, 17996.0, 36195.0, 76643.0, 190889.0, 375772.0, 182215.0, 74294.0, 35131.0, 17456.0, 8969.0, 4851.0, 2662.0, 1591.0, 896.0, 576.0, 349.0, 218.0, 133.0, 86.0, 60.0, 39.0, 25.0, 22.0, 12.0, 14.0, 6.0, 7.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3076171875, -0.2986946105957031, -0.28977203369140625, -0.2808494567871094, -0.2719268798828125, -0.2630043029785156, -0.25408172607421875, -0.24515914916992188, -0.236236572265625, -0.22731399536132812, -0.21839141845703125, -0.20946884155273438, -0.2005462646484375, -0.19162368774414062, -0.18270111083984375, -0.17377853393554688, -0.16485595703125, -0.15593338012695312, -0.14701080322265625, -0.13808822631835938, -0.1291656494140625, -0.12024307250976562, -0.11132049560546875, -0.10239791870117188, -0.093475341796875, -0.08455276489257812, -0.07563018798828125, -0.06670761108398438, -0.0577850341796875, -0.048862457275390625, -0.03993988037109375, -0.031017303466796875, -0.0220947265625, -0.013172149658203125, -0.00424957275390625, 0.004673004150390625, 0.0135955810546875, 0.022518157958984375, 0.03144073486328125, 0.040363311767578125, 0.049285888671875, 0.058208465576171875, 0.06713104248046875, 0.07605361938476562, 0.0849761962890625, 0.09389877319335938, 0.10282135009765625, 0.11174392700195312, 0.12066650390625, 0.12958908081054688, 0.13851165771484375, 0.14743423461914062, 0.1563568115234375, 0.16527938842773438, 0.17420196533203125, 0.18312454223632812, 0.192047119140625, 0.20096969604492188, 0.20989227294921875, 0.21881484985351562, 0.2277374267578125, 0.23666000366210938, 0.24558258056640625, 0.2545051574707031, 0.263427734375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 14.0, 13.0, 11.0, 15.0, 20.0, 20.0, 35.0, 25.0, 34.0, 51.0, 49.0, 45.0, 65.0, 60.0, 65.0, 57.0, 56.0, 59.0, 51.0, 47.0, 41.0, 33.0, 17.0, 35.0, 20.0, 15.0, 13.0, 13.0, 4.0, 4.0, 4.0, 2.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1636962890625, -0.1584949493408203, -0.15329360961914062, -0.14809226989746094, -0.14289093017578125, -0.13768959045410156, -0.13248825073242188, -0.1272869110107422, -0.1220855712890625, -0.11688423156738281, -0.11168289184570312, -0.10648155212402344, -0.10128021240234375, -0.09607887268066406, -0.09087753295898438, -0.08567619323730469, -0.080474853515625, -0.07527351379394531, -0.07007217407226562, -0.06487083435058594, -0.05966949462890625, -0.05446815490722656, -0.049266815185546875, -0.04406547546386719, -0.0388641357421875, -0.03366279602050781, -0.028461456298828125, -0.023260116577148438, -0.01805877685546875, -0.012857437133789062, -0.007656097412109375, -0.0024547576904296875, 0.00274658203125, 0.007947921752929688, 0.013149261474609375, 0.018350601196289062, 0.02355194091796875, 0.028753280639648438, 0.033954620361328125, 0.03915596008300781, 0.0443572998046875, 0.04955863952636719, 0.054759979248046875, 0.05996131896972656, 0.06516265869140625, 0.07036399841308594, 0.07556533813476562, 0.08076667785644531, 0.085968017578125, 0.09116935729980469, 0.09637069702148438, 0.10157203674316406, 0.10677337646484375, 0.11197471618652344, 0.11717605590820312, 0.12237739562988281, 0.1275787353515625, 0.1327800750732422, 0.13798141479492188, 0.14318275451660156, 0.14838409423828125, 0.15358543395996094, 0.15878677368164062, 0.1639881134033203, 0.169189453125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 5.0, 4.0, 15.0, 11.0, 13.0, 21.0, 31.0, 34.0, 42.0, 51.0, 70.0, 109.0, 142.0, 213.0, 291.0, 461.0, 699.0, 1162.0, 1968.0, 4022.0, 10363.0, 38459.0, 256636.0, 641945.0, 65302.0, 14918.0, 5232.0, 2453.0, 1335.0, 767.0, 536.0, 357.0, 248.0, 167.0, 133.0, 94.0, 59.0, 51.0, 38.0, 27.0, 13.0, 12.0, 11.0, 5.0, 7.0, 6.0, 5.0, 6.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0], "bins": [-0.6259765625, -0.6058883666992188, -0.5858001708984375, -0.5657119750976562, -0.545623779296875, -0.5255355834960938, -0.5054473876953125, -0.48535919189453125, -0.46527099609375, -0.44518280029296875, -0.4250946044921875, -0.40500640869140625, -0.384918212890625, -0.36483001708984375, -0.3447418212890625, -0.32465362548828125, -0.3045654296875, -0.28447723388671875, -0.2643890380859375, -0.24430084228515625, -0.224212646484375, -0.20412445068359375, -0.1840362548828125, -0.16394805908203125, -0.14385986328125, -0.12377166748046875, -0.1036834716796875, -0.08359527587890625, -0.063507080078125, -0.04341888427734375, -0.0233306884765625, -0.00324249267578125, 0.016845703125, 0.03693389892578125, 0.0570220947265625, 0.07711029052734375, 0.097198486328125, 0.11728668212890625, 0.1373748779296875, 0.15746307373046875, 0.17755126953125, 0.19763946533203125, 0.2177276611328125, 0.23781585693359375, 0.257904052734375, 0.27799224853515625, 0.2980804443359375, 0.31816864013671875, 0.3382568359375, 0.35834503173828125, 0.3784332275390625, 0.39852142333984375, 0.418609619140625, 0.43869781494140625, 0.4587860107421875, 0.47887420654296875, 0.49896240234375, 0.5190505981445312, 0.5391387939453125, 0.5592269897460938, 0.579315185546875, 0.5994033813476562, 0.6194915771484375, 0.6395797729492188, 0.65966796875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 8.0, 6.0, 18.0, 14.0, 12.0, 16.0, 20.0, 25.0, 26.0, 34.0, 28.0, 21.0, 33.0, 53.0, 53.0, 57.0, 40.0, 49.0, 46.0, 55.0, 50.0, 40.0, 48.0, 39.0, 24.0, 24.0, 28.0, 22.0, 17.0, 11.0, 17.0, 14.0, 9.0, 10.0, 7.0, 4.0, 2.0, 4.0, 6.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60498046875, -0.5840911865234375, -0.563201904296875, -0.5423126220703125, -0.52142333984375, -0.5005340576171875, -0.479644775390625, -0.4587554931640625, -0.4378662109375, -0.4169769287109375, -0.396087646484375, -0.3751983642578125, -0.35430908203125, -0.3334197998046875, -0.312530517578125, -0.2916412353515625, -0.270751953125, -0.2498626708984375, -0.228973388671875, -0.2080841064453125, -0.18719482421875, -0.1663055419921875, -0.145416259765625, -0.1245269775390625, -0.1036376953125, -0.0827484130859375, -0.061859130859375, -0.0409698486328125, -0.02008056640625, 0.0008087158203125, 0.021697998046875, 0.0425872802734375, 0.0634765625, 0.0843658447265625, 0.105255126953125, 0.1261444091796875, 0.14703369140625, 0.1679229736328125, 0.188812255859375, 0.2097015380859375, 0.2305908203125, 0.2514801025390625, 0.272369384765625, 0.2932586669921875, 0.31414794921875, 0.3350372314453125, 0.355926513671875, 0.3768157958984375, 0.397705078125, 0.4185943603515625, 0.439483642578125, 0.4603729248046875, 0.48126220703125, 0.5021514892578125, 0.523040771484375, 0.5439300537109375, 0.5648193359375, 0.5857086181640625, 0.606597900390625, 0.6274871826171875, 0.64837646484375, 0.6692657470703125, 0.690155029296875, 0.7110443115234375, 0.73193359375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 5.0, 8.0, 8.0, 12.0, 23.0, 28.0, 40.0, 29.0, 63.0, 78.0, 123.0, 224.0, 304.0, 508.0, 884.0, 1759.0, 3947.0, 10376.0, 32241.0, 125353.0, 637810.0, 170847.0, 41538.0, 12740.0, 4769.0, 2147.0, 1141.0, 547.0, 319.0, 207.0, 112.0, 98.0, 75.0, 46.0, 39.0, 19.0, 20.0, 15.0, 13.0, 10.0, 7.0, 2.0, 4.0, 3.0, 1.0, 2.0, 6.0, 2.0, 3.0], "bins": [-0.2335205078125, -0.2269611358642578, -0.22040176391601562, -0.21384239196777344, -0.20728302001953125, -0.20072364807128906, -0.19416427612304688, -0.1876049041748047, -0.1810455322265625, -0.1744861602783203, -0.16792678833007812, -0.16136741638183594, -0.15480804443359375, -0.14824867248535156, -0.14168930053710938, -0.1351299285888672, -0.128570556640625, -0.12201118469238281, -0.11545181274414062, -0.10889244079589844, -0.10233306884765625, -0.09577369689941406, -0.08921432495117188, -0.08265495300292969, -0.0760955810546875, -0.06953620910644531, -0.06297683715820312, -0.05641746520996094, -0.04985809326171875, -0.04329872131347656, -0.036739349365234375, -0.030179977416992188, -0.02362060546875, -0.017061233520507812, -0.010501861572265625, -0.0039424896240234375, 0.00261688232421875, 0.009176254272460938, 0.015735626220703125, 0.022294998168945312, 0.0288543701171875, 0.03541374206542969, 0.041973114013671875, 0.04853248596191406, 0.05509185791015625, 0.06165122985839844, 0.06821060180664062, 0.07476997375488281, 0.081329345703125, 0.08788871765136719, 0.09444808959960938, 0.10100746154785156, 0.10756683349609375, 0.11412620544433594, 0.12068557739257812, 0.1272449493408203, 0.1338043212890625, 0.1403636932373047, 0.14692306518554688, 0.15348243713378906, 0.16004180908203125, 0.16660118103027344, 0.17316055297851562, 0.1797199249267578, 0.186279296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 3.0, 2.0, 4.0, 1.0, 8.0, 4.0, 7.0, 8.0, 10.0, 16.0, 18.0, 12.0, 22.0, 34.0, 34.0, 49.0, 47.0, 80.0, 82.0, 104.0, 90.0, 66.0, 64.0, 48.0, 25.0, 31.0, 19.0, 18.0, 18.0, 18.0, 9.0, 12.0, 11.0, 5.0, 6.0, 4.0, 4.0, 8.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.147954940795898e-05, -7.880479097366333e-05, -7.613003253936768e-05, -7.345527410507202e-05, -7.078051567077637e-05, -6.810575723648071e-05, -6.543099880218506e-05, -6.27562403678894e-05, -6.008148193359375e-05, -5.7406723499298096e-05, -5.473196506500244e-05, -5.205720663070679e-05, -4.938244819641113e-05, -4.670768976211548e-05, -4.4032931327819824e-05, -4.135817289352417e-05, -3.8683414459228516e-05, -3.600865602493286e-05, -3.333389759063721e-05, -3.065913915634155e-05, -2.79843807220459e-05, -2.5309622287750244e-05, -2.263486385345459e-05, -1.9960105419158936e-05, -1.728534698486328e-05, -1.4610588550567627e-05, -1.1935830116271973e-05, -9.261071681976318e-06, -6.586313247680664e-06, -3.91155481338501e-06, -1.2367963790893555e-06, 1.4379620552062988e-06, 4.112720489501953e-06, 6.787478923797607e-06, 9.462237358093262e-06, 1.2136995792388916e-05, 1.481175422668457e-05, 1.7486512660980225e-05, 2.016127109527588e-05, 2.2836029529571533e-05, 2.5510787963867188e-05, 2.8185546398162842e-05, 3.0860304832458496e-05, 3.353506326675415e-05, 3.6209821701049805e-05, 3.888458013534546e-05, 4.155933856964111e-05, 4.423409700393677e-05, 4.690885543823242e-05, 4.9583613872528076e-05, 5.225837230682373e-05, 5.4933130741119385e-05, 5.760788917541504e-05, 6.028264760971069e-05, 6.295740604400635e-05, 6.5632164478302e-05, 6.830692291259766e-05, 7.098168134689331e-05, 7.365643978118896e-05, 7.633119821548462e-05, 7.900595664978027e-05, 8.168071508407593e-05, 8.435547351837158e-05, 8.703023195266724e-05, 8.970499038696289e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 8.0, 11.0, 23.0, 25.0, 32.0, 65.0, 85.0, 215.0, 442.0, 908.0, 2322.0, 7648.0, 55244.0, 857245.0, 108618.0, 10587.0, 2938.0, 1114.0, 474.0, 235.0, 126.0, 78.0, 38.0, 22.0, 14.0, 9.0, 6.0, 7.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.442138671875, -0.42858123779296875, -0.4150238037109375, -0.40146636962890625, -0.387908935546875, -0.37435150146484375, -0.3607940673828125, -0.34723663330078125, -0.33367919921875, -0.32012176513671875, -0.3065643310546875, -0.29300689697265625, -0.279449462890625, -0.26589202880859375, -0.2523345947265625, -0.23877716064453125, -0.2252197265625, -0.21166229248046875, -0.1981048583984375, -0.18454742431640625, -0.170989990234375, -0.15743255615234375, -0.1438751220703125, -0.13031768798828125, -0.11676025390625, -0.10320281982421875, -0.0896453857421875, -0.07608795166015625, -0.062530517578125, -0.04897308349609375, -0.0354156494140625, -0.02185821533203125, -0.00830078125, 0.00525665283203125, 0.0188140869140625, 0.03237152099609375, 0.045928955078125, 0.05948638916015625, 0.0730438232421875, 0.08660125732421875, 0.10015869140625, 0.11371612548828125, 0.1272735595703125, 0.14083099365234375, 0.154388427734375, 0.16794586181640625, 0.1815032958984375, 0.19506072998046875, 0.2086181640625, 0.22217559814453125, 0.2357330322265625, 0.24929046630859375, 0.262847900390625, 0.27640533447265625, 0.2899627685546875, 0.30352020263671875, 0.31707763671875, 0.33063507080078125, 0.3441925048828125, 0.35774993896484375, 0.371307373046875, 0.38486480712890625, 0.3984222412109375, 0.41197967529296875, 0.425537109375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 5.0, 4.0, 12.0, 7.0, 13.0, 19.0, 21.0, 39.0, 42.0, 47.0, 39.0, 46.0, 94.0, 86.0, 111.0, 96.0, 66.0, 57.0, 36.0, 36.0, 23.0, 20.0, 16.0, 9.0, 11.0, 7.0, 12.0, 8.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.29345703125, -0.28507232666015625, -0.2766876220703125, -0.26830291748046875, -0.259918212890625, -0.25153350830078125, -0.2431488037109375, -0.23476409912109375, -0.22637939453125, -0.21799468994140625, -0.2096099853515625, -0.20122528076171875, -0.192840576171875, -0.18445587158203125, -0.1760711669921875, -0.16768646240234375, -0.1593017578125, -0.15091705322265625, -0.1425323486328125, -0.13414764404296875, -0.125762939453125, -0.11737823486328125, -0.1089935302734375, -0.10060882568359375, -0.09222412109375, -0.08383941650390625, -0.0754547119140625, -0.06707000732421875, -0.058685302734375, -0.05030059814453125, -0.0419158935546875, -0.03353118896484375, -0.025146484375, -0.01676177978515625, -0.0083770751953125, 7.62939453125e-06, 0.008392333984375, 0.01677703857421875, 0.0251617431640625, 0.03354644775390625, 0.04193115234375, 0.05031585693359375, 0.0587005615234375, 0.06708526611328125, 0.075469970703125, 0.08385467529296875, 0.0922393798828125, 0.10062408447265625, 0.1090087890625, 0.11739349365234375, 0.1257781982421875, 0.13416290283203125, 0.142547607421875, 0.15093231201171875, 0.1593170166015625, 0.16770172119140625, 0.17608642578125, 0.18447113037109375, 0.1928558349609375, 0.20124053955078125, 0.209625244140625, 0.21800994873046875, 0.2263946533203125, 0.23477935791015625, 0.2431640625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 5.0, 4.0, 11.0, 25.0, 128.0, 297.0, 340.0, 135.0, 27.0, 18.0, 1.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.926177978515625, -12.611329078674316, -12.296481132507324, -11.981632232666016, -11.666784286499023, -11.351935386657715, -11.037087440490723, -10.722238540649414, -10.407390594482422, -10.092541694641113, -9.777693748474121, -9.462844848632812, -9.14799690246582, -8.833148002624512, -8.51830005645752, -8.203451156616211, -7.888602256774902, -7.573753833770752, -7.258905410766602, -6.944056987762451, -6.629208564758301, -6.314359664916992, -5.999511241912842, -5.684662818908691, -5.369814395904541, -5.054965972900391, -4.74011754989624, -4.42526912689209, -4.110420227050781, -3.79557204246521, -3.4807233810424805, -3.16587495803833, -2.851027488708496, -2.5361790657043457, -2.2213306427001953, -1.9064819812774658, -1.5916335582733154, -1.276785135269165, -0.9619365930557251, -0.6470880508422852, -0.33223962783813477, -0.0173911452293396, 0.29745733737945557, 0.6123058199882507, 0.9271543025970459, 1.2420027256011963, 1.5568512678146362, 1.8716998100280762, 2.1865482330322266, 2.501396656036377, 2.8162450790405273, 3.131093740463257, 3.4459421634674072, 3.7607905864715576, 4.075639247894287, 4.3904876708984375, 4.705336093902588, 5.020184516906738, 5.335032939910889, 5.649881362915039, 5.964730262756348, 6.27957820892334, 6.594427108764648, 6.909275531768799, 7.224123954772949]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 9.0, 2.0, 7.0, 11.0, 15.0, 16.0, 13.0, 20.0, 18.0, 34.0, 22.0, 33.0, 46.0, 31.0, 51.0, 55.0, 57.0, 71.0, 67.0, 58.0, 41.0, 46.0, 26.0, 30.0, 33.0, 30.0, 30.0, 20.0, 17.0, 17.0, 10.0, 12.0, 11.0, 9.0, 4.0, 8.0, 5.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.563842296600342, -2.479626417160034, -2.3954105377197266, -2.31119441986084, -2.2269785404205322, -2.1427626609802246, -2.058546781539917, -1.9743309020996094, -1.8901149034500122, -1.8058990240097046, -1.7216830253601074, -1.6374671459197998, -1.5532512664794922, -1.469035267829895, -1.3848193883895874, -1.3006033897399902, -1.2163875102996826, -1.132171630859375, -1.0479556322097778, -0.9637397527694702, -0.8795238137245178, -0.7953078746795654, -0.7110919952392578, -0.6268760561943054, -0.542660117149353, -0.45844417810440063, -0.37422826886177063, -0.2900123596191406, -0.20579642057418823, -0.12158048152923584, -0.03736460208892822, 0.04685133695602417, 0.13106727600097656, 0.21528320014476776, 0.29949912428855896, 0.38371503353118896, 0.46793097257614136, 0.5521469116210938, 0.6363627910614014, 0.7205787301063538, 0.8047946691513062, 0.8890106081962585, 0.9732265472412109, 1.0574424266815186, 1.1416583061218262, 1.2258743047714233, 1.310090184211731, 1.3943061828613281, 1.4785220623016357, 1.5627379417419434, 1.6469539403915405, 1.7311698198318481, 1.8153858184814453, 1.899601697921753, 1.9838175773620605, 2.068033456802368, 2.152249336242676, 2.2364652156829834, 2.320681095123291, 2.4048972129821777, 2.4891130924224854, 2.573328971862793, 2.6575448513031006, 2.741760730743408, 2.825976848602295]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 6.0, 10.0, 18.0, 10.0, 23.0, 38.0, 78.0, 136.0, 299.0, 618.0, 1521.0, 4102.0, 12535.0, 46551.0, 244330.0, 2054875.0, 1587099.0, 186698.0, 38449.0, 10621.0, 3637.0, 1316.0, 653.0, 270.0, 161.0, 66.0, 43.0, 36.0, 16.0, 12.0, 12.0, 8.0, 10.0, 7.0, 3.0, 6.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2440185546875, -0.23528099060058594, -0.22654342651367188, -0.2178058624267578, -0.20906829833984375, -0.2003307342529297, -0.19159317016601562, -0.18285560607910156, -0.1741180419921875, -0.16538047790527344, -0.15664291381835938, -0.1479053497314453, -0.13916778564453125, -0.1304302215576172, -0.12169265747070312, -0.11295509338378906, -0.104217529296875, -0.09547996520996094, -0.08674240112304688, -0.07800483703613281, -0.06926727294921875, -0.06052970886230469, -0.051792144775390625, -0.04305458068847656, -0.0343170166015625, -0.025579452514648438, -0.016841888427734375, -0.008104324340820312, 0.00063323974609375, 0.009370803833007812, 0.018108367919921875, 0.026845932006835938, 0.03558349609375, 0.04432106018066406, 0.053058624267578125, 0.06179618835449219, 0.07053375244140625, 0.07927131652832031, 0.08800888061523438, 0.09674644470214844, 0.1054840087890625, 0.11422157287597656, 0.12295913696289062, 0.1316967010498047, 0.14043426513671875, 0.1491718292236328, 0.15790939331054688, 0.16664695739746094, 0.175384521484375, 0.18412208557128906, 0.19285964965820312, 0.2015972137451172, 0.21033477783203125, 0.2190723419189453, 0.22780990600585938, 0.23654747009277344, 0.2452850341796875, 0.25402259826660156, 0.2627601623535156, 0.2714977264404297, 0.28023529052734375, 0.2889728546142578, 0.2977104187011719, 0.30644798278808594, 0.315185546875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 7.0, 4.0, 11.0, 4.0, 8.0, 9.0, 22.0, 17.0, 25.0, 24.0, 20.0, 30.0, 26.0, 35.0, 38.0, 37.0, 51.0, 42.0, 41.0, 50.0, 45.0, 34.0, 48.0, 32.0, 46.0, 54.0, 36.0, 33.0, 23.0, 23.0, 21.0, 17.0, 17.0, 12.0, 13.0, 6.0, 10.0, 6.0, 4.0, 2.0, 3.0, 6.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.15283203125, -0.14876365661621094, -0.14469528198242188, -0.1406269073486328, -0.13655853271484375, -0.1324901580810547, -0.12842178344726562, -0.12435340881347656, -0.1202850341796875, -0.11621665954589844, -0.11214828491210938, -0.10807991027832031, -0.10401153564453125, -0.09994316101074219, -0.09587478637695312, -0.09180641174316406, -0.087738037109375, -0.08366966247558594, -0.07960128784179688, -0.07553291320800781, -0.07146453857421875, -0.06739616394042969, -0.06332778930664062, -0.05925941467285156, -0.0551910400390625, -0.05112266540527344, -0.047054290771484375, -0.04298591613769531, -0.03891754150390625, -0.03484916687011719, -0.030780792236328125, -0.026712417602539062, -0.02264404296875, -0.018575668334960938, -0.014507293701171875, -0.010438919067382812, -0.00637054443359375, -0.0023021697998046875, 0.001766204833984375, 0.0058345794677734375, 0.0099029541015625, 0.013971328735351562, 0.018039703369140625, 0.022108078002929688, 0.02617645263671875, 0.030244827270507812, 0.034313201904296875, 0.03838157653808594, 0.042449951171875, 0.04651832580566406, 0.050586700439453125, 0.05465507507324219, 0.05872344970703125, 0.06279182434082031, 0.06686019897460938, 0.07092857360839844, 0.0749969482421875, 0.07906532287597656, 0.08313369750976562, 0.08720207214355469, 0.09127044677734375, 0.09533882141113281, 0.09940719604492188, 0.10347557067871094, 0.1075439453125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 3.0, 5.0, 11.0, 15.0, 17.0, 19.0, 39.0, 65.0, 108.0, 188.0, 337.0, 723.0, 1851.0, 5382.0, 18309.0, 75503.0, 454144.0, 2751928.0, 739996.0, 108779.0, 24889.0, 7302.0, 2512.0, 1026.0, 473.0, 280.0, 148.0, 84.0, 40.0, 35.0, 22.0, 11.0, 15.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.402587890625, -0.3915901184082031, -0.38059234619140625, -0.3695945739746094, -0.3585968017578125, -0.3475990295410156, -0.33660125732421875, -0.3256034851074219, -0.314605712890625, -0.3036079406738281, -0.29261016845703125, -0.2816123962402344, -0.2706146240234375, -0.2596168518066406, -0.24861907958984375, -0.23762130737304688, -0.22662353515625, -0.21562576293945312, -0.20462799072265625, -0.19363021850585938, -0.1826324462890625, -0.17163467407226562, -0.16063690185546875, -0.14963912963867188, -0.138641357421875, -0.12764358520507812, -0.11664581298828125, -0.10564804077148438, -0.0946502685546875, -0.08365249633789062, -0.07265472412109375, -0.061656951904296875, -0.0506591796875, -0.039661407470703125, -0.02866363525390625, -0.017665863037109375, -0.0066680908203125, 0.004329681396484375, 0.01532745361328125, 0.026325225830078125, 0.037322998046875, 0.048320770263671875, 0.05931854248046875, 0.07031631469726562, 0.0813140869140625, 0.09231185913085938, 0.10330963134765625, 0.11430740356445312, 0.12530517578125, 0.13630294799804688, 0.14730072021484375, 0.15829849243164062, 0.1692962646484375, 0.18029403686523438, 0.19129180908203125, 0.20228958129882812, 0.213287353515625, 0.22428512573242188, 0.23528289794921875, 0.24628067016601562, 0.2572784423828125, 0.2682762145996094, 0.27927398681640625, 0.2902717590332031, 0.30126953125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 5.0, 5.0, 3.0, 7.0, 10.0, 16.0, 13.0, 16.0, 32.0, 28.0, 48.0, 39.0, 75.0, 103.0, 128.0, 176.0, 275.0, 339.0, 403.0, 478.0, 420.0, 377.0, 266.0, 199.0, 143.0, 112.0, 93.0, 48.0, 43.0, 52.0, 23.0, 21.0, 19.0, 12.0, 17.0, 7.0, 11.0, 5.0, 6.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.278076171875, -0.2672309875488281, -0.25638580322265625, -0.24554061889648438, -0.2346954345703125, -0.22385025024414062, -0.21300506591796875, -0.20215988159179688, -0.191314697265625, -0.18046951293945312, -0.16962432861328125, -0.15877914428710938, -0.1479339599609375, -0.13708877563476562, -0.12624359130859375, -0.11539840698242188, -0.10455322265625, -0.09370803833007812, -0.08286285400390625, -0.07201766967773438, -0.0611724853515625, -0.050327301025390625, -0.03948211669921875, -0.028636932373046875, -0.017791748046875, -0.006946563720703125, 0.00389862060546875, 0.014743804931640625, 0.0255889892578125, 0.036434173583984375, 0.04727935791015625, 0.058124542236328125, 0.0689697265625, 0.07981491088867188, 0.09066009521484375, 0.10150527954101562, 0.1123504638671875, 0.12319564819335938, 0.13404083251953125, 0.14488601684570312, 0.155731201171875, 0.16657638549804688, 0.17742156982421875, 0.18826675415039062, 0.1991119384765625, 0.20995712280273438, 0.22080230712890625, 0.23164749145507812, 0.24249267578125, 0.2533378601074219, 0.26418304443359375, 0.2750282287597656, 0.2858734130859375, 0.2967185974121094, 0.30756378173828125, 0.3184089660644531, 0.329254150390625, 0.3400993347167969, 0.35094451904296875, 0.3617897033691406, 0.3726348876953125, 0.3834800720214844, 0.39432525634765625, 0.4051704406738281, 0.416015625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 9.0, 15.0, 26.0, 47.0, 93.0, 137.0, 201.0, 167.0, 117.0, 81.0, 38.0, 25.0, 9.0, 6.0, 4.0, 7.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.917229652404785, -3.7754342555999756, -3.633638858795166, -3.4918434619903564, -3.350048065185547, -3.208252429962158, -3.0664570331573486, -2.924661636352539, -2.7828662395477295, -2.64107084274292, -2.4992754459381104, -2.357480049133301, -2.215684413909912, -2.0738892555236816, -1.932093620300293, -1.7902982234954834, -1.6485028266906738, -1.5067074298858643, -1.3649120330810547, -1.2231165170669556, -1.081321120262146, -0.9395257234573364, -0.7977302670478821, -0.6559348106384277, -0.5141394138336182, -0.3723439872264862, -0.23054856061935425, -0.08875313401222229, 0.05304229259490967, 0.19483768939971924, 0.3366331458091736, 0.47842860221862793, 0.6202239990234375, 0.7620193958282471, 0.9038148522377014, 1.0456103086471558, 1.1874057054519653, 1.329201102256775, 1.470996618270874, 1.6127920150756836, 1.7545874118804932, 1.8963828086853027, 2.0381782054901123, 2.179973602294922, 2.3217692375183105, 2.463564395904541, 2.6053600311279297, 2.7471554279327393, 2.888950824737549, 3.0307462215423584, 3.172541618347168, 3.3143370151519775, 3.456132411956787, 3.597928047180176, 3.7397234439849854, 3.881518840789795, 4.023314476013184, 4.165110111236572, 4.306905269622803, 4.448700904846191, 4.590496063232422, 4.7322916984558105, 4.874086856842041, 5.01588249206543, 5.15767765045166]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 9.0, 3.0, 2.0, 4.0, 7.0, 9.0, 10.0, 12.0, 15.0, 17.0, 16.0, 20.0, 20.0, 24.0, 29.0, 32.0, 27.0, 27.0, 34.0, 47.0, 36.0, 34.0, 37.0, 47.0, 32.0, 37.0, 55.0, 38.0, 34.0, 38.0, 30.0, 35.0, 31.0, 15.0, 23.0, 27.0, 19.0, 16.0, 9.0, 12.0, 6.0, 7.0, 4.0, 1.0, 4.0, 4.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0], "bins": [-1.8330843448638916, -1.777659296989441, -1.7222343683242798, -1.666809320449829, -1.6113842725753784, -1.5559592247009277, -1.5005342960357666, -1.445109248161316, -1.3896842002868652, -1.3342591524124146, -1.2788342237472534, -1.2234091758728027, -1.167984127998352, -1.1125590801239014, -1.0571341514587402, -1.0017091035842896, -0.9462841749191284, -0.8908591866493225, -0.8354341387748718, -0.7800091505050659, -0.7245841026306152, -0.6691591143608093, -0.6137341260910034, -0.5583090782165527, -0.5028840899467468, -0.44745907187461853, -0.39203405380249023, -0.3366090655326843, -0.28118404746055603, -0.22575902938842773, -0.17033404111862183, -0.11490902304649353, -0.059484124183654785, -0.004059113562107086, 0.05136589705944061, 0.10679090023040771, 0.162215918302536, 0.2176409363746643, 0.2730659246444702, 0.3284909427165985, 0.3839159607887268, 0.4393409788608551, 0.4947659969329834, 0.5501909852027893, 0.6056159734725952, 0.6610410213470459, 0.7164660096168518, 0.7718909978866577, 0.8273160457611084, 0.8827410340309143, 0.938166081905365, 0.9935910701751709, 1.0490161180496216, 1.1044411659240723, 1.1598660945892334, 1.215291142463684, 1.2707161903381348, 1.3261412382125854, 1.3815661668777466, 1.4369912147521973, 1.492416262626648, 1.5478413105010986, 1.6032662391662598, 1.6586912870407104, 1.7141162157058716]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 2.0, 6.0, 18.0, 17.0, 31.0, 59.0, 100.0, 188.0, 306.0, 547.0, 1129.0, 2350.0, 4961.0, 11994.0, 33036.0, 122831.0, 536307.0, 249478.0, 54054.0, 17644.0, 6962.0, 3226.0, 1569.0, 780.0, 418.0, 236.0, 113.0, 78.0, 48.0, 19.0, 12.0, 6.0, 9.0, 4.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.428466796875, -0.41536712646484375, -0.4022674560546875, -0.38916778564453125, -0.376068115234375, -0.36296844482421875, -0.3498687744140625, -0.33676910400390625, -0.32366943359375, -0.31056976318359375, -0.2974700927734375, -0.28437042236328125, -0.271270751953125, -0.25817108154296875, -0.2450714111328125, -0.23197174072265625, -0.2188720703125, -0.20577239990234375, -0.1926727294921875, -0.17957305908203125, -0.166473388671875, -0.15337371826171875, -0.1402740478515625, -0.12717437744140625, -0.11407470703125, -0.10097503662109375, -0.0878753662109375, -0.07477569580078125, -0.061676025390625, -0.04857635498046875, -0.0354766845703125, -0.02237701416015625, -0.00927734375, 0.00382232666015625, 0.0169219970703125, 0.03002166748046875, 0.043121337890625, 0.05622100830078125, 0.0693206787109375, 0.08242034912109375, 0.09552001953125, 0.10861968994140625, 0.1217193603515625, 0.13481903076171875, 0.147918701171875, 0.16101837158203125, 0.1741180419921875, 0.18721771240234375, 0.2003173828125, 0.21341705322265625, 0.2265167236328125, 0.23961639404296875, 0.252716064453125, 0.26581573486328125, 0.2789154052734375, 0.29201507568359375, 0.30511474609375, 0.31821441650390625, 0.3313140869140625, 0.34441375732421875, 0.357513427734375, 0.37061309814453125, 0.3837127685546875, 0.39681243896484375, 0.409912109375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 8.0, 13.0, 7.0, 20.0, 13.0, 19.0, 36.0, 33.0, 25.0, 42.0, 35.0, 47.0, 52.0, 52.0, 58.0, 60.0, 53.0, 66.0, 55.0, 64.0, 38.0, 39.0, 40.0, 23.0, 24.0, 21.0, 12.0, 13.0, 10.0, 5.0, 2.0, 7.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1702880859375, -0.16463470458984375, -0.1589813232421875, -0.15332794189453125, -0.147674560546875, -0.14202117919921875, -0.1363677978515625, -0.13071441650390625, -0.12506103515625, -0.11940765380859375, -0.1137542724609375, -0.10810089111328125, -0.102447509765625, -0.09679412841796875, -0.0911407470703125, -0.08548736572265625, -0.079833984375, -0.07418060302734375, -0.0685272216796875, -0.06287384033203125, -0.057220458984375, -0.05156707763671875, -0.0459136962890625, -0.04026031494140625, -0.03460693359375, -0.02895355224609375, -0.0233001708984375, -0.01764678955078125, -0.011993408203125, -0.00634002685546875, -0.0006866455078125, 0.00496673583984375, 0.0106201171875, 0.01627349853515625, 0.0219268798828125, 0.02758026123046875, 0.033233642578125, 0.03888702392578125, 0.0445404052734375, 0.05019378662109375, 0.05584716796875, 0.06150054931640625, 0.0671539306640625, 0.07280731201171875, 0.078460693359375, 0.08411407470703125, 0.0897674560546875, 0.09542083740234375, 0.10107421875, 0.10672760009765625, 0.1123809814453125, 0.11803436279296875, 0.123687744140625, 0.12934112548828125, 0.1349945068359375, 0.14064788818359375, 0.14630126953125, 0.15195465087890625, 0.1576080322265625, 0.16326141357421875, 0.168914794921875, 0.17456817626953125, 0.1802215576171875, 0.18587493896484375, 0.1915283203125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 12.0, 15.0, 14.0, 19.0, 39.0, 71.0, 91.0, 141.0, 197.0, 314.0, 526.0, 1007.0, 2019.0, 5521.0, 22956.0, 216526.0, 737264.0, 46718.0, 9119.0, 2855.0, 1307.0, 661.0, 390.0, 246.0, 155.0, 126.0, 69.0, 43.0, 29.0, 23.0, 26.0, 11.0, 7.0, 11.0, 8.0, 5.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.806640625, -0.783721923828125, -0.76080322265625, -0.737884521484375, -0.7149658203125, -0.692047119140625, -0.66912841796875, -0.646209716796875, -0.623291015625, -0.600372314453125, -0.57745361328125, -0.554534912109375, -0.5316162109375, -0.508697509765625, -0.48577880859375, -0.462860107421875, -0.43994140625, -0.417022705078125, -0.39410400390625, -0.371185302734375, -0.3482666015625, -0.325347900390625, -0.30242919921875, -0.279510498046875, -0.256591796875, -0.233673095703125, -0.21075439453125, -0.187835693359375, -0.1649169921875, -0.141998291015625, -0.11907958984375, -0.096160888671875, -0.0732421875, -0.050323486328125, -0.02740478515625, -0.004486083984375, 0.0184326171875, 0.041351318359375, 0.06427001953125, 0.087188720703125, 0.110107421875, 0.133026123046875, 0.15594482421875, 0.178863525390625, 0.2017822265625, 0.224700927734375, 0.24761962890625, 0.270538330078125, 0.29345703125, 0.316375732421875, 0.33929443359375, 0.362213134765625, 0.3851318359375, 0.408050537109375, 0.43096923828125, 0.453887939453125, 0.476806640625, 0.499725341796875, 0.52264404296875, 0.545562744140625, 0.5684814453125, 0.591400146484375, 0.61431884765625, 0.637237548828125, 0.66015625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 10.0, 4.0, 8.0, 5.0, 4.0, 8.0, 10.0, 9.0, 17.0, 12.0, 16.0, 19.0, 22.0, 29.0, 33.0, 23.0, 34.0, 27.0, 38.0, 53.0, 45.0, 50.0, 44.0, 38.0, 45.0, 46.0, 41.0, 46.0, 31.0, 30.0, 27.0, 29.0, 26.0, 13.0, 13.0, 14.0, 10.0, 10.0, 7.0, 15.0, 7.0, 8.0, 2.0, 1.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.55126953125, -0.5335311889648438, -0.5157928466796875, -0.49805450439453125, -0.480316162109375, -0.46257781982421875, -0.4448394775390625, -0.42710113525390625, -0.40936279296875, -0.39162445068359375, -0.3738861083984375, -0.35614776611328125, -0.338409423828125, -0.32067108154296875, -0.3029327392578125, -0.28519439697265625, -0.2674560546875, -0.24971771240234375, -0.2319793701171875, -0.21424102783203125, -0.196502685546875, -0.17876434326171875, -0.1610260009765625, -0.14328765869140625, -0.12554931640625, -0.10781097412109375, -0.0900726318359375, -0.07233428955078125, -0.054595947265625, -0.03685760498046875, -0.0191192626953125, -0.00138092041015625, 0.016357421875, 0.03409576416015625, 0.0518341064453125, 0.06957244873046875, 0.087310791015625, 0.10504913330078125, 0.1227874755859375, 0.14052581787109375, 0.15826416015625, 0.17600250244140625, 0.1937408447265625, 0.21147918701171875, 0.229217529296875, 0.24695587158203125, 0.2646942138671875, 0.28243255615234375, 0.3001708984375, 0.31790924072265625, 0.3356475830078125, 0.35338592529296875, 0.371124267578125, 0.38886260986328125, 0.4066009521484375, 0.42433929443359375, 0.44207763671875, 0.45981597900390625, 0.4775543212890625, 0.49529266357421875, 0.513031005859375, 0.5307693481445312, 0.5485076904296875, 0.5662460327148438, 0.583984375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 6.0, 5.0, 4.0, 8.0, 10.0, 17.0, 15.0, 21.0, 31.0, 31.0, 56.0, 100.0, 158.0, 263.0, 528.0, 1052.0, 2652.0, 7726.0, 28807.0, 154564.0, 704144.0, 114105.0, 23384.0, 6454.0, 2268.0, 950.0, 475.0, 258.0, 140.0, 103.0, 58.0, 44.0, 32.0, 25.0, 21.0, 9.0, 9.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.264404296875, -0.2571449279785156, -0.24988555908203125, -0.24262619018554688, -0.2353668212890625, -0.22810745239257812, -0.22084808349609375, -0.21358871459960938, -0.206329345703125, -0.19906997680664062, -0.19181060791015625, -0.18455123901367188, -0.1772918701171875, -0.17003250122070312, -0.16277313232421875, -0.15551376342773438, -0.14825439453125, -0.14099502563476562, -0.13373565673828125, -0.12647628784179688, -0.1192169189453125, -0.11195755004882812, -0.10469818115234375, -0.09743881225585938, -0.090179443359375, -0.08292007446289062, -0.07566070556640625, -0.06840133666992188, -0.0611419677734375, -0.053882598876953125, -0.04662322998046875, -0.039363861083984375, -0.0321044921875, -0.024845123291015625, -0.01758575439453125, -0.010326385498046875, -0.0030670166015625, 0.004192352294921875, 0.01145172119140625, 0.018711090087890625, 0.025970458984375, 0.033229827880859375, 0.04048919677734375, 0.047748565673828125, 0.0550079345703125, 0.062267303466796875, 0.06952667236328125, 0.07678604125976562, 0.08404541015625, 0.09130477905273438, 0.09856414794921875, 0.10582351684570312, 0.1130828857421875, 0.12034225463867188, 0.12760162353515625, 0.13486099243164062, 0.142120361328125, 0.14937973022460938, 0.15663909912109375, 0.16389846801757812, 0.1711578369140625, 0.17841720581054688, 0.18567657470703125, 0.19293594360351562, 0.2001953125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 4.0, 6.0, 9.0, 0.0, 8.0, 4.0, 21.0, 19.0, 20.0, 30.0, 25.0, 50.0, 60.0, 83.0, 111.0, 100.0, 91.0, 82.0, 62.0, 41.0, 34.0, 37.0, 22.0, 18.0, 15.0, 6.0, 7.0, 11.0, 5.0, 4.0, 2.0, 1.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.147954940795898e-05, -7.905811071395874e-05, -7.66366720199585e-05, -7.421523332595825e-05, -7.179379463195801e-05, -6.937235593795776e-05, -6.695091724395752e-05, -6.452947854995728e-05, -6.210803985595703e-05, -5.968660116195679e-05, -5.726516246795654e-05, -5.48437237739563e-05, -5.2422285079956055e-05, -5.000084638595581e-05, -4.7579407691955566e-05, -4.515796899795532e-05, -4.273653030395508e-05, -4.0315091609954834e-05, -3.789365291595459e-05, -3.5472214221954346e-05, -3.30507755279541e-05, -3.062933683395386e-05, -2.8207898139953613e-05, -2.578645944595337e-05, -2.3365020751953125e-05, -2.094358205795288e-05, -1.8522143363952637e-05, -1.6100704669952393e-05, -1.3679265975952148e-05, -1.1257827281951904e-05, -8.83638858795166e-06, -6.414949893951416e-06, -3.993511199951172e-06, -1.5720725059509277e-06, 8.493661880493164e-07, 3.2708048820495605e-06, 5.692243576049805e-06, 8.113682270050049e-06, 1.0535120964050293e-05, 1.2956559658050537e-05, 1.537799835205078e-05, 1.7799437046051025e-05, 2.022087574005127e-05, 2.2642314434051514e-05, 2.5063753128051758e-05, 2.7485191822052002e-05, 2.9906630516052246e-05, 3.232806921005249e-05, 3.4749507904052734e-05, 3.717094659805298e-05, 3.959238529205322e-05, 4.201382398605347e-05, 4.443526268005371e-05, 4.6856701374053955e-05, 4.92781400680542e-05, 5.169957876205444e-05, 5.412101745605469e-05, 5.654245615005493e-05, 5.8963894844055176e-05, 6.138533353805542e-05, 6.380677223205566e-05, 6.622821092605591e-05, 6.864964962005615e-05, 7.10710883140564e-05, 7.349252700805664e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 6.0, 10.0, 13.0, 16.0, 20.0, 24.0, 49.0, 48.0, 91.0, 119.0, 195.0, 277.0, 483.0, 827.0, 1516.0, 3131.0, 7155.0, 21365.0, 89115.0, 639993.0, 221478.0, 41106.0, 11924.0, 4589.0, 2075.0, 1073.0, 712.0, 373.0, 242.0, 173.0, 120.0, 61.0, 48.0, 27.0, 32.0, 12.0, 16.0, 7.0, 7.0, 7.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2056884765625, -0.19940757751464844, -0.19312667846679688, -0.1868457794189453, -0.18056488037109375, -0.1742839813232422, -0.16800308227539062, -0.16172218322753906, -0.1554412841796875, -0.14916038513183594, -0.14287948608398438, -0.1365985870361328, -0.13031768798828125, -0.12403678894042969, -0.11775588989257812, -0.11147499084472656, -0.105194091796875, -0.09891319274902344, -0.09263229370117188, -0.08635139465332031, -0.08007049560546875, -0.07378959655761719, -0.06750869750976562, -0.06122779846191406, -0.0549468994140625, -0.04866600036621094, -0.042385101318359375, -0.03610420227050781, -0.02982330322265625, -0.023542404174804688, -0.017261505126953125, -0.010980606079101562, -0.00469970703125, 0.0015811920166015625, 0.007862091064453125, 0.014142990112304688, 0.02042388916015625, 0.026704788208007812, 0.032985687255859375, 0.03926658630371094, 0.0455474853515625, 0.05182838439941406, 0.058109283447265625, 0.06439018249511719, 0.07067108154296875, 0.07695198059082031, 0.08323287963867188, 0.08951377868652344, 0.095794677734375, 0.10207557678222656, 0.10835647583007812, 0.11463737487792969, 0.12091827392578125, 0.1271991729736328, 0.13348007202148438, 0.13976097106933594, 0.1460418701171875, 0.15232276916503906, 0.15860366821289062, 0.1648845672607422, 0.17116546630859375, 0.1774463653564453, 0.18372726440429688, 0.19000816345214844, 0.1962890625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 2.0, 8.0, 4.0, 9.0, 16.0, 13.0, 15.0, 26.0, 35.0, 38.0, 47.0, 76.0, 87.0, 114.0, 118.0, 97.0, 57.0, 51.0, 38.0, 22.0, 24.0, 24.0, 18.0, 15.0, 10.0, 9.0, 4.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.189453125, -0.18309783935546875, -0.1767425537109375, -0.17038726806640625, -0.164031982421875, -0.15767669677734375, -0.1513214111328125, -0.14496612548828125, -0.13861083984375, -0.13225555419921875, -0.1259002685546875, -0.11954498291015625, -0.113189697265625, -0.10683441162109375, -0.1004791259765625, -0.09412384033203125, -0.0877685546875, -0.08141326904296875, -0.0750579833984375, -0.06870269775390625, -0.062347412109375, -0.05599212646484375, -0.0496368408203125, -0.04328155517578125, -0.03692626953125, -0.03057098388671875, -0.0242156982421875, -0.01786041259765625, -0.011505126953125, -0.00514984130859375, 0.0012054443359375, 0.00756072998046875, 0.013916015625, 0.02027130126953125, 0.0266265869140625, 0.03298187255859375, 0.039337158203125, 0.04569244384765625, 0.0520477294921875, 0.05840301513671875, 0.06475830078125, 0.07111358642578125, 0.0774688720703125, 0.08382415771484375, 0.090179443359375, 0.09653472900390625, 0.1028900146484375, 0.10924530029296875, 0.1156005859375, 0.12195587158203125, 0.1283111572265625, 0.13466644287109375, 0.141021728515625, 0.14737701416015625, 0.1537322998046875, 0.16008758544921875, 0.16644287109375, 0.17279815673828125, 0.1791534423828125, 0.18550872802734375, 0.191864013671875, 0.19821929931640625, 0.2045745849609375, 0.21092987060546875, 0.21728515625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 7.0, 5.0, 5.0, 8.0, 15.0, 46.0, 157.0, 328.0, 268.0, 101.0, 35.0, 7.0, 5.0, 6.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.837558746337891, -6.629733562469482, -6.421907901763916, -6.214082717895508, -6.006257057189941, -5.798431873321533, -5.590606689453125, -5.382781028747559, -5.17495584487915, -4.967130661010742, -4.759305000305176, -4.551479816436768, -4.343654155731201, -4.135828971862793, -3.9280035495758057, -3.7201781272888184, -3.512352705001831, -3.3045272827148438, -3.0967018604278564, -2.888876438140869, -2.681051254272461, -2.4732258319854736, -2.2654004096984863, -2.057575225830078, -1.8497496843338013, -1.641924262046814, -1.4340989589691162, -1.226273536682129, -1.0184481143951416, -0.8106228113174438, -0.6027973890304565, -0.3949720859527588, -0.18714666366577148, 0.02067871391773224, 0.22850409150123596, 0.4363294839859009, 0.6441548466682434, 0.8519802093505859, 1.0598056316375732, 1.267630934715271, 1.4754563570022583, 1.6832817792892456, 1.8911070823669434, 2.0989325046539307, 2.306757926940918, 2.514583110809326, 2.7224087715148926, 2.930233955383301, 3.138059377670288, 3.3458847999572754, 3.5537102222442627, 3.76153564453125, 3.969360828399658, 4.177186012268066, 4.385011672973633, 4.592836856842041, 4.800662517547607, 5.008487701416016, 5.216313362121582, 5.42413854598999, 5.631964206695557, 5.839789390563965, 6.047615051269531, 6.2554402351379395, 6.463265419006348]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 11.0, 8.0, 7.0, 12.0, 12.0, 16.0, 15.0, 17.0, 29.0, 29.0, 36.0, 32.0, 28.0, 44.0, 40.0, 71.0, 67.0, 66.0, 58.0, 67.0, 38.0, 41.0, 38.0, 29.0, 27.0, 21.0, 24.0, 21.0, 20.0, 18.0, 4.0, 16.0, 7.0, 9.0, 4.0, 5.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.346055030822754, -2.266205310821533, -2.1863555908203125, -2.106505870819092, -2.026656150817871, -1.9468064308166504, -1.8669567108154297, -1.787106990814209, -1.7072572708129883, -1.6274075508117676, -1.5475578308105469, -1.4677081108093262, -1.3878583908081055, -1.3080086708068848, -1.228158950805664, -1.1483092308044434, -1.0684596300125122, -0.9886099100112915, -0.9087601900100708, -0.8289104700088501, -0.7490607500076294, -0.6692110300064087, -0.5893613696098328, -0.5095116496086121, -0.42966192960739136, -0.34981220960617065, -0.26996248960494995, -0.19011279940605164, -0.11026307940483093, -0.03041335940361023, 0.049436330795288086, 0.1292860507965088, 0.2091357707977295, 0.2889854907989502, 0.3688352108001709, 0.4486849009990692, 0.5285346508026123, 0.608384370803833, 0.6882340312004089, 0.7680837512016296, 0.8479334712028503, 0.927783191204071, 1.007632851600647, 1.0874825716018677, 1.1673322916030884, 1.247182011604309, 1.3270317316055298, 1.4068814516067505, 1.4867311716079712, 1.566580891609192, 1.6464306116104126, 1.7262803316116333, 1.806130051612854, 1.8859797716140747, 1.9658293724060059, 2.0456790924072266, 2.1255288124084473, 2.205378532409668, 2.2852282524108887, 2.3650779724121094, 2.44492769241333, 2.524777412414551, 2.6046271324157715, 2.684476852416992, 2.764326572418213]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 4.0, 15.0, 10.0, 16.0, 25.0, 33.0, 42.0, 62.0, 131.0, 287.0, 611.0, 1641.0, 5344.0, 21855.0, 145670.0, 2388782.0, 1514496.0, 92551.0, 16034.0, 4172.0, 1379.0, 508.0, 246.0, 121.0, 66.0, 50.0, 33.0, 22.0, 16.0, 14.0, 9.0, 5.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.376953125, -0.3661537170410156, -0.35535430908203125, -0.3445549011230469, -0.3337554931640625, -0.3229560852050781, -0.31215667724609375, -0.3013572692871094, -0.290557861328125, -0.2797584533691406, -0.26895904541015625, -0.2581596374511719, -0.2473602294921875, -0.23656082153320312, -0.22576141357421875, -0.21496200561523438, -0.20416259765625, -0.19336318969726562, -0.18256378173828125, -0.17176437377929688, -0.1609649658203125, -0.15016555786132812, -0.13936614990234375, -0.12856674194335938, -0.117767333984375, -0.10696792602539062, -0.09616851806640625, -0.08536911010742188, -0.0745697021484375, -0.06377029418945312, -0.05297088623046875, -0.042171478271484375, -0.0313720703125, -0.020572662353515625, -0.00977325439453125, 0.001026153564453125, 0.0118255615234375, 0.022624969482421875, 0.03342437744140625, 0.044223785400390625, 0.055023193359375, 0.06582260131835938, 0.07662200927734375, 0.08742141723632812, 0.0982208251953125, 0.10902023315429688, 0.11981964111328125, 0.13061904907226562, 0.14141845703125, 0.15221786499023438, 0.16301727294921875, 0.17381668090820312, 0.1846160888671875, 0.19541549682617188, 0.20621490478515625, 0.21701431274414062, 0.227813720703125, 0.23861312866210938, 0.24941253662109375, 0.2602119445800781, 0.2710113525390625, 0.2818107604980469, 0.29261016845703125, 0.3034095764160156, 0.314208984375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 10.0, 9.0, 8.0, 8.0, 10.0, 16.0, 16.0, 20.0, 30.0, 24.0, 35.0, 35.0, 37.0, 44.0, 36.0, 49.0, 32.0, 48.0, 64.0, 53.0, 43.0, 46.0, 38.0, 28.0, 37.0, 29.0, 32.0, 26.0, 29.0, 18.0, 14.0, 16.0, 10.0, 10.0, 6.0, 9.0, 5.0, 4.0, 2.0, 2.0, 1.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.11444091796875, -0.11026477813720703, -0.10608863830566406, -0.1019124984741211, -0.09773635864257812, -0.09356021881103516, -0.08938407897949219, -0.08520793914794922, -0.08103179931640625, -0.07685565948486328, -0.07267951965332031, -0.06850337982177734, -0.06432723999023438, -0.060151100158691406, -0.05597496032714844, -0.05179882049560547, -0.0476226806640625, -0.04344654083251953, -0.03927040100097656, -0.035094261169433594, -0.030918121337890625, -0.026741981506347656, -0.022565841674804688, -0.01838970184326172, -0.01421356201171875, -0.010037422180175781, -0.0058612823486328125, -0.0016851425170898438, 0.002490997314453125, 0.006667137145996094, 0.010843276977539062, 0.015019416809082031, 0.019195556640625, 0.02337169647216797, 0.027547836303710938, 0.031723976135253906, 0.035900115966796875, 0.040076255798339844, 0.04425239562988281, 0.04842853546142578, 0.05260467529296875, 0.05678081512451172, 0.06095695495605469, 0.06513309478759766, 0.06930923461914062, 0.0734853744506836, 0.07766151428222656, 0.08183765411376953, 0.0860137939453125, 0.09018993377685547, 0.09436607360839844, 0.0985422134399414, 0.10271835327148438, 0.10689449310302734, 0.11107063293457031, 0.11524677276611328, 0.11942291259765625, 0.12359905242919922, 0.1277751922607422, 0.13195133209228516, 0.13612747192382812, 0.1403036117553711, 0.14447975158691406, 0.14865589141845703, 0.15283203125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 4.0, 9.0, 13.0, 18.0, 17.0, 31.0, 50.0, 84.0, 183.0, 386.0, 917.0, 2562.0, 9569.0, 65802.0, 1562390.0, 2442958.0, 92214.0, 12039.0, 2996.0, 1038.0, 477.0, 207.0, 124.0, 52.0, 46.0, 22.0, 19.0, 11.0, 12.0, 9.0, 2.0, 6.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6044921875, -0.5881843566894531, -0.5718765258789062, -0.5555686950683594, -0.5392608642578125, -0.5229530334472656, -0.5066452026367188, -0.4903373718261719, -0.474029541015625, -0.4577217102050781, -0.44141387939453125, -0.4251060485839844, -0.4087982177734375, -0.3924903869628906, -0.37618255615234375, -0.3598747253417969, -0.34356689453125, -0.3272590637207031, -0.31095123291015625, -0.2946434020996094, -0.2783355712890625, -0.2620277404785156, -0.24571990966796875, -0.22941207885742188, -0.213104248046875, -0.19679641723632812, -0.18048858642578125, -0.16418075561523438, -0.1478729248046875, -0.13156509399414062, -0.11525726318359375, -0.09894943237304688, -0.0826416015625, -0.06633377075195312, -0.05002593994140625, -0.033718109130859375, -0.0174102783203125, -0.001102447509765625, 0.01520538330078125, 0.031513214111328125, 0.047821044921875, 0.06412887573242188, 0.08043670654296875, 0.09674453735351562, 0.1130523681640625, 0.12936019897460938, 0.14566802978515625, 0.16197586059570312, 0.17828369140625, 0.19459152221679688, 0.21089935302734375, 0.22720718383789062, 0.2435150146484375, 0.2598228454589844, 0.27613067626953125, 0.2924385070800781, 0.308746337890625, 0.3250541687011719, 0.34136199951171875, 0.3576698303222656, 0.3739776611328125, 0.3902854919433594, 0.40659332275390625, 0.4229011535644531, 0.439208984375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 9.0, 10.0, 11.0, 18.0, 21.0, 29.0, 57.0, 71.0, 109.0, 165.0, 245.0, 417.0, 629.0, 659.0, 574.0, 357.0, 225.0, 138.0, 116.0, 74.0, 36.0, 34.0, 18.0, 15.0, 9.0, 11.0, 3.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3876953125, -0.3744850158691406, -0.36127471923828125, -0.3480644226074219, -0.3348541259765625, -0.3216438293457031, -0.30843353271484375, -0.2952232360839844, -0.282012939453125, -0.2688026428222656, -0.25559234619140625, -0.24238204956054688, -0.2291717529296875, -0.21596145629882812, -0.20275115966796875, -0.18954086303710938, -0.17633056640625, -0.16312026977539062, -0.14990997314453125, -0.13669967651367188, -0.1234893798828125, -0.11027908325195312, -0.09706878662109375, -0.08385848999023438, -0.070648193359375, -0.057437896728515625, -0.04422760009765625, -0.031017303466796875, -0.0178070068359375, -0.004596710205078125, 0.00861358642578125, 0.021823883056640625, 0.0350341796875, 0.048244476318359375, 0.06145477294921875, 0.07466506958007812, 0.0878753662109375, 0.10108566284179688, 0.11429595947265625, 0.12750625610351562, 0.140716552734375, 0.15392684936523438, 0.16713714599609375, 0.18034744262695312, 0.1935577392578125, 0.20676803588867188, 0.21997833251953125, 0.23318862915039062, 0.24639892578125, 0.2596092224121094, 0.27281951904296875, 0.2860298156738281, 0.2992401123046875, 0.3124504089355469, 0.32566070556640625, 0.3388710021972656, 0.352081298828125, 0.3652915954589844, 0.37850189208984375, 0.3917121887207031, 0.4049224853515625, 0.4181327819824219, 0.43134307861328125, 0.4445533752441406, 0.457763671875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 11.0, 7.0, 15.0, 24.0, 75.0, 145.0, 234.0, 268.0, 119.0, 54.0, 20.0, 10.0, 6.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-6.050366401672363, -5.881232261657715, -5.712097644805908, -5.542963027954102, -5.373828887939453, -5.204694747924805, -5.035560131072998, -4.866425514221191, -4.697291374206543, -4.5281572341918945, -4.359022617340088, -4.189888000488281, -4.020753860473633, -3.8516194820404053, -3.6824851036071777, -3.51335072517395, -3.3442163467407227, -3.175081968307495, -3.0059475898742676, -2.83681321144104, -2.6676788330078125, -2.498544454574585, -2.3294100761413574, -2.16027569770813, -1.9911413192749023, -1.8220069408416748, -1.6528725624084473, -1.4837381839752197, -1.3146038055419922, -1.1454694271087646, -0.9763350486755371, -0.8072006702423096, -0.6380658149719238, -0.4689314365386963, -0.29979705810546875, -0.1306626796722412, 0.03847169876098633, 0.20760607719421387, 0.3767404556274414, 0.545874834060669, 0.7150092124938965, 0.884143590927124, 1.0532779693603516, 1.222412347793579, 1.3915467262268066, 1.5606811046600342, 1.7298154830932617, 1.8989498615264893, 2.068084239959717, 2.2372186183929443, 2.406352996826172, 2.5754873752593994, 2.744621753692627, 2.9137561321258545, 3.082890510559082, 3.2520248889923096, 3.421159267425537, 3.5902936458587646, 3.759428024291992, 3.9285624027252197, 4.097696781158447, 4.266831398010254, 4.435965538024902, 4.605099678039551, 4.774234294891357]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 4.0, 6.0, 12.0, 32.0, 22.0, 23.0, 39.0, 51.0, 60.0, 56.0, 76.0, 83.0, 68.0, 63.0, 70.0, 58.0, 61.0, 49.0, 41.0, 34.0, 21.0, 20.0, 15.0, 11.0, 8.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8514225482940674, -2.7698893547058105, -2.6883559226989746, -2.6068227291107178, -2.525289297103882, -2.443756103515625, -2.362222671508789, -2.2806894779205322, -2.1991562843322754, -2.1176230907440186, -2.0360896587371826, -1.9545563459396362, -1.8730230331420898, -1.791489839553833, -1.7099565267562866, -1.6284232139587402, -1.5468897819519043, -1.465356469154358, -1.3838231563568115, -1.3022898435592651, -1.2207565307617188, -1.139223337173462, -1.0576900243759155, -0.9761567115783691, -0.8946233987808228, -0.8130900859832764, -0.73155677318573, -0.6500235199928284, -0.568490207195282, -0.4869568943977356, -0.4054236114025116, -0.3238903284072876, -0.2423572540283203, -0.16082395613193512, -0.07929065823554993, 0.002242639660835266, 0.08377593755722046, 0.16530925035476685, 0.24684253334999084, 0.32837581634521484, 0.40990912914276123, 0.4914424419403076, 0.572975754737854, 0.6545090079307556, 0.736042320728302, 0.8175756335258484, 0.89910888671875, 0.9806421995162964, 1.0621755123138428, 1.1437088251113892, 1.2252421379089355, 1.306775450706482, 1.3883087635040283, 1.4698419570922852, 1.5513752698898315, 1.632908582687378, 1.7144418954849243, 1.7959752082824707, 1.877508521080017, 1.9590418338775635, 2.0405750274658203, 2.1221084594726562, 2.203641653060913, 2.28517484664917, 2.366708278656006]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 6.0, 6.0, 6.0, 10.0, 8.0, 8.0, 13.0, 19.0, 28.0, 53.0, 73.0, 110.0, 229.0, 435.0, 868.0, 1704.0, 3894.0, 10015.0, 37642.0, 233447.0, 573683.0, 146493.0, 25954.0, 7733.0, 3159.0, 1415.0, 691.0, 355.0, 205.0, 91.0, 62.0, 47.0, 31.0, 18.0, 11.0, 12.0, 6.0, 4.0, 6.0, 4.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.399658203125, -0.38924407958984375, -0.3788299560546875, -0.36841583251953125, -0.358001708984375, -0.34758758544921875, -0.3371734619140625, -0.32675933837890625, -0.31634521484375, -0.30593109130859375, -0.2955169677734375, -0.28510284423828125, -0.274688720703125, -0.26427459716796875, -0.2538604736328125, -0.24344635009765625, -0.2330322265625, -0.22261810302734375, -0.2122039794921875, -0.20178985595703125, -0.191375732421875, -0.18096160888671875, -0.1705474853515625, -0.16013336181640625, -0.14971923828125, -0.13930511474609375, -0.1288909912109375, -0.11847686767578125, -0.108062744140625, -0.09764862060546875, -0.0872344970703125, -0.07682037353515625, -0.06640625, -0.05599212646484375, -0.0455780029296875, -0.03516387939453125, -0.024749755859375, -0.01433563232421875, -0.0039215087890625, 0.00649261474609375, 0.01690673828125, 0.02732086181640625, 0.0377349853515625, 0.04814910888671875, 0.058563232421875, 0.06897735595703125, 0.0793914794921875, 0.08980560302734375, 0.1002197265625, 0.11063385009765625, 0.1210479736328125, 0.13146209716796875, 0.141876220703125, 0.15229034423828125, 0.1627044677734375, 0.17311859130859375, 0.18353271484375, 0.19394683837890625, 0.2043609619140625, 0.21477508544921875, 0.225189208984375, 0.23560333251953125, 0.2460174560546875, 0.25643157958984375, 0.266845703125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 8.0, 8.0, 5.0, 6.0, 11.0, 11.0, 10.0, 15.0, 29.0, 26.0, 19.0, 26.0, 39.0, 38.0, 40.0, 34.0, 41.0, 53.0, 41.0, 48.0, 40.0, 42.0, 44.0, 40.0, 39.0, 48.0, 38.0, 24.0, 27.0, 18.0, 22.0, 22.0, 16.0, 12.0, 17.0, 6.0, 9.0, 9.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1397705078125, -0.1353759765625, -0.1309814453125, -0.1265869140625, -0.1221923828125, -0.1177978515625, -0.1134033203125, -0.1090087890625, -0.1046142578125, -0.1002197265625, -0.0958251953125, -0.0914306640625, -0.0870361328125, -0.0826416015625, -0.0782470703125, -0.0738525390625, -0.0694580078125, -0.0650634765625, -0.0606689453125, -0.0562744140625, -0.0518798828125, -0.0474853515625, -0.0430908203125, -0.0386962890625, -0.0343017578125, -0.0299072265625, -0.0255126953125, -0.0211181640625, -0.0167236328125, -0.0123291015625, -0.0079345703125, -0.0035400390625, 0.0008544921875, 0.0052490234375, 0.0096435546875, 0.0140380859375, 0.0184326171875, 0.0228271484375, 0.0272216796875, 0.0316162109375, 0.0360107421875, 0.0404052734375, 0.0447998046875, 0.0491943359375, 0.0535888671875, 0.0579833984375, 0.0623779296875, 0.0667724609375, 0.0711669921875, 0.0755615234375, 0.0799560546875, 0.0843505859375, 0.0887451171875, 0.0931396484375, 0.0975341796875, 0.1019287109375, 0.1063232421875, 0.1107177734375, 0.1151123046875, 0.1195068359375, 0.1239013671875, 0.1282958984375, 0.1326904296875, 0.1370849609375, 0.1414794921875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 7.0, 10.0, 6.0, 14.0, 22.0, 40.0, 64.0, 97.0, 197.0, 418.0, 953.0, 2952.0, 13145.0, 192070.0, 787938.0, 42193.0, 5597.0, 1604.0, 573.0, 269.0, 162.0, 75.0, 57.0, 33.0, 13.0, 15.0, 8.0, 7.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4384765625, -0.421112060546875, -0.40374755859375, -0.386383056640625, -0.3690185546875, -0.351654052734375, -0.33428955078125, -0.316925048828125, -0.299560546875, -0.282196044921875, -0.26483154296875, -0.247467041015625, -0.2301025390625, -0.212738037109375, -0.19537353515625, -0.178009033203125, -0.16064453125, -0.143280029296875, -0.12591552734375, -0.108551025390625, -0.0911865234375, -0.073822021484375, -0.05645751953125, -0.039093017578125, -0.021728515625, -0.004364013671875, 0.01300048828125, 0.030364990234375, 0.0477294921875, 0.065093994140625, 0.08245849609375, 0.099822998046875, 0.1171875, 0.134552001953125, 0.15191650390625, 0.169281005859375, 0.1866455078125, 0.204010009765625, 0.22137451171875, 0.238739013671875, 0.256103515625, 0.273468017578125, 0.29083251953125, 0.308197021484375, 0.3255615234375, 0.342926025390625, 0.36029052734375, 0.377655029296875, 0.39501953125, 0.412384033203125, 0.42974853515625, 0.447113037109375, 0.4644775390625, 0.481842041015625, 0.49920654296875, 0.516571044921875, 0.533935546875, 0.551300048828125, 0.56866455078125, 0.586029052734375, 0.6033935546875, 0.620758056640625, 0.63812255859375, 0.655487060546875, 0.6728515625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 4.0, 7.0, 6.0, 9.0, 8.0, 15.0, 11.0, 23.0, 24.0, 13.0, 29.0, 39.0, 31.0, 41.0, 44.0, 43.0, 45.0, 57.0, 51.0, 53.0, 53.0, 38.0, 47.0, 41.0, 39.0, 22.0, 26.0, 33.0, 23.0, 23.0, 14.0, 16.0, 13.0, 17.0, 8.0, 7.0, 5.0, 6.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.5791015625, -0.5621871948242188, -0.5452728271484375, -0.5283584594726562, -0.511444091796875, -0.49452972412109375, -0.4776153564453125, -0.46070098876953125, -0.44378662109375, -0.42687225341796875, -0.4099578857421875, -0.39304351806640625, -0.376129150390625, -0.35921478271484375, -0.3423004150390625, -0.32538604736328125, -0.3084716796875, -0.29155731201171875, -0.2746429443359375, -0.25772857666015625, -0.240814208984375, -0.22389984130859375, -0.2069854736328125, -0.19007110595703125, -0.17315673828125, -0.15624237060546875, -0.1393280029296875, -0.12241363525390625, -0.105499267578125, -0.08858489990234375, -0.0716705322265625, -0.05475616455078125, -0.037841796875, -0.02092742919921875, -0.0040130615234375, 0.01290130615234375, 0.029815673828125, 0.04673004150390625, 0.0636444091796875, 0.08055877685546875, 0.09747314453125, 0.11438751220703125, 0.1313018798828125, 0.14821624755859375, 0.165130615234375, 0.18204498291015625, 0.1989593505859375, 0.21587371826171875, 0.2327880859375, 0.24970245361328125, 0.2666168212890625, 0.28353118896484375, 0.300445556640625, 0.31735992431640625, 0.3342742919921875, 0.35118865966796875, 0.36810302734375, 0.38501739501953125, 0.4019317626953125, 0.41884613037109375, 0.435760498046875, 0.45267486572265625, 0.4695892333984375, 0.48650360107421875, 0.50341796875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 5.0, 10.0, 9.0, 24.0, 23.0, 28.0, 55.0, 65.0, 111.0, 192.0, 368.0, 624.0, 1454.0, 3241.0, 7488.0, 20955.0, 73703.0, 300826.0, 511000.0, 88318.0, 24669.0, 8674.0, 3438.0, 1582.0, 733.0, 376.0, 184.0, 151.0, 98.0, 54.0, 33.0, 13.0, 13.0, 15.0, 13.0, 9.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09912109375, -0.095458984375, -0.091796875, -0.088134765625, -0.08447265625, -0.080810546875, -0.0771484375, -0.073486328125, -0.06982421875, -0.066162109375, -0.0625, -0.058837890625, -0.05517578125, -0.051513671875, -0.0478515625, -0.044189453125, -0.04052734375, -0.036865234375, -0.033203125, -0.029541015625, -0.02587890625, -0.022216796875, -0.0185546875, -0.014892578125, -0.01123046875, -0.007568359375, -0.00390625, -0.000244140625, 0.00341796875, 0.007080078125, 0.0107421875, 0.014404296875, 0.01806640625, 0.021728515625, 0.025390625, 0.029052734375, 0.03271484375, 0.036376953125, 0.0400390625, 0.043701171875, 0.04736328125, 0.051025390625, 0.0546875, 0.058349609375, 0.06201171875, 0.065673828125, 0.0693359375, 0.072998046875, 0.07666015625, 0.080322265625, 0.083984375, 0.087646484375, 0.09130859375, 0.094970703125, 0.0986328125, 0.102294921875, 0.10595703125, 0.109619140625, 0.11328125, 0.116943359375, 0.12060546875, 0.124267578125, 0.1279296875, 0.131591796875, 0.13525390625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 6.0, 3.0, 6.0, 8.0, 5.0, 7.0, 21.0, 18.0, 27.0, 46.0, 60.0, 60.0, 75.0, 89.0, 93.0, 94.0, 77.0, 64.0, 58.0, 45.0, 29.0, 21.0, 29.0, 13.0, 13.0, 11.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.817413330078125e-05, -5.659274756908417e-05, -5.5011361837387085e-05, -5.342997610569e-05, -5.184859037399292e-05, -5.026720464229584e-05, -4.8685818910598755e-05, -4.710443317890167e-05, -4.552304744720459e-05, -4.394166171550751e-05, -4.2360275983810425e-05, -4.077889025211334e-05, -3.919750452041626e-05, -3.761611878871918e-05, -3.6034733057022095e-05, -3.445334732532501e-05, -3.287196159362793e-05, -3.129057586193085e-05, -2.9709190130233765e-05, -2.8127804398536682e-05, -2.65464186668396e-05, -2.4965032935142517e-05, -2.3383647203445435e-05, -2.1802261471748352e-05, -2.022087574005127e-05, -1.8639490008354187e-05, -1.7058104276657104e-05, -1.5476718544960022e-05, -1.389533281326294e-05, -1.2313947081565857e-05, -1.0732561349868774e-05, -9.151175618171692e-06, -7.569789886474609e-06, -5.988404154777527e-06, -4.407018423080444e-06, -2.825632691383362e-06, -1.2442469596862793e-06, 3.371387720108032e-07, 1.9185245037078857e-06, 3.4999102354049683e-06, 5.081295967102051e-06, 6.662681698799133e-06, 8.244067430496216e-06, 9.825453162193298e-06, 1.1406838893890381e-05, 1.2988224625587463e-05, 1.4569610357284546e-05, 1.615099608898163e-05, 1.773238182067871e-05, 1.9313767552375793e-05, 2.0895153284072876e-05, 2.247653901576996e-05, 2.405792474746704e-05, 2.5639310479164124e-05, 2.7220696210861206e-05, 2.880208194255829e-05, 3.038346767425537e-05, 3.1964853405952454e-05, 3.3546239137649536e-05, 3.512762486934662e-05, 3.67090106010437e-05, 3.8290396332740784e-05, 3.9871782064437866e-05, 4.145316779613495e-05, 4.303455352783203e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 7.0, 8.0, 9.0, 17.0, 32.0, 50.0, 74.0, 149.0, 305.0, 707.0, 2069.0, 8154.0, 49308.0, 602710.0, 337911.0, 37503.0, 6521.0, 1806.0, 614.0, 286.0, 132.0, 88.0, 32.0, 22.0, 15.0, 11.0, 9.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18359375, -0.1772480010986328, -0.17090225219726562, -0.16455650329589844, -0.15821075439453125, -0.15186500549316406, -0.14551925659179688, -0.1391735076904297, -0.1328277587890625, -0.1264820098876953, -0.12013626098632812, -0.11379051208496094, -0.10744476318359375, -0.10109901428222656, -0.09475326538085938, -0.08840751647949219, -0.082061767578125, -0.07571601867675781, -0.06937026977539062, -0.06302452087402344, -0.05667877197265625, -0.05033302307128906, -0.043987274169921875, -0.03764152526855469, -0.0312957763671875, -0.024950027465820312, -0.018604278564453125, -0.012258529663085938, -0.00591278076171875, 0.0004329681396484375, 0.006778717041015625, 0.013124465942382812, 0.01947021484375, 0.025815963745117188, 0.032161712646484375, 0.03850746154785156, 0.04485321044921875, 0.05119895935058594, 0.057544708251953125, 0.06389045715332031, 0.0702362060546875, 0.07658195495605469, 0.08292770385742188, 0.08927345275878906, 0.09561920166015625, 0.10196495056152344, 0.10831069946289062, 0.11465644836425781, 0.121002197265625, 0.1273479461669922, 0.13369369506835938, 0.14003944396972656, 0.14638519287109375, 0.15273094177246094, 0.15907669067382812, 0.1654224395751953, 0.1717681884765625, 0.1781139373779297, 0.18445968627929688, 0.19080543518066406, 0.19715118408203125, 0.20349693298339844, 0.20984268188476562, 0.2161884307861328, 0.2225341796875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 3.0, 5.0, 16.0, 7.0, 14.0, 16.0, 17.0, 18.0, 23.0, 38.0, 37.0, 47.0, 73.0, 65.0, 74.0, 74.0, 95.0, 67.0, 55.0, 42.0, 38.0, 48.0, 26.0, 17.0, 13.0, 20.0, 12.0, 9.0, 5.0, 5.0, 2.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1212158203125, -0.11757659912109375, -0.1139373779296875, -0.11029815673828125, -0.106658935546875, -0.10301971435546875, -0.0993804931640625, -0.09574127197265625, -0.09210205078125, -0.08846282958984375, -0.0848236083984375, -0.08118438720703125, -0.077545166015625, -0.07390594482421875, -0.0702667236328125, -0.06662750244140625, -0.06298828125, -0.05934906005859375, -0.0557098388671875, -0.05207061767578125, -0.048431396484375, -0.04479217529296875, -0.0411529541015625, -0.03751373291015625, -0.03387451171875, -0.03023529052734375, -0.0265960693359375, -0.02295684814453125, -0.019317626953125, -0.01567840576171875, -0.0120391845703125, -0.00839996337890625, -0.0047607421875, -0.00112152099609375, 0.0025177001953125, 0.00615692138671875, 0.009796142578125, 0.01343536376953125, 0.0170745849609375, 0.02071380615234375, 0.02435302734375, 0.02799224853515625, 0.0316314697265625, 0.03527069091796875, 0.038909912109375, 0.04254913330078125, 0.0461883544921875, 0.04982757568359375, 0.053466796875, 0.05710601806640625, 0.0607452392578125, 0.06438446044921875, 0.068023681640625, 0.07166290283203125, 0.0753021240234375, 0.07894134521484375, 0.08258056640625, 0.08621978759765625, 0.0898590087890625, 0.09349822998046875, 0.097137451171875, 0.10077667236328125, 0.1044158935546875, 0.10805511474609375, 0.1116943359375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 3.0, 5.0, 3.0, 4.0, 3.0, 8.0, 9.0, 19.0, 40.0, 81.0, 111.0, 248.0, 181.0, 135.0, 78.0, 34.0, 12.0, 11.0, 3.0, 5.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.750999927520752, -2.6521968841552734, -2.553393840789795, -2.4545907974243164, -2.355787754058838, -2.2569847106933594, -2.158181667327881, -2.0593786239624023, -1.9605754613876343, -1.8617724180221558, -1.7629693746566772, -1.6641662120819092, -1.5653631687164307, -1.4665601253509521, -1.3677570819854736, -1.2689540386199951, -1.1701509952545166, -1.071347951889038, -0.9725449085235596, -0.8737418055534363, -0.7749387621879578, -0.6761357188224792, -0.577332615852356, -0.47852957248687744, -0.3797265291213989, -0.2809234857559204, -0.1821204125881195, -0.0833173394203186, 0.015485703945159912, 0.11428874731063843, 0.21309185028076172, 0.31189489364624023, 0.41069769859313965, 0.5095007419586182, 0.6083037853240967, 0.70710688829422, 0.8059099316596985, 0.904712975025177, 1.0035160779953003, 1.1023191213607788, 1.2011221647262573, 1.2999252080917358, 1.3987282514572144, 1.4975314140319824, 1.596334457397461, 1.6951375007629395, 1.793940544128418, 1.8927435874938965, 1.991546630859375, 2.0903496742248535, 2.189152717590332, 2.2879557609558105, 2.386758804321289, 2.4855618476867676, 2.584364891052246, 2.6831679344177246, 2.781970977783203, 2.8807740211486816, 2.97957706451416, 3.0783801078796387, 3.177183151245117, 3.2759861946105957, 3.374789237976074, 3.4735922813415527, 3.5723955631256104]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 2.0, 6.0, 9.0, 9.0, 11.0, 16.0, 13.0, 30.0, 27.0, 29.0, 25.0, 43.0, 41.0, 50.0, 58.0, 78.0, 83.0, 89.0, 62.0, 49.0, 40.0, 32.0, 35.0, 21.0, 23.0, 25.0, 21.0, 14.0, 13.0, 15.0, 7.0, 6.0, 2.0, 4.0, 6.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5994820594787598, -2.5223748683929443, -2.445267677307129, -2.3681602478027344, -2.291053056716919, -2.2139458656311035, -2.136838674545288, -2.0597314834594727, -1.9826240539550781, -1.9055168628692627, -1.8284095525741577, -1.7513023614883423, -1.6741950511932373, -1.5970878601074219, -1.5199806690216064, -1.4428733587265015, -1.365766167640686, -1.2886589765548706, -1.2115516662597656, -1.1344444751739502, -1.0573371648788452, -0.9802299737930298, -0.9031227231025696, -0.8260154724121094, -0.7489082217216492, -0.671800971031189, -0.5946937203407288, -0.5175864696502686, -0.44047924876213074, -0.36337199807167053, -0.2862647771835327, -0.2091575264930725, -0.1320502758026123, -0.0549430325627327, 0.02216421067714691, 0.09927144646644592, 0.17637869715690613, 0.25348594784736633, 0.33059316873550415, 0.40770041942596436, 0.48480767011642456, 0.5619149208068848, 0.639022171497345, 0.7161294221878052, 0.7932366132736206, 0.8703439235687256, 0.947451114654541, 1.0245583057403564, 1.1016656160354614, 1.1787728071212769, 1.2558801174163818, 1.3329873085021973, 1.4100946187973022, 1.4872018098831177, 1.5643091201782227, 1.641416311264038, 1.7185235023498535, 1.795630693435669, 1.872738003730774, 1.9498451948165894, 2.0269525051116943, 2.1040596961975098, 2.181166887283325, 2.2582740783691406, 2.335381507873535]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 8.0, 3.0, 5.0, 6.0, 6.0, 8.0, 19.0, 16.0, 29.0, 37.0, 70.0, 156.0, 405.0, 1085.0, 4111.0, 19520.0, 168978.0, 2909569.0, 1017544.0, 59727.0, 9510.0, 2208.0, 721.0, 273.0, 108.0, 54.0, 21.0, 28.0, 19.0, 15.0, 4.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37939453125, -0.3684883117675781, -0.35758209228515625, -0.3466758728027344, -0.3357696533203125, -0.3248634338378906, -0.31395721435546875, -0.3030509948730469, -0.292144775390625, -0.2812385559082031, -0.27033233642578125, -0.2594261169433594, -0.2485198974609375, -0.23761367797851562, -0.22670745849609375, -0.21580123901367188, -0.20489501953125, -0.19398880004882812, -0.18308258056640625, -0.17217636108398438, -0.1612701416015625, -0.15036392211914062, -0.13945770263671875, -0.12855148315429688, -0.117645263671875, -0.10673904418945312, -0.09583282470703125, -0.08492660522460938, -0.0740203857421875, -0.06311416625976562, -0.05220794677734375, -0.041301727294921875, -0.0303955078125, -0.019489288330078125, -0.00858306884765625, 0.002323150634765625, 0.0132293701171875, 0.024135589599609375, 0.03504180908203125, 0.045948028564453125, 0.056854248046875, 0.06776046752929688, 0.07866668701171875, 0.08957290649414062, 0.1004791259765625, 0.11138534545898438, 0.12229156494140625, 0.13319778442382812, 0.14410400390625, 0.15501022338867188, 0.16591644287109375, 0.17682266235351562, 0.1877288818359375, 0.19863510131835938, 0.20954132080078125, 0.22044754028320312, 0.231353759765625, 0.24225997924804688, 0.25316619873046875, 0.2640724182128906, 0.2749786376953125, 0.2858848571777344, 0.29679107666015625, 0.3076972961425781, 0.318603515625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 1.0, 0.0, 3.0, 9.0, 4.0, 9.0, 6.0, 16.0, 15.0, 21.0, 29.0, 34.0, 33.0, 36.0, 35.0, 42.0, 42.0, 59.0, 52.0, 54.0, 46.0, 46.0, 55.0, 54.0, 50.0, 42.0, 32.0, 23.0, 18.0, 22.0, 26.0, 16.0, 17.0, 16.0, 13.0, 11.0, 2.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1429443359375, -0.13803482055664062, -0.13312530517578125, -0.12821578979492188, -0.1233062744140625, -0.11839675903320312, -0.11348724365234375, -0.10857772827148438, -0.103668212890625, -0.09875869750976562, -0.09384918212890625, -0.08893966674804688, -0.0840301513671875, -0.07912063598632812, -0.07421112060546875, -0.06930160522460938, -0.06439208984375, -0.059482574462890625, -0.05457305908203125, -0.049663543701171875, -0.0447540283203125, -0.039844512939453125, -0.03493499755859375, -0.030025482177734375, -0.025115966796875, -0.020206451416015625, -0.01529693603515625, -0.010387420654296875, -0.0054779052734375, -0.000568389892578125, 0.00434112548828125, 0.009250640869140625, 0.01416015625, 0.019069671630859375, 0.02397918701171875, 0.028888702392578125, 0.0337982177734375, 0.038707733154296875, 0.04361724853515625, 0.048526763916015625, 0.053436279296875, 0.058345794677734375, 0.06325531005859375, 0.06816482543945312, 0.0730743408203125, 0.07798385620117188, 0.08289337158203125, 0.08780288696289062, 0.09271240234375, 0.09762191772460938, 0.10253143310546875, 0.10744094848632812, 0.1123504638671875, 0.11725997924804688, 0.12216949462890625, 0.12707901000976562, 0.131988525390625, 0.13689804077148438, 0.14180755615234375, 0.14671707153320312, 0.1516265869140625, 0.15653610229492188, 0.16144561767578125, 0.16635513305664062, 0.1712646484375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 1.0, 4.0, 6.0, 11.0, 6.0, 12.0, 22.0, 33.0, 42.0, 67.0, 120.0, 234.0, 560.0, 2023.0, 11973.0, 129527.0, 3364816.0, 646010.0, 32891.0, 4237.0, 978.0, 312.0, 156.0, 82.0, 37.0, 42.0, 24.0, 8.0, 12.0, 9.0, 7.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.474609375, -0.45916748046875, -0.4437255859375, -0.42828369140625, -0.412841796875, -0.39739990234375, -0.3819580078125, -0.36651611328125, -0.35107421875, -0.33563232421875, -0.3201904296875, -0.30474853515625, -0.289306640625, -0.27386474609375, -0.2584228515625, -0.24298095703125, -0.2275390625, -0.21209716796875, -0.1966552734375, -0.18121337890625, -0.165771484375, -0.15032958984375, -0.1348876953125, -0.11944580078125, -0.10400390625, -0.08856201171875, -0.0731201171875, -0.05767822265625, -0.042236328125, -0.02679443359375, -0.0113525390625, 0.00408935546875, 0.01953125, 0.03497314453125, 0.0504150390625, 0.06585693359375, 0.081298828125, 0.09674072265625, 0.1121826171875, 0.12762451171875, 0.14306640625, 0.15850830078125, 0.1739501953125, 0.18939208984375, 0.204833984375, 0.22027587890625, 0.2357177734375, 0.25115966796875, 0.2666015625, 0.28204345703125, 0.2974853515625, 0.31292724609375, 0.328369140625, 0.34381103515625, 0.3592529296875, 0.37469482421875, 0.39013671875, 0.40557861328125, 0.4210205078125, 0.43646240234375, 0.451904296875, 0.46734619140625, 0.4827880859375, 0.49822998046875, 0.513671875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 7.0, 15.0, 13.0, 19.0, 24.0, 37.0, 43.0, 57.0, 94.0, 126.0, 201.0, 350.0, 458.0, 539.0, 670.0, 480.0, 307.0, 196.0, 121.0, 99.0, 51.0, 55.0, 27.0, 23.0, 17.0, 9.0, 7.0, 7.0, 9.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33642578125, -0.3259239196777344, -0.31542205810546875, -0.3049201965332031, -0.2944183349609375, -0.2839164733886719, -0.27341461181640625, -0.2629127502441406, -0.252410888671875, -0.24190902709960938, -0.23140716552734375, -0.22090530395507812, -0.2104034423828125, -0.19990158081054688, -0.18939971923828125, -0.17889785766601562, -0.16839599609375, -0.15789413452148438, -0.14739227294921875, -0.13689041137695312, -0.1263885498046875, -0.11588668823242188, -0.10538482666015625, -0.09488296508789062, -0.084381103515625, -0.07387924194335938, -0.06337738037109375, -0.052875518798828125, -0.0423736572265625, -0.031871795654296875, -0.02136993408203125, -0.010868072509765625, -0.0003662109375, 0.010135650634765625, 0.02063751220703125, 0.031139373779296875, 0.0416412353515625, 0.052143096923828125, 0.06264495849609375, 0.07314682006835938, 0.083648681640625, 0.09415054321289062, 0.10465240478515625, 0.11515426635742188, 0.1256561279296875, 0.13615798950195312, 0.14665985107421875, 0.15716171264648438, 0.16766357421875, 0.17816543579101562, 0.18866729736328125, 0.19916915893554688, 0.2096710205078125, 0.22017288208007812, 0.23067474365234375, 0.24117660522460938, 0.251678466796875, 0.2621803283691406, 0.27268218994140625, 0.2831840515136719, 0.2936859130859375, 0.3041877746582031, 0.31468963623046875, 0.3251914978027344, 0.335693359375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 15.0, 27.0, 143.0, 316.0, 338.0, 102.0, 32.0, 15.0, 8.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.793111801147461, -11.566461563110352, -11.339810371398926, -11.113160133361816, -10.886509895324707, -10.659858703613281, -10.433208465576172, -10.206558227539062, -9.979907035827637, -9.753256797790527, -9.526605606079102, -9.299955368041992, -9.073305130004883, -8.846653938293457, -8.620003700256348, -8.393353462219238, -8.166703224182129, -7.940052509307861, -7.713402271270752, -7.486751556396484, -7.260100841522217, -7.033450603485107, -6.80679988861084, -6.5801496505737305, -6.353498458862305, -6.126847743988037, -5.900197505950928, -5.67354679107666, -5.446896076202393, -5.220245838165283, -4.993595123291016, -4.766944885253906, -4.5402936935424805, -4.313642978668213, -4.0869927406311035, -3.860342025756836, -3.6336915493011475, -3.407041072845459, -3.1803903579711914, -2.953739881515503, -2.7270894050598145, -2.500438928604126, -2.2737882137298584, -2.04713773727417, -1.8204872608184814, -1.5938366651535034, -1.3671860694885254, -1.140535593032837, -0.9138851165771484, -0.6872345805168152, -0.46058401465415955, -0.2339334487915039, -0.007282912731170654, 0.2193676233291626, 0.4460182189941406, 0.6726686954498291, 0.8993192911148071, 1.1259698867797852, 1.3526203632354736, 1.5792709589004517, 1.8059215545654297, 2.032572031021118, 2.2592225074768066, 2.485873222351074, 2.7125236988067627]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 3.0, 6.0, 6.0, 5.0, 5.0, 11.0, 11.0, 12.0, 9.0, 7.0, 11.0, 18.0, 12.0, 23.0, 24.0, 24.0, 21.0, 33.0, 33.0, 39.0, 26.0, 38.0, 36.0, 22.0, 40.0, 32.0, 41.0, 32.0, 25.0, 37.0, 44.0, 28.0, 34.0, 31.0, 32.0, 23.0, 21.0, 21.0, 23.0, 16.0, 10.0, 18.0, 9.0, 10.0, 10.0, 10.0, 3.0, 4.0, 3.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0], "bins": [-1.1417587995529175, -1.106102466583252, -1.0704461336135864, -1.034789800643921, -0.9991334676742554, -0.9634771347045898, -0.9278208017349243, -0.8921644687652588, -0.8565081357955933, -0.8208518028259277, -0.7851954698562622, -0.7495391368865967, -0.7138828039169312, -0.6782264709472656, -0.6425701379776001, -0.6069138050079346, -0.5712575316429138, -0.5356011986732483, -0.49994486570358276, -0.46428853273391724, -0.4286321997642517, -0.3929758667945862, -0.35731956362724304, -0.3216632306575775, -0.286006897687912, -0.25035056471824646, -0.21469423174858093, -0.1790379136800766, -0.14338158071041107, -0.10772524774074554, -0.07206892967224121, -0.036412596702575684, -0.0007562637329101562, 0.03490006551146507, 0.0705563947558403, 0.10621272027492523, 0.14186905324459076, 0.1775253862142563, 0.21318170428276062, 0.24883803725242615, 0.2844943702220917, 0.3201507031917572, 0.35580703616142273, 0.39146333932876587, 0.4271196722984314, 0.4627760052680969, 0.49843233823776245, 0.534088671207428, 0.5697450041770935, 0.605401337146759, 0.6410576701164246, 0.6767140030860901, 0.7123703360557556, 0.7480266690254211, 0.7836829423904419, 0.8193392753601074, 0.854995608329773, 0.8906519412994385, 0.926308274269104, 0.9619646072387695, 0.9976209402084351, 1.0332772731781006, 1.0689336061477661, 1.1045899391174316, 1.1402462720870972]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 8.0, 7.0, 7.0, 14.0, 10.0, 22.0, 32.0, 40.0, 45.0, 75.0, 129.0, 186.0, 270.0, 354.0, 614.0, 953.0, 1560.0, 2932.0, 5791.0, 13231.0, 35589.0, 120050.0, 390408.0, 330964.0, 93723.0, 28747.0, 11098.0, 5143.0, 2697.0, 1392.0, 822.0, 575.0, 337.0, 241.0, 146.0, 100.0, 68.0, 50.0, 40.0, 22.0, 16.0, 13.0, 15.0, 13.0, 3.0, 1.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.20849609375, -0.2017498016357422, -0.19500350952148438, -0.18825721740722656, -0.18151092529296875, -0.17476463317871094, -0.16801834106445312, -0.1612720489501953, -0.1545257568359375, -0.1477794647216797, -0.14103317260742188, -0.13428688049316406, -0.12754058837890625, -0.12079429626464844, -0.11404800415039062, -0.10730171203613281, -0.100555419921875, -0.09380912780761719, -0.08706283569335938, -0.08031654357910156, -0.07357025146484375, -0.06682395935058594, -0.060077667236328125, -0.05333137512207031, -0.0465850830078125, -0.03983879089355469, -0.033092498779296875, -0.026346206665039062, -0.01959991455078125, -0.012853622436523438, -0.006107330322265625, 0.0006389617919921875, 0.00738525390625, 0.014131546020507812, 0.020877838134765625, 0.027624130249023438, 0.03437042236328125, 0.04111671447753906, 0.047863006591796875, 0.05460929870605469, 0.0613555908203125, 0.06810188293457031, 0.07484817504882812, 0.08159446716308594, 0.08834075927734375, 0.09508705139160156, 0.10183334350585938, 0.10857963562011719, 0.115325927734375, 0.12207221984863281, 0.12881851196289062, 0.13556480407714844, 0.14231109619140625, 0.14905738830566406, 0.15580368041992188, 0.1625499725341797, 0.1692962646484375, 0.1760425567626953, 0.18278884887695312, 0.18953514099121094, 0.19628143310546875, 0.20302772521972656, 0.20977401733398438, 0.2165203094482422, 0.2232666015625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 6.0, 6.0, 7.0, 11.0, 16.0, 21.0, 29.0, 23.0, 24.0, 41.0, 27.0, 39.0, 35.0, 41.0, 46.0, 42.0, 53.0, 45.0, 61.0, 56.0, 56.0, 37.0, 31.0, 38.0, 39.0, 29.0, 29.0, 24.0, 16.0, 18.0, 8.0, 13.0, 5.0, 8.0, 4.0, 3.0, 5.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1436767578125, -0.13857460021972656, -0.13347244262695312, -0.1283702850341797, -0.12326812744140625, -0.11816596984863281, -0.11306381225585938, -0.10796165466308594, -0.1028594970703125, -0.09775733947753906, -0.09265518188476562, -0.08755302429199219, -0.08245086669921875, -0.07734870910644531, -0.07224655151367188, -0.06714439392089844, -0.062042236328125, -0.05694007873535156, -0.051837921142578125, -0.04673576354980469, -0.04163360595703125, -0.03653144836425781, -0.031429290771484375, -0.026327133178710938, -0.0212249755859375, -0.016122817993164062, -0.011020660400390625, -0.0059185028076171875, -0.00081634521484375, 0.0042858123779296875, 0.009387969970703125, 0.014490127563476562, 0.01959228515625, 0.024694442749023438, 0.029796600341796875, 0.03489875793457031, 0.04000091552734375, 0.04510307312011719, 0.050205230712890625, 0.05530738830566406, 0.0604095458984375, 0.06551170349121094, 0.07061386108398438, 0.07571601867675781, 0.08081817626953125, 0.08592033386230469, 0.09102249145507812, 0.09612464904785156, 0.101226806640625, 0.10632896423339844, 0.11143112182617188, 0.11653327941894531, 0.12163543701171875, 0.1267375946044922, 0.13183975219726562, 0.13694190979003906, 0.1420440673828125, 0.14714622497558594, 0.15224838256835938, 0.1573505401611328, 0.16245269775390625, 0.1675548553466797, 0.17265701293945312, 0.17775917053222656, 0.182861328125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 7.0, 6.0, 5.0, 15.0, 21.0, 19.0, 32.0, 31.0, 49.0, 68.0, 146.0, 206.0, 279.0, 569.0, 1157.0, 2932.0, 10884.0, 77215.0, 791950.0, 140172.0, 15867.0, 3844.0, 1451.0, 641.0, 351.0, 216.0, 136.0, 72.0, 59.0, 38.0, 35.0, 24.0, 16.0, 7.0, 13.0, 8.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.42431640625, -0.41089630126953125, -0.3974761962890625, -0.38405609130859375, -0.370635986328125, -0.35721588134765625, -0.3437957763671875, -0.33037567138671875, -0.31695556640625, -0.30353546142578125, -0.2901153564453125, -0.27669525146484375, -0.263275146484375, -0.24985504150390625, -0.2364349365234375, -0.22301483154296875, -0.2095947265625, -0.19617462158203125, -0.1827545166015625, -0.16933441162109375, -0.155914306640625, -0.14249420166015625, -0.1290740966796875, -0.11565399169921875, -0.10223388671875, -0.08881378173828125, -0.0753936767578125, -0.06197357177734375, -0.048553466796875, -0.03513336181640625, -0.0217132568359375, -0.00829315185546875, 0.005126953125, 0.01854705810546875, 0.0319671630859375, 0.04538726806640625, 0.058807373046875, 0.07222747802734375, 0.0856475830078125, 0.09906768798828125, 0.11248779296875, 0.12590789794921875, 0.1393280029296875, 0.15274810791015625, 0.166168212890625, 0.17958831787109375, 0.1930084228515625, 0.20642852783203125, 0.2198486328125, 0.23326873779296875, 0.2466888427734375, 0.26010894775390625, 0.273529052734375, 0.28694915771484375, 0.3003692626953125, 0.31378936767578125, 0.32720947265625, 0.34062957763671875, 0.3540496826171875, 0.36746978759765625, 0.380889892578125, 0.39430999755859375, 0.4077301025390625, 0.42115020751953125, 0.4345703125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 8.0, 8.0, 6.0, 11.0, 9.0, 15.0, 15.0, 20.0, 22.0, 33.0, 43.0, 39.0, 41.0, 54.0, 52.0, 37.0, 70.0, 64.0, 63.0, 42.0, 59.0, 43.0, 50.0, 27.0, 36.0, 25.0, 23.0, 17.0, 14.0, 17.0, 8.0, 6.0, 6.0, 2.0, 5.0, 2.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59228515625, -0.5718154907226562, -0.5513458251953125, -0.5308761596679688, -0.510406494140625, -0.48993682861328125, -0.4694671630859375, -0.44899749755859375, -0.42852783203125, -0.40805816650390625, -0.3875885009765625, -0.36711883544921875, -0.346649169921875, -0.32617950439453125, -0.3057098388671875, -0.28524017333984375, -0.2647705078125, -0.24430084228515625, -0.2238311767578125, -0.20336151123046875, -0.182891845703125, -0.16242218017578125, -0.1419525146484375, -0.12148284912109375, -0.10101318359375, -0.08054351806640625, -0.0600738525390625, -0.03960418701171875, -0.019134521484375, 0.00133514404296875, 0.0218048095703125, 0.04227447509765625, 0.062744140625, 0.08321380615234375, 0.1036834716796875, 0.12415313720703125, 0.144622802734375, 0.16509246826171875, 0.1855621337890625, 0.20603179931640625, 0.22650146484375, 0.24697113037109375, 0.2674407958984375, 0.28791046142578125, 0.308380126953125, 0.32884979248046875, 0.3493194580078125, 0.36978912353515625, 0.3902587890625, 0.41072845458984375, 0.4311981201171875, 0.45166778564453125, 0.472137451171875, 0.49260711669921875, 0.5130767822265625, 0.5335464477539062, 0.55401611328125, 0.5744857788085938, 0.5949554443359375, 0.6154251098632812, 0.635894775390625, 0.6563644409179688, 0.6768341064453125, 0.6973037719726562, 0.7177734375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 5.0, 10.0, 12.0, 18.0, 35.0, 55.0, 92.0, 198.0, 337.0, 653.0, 1366.0, 3278.0, 8952.0, 31766.0, 179772.0, 710198.0, 83045.0, 18403.0, 5953.0, 2254.0, 1026.0, 502.0, 248.0, 149.0, 75.0, 55.0, 38.0, 21.0, 11.0, 8.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.167236328125, -0.16318702697753906, -0.15913772583007812, -0.1550884246826172, -0.15103912353515625, -0.1469898223876953, -0.14294052124023438, -0.13889122009277344, -0.1348419189453125, -0.13079261779785156, -0.12674331665039062, -0.12269401550292969, -0.11864471435546875, -0.11459541320800781, -0.11054611206054688, -0.10649681091308594, -0.102447509765625, -0.09839820861816406, -0.09434890747070312, -0.09029960632324219, -0.08625030517578125, -0.08220100402832031, -0.07815170288085938, -0.07410240173339844, -0.0700531005859375, -0.06600379943847656, -0.061954498291015625, -0.05790519714355469, -0.05385589599609375, -0.04980659484863281, -0.045757293701171875, -0.04170799255371094, -0.03765869140625, -0.03360939025878906, -0.029560089111328125, -0.025510787963867188, -0.02146148681640625, -0.017412185668945312, -0.013362884521484375, -0.009313583374023438, -0.0052642822265625, -0.0012149810791015625, 0.002834320068359375, 0.0068836212158203125, 0.01093292236328125, 0.014982223510742188, 0.019031524658203125, 0.023080825805664062, 0.027130126953125, 0.031179428100585938, 0.035228729248046875, 0.03927803039550781, 0.04332733154296875, 0.04737663269042969, 0.051425933837890625, 0.05547523498535156, 0.0595245361328125, 0.06357383728027344, 0.06762313842773438, 0.07167243957519531, 0.07572174072265625, 0.07977104187011719, 0.08382034301757812, 0.08786964416503906, 0.0919189453125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 8.0, 10.0, 14.0, 17.0, 24.0, 31.0, 65.0, 100.0, 106.0, 115.0, 129.0, 127.0, 81.0, 51.0, 32.0, 30.0, 22.0, 10.0, 5.0, 4.0, 4.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.59687614440918e-05, -5.395989865064621e-05, -5.195103585720062e-05, -4.9942173063755035e-05, -4.793331027030945e-05, -4.592444747686386e-05, -4.3915584683418274e-05, -4.190672188997269e-05, -3.98978590965271e-05, -3.788899630308151e-05, -3.5880133509635925e-05, -3.387127071619034e-05, -3.186240792274475e-05, -2.9853545129299164e-05, -2.7844682335853577e-05, -2.583581954240799e-05, -2.3826956748962402e-05, -2.1818093955516815e-05, -1.9809231162071228e-05, -1.780036836862564e-05, -1.5791505575180054e-05, -1.3782642781734467e-05, -1.177377998828888e-05, -9.764917194843292e-06, -7.756054401397705e-06, -5.747191607952118e-06, -3.7383288145065308e-06, -1.7294660210609436e-06, 2.7939677238464355e-07, 2.2882595658302307e-06, 4.297122359275818e-06, 6.305985152721405e-06, 8.314847946166992e-06, 1.032371073961258e-05, 1.2332573533058167e-05, 1.4341436326503754e-05, 1.635029911994934e-05, 1.8359161913394928e-05, 2.0368024706840515e-05, 2.2376887500286102e-05, 2.438575029373169e-05, 2.6394613087177277e-05, 2.8403475880622864e-05, 3.041233867406845e-05, 3.242120146751404e-05, 3.4430064260959625e-05, 3.643892705440521e-05, 3.84477898478508e-05, 4.045665264129639e-05, 4.2465515434741974e-05, 4.447437822818756e-05, 4.648324102163315e-05, 4.8492103815078735e-05, 5.050096660852432e-05, 5.250982940196991e-05, 5.45186921954155e-05, 5.6527554988861084e-05, 5.853641778230667e-05, 6.054528057575226e-05, 6.255414336919785e-05, 6.456300616264343e-05, 6.657186895608902e-05, 6.858073174953461e-05, 7.05895945429802e-05, 7.259845733642578e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 8.0, 7.0, 8.0, 16.0, 26.0, 43.0, 55.0, 106.0, 184.0, 319.0, 626.0, 1426.0, 3329.0, 9452.0, 34015.0, 190586.0, 695328.0, 83976.0, 18705.0, 5981.0, 2219.0, 1033.0, 453.0, 271.0, 145.0, 80.0, 56.0, 38.0, 21.0, 13.0, 7.0, 6.0, 7.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1334228515625, -0.12915802001953125, -0.1248931884765625, -0.12062835693359375, -0.116363525390625, -0.11209869384765625, -0.1078338623046875, -0.10356903076171875, -0.09930419921875, -0.09503936767578125, -0.0907745361328125, -0.08650970458984375, -0.082244873046875, -0.07798004150390625, -0.0737152099609375, -0.06945037841796875, -0.065185546875, -0.06092071533203125, -0.0566558837890625, -0.05239105224609375, -0.048126220703125, -0.04386138916015625, -0.0395965576171875, -0.03533172607421875, -0.03106689453125, -0.02680206298828125, -0.0225372314453125, -0.01827239990234375, -0.014007568359375, -0.00974273681640625, -0.0054779052734375, -0.00121307373046875, 0.0030517578125, 0.00731658935546875, 0.0115814208984375, 0.01584625244140625, 0.020111083984375, 0.02437591552734375, 0.0286407470703125, 0.03290557861328125, 0.03717041015625, 0.04143524169921875, 0.0457000732421875, 0.04996490478515625, 0.054229736328125, 0.05849456787109375, 0.0627593994140625, 0.06702423095703125, 0.0712890625, 0.07555389404296875, 0.0798187255859375, 0.08408355712890625, 0.088348388671875, 0.09261322021484375, 0.0968780517578125, 0.10114288330078125, 0.10540771484375, 0.10967254638671875, 0.1139373779296875, 0.11820220947265625, 0.122467041015625, 0.12673187255859375, 0.1309967041015625, 0.13526153564453125, 0.1395263671875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 2.0, 2.0, 8.0, 11.0, 8.0, 13.0, 25.0, 16.0, 25.0, 26.0, 44.0, 48.0, 70.0, 84.0, 102.0, 92.0, 105.0, 73.0, 59.0, 45.0, 26.0, 24.0, 16.0, 14.0, 12.0, 5.0, 6.0, 5.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09637451171875, -0.0927896499633789, -0.08920478820800781, -0.08561992645263672, -0.08203506469726562, -0.07845020294189453, -0.07486534118652344, -0.07128047943115234, -0.06769561767578125, -0.06411075592041016, -0.06052589416503906, -0.05694103240966797, -0.053356170654296875, -0.04977130889892578, -0.04618644714355469, -0.042601585388183594, -0.0390167236328125, -0.035431861877441406, -0.03184700012207031, -0.02826213836669922, -0.024677276611328125, -0.02109241485595703, -0.017507553100585938, -0.013922691345214844, -0.01033782958984375, -0.006752967834472656, -0.0031681060791015625, 0.00041675567626953125, 0.004001617431640625, 0.007586479187011719, 0.011171340942382812, 0.014756202697753906, 0.018341064453125, 0.021925926208496094, 0.025510787963867188, 0.02909564971923828, 0.032680511474609375, 0.03626537322998047, 0.03985023498535156, 0.043435096740722656, 0.04701995849609375, 0.050604820251464844, 0.05418968200683594, 0.05777454376220703, 0.061359405517578125, 0.06494426727294922, 0.06852912902832031, 0.0721139907836914, 0.0756988525390625, 0.0792837142944336, 0.08286857604980469, 0.08645343780517578, 0.09003829956054688, 0.09362316131591797, 0.09720802307128906, 0.10079288482666016, 0.10437774658203125, 0.10796260833740234, 0.11154747009277344, 0.11513233184814453, 0.11871719360351562, 0.12230205535888672, 0.1258869171142578, 0.1294717788696289, 0.133056640625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 9.0, 15.0, 18.0, 53.0, 117.0, 191.0, 297.0, 151.0, 72.0, 28.0, 22.0, 9.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9592761993408203, -1.8519467115402222, -1.744617223739624, -1.6372878551483154, -1.5299582481384277, -1.4226288795471191, -1.315299391746521, -1.2079699039459229, -1.1006404161453247, -0.9933109283447266, -0.8859814405441284, -0.778652012348175, -0.6713225245475769, -0.5639930367469788, -0.4566636085510254, -0.34933412075042725, -0.2420046329498291, -0.13467516005039215, -0.0273456871509552, 0.07998377084732056, 0.1873132586479187, 0.29464274644851685, 0.4019721746444702, 0.5093016624450684, 0.6166311502456665, 0.7239606380462646, 0.8312901258468628, 0.9386195540428162, 1.0459489822387695, 1.1532785892486572, 1.2606079578399658, 1.367937445640564, 1.475266933441162, 1.5825964212417603, 1.6899259090423584, 1.797255277633667, 1.9045848846435547, 2.0119142532348633, 2.119243621826172, 2.2265732288360596, 2.3339028358459473, 2.441232204437256, 2.5485618114471436, 2.655891180038452, 2.76322078704834, 2.8705501556396484, 2.977879524230957, 3.0852091312408447, 3.1925384998321533, 3.299867868423462, 3.4071974754333496, 3.514526844024658, 3.621856451034546, 3.7291858196258545, 3.836515426635742, 3.943844795227051, 4.051174163818359, 4.158503532409668, 4.265832901000977, 4.373162746429443, 4.480492115020752, 4.5878214836120605, 4.695150852203369, 4.802480697631836, 4.9098100662231445]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 7.0, 4.0, 11.0, 5.0, 9.0, 18.0, 18.0, 17.0, 28.0, 33.0, 24.0, 27.0, 41.0, 39.0, 60.0, 102.0, 103.0, 91.0, 52.0, 50.0, 34.0, 28.0, 28.0, 30.0, 25.0, 16.0, 22.0, 17.0, 13.0, 9.0, 11.0, 5.0, 7.0, 4.0, 1.0, 7.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.645404100418091, -2.5691723823547363, -2.4929404258728027, -2.4167087078094482, -2.3404769897460938, -2.26424503326416, -2.1880133152008057, -2.111781597137451, -2.0355496406555176, -1.9593178033828735, -1.8830859661102295, -1.806854248046875, -1.730622410774231, -1.654390573501587, -1.5781588554382324, -1.5019270181655884, -1.4256951808929443, -1.3494633436203003, -1.2732315063476562, -1.1969997882843018, -1.1207679510116577, -1.0445361137390137, -0.9683043360710144, -0.8920725584030151, -0.8158407211303711, -0.739608883857727, -0.6633771061897278, -0.5871453285217285, -0.5109134912490845, -0.4346816837787628, -0.35844987630844116, -0.2822180986404419, -0.20598649978637695, -0.1297546923160553, -0.05352288484573364, 0.022708922624588013, 0.09894073009490967, 0.17517253756523132, 0.251404345035553, 0.32763612270355225, 0.4038679599761963, 0.48009976744651794, 0.5563315749168396, 0.6325633525848389, 0.7087951898574829, 0.785027027130127, 0.8612588047981262, 0.9374905824661255, 1.0137224197387695, 1.0899542570114136, 1.1661860942840576, 1.242417812347412, 1.3186496496200562, 1.3948814868927002, 1.4711132049560547, 1.5473450422286987, 1.6235768795013428, 1.6998087167739868, 1.7760405540466309, 1.8522722721099854, 1.9285041093826294, 2.0047359466552734, 2.080967664718628, 2.1571993827819824, 2.233431339263916]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 6.0, 4.0, 4.0, 6.0, 10.0, 20.0, 12.0, 32.0, 43.0, 39.0, 112.0, 186.0, 403.0, 872.0, 2054.0, 5017.0, 14696.0, 53734.0, 295129.0, 1985511.0, 1560115.0, 216967.0, 40617.0, 11464.0, 3884.0, 1656.0, 715.0, 360.0, 197.0, 106.0, 63.0, 58.0, 31.0, 30.0, 24.0, 22.0, 14.0, 5.0, 8.0, 10.0, 11.0, 9.0, 4.0, 5.0, 2.0, 5.0, 7.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1776123046875, -0.1704845428466797, -0.16335678100585938, -0.15622901916503906, -0.14910125732421875, -0.14197349548339844, -0.13484573364257812, -0.1277179718017578, -0.1205902099609375, -0.11346244812011719, -0.10633468627929688, -0.09920692443847656, -0.09207916259765625, -0.08495140075683594, -0.07782363891601562, -0.07069587707519531, -0.063568115234375, -0.05644035339355469, -0.049312591552734375, -0.04218482971191406, -0.03505706787109375, -0.027929306030273438, -0.020801544189453125, -0.013673782348632812, -0.0065460205078125, 0.0005817413330078125, 0.007709503173828125, 0.014837265014648438, 0.02196502685546875, 0.029092788696289062, 0.036220550537109375, 0.04334831237792969, 0.05047607421875, 0.05760383605957031, 0.06473159790039062, 0.07185935974121094, 0.07898712158203125, 0.08611488342285156, 0.09324264526367188, 0.10037040710449219, 0.1074981689453125, 0.11462593078613281, 0.12175369262695312, 0.12888145446777344, 0.13600921630859375, 0.14313697814941406, 0.15026473999023438, 0.1573925018310547, 0.164520263671875, 0.1716480255126953, 0.17877578735351562, 0.18590354919433594, 0.19303131103515625, 0.20015907287597656, 0.20728683471679688, 0.2144145965576172, 0.2215423583984375, 0.2286701202392578, 0.23579788208007812, 0.24292564392089844, 0.25005340576171875, 0.25718116760253906, 0.2643089294433594, 0.2714366912841797, 0.278564453125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 9.0, 6.0, 8.0, 15.0, 19.0, 15.0, 16.0, 26.0, 34.0, 28.0, 34.0, 37.0, 37.0, 44.0, 49.0, 31.0, 53.0, 60.0, 42.0, 51.0, 51.0, 56.0, 37.0, 33.0, 43.0, 37.0, 23.0, 23.0, 24.0, 12.0, 9.0, 8.0, 3.0, 6.0, 7.0, 0.0, 5.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1328125, -0.127838134765625, -0.12286376953125, -0.117889404296875, -0.1129150390625, -0.107940673828125, -0.10296630859375, -0.097991943359375, -0.093017578125, -0.088043212890625, -0.08306884765625, -0.078094482421875, -0.0731201171875, -0.068145751953125, -0.06317138671875, -0.058197021484375, -0.05322265625, -0.048248291015625, -0.04327392578125, -0.038299560546875, -0.0333251953125, -0.028350830078125, -0.02337646484375, -0.018402099609375, -0.013427734375, -0.008453369140625, -0.00347900390625, 0.001495361328125, 0.0064697265625, 0.011444091796875, 0.01641845703125, 0.021392822265625, 0.0263671875, 0.031341552734375, 0.03631591796875, 0.041290283203125, 0.0462646484375, 0.051239013671875, 0.05621337890625, 0.061187744140625, 0.066162109375, 0.071136474609375, 0.07611083984375, 0.081085205078125, 0.0860595703125, 0.091033935546875, 0.09600830078125, 0.100982666015625, 0.10595703125, 0.110931396484375, 0.11590576171875, 0.120880126953125, 0.1258544921875, 0.130828857421875, 0.13580322265625, 0.140777587890625, 0.145751953125, 0.150726318359375, 0.15570068359375, 0.160675048828125, 0.1656494140625, 0.170623779296875, 0.17559814453125, 0.180572509765625, 0.185546875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 4.0, 4.0, 11.0, 6.0, 12.0, 13.0, 15.0, 33.0, 39.0, 58.0, 96.0, 162.0, 300.0, 777.0, 2368.0, 10195.0, 72270.0, 1555945.0, 2433734.0, 101017.0, 12807.0, 2691.0, 852.0, 341.0, 172.0, 107.0, 58.0, 47.0, 33.0, 27.0, 18.0, 17.0, 9.0, 12.0, 6.0, 4.0, 7.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.443359375, -0.43071746826171875, -0.4180755615234375, -0.40543365478515625, -0.392791748046875, -0.38014984130859375, -0.3675079345703125, -0.35486602783203125, -0.34222412109375, -0.32958221435546875, -0.3169403076171875, -0.30429840087890625, -0.291656494140625, -0.27901458740234375, -0.2663726806640625, -0.25373077392578125, -0.2410888671875, -0.22844696044921875, -0.2158050537109375, -0.20316314697265625, -0.190521240234375, -0.17787933349609375, -0.1652374267578125, -0.15259552001953125, -0.13995361328125, -0.12731170654296875, -0.1146697998046875, -0.10202789306640625, -0.089385986328125, -0.07674407958984375, -0.0641021728515625, -0.05146026611328125, -0.038818359375, -0.02617645263671875, -0.0135345458984375, -0.00089263916015625, 0.011749267578125, 0.02439117431640625, 0.0370330810546875, 0.04967498779296875, 0.06231689453125, 0.07495880126953125, 0.0876007080078125, 0.10024261474609375, 0.112884521484375, 0.12552642822265625, 0.1381683349609375, 0.15081024169921875, 0.1634521484375, 0.17609405517578125, 0.1887359619140625, 0.20137786865234375, 0.214019775390625, 0.22666168212890625, 0.2393035888671875, 0.25194549560546875, 0.26458740234375, 0.27722930908203125, 0.2898712158203125, 0.30251312255859375, 0.315155029296875, 0.32779693603515625, 0.3404388427734375, 0.35308074951171875, 0.36572265625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 11.0, 4.0, 10.0, 5.0, 11.0, 17.0, 19.0, 28.0, 23.0, 41.0, 55.0, 64.0, 98.0, 118.0, 160.0, 220.0, 307.0, 383.0, 507.0, 439.0, 404.0, 276.0, 207.0, 182.0, 117.0, 79.0, 65.0, 62.0, 31.0, 31.0, 21.0, 15.0, 14.0, 5.0, 9.0, 8.0, 7.0, 5.0, 1.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.276123046875, -0.2682323455810547, -0.2603416442871094, -0.25245094299316406, -0.24456024169921875, -0.23666954040527344, -0.22877883911132812, -0.2208881378173828, -0.2129974365234375, -0.2051067352294922, -0.19721603393554688, -0.18932533264160156, -0.18143463134765625, -0.17354393005371094, -0.16565322875976562, -0.1577625274658203, -0.149871826171875, -0.1419811248779297, -0.13409042358398438, -0.12619972229003906, -0.11830902099609375, -0.11041831970214844, -0.10252761840820312, -0.09463691711425781, -0.0867462158203125, -0.07885551452636719, -0.07096481323242188, -0.06307411193847656, -0.05518341064453125, -0.04729270935058594, -0.039402008056640625, -0.03151130676269531, -0.02362060546875, -0.015729904174804688, -0.007839202880859375, 5.14984130859375e-05, 0.00794219970703125, 0.015832901000976562, 0.023723602294921875, 0.03161430358886719, 0.0395050048828125, 0.04739570617675781, 0.055286407470703125, 0.06317710876464844, 0.07106781005859375, 0.07895851135253906, 0.08684921264648438, 0.09473991394042969, 0.102630615234375, 0.11052131652832031, 0.11841201782226562, 0.12630271911621094, 0.13419342041015625, 0.14208412170410156, 0.14997482299804688, 0.1578655242919922, 0.1657562255859375, 0.1736469268798828, 0.18153762817382812, 0.18942832946777344, 0.19731903076171875, 0.20520973205566406, 0.21310043334960938, 0.2209911346435547, 0.2288818359375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 8.0, 8.0, 8.0, 4.0, 16.0, 28.0, 56.0, 67.0, 87.0, 118.0, 136.0, 134.0, 115.0, 75.0, 52.0, 29.0, 20.0, 11.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1091694831848145, -2.0345773696899414, -1.9599854946136475, -1.8853933811187744, -1.810801386833191, -1.7362093925476074, -1.6616172790527344, -1.5870252847671509, -1.5124332904815674, -1.4378412961959839, -1.3632493019104004, -1.2886571884155273, -1.2140651941299438, -1.1394731998443604, -1.0648810863494873, -0.9902890920639038, -0.9156970977783203, -0.8411051034927368, -0.7665130496025085, -0.6919209957122803, -0.6173290014266968, -0.5427370071411133, -0.468144953250885, -0.39355289936065674, -0.31896090507507324, -0.24436888098716736, -0.16977685689926147, -0.09518483281135559, -0.020592808723449707, 0.05399921536445618, 0.12859123945236206, 0.20318329334259033, 0.27777528762817383, 0.3523673117160797, 0.4269593358039856, 0.5015513896942139, 0.5761433839797974, 0.6507353782653809, 0.7253274321556091, 0.7999194860458374, 0.8745114803314209, 0.9491034746170044, 1.023695468902588, 1.098287582397461, 1.1728795766830444, 1.247471570968628, 1.322063684463501, 1.3966556787490845, 1.471247673034668, 1.5458396673202515, 1.620431661605835, 1.695023775100708, 1.7696157693862915, 1.844207763671875, 1.918799877166748, 1.9933918714523315, 2.067983865737915, 2.142575979232788, 2.217167854309082, 2.291759967803955, 2.366352081298828, 2.440943956375122, 2.515536069869995, 2.590127944946289, 2.664720058441162]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 8.0, 4.0, 3.0, 11.0, 13.0, 17.0, 16.0, 33.0, 41.0, 28.0, 47.0, 50.0, 67.0, 49.0, 44.0, 46.0, 51.0, 52.0, 60.0, 69.0, 48.0, 48.0, 31.0, 36.0, 25.0, 24.0, 23.0, 15.0, 14.0, 4.0, 8.0, 7.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6510562896728516, -1.595447063446045, -1.5398379564285278, -1.4842288494110107, -1.428619623184204, -1.3730103969573975, -1.3174012899398804, -1.2617921829223633, -1.2061829566955566, -1.15057373046875, -1.094964623451233, -1.0393555164337158, -0.9837462902069092, -0.9281371235847473, -0.8725279569625854, -0.8169187903404236, -0.7613096237182617, -0.7057004570960999, -0.650091290473938, -0.5944821238517761, -0.5388729572296143, -0.4832637906074524, -0.4276546239852905, -0.37204545736312866, -0.3164362907409668, -0.26082712411880493, -0.20521795749664307, -0.1496087908744812, -0.09399962425231934, -0.03839045763015747, 0.017218708992004395, 0.07282787561416626, 0.12843692302703857, 0.18404608964920044, 0.2396552562713623, 0.29526442289352417, 0.35087358951568604, 0.4064827561378479, 0.46209192276000977, 0.5177010893821716, 0.5733102560043335, 0.6289194226264954, 0.6845285892486572, 0.7401377558708191, 0.795746922492981, 0.8513560891151428, 0.9069652557373047, 0.9625744223594666, 1.0181835889816284, 1.0737926959991455, 1.1294019222259521, 1.1850111484527588, 1.2406202554702759, 1.296229362487793, 1.3518385887145996, 1.4074478149414062, 1.4630569219589233, 1.5186660289764404, 1.574275255203247, 1.6298844814300537, 1.6854935884475708, 1.741102695465088, 1.7967119216918945, 1.8523211479187012, 1.9079302549362183]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 14.0, 13.0, 24.0, 28.0, 36.0, 59.0, 98.0, 154.0, 273.0, 502.0, 959.0, 1836.0, 4151.0, 10276.0, 28209.0, 91262.0, 354952.0, 398920.0, 104578.0, 31777.0, 11322.0, 4740.0, 2070.0, 1050.0, 496.0, 280.0, 168.0, 125.0, 67.0, 39.0, 27.0, 15.0, 8.0, 9.0, 7.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2366943359375, -0.2288188934326172, -0.22094345092773438, -0.21306800842285156, -0.20519256591796875, -0.19731712341308594, -0.18944168090820312, -0.1815662384033203, -0.1736907958984375, -0.1658153533935547, -0.15793991088867188, -0.15006446838378906, -0.14218902587890625, -0.13431358337402344, -0.12643814086914062, -0.11856269836425781, -0.110687255859375, -0.10281181335449219, -0.09493637084960938, -0.08706092834472656, -0.07918548583984375, -0.07131004333496094, -0.06343460083007812, -0.05555915832519531, -0.0476837158203125, -0.03980827331542969, -0.031932830810546875, -0.024057388305664062, -0.01618194580078125, -0.008306503295898438, -0.000431060791015625, 0.0074443817138671875, 0.01531982421875, 0.023195266723632812, 0.031070709228515625, 0.03894615173339844, 0.04682159423828125, 0.05469703674316406, 0.06257247924804688, 0.07044792175292969, 0.0783233642578125, 0.08619880676269531, 0.09407424926757812, 0.10194969177246094, 0.10982513427734375, 0.11770057678222656, 0.12557601928710938, 0.1334514617919922, 0.141326904296875, 0.1492023468017578, 0.15707778930664062, 0.16495323181152344, 0.17282867431640625, 0.18070411682128906, 0.18857955932617188, 0.1964550018310547, 0.2043304443359375, 0.2122058868408203, 0.22008132934570312, 0.22795677185058594, 0.23583221435546875, 0.24370765686035156, 0.2515830993652344, 0.2594585418701172, 0.267333984375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 6.0, 5.0, 5.0, 6.0, 6.0, 6.0, 14.0, 7.0, 22.0, 16.0, 23.0, 28.0, 27.0, 21.0, 26.0, 30.0, 41.0, 39.0, 50.0, 38.0, 31.0, 39.0, 39.0, 58.0, 55.0, 38.0, 42.0, 43.0, 34.0, 33.0, 29.0, 29.0, 18.0, 23.0, 11.0, 12.0, 9.0, 6.0, 9.0, 10.0, 7.0, 3.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1270751953125, -0.12250709533691406, -0.11793899536132812, -0.11337089538574219, -0.10880279541015625, -0.10423469543457031, -0.09966659545898438, -0.09509849548339844, -0.0905303955078125, -0.08596229553222656, -0.08139419555664062, -0.07682609558105469, -0.07225799560546875, -0.06768989562988281, -0.06312179565429688, -0.05855369567871094, -0.053985595703125, -0.04941749572753906, -0.044849395751953125, -0.04028129577636719, -0.03571319580078125, -0.031145095825195312, -0.026576995849609375, -0.022008895874023438, -0.0174407958984375, -0.012872695922851562, -0.008304595947265625, -0.0037364959716796875, 0.00083160400390625, 0.0053997039794921875, 0.009967803955078125, 0.014535903930664062, 0.01910400390625, 0.023672103881835938, 0.028240203857421875, 0.03280830383300781, 0.03737640380859375, 0.04194450378417969, 0.046512603759765625, 0.05108070373535156, 0.0556488037109375, 0.06021690368652344, 0.06478500366210938, 0.06935310363769531, 0.07392120361328125, 0.07848930358886719, 0.08305740356445312, 0.08762550354003906, 0.092193603515625, 0.09676170349121094, 0.10132980346679688, 0.10589790344238281, 0.11046600341796875, 0.11503410339355469, 0.11960220336914062, 0.12417030334472656, 0.1287384033203125, 0.13330650329589844, 0.13787460327148438, 0.1424427032470703, 0.14701080322265625, 0.1515789031982422, 0.15614700317382812, 0.16071510314941406, 0.165283203125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 2.0, 2.0, 5.0, 4.0, 6.0, 9.0, 7.0, 14.0, 18.0, 27.0, 46.0, 69.0, 96.0, 136.0, 224.0, 366.0, 629.0, 1295.0, 3302.0, 11767.0, 74097.0, 798402.0, 132942.0, 17000.0, 4407.0, 1621.0, 751.0, 476.0, 280.0, 172.0, 126.0, 85.0, 47.0, 25.0, 19.0, 20.0, 15.0, 11.0, 6.0, 10.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.45751953125, -0.4439125061035156, -0.43030548095703125, -0.4166984558105469, -0.4030914306640625, -0.3894844055175781, -0.37587738037109375, -0.3622703552246094, -0.348663330078125, -0.3350563049316406, -0.32144927978515625, -0.3078422546386719, -0.2942352294921875, -0.2806282043457031, -0.26702117919921875, -0.2534141540527344, -0.23980712890625, -0.22620010375976562, -0.21259307861328125, -0.19898605346679688, -0.1853790283203125, -0.17177200317382812, -0.15816497802734375, -0.14455795288085938, -0.130950927734375, -0.11734390258789062, -0.10373687744140625, -0.09012985229492188, -0.0765228271484375, -0.06291580200195312, -0.04930877685546875, -0.035701751708984375, -0.0220947265625, -0.008487701416015625, 0.00511932373046875, 0.018726348876953125, 0.0323333740234375, 0.045940399169921875, 0.05954742431640625, 0.07315444946289062, 0.086761474609375, 0.10036849975585938, 0.11397552490234375, 0.12758255004882812, 0.1411895751953125, 0.15479660034179688, 0.16840362548828125, 0.18201065063476562, 0.19561767578125, 0.20922470092773438, 0.22283172607421875, 0.23643875122070312, 0.2500457763671875, 0.2636528015136719, 0.27725982666015625, 0.2908668518066406, 0.304473876953125, 0.3180809020996094, 0.33168792724609375, 0.3452949523925781, 0.3589019775390625, 0.3725090026855469, 0.38611602783203125, 0.3997230529785156, 0.413330078125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 6.0, 10.0, 1.0, 7.0, 13.0, 23.0, 16.0, 12.0, 20.0, 28.0, 31.0, 33.0, 36.0, 49.0, 36.0, 55.0, 60.0, 62.0, 51.0, 59.0, 56.0, 46.0, 42.0, 28.0, 47.0, 31.0, 28.0, 31.0, 22.0, 8.0, 10.0, 11.0, 7.0, 8.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.7158203125, -0.6964263916015625, -0.677032470703125, -0.6576385498046875, -0.63824462890625, -0.6188507080078125, -0.599456787109375, -0.5800628662109375, -0.5606689453125, -0.5412750244140625, -0.521881103515625, -0.5024871826171875, -0.48309326171875, -0.4636993408203125, -0.444305419921875, -0.4249114990234375, -0.405517578125, -0.3861236572265625, -0.366729736328125, -0.3473358154296875, -0.32794189453125, -0.3085479736328125, -0.289154052734375, -0.2697601318359375, -0.2503662109375, -0.2309722900390625, -0.211578369140625, -0.1921844482421875, -0.17279052734375, -0.1533966064453125, -0.134002685546875, -0.1146087646484375, -0.09521484375, -0.0758209228515625, -0.056427001953125, -0.0370330810546875, -0.01763916015625, 0.0017547607421875, 0.021148681640625, 0.0405426025390625, 0.0599365234375, 0.0793304443359375, 0.098724365234375, 0.1181182861328125, 0.13751220703125, 0.1569061279296875, 0.176300048828125, 0.1956939697265625, 0.215087890625, 0.2344818115234375, 0.253875732421875, 0.2732696533203125, 0.29266357421875, 0.3120574951171875, 0.331451416015625, 0.3508453369140625, 0.3702392578125, 0.3896331787109375, 0.409027099609375, 0.4284210205078125, 0.44781494140625, 0.4672088623046875, 0.486602783203125, 0.5059967041015625, 0.525390625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 6.0, 10.0, 20.0, 17.0, 36.0, 52.0, 86.0, 128.0, 227.0, 408.0, 773.0, 1749.0, 4377.0, 12799.0, 48759.0, 425663.0, 483622.0, 49158.0, 12777.0, 4318.0, 1709.0, 840.0, 421.0, 213.0, 138.0, 73.0, 47.0, 35.0, 25.0, 12.0, 13.0, 8.0, 8.0, 5.0, 8.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.102294921875, -0.09899520874023438, -0.09569549560546875, -0.09239578247070312, -0.0890960693359375, -0.08579635620117188, -0.08249664306640625, -0.07919692993164062, -0.075897216796875, -0.07259750366210938, -0.06929779052734375, -0.06599807739257812, -0.0626983642578125, -0.059398651123046875, -0.05609893798828125, -0.052799224853515625, -0.04949951171875, -0.046199798583984375, -0.04290008544921875, -0.039600372314453125, -0.0363006591796875, -0.033000946044921875, -0.02970123291015625, -0.026401519775390625, -0.023101806640625, -0.019802093505859375, -0.01650238037109375, -0.013202667236328125, -0.0099029541015625, -0.006603240966796875, -0.00330352783203125, -3.814697265625e-06, 0.0032958984375, 0.006595611572265625, 0.00989532470703125, 0.013195037841796875, 0.0164947509765625, 0.019794464111328125, 0.02309417724609375, 0.026393890380859375, 0.029693603515625, 0.032993316650390625, 0.03629302978515625, 0.039592742919921875, 0.0428924560546875, 0.046192169189453125, 0.04949188232421875, 0.052791595458984375, 0.05609130859375, 0.059391021728515625, 0.06269073486328125, 0.06599044799804688, 0.0692901611328125, 0.07258987426757812, 0.07588958740234375, 0.07918930053710938, 0.082489013671875, 0.08578872680664062, 0.08908843994140625, 0.09238815307617188, 0.0956878662109375, 0.09898757934570312, 0.10228729248046875, 0.10558700561523438, 0.10888671875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 11.0, 15.0, 19.0, 28.0, 42.0, 84.0, 115.0, 138.0, 125.0, 113.0, 88.0, 63.0, 45.0, 31.0, 21.0, 11.0, 10.0, 4.0, 3.0, 6.0, 5.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.84721565246582e-05, -5.65405935049057e-05, -5.46090304851532e-05, -5.2677467465400696e-05, -5.074590444564819e-05, -4.881434142589569e-05, -4.688277840614319e-05, -4.4951215386390686e-05, -4.3019652366638184e-05, -4.108808934688568e-05, -3.915652632713318e-05, -3.7224963307380676e-05, -3.5293400287628174e-05, -3.336183726787567e-05, -3.143027424812317e-05, -2.9498711228370667e-05, -2.7567148208618164e-05, -2.563558518886566e-05, -2.370402216911316e-05, -2.1772459149360657e-05, -1.9840896129608154e-05, -1.7909333109855652e-05, -1.597777009010315e-05, -1.4046207070350647e-05, -1.2114644050598145e-05, -1.0183081030845642e-05, -8.25151801109314e-06, -6.319954991340637e-06, -4.388391971588135e-06, -2.4568289518356323e-06, -5.252659320831299e-07, 1.4062970876693726e-06, 3.337860107421875e-06, 5.2694231271743774e-06, 7.20098614692688e-06, 9.132549166679382e-06, 1.1064112186431885e-05, 1.2995675206184387e-05, 1.492723822593689e-05, 1.6858801245689392e-05, 1.8790364265441895e-05, 2.0721927285194397e-05, 2.26534903049469e-05, 2.4585053324699402e-05, 2.6516616344451904e-05, 2.8448179364204407e-05, 3.037974238395691e-05, 3.231130540370941e-05, 3.4242868423461914e-05, 3.6174431443214417e-05, 3.810599446296692e-05, 4.003755748271942e-05, 4.1969120502471924e-05, 4.3900683522224426e-05, 4.583224654197693e-05, 4.776380956172943e-05, 4.9695372581481934e-05, 5.1626935601234436e-05, 5.355849862098694e-05, 5.549006164073944e-05, 5.742162466049194e-05, 5.9353187680244446e-05, 6.128475069999695e-05, 6.321631371974945e-05, 6.514787673950195e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 12.0, 14.0, 22.0, 54.0, 66.0, 118.0, 184.0, 304.0, 531.0, 1027.0, 2111.0, 5439.0, 16579.0, 62500.0, 585472.0, 296190.0, 54146.0, 14740.0, 4765.0, 1953.0, 987.0, 552.0, 277.0, 218.0, 113.0, 64.0, 37.0, 29.0, 9.0, 11.0, 5.0, 6.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10064697265625, -0.09749698638916016, -0.09434700012207031, -0.09119701385498047, -0.08804702758789062, -0.08489704132080078, -0.08174705505371094, -0.0785970687866211, -0.07544708251953125, -0.0722970962524414, -0.06914710998535156, -0.06599712371826172, -0.06284713745117188, -0.05969715118408203, -0.05654716491699219, -0.053397178649902344, -0.0502471923828125, -0.047097206115722656, -0.04394721984863281, -0.04079723358154297, -0.037647247314453125, -0.03449726104736328, -0.03134727478027344, -0.028197288513183594, -0.02504730224609375, -0.021897315979003906, -0.018747329711914062, -0.015597343444824219, -0.012447357177734375, -0.009297370910644531, -0.0061473846435546875, -0.0029973983764648438, 0.000152587890625, 0.0033025741577148438, 0.0064525604248046875, 0.009602546691894531, 0.012752532958984375, 0.01590251922607422, 0.019052505493164062, 0.022202491760253906, 0.02535247802734375, 0.028502464294433594, 0.03165245056152344, 0.03480243682861328, 0.037952423095703125, 0.04110240936279297, 0.04425239562988281, 0.047402381896972656, 0.0505523681640625, 0.053702354431152344, 0.05685234069824219, 0.06000232696533203, 0.06315231323242188, 0.06630229949951172, 0.06945228576660156, 0.0726022720336914, 0.07575225830078125, 0.0789022445678711, 0.08205223083496094, 0.08520221710205078, 0.08835220336914062, 0.09150218963623047, 0.09465217590332031, 0.09780216217041016, 0.1009521484375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 1.0, 8.0, 9.0, 6.0, 6.0, 8.0, 19.0, 13.0, 24.0, 24.0, 24.0, 37.0, 54.0, 71.0, 100.0, 104.0, 87.0, 95.0, 65.0, 47.0, 52.0, 30.0, 21.0, 21.0, 20.0, 11.0, 8.0, 7.0, 8.0, 7.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09503173828125, -0.09174251556396484, -0.08845329284667969, -0.08516407012939453, -0.08187484741210938, -0.07858562469482422, -0.07529640197753906, -0.0720071792602539, -0.06871795654296875, -0.0654287338256836, -0.06213951110839844, -0.05885028839111328, -0.055561065673828125, -0.05227184295654297, -0.04898262023925781, -0.045693397521972656, -0.0424041748046875, -0.039114952087402344, -0.03582572937011719, -0.03253650665283203, -0.029247283935546875, -0.02595806121826172, -0.022668838500976562, -0.019379615783691406, -0.01609039306640625, -0.012801170349121094, -0.009511947631835938, -0.006222724914550781, -0.002933502197265625, 0.00035572052001953125, 0.0036449432373046875, 0.006934165954589844, 0.010223388671875, 0.013512611389160156, 0.016801834106445312, 0.02009105682373047, 0.023380279541015625, 0.02666950225830078, 0.029958724975585938, 0.033247947692871094, 0.03653717041015625, 0.039826393127441406, 0.04311561584472656, 0.04640483856201172, 0.049694061279296875, 0.05298328399658203, 0.05627250671386719, 0.059561729431152344, 0.0628509521484375, 0.06614017486572266, 0.06942939758300781, 0.07271862030029297, 0.07600784301757812, 0.07929706573486328, 0.08258628845214844, 0.0858755111694336, 0.08916473388671875, 0.0924539566040039, 0.09574317932128906, 0.09903240203857422, 0.10232162475585938, 0.10561084747314453, 0.10890007019042969, 0.11218929290771484, 0.115478515625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 5.0, 4.0, 5.0, 14.0, 24.0, 49.0, 84.0, 184.0, 397.0, 136.0, 44.0, 33.0, 14.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.743709087371826, -5.617029190063477, -5.490349292755127, -5.363669395446777, -5.236989498138428, -5.110309600830078, -4.9836297035217285, -4.856949806213379, -4.730269432067871, -4.6035895347595215, -4.476909637451172, -4.350229740142822, -4.223549842834473, -4.096869945526123, -3.9701898097991943, -3.8435099124908447, -3.716830253601074, -3.5901503562927246, -3.463470458984375, -3.3367905616760254, -3.210110664367676, -3.083430767059326, -2.9567506313323975, -2.830070734024048, -2.7033908367156982, -2.5767109394073486, -2.450031042098999, -2.3233511447906494, -2.1966710090637207, -2.069991111755371, -1.9433112144470215, -1.8166313171386719, -1.6899516582489014, -1.5632717609405518, -1.4365918636322021, -1.309911847114563, -1.1832319498062134, -1.0565520524978638, -0.9298720955848694, -0.803192138671875, -0.6765122413635254, -0.5498323440551758, -0.4231523871421814, -0.2964724600315094, -0.1697925329208374, -0.04311263561248779, 0.08356732130050659, 0.21024727821350098, 0.3369271755218506, 0.4636071026325226, 0.5902870297431946, 0.716966986656189, 0.8436468839645386, 0.9703267812728882, 1.0970067977905273, 1.223686695098877, 1.3503665924072266, 1.4770464897155762, 1.6037263870239258, 1.730406403541565, 1.8570863008499146, 1.9837661981582642, 2.1104462146759033, 2.237126111984253, 2.3638060092926025]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 3.0, 3.0, 7.0, 11.0, 12.0, 8.0, 13.0, 14.0, 22.0, 23.0, 28.0, 31.0, 25.0, 33.0, 28.0, 45.0, 96.0, 132.0, 123.0, 56.0, 43.0, 28.0, 35.0, 33.0, 34.0, 16.0, 23.0, 17.0, 8.0, 10.0, 10.0, 4.0, 9.0, 7.0, 4.0, 1.0, 6.0, 4.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.7638497352600098, -2.688305377960205, -2.6127607822418213, -2.5372164249420166, -2.461671829223633, -2.386127471923828, -2.3105831146240234, -2.2350385189056396, -2.159494161605835, -2.0839498043060303, -2.0084052085876465, -1.9328608512878418, -1.8573163747787476, -1.7817718982696533, -1.706227421760559, -1.6306829452514648, -1.5551384687423706, -1.4795939922332764, -1.4040495157241821, -1.328505039215088, -1.2529606819152832, -1.177416205406189, -1.1018717288970947, -1.02632737159729, -0.950782835483551, -0.8752383589744568, -0.7996939420700073, -0.7241494655609131, -0.6486049890518188, -0.5730605721473694, -0.49751609563827515, -0.4219716787338257, -0.34642720222473145, -0.2708827555179596, -0.19533829391002655, -0.1197938323020935, -0.044249385595321655, 0.031295061111450195, 0.10683953762054443, 0.1823839545249939, 0.25792843103408813, 0.33347287774086, 0.40901732444763184, 0.4845618009567261, 0.5601062774658203, 0.6356506943702698, 0.711195170879364, 0.7867395877838135, 0.8622840642929077, 0.937828540802002, 1.0133730173110962, 1.0889174938201904, 1.1644618511199951, 1.2400063276290894, 1.3155508041381836, 1.3910951614379883, 1.466639757156372, 1.5421842336654663, 1.6177287101745605, 1.6932730674743652, 1.7688175439834595, 1.8443620204925537, 1.919906497001648, 1.9954509735107422, 2.070995330810547]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 6.0, 4.0, 4.0, 3.0, 5.0, 11.0, 12.0, 6.0, 12.0, 9.0, 26.0, 22.0, 41.0, 42.0, 58.0, 83.0, 170.0, 222.0, 395.0, 752.0, 1396.0, 2923.0, 7093.0, 20880.0, 74194.0, 356379.0, 1698814.0, 1597046.0, 332861.0, 69171.0, 19093.0, 6820.0, 2717.0, 1316.0, 672.0, 366.0, 233.0, 114.0, 99.0, 50.0, 42.0, 23.0, 21.0, 18.0, 14.0, 16.0, 10.0, 4.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.344482421875, -0.33490753173828125, -0.3253326416015625, -0.31575775146484375, -0.306182861328125, -0.29660797119140625, -0.2870330810546875, -0.27745819091796875, -0.26788330078125, -0.25830841064453125, -0.2487335205078125, -0.23915863037109375, -0.229583740234375, -0.22000885009765625, -0.2104339599609375, -0.20085906982421875, -0.1912841796875, -0.18170928955078125, -0.1721343994140625, -0.16255950927734375, -0.152984619140625, -0.14340972900390625, -0.1338348388671875, -0.12425994873046875, -0.11468505859375, -0.10511016845703125, -0.0955352783203125, -0.08596038818359375, -0.076385498046875, -0.06681060791015625, -0.0572357177734375, -0.04766082763671875, -0.0380859375, -0.02851104736328125, -0.0189361572265625, -0.00936126708984375, 0.000213623046875, 0.00978851318359375, 0.0193634033203125, 0.02893829345703125, 0.03851318359375, 0.04808807373046875, 0.0576629638671875, 0.06723785400390625, 0.076812744140625, 0.08638763427734375, 0.0959625244140625, 0.10553741455078125, 0.1151123046875, 0.12468719482421875, 0.1342620849609375, 0.14383697509765625, 0.153411865234375, 0.16298675537109375, 0.1725616455078125, 0.18213653564453125, 0.19171142578125, 0.20128631591796875, 0.2108612060546875, 0.22043609619140625, 0.230010986328125, 0.23958587646484375, 0.2491607666015625, 0.25873565673828125, 0.268310546875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 2.0, 3.0, 4.0, 6.0, 9.0, 9.0, 9.0, 17.0, 14.0, 16.0, 20.0, 33.0, 32.0, 31.0, 27.0, 35.0, 41.0, 37.0, 47.0, 39.0, 41.0, 53.0, 46.0, 48.0, 37.0, 31.0, 49.0, 43.0, 36.0, 39.0, 33.0, 23.0, 20.0, 16.0, 10.0, 7.0, 9.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.132568359375, -0.1278705596923828, -0.12317276000976562, -0.11847496032714844, -0.11377716064453125, -0.10907936096191406, -0.10438156127929688, -0.09968376159667969, -0.0949859619140625, -0.09028816223144531, -0.08559036254882812, -0.08089256286621094, -0.07619476318359375, -0.07149696350097656, -0.06679916381835938, -0.06210136413574219, -0.057403564453125, -0.05270576477050781, -0.048007965087890625, -0.04331016540527344, -0.03861236572265625, -0.03391456604003906, -0.029216766357421875, -0.024518966674804688, -0.0198211669921875, -0.015123367309570312, -0.010425567626953125, -0.0057277679443359375, -0.00102996826171875, 0.0036678314208984375, 0.008365631103515625, 0.013063430786132812, 0.01776123046875, 0.022459030151367188, 0.027156829833984375, 0.03185462951660156, 0.03655242919921875, 0.04125022888183594, 0.045948028564453125, 0.05064582824707031, 0.0553436279296875, 0.06004142761230469, 0.06473922729492188, 0.06943702697753906, 0.07413482666015625, 0.07883262634277344, 0.08353042602539062, 0.08822822570800781, 0.092926025390625, 0.09762382507324219, 0.10232162475585938, 0.10701942443847656, 0.11171722412109375, 0.11641502380371094, 0.12111282348632812, 0.1258106231689453, 0.1305084228515625, 0.1352062225341797, 0.13990402221679688, 0.14460182189941406, 0.14929962158203125, 0.15399742126464844, 0.15869522094726562, 0.1633930206298828, 0.1680908203125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 10.0, 16.0, 23.0, 28.0, 59.0, 74.0, 178.0, 375.0, 791.0, 2402.0, 21277.0, 3996459.0, 165708.0, 4704.0, 1216.0, 465.0, 227.0, 104.0, 80.0, 24.0, 16.0, 7.0, 11.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4765625, -1.4268646240234375, -1.377166748046875, -1.3274688720703125, -1.27777099609375, -1.2280731201171875, -1.178375244140625, -1.1286773681640625, -1.0789794921875, -1.0292816162109375, -0.979583740234375, -0.9298858642578125, -0.88018798828125, -0.8304901123046875, -0.780792236328125, -0.7310943603515625, -0.681396484375, -0.6316986083984375, -0.582000732421875, -0.5323028564453125, -0.48260498046875, -0.4329071044921875, -0.383209228515625, -0.3335113525390625, -0.2838134765625, -0.2341156005859375, -0.184417724609375, -0.1347198486328125, -0.08502197265625, -0.0353240966796875, 0.014373779296875, 0.0640716552734375, 0.11376953125, 0.1634674072265625, 0.213165283203125, 0.2628631591796875, 0.31256103515625, 0.3622589111328125, 0.411956787109375, 0.4616546630859375, 0.5113525390625, 0.5610504150390625, 0.610748291015625, 0.6604461669921875, 0.71014404296875, 0.7598419189453125, 0.809539794921875, 0.8592376708984375, 0.908935546875, 0.9586334228515625, 1.008331298828125, 1.0580291748046875, 1.10772705078125, 1.1574249267578125, 1.207122802734375, 1.2568206787109375, 1.3065185546875, 1.3562164306640625, 1.405914306640625, 1.4556121826171875, 1.50531005859375, 1.5550079345703125, 1.604705810546875, 1.6544036865234375, 1.7041015625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 6.0, 12.0, 17.0, 30.0, 59.0, 121.0, 180.0, 368.0, 626.0, 867.0, 799.0, 439.0, 244.0, 145.0, 81.0, 40.0, 20.0, 16.0, 7.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0927734375, -1.0622177124023438, -1.0316619873046875, -1.0011062622070312, -0.970550537109375, -0.9399948120117188, -0.9094390869140625, -0.8788833618164062, -0.84832763671875, -0.8177719116210938, -0.7872161865234375, -0.7566604614257812, -0.726104736328125, -0.6955490112304688, -0.6649932861328125, -0.6344375610351562, -0.6038818359375, -0.5733261108398438, -0.5427703857421875, -0.5122146606445312, -0.481658935546875, -0.45110321044921875, -0.4205474853515625, -0.38999176025390625, -0.35943603515625, -0.32888031005859375, -0.2983245849609375, -0.26776885986328125, -0.237213134765625, -0.20665740966796875, -0.1761016845703125, -0.14554595947265625, -0.114990234375, -0.08443450927734375, -0.0538787841796875, -0.02332305908203125, 0.007232666015625, 0.03778839111328125, 0.0683441162109375, 0.09889984130859375, 0.12945556640625, 0.16001129150390625, 0.1905670166015625, 0.22112274169921875, 0.251678466796875, 0.28223419189453125, 0.3127899169921875, 0.34334564208984375, 0.3739013671875, 0.40445709228515625, 0.4350128173828125, 0.46556854248046875, 0.496124267578125, 0.5266799926757812, 0.5572357177734375, 0.5877914428710938, 0.61834716796875, 0.6489028930664062, 0.6794586181640625, 0.7100143432617188, 0.740570068359375, 0.7711257934570312, 0.8016815185546875, 0.8322372436523438, 0.86279296875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 9.0, 20.0, 34.0, 61.0, 133.0, 219.0, 245.0, 133.0, 71.0, 24.0, 20.0, 13.0, 2.0, 1.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.410016059875488, -6.1209869384765625, -5.831958293914795, -5.542929172515869, -5.253900527954102, -4.964871406555176, -4.67584228515625, -4.386813163757324, -4.097784519195557, -3.80875563621521, -3.5197267532348633, -3.2306976318359375, -2.941668748855591, -2.652639865875244, -2.3636107444763184, -2.0745818614959717, -1.785552978515625, -1.4965240955352783, -1.207495093345642, -0.9184661507606506, -0.6294372081756592, -0.3404083251953125, -0.05137932300567627, 0.23764967918395996, 0.5266785621643066, 0.8157075047492981, 1.1047364473342896, 1.3937654495239258, 1.6827943325042725, 1.9718232154846191, 2.260852336883545, 2.5498812198638916, 2.8389110565185547, 3.1279399394989014, 3.416968822479248, 3.705997943878174, 3.9950268268585205, 4.284055709838867, 4.573084831237793, 4.862113952636719, 5.151142597198486, 5.440171718597412, 5.72920036315918, 6.0182294845581055, 6.307258605957031, 6.596287250518799, 6.885316371917725, 7.174345016479492, 7.463374137878418, 7.752403259277344, 8.04143238067627, 8.330460548400879, 8.619489669799805, 8.90851879119873, 9.197547912597656, 9.486577033996582, 9.775606155395508, 10.064635276794434, 10.35366439819336, 10.642692565917969, 10.931721687316895, 11.22075080871582, 11.509779930114746, 11.798809051513672, 12.087837219238281]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 3.0, 7.0, 9.0, 4.0, 14.0, 17.0, 14.0, 22.0, 17.0, 25.0, 28.0, 28.0, 22.0, 30.0, 33.0, 48.0, 41.0, 47.0, 47.0, 56.0, 53.0, 41.0, 35.0, 40.0, 39.0, 35.0, 33.0, 17.0, 28.0, 22.0, 24.0, 15.0, 23.0, 17.0, 10.0, 10.0, 14.0, 5.0, 6.0, 8.0, 5.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.464331865310669, -2.3768444061279297, -2.2893569469451904, -2.201869487762451, -2.114382028579712, -2.0268945693969727, -1.9394069910049438, -1.8519195318222046, -1.7644320726394653, -1.676944613456726, -1.5894571542739868, -1.501969575881958, -1.4144821166992188, -1.3269946575164795, -1.2395071983337402, -1.152019739151001, -1.0645322799682617, -0.9770448207855225, -0.8895573616027832, -0.8020698428153992, -0.7145823836326599, -0.6270949244499207, -0.5396074056625366, -0.45211994647979736, -0.3646324872970581, -0.27714502811431885, -0.1896575391292572, -0.10217005014419556, -0.014682590961456299, 0.07280486822128296, 0.160292387008667, 0.24777984619140625, 0.3352675437927246, 0.42275500297546387, 0.5102424621582031, 0.5977299809455872, 0.6852174401283264, 0.7727048993110657, 0.8601924180984497, 0.947679877281189, 1.0351673364639282, 1.1226547956466675, 1.2101422548294067, 1.2976298332214355, 1.3851172924041748, 1.472604751586914, 1.5600922107696533, 1.6475796699523926, 1.7350671291351318, 1.822554588317871, 1.9100420475006104, 1.9975295066833496, 2.085016965866089, 2.172504425048828, 2.2599921226501465, 2.3474793434143066, 2.434967041015625, 2.5224545001983643, 2.6099419593811035, 2.6974294185638428, 2.784916877746582, 2.8724043369293213, 2.9598917961120605, 3.047379493713379, 3.134866714477539]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 9.0, 5.0, 9.0, 10.0, 12.0, 27.0, 32.0, 55.0, 72.0, 115.0, 165.0, 263.0, 434.0, 694.0, 1090.0, 1889.0, 3451.0, 6634.0, 13385.0, 32593.0, 92773.0, 378092.0, 366202.0, 90311.0, 31982.0, 13583.0, 6434.0, 3361.0, 1946.0, 1103.0, 653.0, 389.0, 245.0, 194.0, 117.0, 63.0, 56.0, 33.0, 33.0, 10.0, 9.0, 7.0, 7.0, 2.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.222900390625, -0.21570777893066406, -0.20851516723632812, -0.2013225555419922, -0.19412994384765625, -0.1869373321533203, -0.17974472045898438, -0.17255210876464844, -0.1653594970703125, -0.15816688537597656, -0.15097427368164062, -0.1437816619873047, -0.13658905029296875, -0.1293964385986328, -0.12220382690429688, -0.11501121520996094, -0.107818603515625, -0.10062599182128906, -0.09343338012695312, -0.08624076843261719, -0.07904815673828125, -0.07185554504394531, -0.06466293334960938, -0.05747032165527344, -0.0502777099609375, -0.04308509826660156, -0.035892486572265625, -0.028699874877929688, -0.02150726318359375, -0.014314651489257812, -0.007122039794921875, 7.05718994140625e-05, 0.00726318359375, 0.014455795288085938, 0.021648406982421875, 0.028841018676757812, 0.03603363037109375, 0.04322624206542969, 0.050418853759765625, 0.05761146545410156, 0.0648040771484375, 0.07199668884277344, 0.07918930053710938, 0.08638191223144531, 0.09357452392578125, 0.10076713562011719, 0.10795974731445312, 0.11515235900878906, 0.122344970703125, 0.12953758239746094, 0.13673019409179688, 0.1439228057861328, 0.15111541748046875, 0.1583080291748047, 0.16550064086914062, 0.17269325256347656, 0.1798858642578125, 0.18707847595214844, 0.19427108764648438, 0.2014636993408203, 0.20865631103515625, 0.2158489227294922, 0.22304153442382812, 0.23023414611816406, 0.2374267578125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 3.0, 6.0, 7.0, 16.0, 12.0, 17.0, 15.0, 24.0, 33.0, 29.0, 37.0, 49.0, 61.0, 70.0, 56.0, 39.0, 49.0, 55.0, 59.0, 58.0, 40.0, 39.0, 40.0, 39.0, 34.0, 16.0, 20.0, 20.0, 21.0, 9.0, 7.0, 8.0, 7.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.219482421875, -0.21088027954101562, -0.20227813720703125, -0.19367599487304688, -0.1850738525390625, -0.17647171020507812, -0.16786956787109375, -0.15926742553710938, -0.150665283203125, -0.14206314086914062, -0.13346099853515625, -0.12485885620117188, -0.1162567138671875, -0.10765457153320312, -0.09905242919921875, -0.09045028686523438, -0.08184814453125, -0.07324600219726562, -0.06464385986328125, -0.056041717529296875, -0.0474395751953125, -0.038837432861328125, -0.03023529052734375, -0.021633148193359375, -0.013031005859375, -0.004428863525390625, 0.00417327880859375, 0.012775421142578125, 0.0213775634765625, 0.029979705810546875, 0.03858184814453125, 0.047183990478515625, 0.0557861328125, 0.06438827514648438, 0.07299041748046875, 0.08159255981445312, 0.0901947021484375, 0.09879684448242188, 0.10739898681640625, 0.11600112915039062, 0.124603271484375, 0.13320541381835938, 0.14180755615234375, 0.15040969848632812, 0.1590118408203125, 0.16761398315429688, 0.17621612548828125, 0.18481826782226562, 0.19342041015625, 0.20202255249023438, 0.21062469482421875, 0.21922683715820312, 0.2278289794921875, 0.23643112182617188, 0.24503326416015625, 0.2536354064941406, 0.262237548828125, 0.2708396911621094, 0.27944183349609375, 0.2880439758300781, 0.2966461181640625, 0.3052482604980469, 0.31385040283203125, 0.3224525451660156, 0.3310546875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 5.0, 2.0, 7.0, 9.0, 6.0, 24.0, 32.0, 47.0, 85.0, 160.0, 374.0, 971.0, 4140.0, 44484.0, 951071.0, 41410.0, 3970.0, 982.0, 362.0, 165.0, 101.0, 62.0, 28.0, 17.0, 12.0, 12.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6728515625, -0.6521377563476562, -0.6314239501953125, -0.6107101440429688, -0.589996337890625, -0.5692825317382812, -0.5485687255859375, -0.5278549194335938, -0.50714111328125, -0.48642730712890625, -0.4657135009765625, -0.44499969482421875, -0.424285888671875, -0.40357208251953125, -0.3828582763671875, -0.36214447021484375, -0.3414306640625, -0.32071685791015625, -0.3000030517578125, -0.27928924560546875, -0.258575439453125, -0.23786163330078125, -0.2171478271484375, -0.19643402099609375, -0.17572021484375, -0.15500640869140625, -0.1342926025390625, -0.11357879638671875, -0.092864990234375, -0.07215118408203125, -0.0514373779296875, -0.03072357177734375, -0.010009765625, 0.01070404052734375, 0.0314178466796875, 0.05213165283203125, 0.072845458984375, 0.09355926513671875, 0.1142730712890625, 0.13498687744140625, 0.15570068359375, 0.17641448974609375, 0.1971282958984375, 0.21784210205078125, 0.238555908203125, 0.25926971435546875, 0.2799835205078125, 0.30069732666015625, 0.3214111328125, 0.34212493896484375, 0.3628387451171875, 0.38355255126953125, 0.404266357421875, 0.42498016357421875, 0.4456939697265625, 0.46640777587890625, 0.48712158203125, 0.5078353881835938, 0.5285491943359375, 0.5492630004882812, 0.569976806640625, 0.5906906127929688, 0.6114044189453125, 0.6321182250976562, 0.65283203125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 6.0, 6.0, 9.0, 12.0, 13.0, 10.0, 13.0, 22.0, 23.0, 24.0, 48.0, 44.0, 65.0, 70.0, 106.0, 86.0, 72.0, 78.0, 45.0, 42.0, 35.0, 30.0, 27.0, 27.0, 19.0, 10.0, 13.0, 11.0, 9.0, 8.0, 7.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2373046875, -1.2040176391601562, -1.1707305908203125, -1.1374435424804688, -1.104156494140625, -1.0708694458007812, -1.0375823974609375, -1.0042953491210938, -0.97100830078125, -0.9377212524414062, -0.9044342041015625, -0.8711471557617188, -0.837860107421875, -0.8045730590820312, -0.7712860107421875, -0.7379989624023438, -0.7047119140625, -0.6714248657226562, -0.6381378173828125, -0.6048507690429688, -0.571563720703125, -0.5382766723632812, -0.5049896240234375, -0.47170257568359375, -0.43841552734375, -0.40512847900390625, -0.3718414306640625, -0.33855438232421875, -0.305267333984375, -0.27198028564453125, -0.2386932373046875, -0.20540618896484375, -0.172119140625, -0.13883209228515625, -0.1055450439453125, -0.07225799560546875, -0.038970947265625, -0.00568389892578125, 0.0276031494140625, 0.06089019775390625, 0.09417724609375, 0.12746429443359375, 0.1607513427734375, 0.19403839111328125, 0.227325439453125, 0.26061248779296875, 0.2938995361328125, 0.32718658447265625, 0.3604736328125, 0.39376068115234375, 0.4270477294921875, 0.46033477783203125, 0.493621826171875, 0.5269088745117188, 0.5601959228515625, 0.5934829711914062, 0.62677001953125, 0.6600570678710938, 0.6933441162109375, 0.7266311645507812, 0.759918212890625, 0.7932052612304688, 0.8264923095703125, 0.8597793579101562, 0.89306640625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 7.0, 5.0, 10.0, 17.0, 21.0, 38.0, 42.0, 72.0, 120.0, 210.0, 409.0, 1003.0, 3074.0, 13674.0, 138764.0, 854233.0, 28873.0, 5202.0, 1471.0, 588.0, 260.0, 153.0, 94.0, 56.0, 45.0, 36.0, 18.0, 19.0, 12.0, 9.0, 5.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.09600830078125, -0.09260272979736328, -0.08919715881347656, -0.08579158782958984, -0.08238601684570312, -0.0789804458618164, -0.07557487487792969, -0.07216930389404297, -0.06876373291015625, -0.06535816192626953, -0.06195259094238281, -0.058547019958496094, -0.055141448974609375, -0.051735877990722656, -0.04833030700683594, -0.04492473602294922, -0.0415191650390625, -0.03811359405517578, -0.03470802307128906, -0.031302452087402344, -0.027896881103515625, -0.024491310119628906, -0.021085739135742188, -0.01768016815185547, -0.01427459716796875, -0.010869026184082031, -0.0074634552001953125, -0.004057884216308594, -0.000652313232421875, 0.0027532577514648438, 0.0061588287353515625, 0.009564399719238281, 0.012969970703125, 0.01637554168701172, 0.019781112670898438, 0.023186683654785156, 0.026592254638671875, 0.029997825622558594, 0.03340339660644531, 0.03680896759033203, 0.04021453857421875, 0.04362010955810547, 0.04702568054199219, 0.050431251525878906, 0.053836822509765625, 0.057242393493652344, 0.06064796447753906, 0.06405353546142578, 0.0674591064453125, 0.07086467742919922, 0.07427024841308594, 0.07767581939697266, 0.08108139038085938, 0.0844869613647461, 0.08789253234863281, 0.09129810333251953, 0.09470367431640625, 0.09810924530029297, 0.10151481628417969, 0.1049203872680664, 0.10832595825195312, 0.11173152923583984, 0.11513710021972656, 0.11854267120361328, 0.1219482421875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 3.0, 6.0, 14.0, 6.0, 12.0, 12.0, 13.0, 15.0, 16.0, 15.0, 24.0, 33.0, 44.0, 48.0, 64.0, 64.0, 75.0, 74.0, 85.0, 53.0, 53.0, 48.0, 33.0, 33.0, 26.0, 24.0, 15.0, 15.0, 12.0, 8.0, 9.0, 6.0, 11.0, 9.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.0994415283203125e-05, -2.9935501515865326e-05, -2.8876587748527527e-05, -2.7817673981189728e-05, -2.675876021385193e-05, -2.569984644651413e-05, -2.464093267917633e-05, -2.358201891183853e-05, -2.2523105144500732e-05, -2.1464191377162933e-05, -2.0405277609825134e-05, -1.9346363842487335e-05, -1.8287450075149536e-05, -1.7228536307811737e-05, -1.6169622540473938e-05, -1.5110708773136139e-05, -1.405179500579834e-05, -1.299288123846054e-05, -1.1933967471122742e-05, -1.0875053703784943e-05, -9.816139936447144e-06, -8.757226169109344e-06, -7.698312401771545e-06, -6.639398634433746e-06, -5.580484867095947e-06, -4.521571099758148e-06, -3.462657332420349e-06, -2.40374356508255e-06, -1.344829797744751e-06, -2.859160304069519e-07, 7.729977369308472e-07, 1.8319115042686462e-06, 2.8908252716064453e-06, 3.949739038944244e-06, 5.0086528062820435e-06, 6.0675665736198425e-06, 7.126480340957642e-06, 8.18539410829544e-06, 9.24430787563324e-06, 1.0303221642971039e-05, 1.1362135410308838e-05, 1.2421049177646637e-05, 1.3479962944984436e-05, 1.4538876712322235e-05, 1.5597790479660034e-05, 1.6656704246997833e-05, 1.7715618014335632e-05, 1.877453178167343e-05, 1.983344554901123e-05, 2.089235931634903e-05, 2.195127308368683e-05, 2.3010186851024628e-05, 2.4069100618362427e-05, 2.5128014385700226e-05, 2.6186928153038025e-05, 2.7245841920375824e-05, 2.8304755687713623e-05, 2.9363669455051422e-05, 3.042258322238922e-05, 3.148149698972702e-05, 3.254041075706482e-05, 3.359932452440262e-05, 3.465823829174042e-05, 3.5717152059078217e-05, 3.6776065826416016e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 9.0, 12.0, 19.0, 22.0, 38.0, 65.0, 87.0, 162.0, 281.0, 424.0, 764.0, 1510.0, 3369.0, 8534.0, 26563.0, 140907.0, 787311.0, 54296.0, 14526.0, 5039.0, 2194.0, 1028.0, 550.0, 326.0, 199.0, 118.0, 67.0, 36.0, 32.0, 20.0, 13.0, 9.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.08612060546875, -0.08353042602539062, -0.08094024658203125, -0.07835006713867188, -0.0757598876953125, -0.07316970825195312, -0.07057952880859375, -0.06798934936523438, -0.065399169921875, -0.06280899047851562, -0.06021881103515625, -0.057628631591796875, -0.0550384521484375, -0.052448272705078125, -0.04985809326171875, -0.047267913818359375, -0.044677734375, -0.042087554931640625, -0.03949737548828125, -0.036907196044921875, -0.0343170166015625, -0.031726837158203125, -0.02913665771484375, -0.026546478271484375, -0.023956298828125, -0.021366119384765625, -0.01877593994140625, -0.016185760498046875, -0.0135955810546875, -0.011005401611328125, -0.00841522216796875, -0.005825042724609375, -0.00323486328125, -0.000644683837890625, 0.00194549560546875, 0.004535675048828125, 0.0071258544921875, 0.009716033935546875, 0.01230621337890625, 0.014896392822265625, 0.017486572265625, 0.020076751708984375, 0.02266693115234375, 0.025257110595703125, 0.0278472900390625, 0.030437469482421875, 0.03302764892578125, 0.035617828369140625, 0.0382080078125, 0.040798187255859375, 0.04338836669921875, 0.045978546142578125, 0.0485687255859375, 0.051158905029296875, 0.05374908447265625, 0.056339263916015625, 0.058929443359375, 0.061519622802734375, 0.06410980224609375, 0.06669998168945312, 0.0692901611328125, 0.07188034057617188, 0.07447052001953125, 0.07706069946289062, 0.07965087890625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 7.0, 2.0, 7.0, 16.0, 13.0, 12.0, 13.0, 16.0, 30.0, 38.0, 79.0, 110.0, 124.0, 156.0, 109.0, 70.0, 50.0, 37.0, 19.0, 14.0, 12.0, 14.0, 7.0, 4.0, 9.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 4.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10992431640625, -0.10679149627685547, -0.10365867614746094, -0.1005258560180664, -0.09739303588867188, -0.09426021575927734, -0.09112739562988281, -0.08799457550048828, -0.08486175537109375, -0.08172893524169922, -0.07859611511230469, -0.07546329498291016, -0.07233047485351562, -0.0691976547241211, -0.06606483459472656, -0.06293201446533203, -0.0597991943359375, -0.05666637420654297, -0.05353355407714844, -0.050400733947753906, -0.047267913818359375, -0.044135093688964844, -0.04100227355957031, -0.03786945343017578, -0.03473663330078125, -0.03160381317138672, -0.028470993041992188, -0.025338172912597656, -0.022205352783203125, -0.019072532653808594, -0.015939712524414062, -0.012806892395019531, -0.009674072265625, -0.006541252136230469, -0.0034084320068359375, -0.00027561187744140625, 0.002857208251953125, 0.005990028381347656, 0.009122848510742188, 0.012255668640136719, 0.01538848876953125, 0.01852130889892578, 0.021654129028320312, 0.024786949157714844, 0.027919769287109375, 0.031052589416503906, 0.03418540954589844, 0.03731822967529297, 0.0404510498046875, 0.04358386993408203, 0.04671669006347656, 0.049849510192871094, 0.052982330322265625, 0.056115150451660156, 0.05924797058105469, 0.06238079071044922, 0.06551361083984375, 0.06864643096923828, 0.07177925109863281, 0.07491207122802734, 0.07804489135742188, 0.0811777114868164, 0.08431053161621094, 0.08744335174560547, 0.090576171875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 18.0, 24.0, 53.0, 118.0, 509.0, 167.0, 55.0, 22.0, 16.0, 10.0, 8.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.491363048553467, -3.32965350151062, -3.1679439544677734, -3.0062344074249268, -2.84452486038208, -2.6828153133392334, -2.5211057662963867, -2.35939621925354, -2.1976866722106934, -2.0359771251678467, -1.874267578125, -1.7125580310821533, -1.5508484840393066, -1.38913893699646, -1.2274293899536133, -1.0657198429107666, -0.9040102958679199, -0.7423007488250732, -0.5805912017822266, -0.4188816547393799, -0.2571721076965332, -0.09546256065368652, 0.06624698638916016, 0.22795653343200684, 0.3896660804748535, 0.5513756275177002, 0.7130851745605469, 0.8747947216033936, 1.0365042686462402, 1.198213815689087, 1.3599233627319336, 1.5216329097747803, 1.6833429336547852, 1.8450524806976318, 2.0067620277404785, 2.168471574783325, 2.330181121826172, 2.4918906688690186, 2.6536002159118652, 2.815309762954712, 2.9770193099975586, 3.1387288570404053, 3.300438404083252, 3.4621479511260986, 3.6238574981689453, 3.785567045211792, 3.9472765922546387, 4.108985900878906, 4.270695686340332, 4.432405471801758, 4.594114780426025, 4.755824089050293, 4.917533874511719, 5.0792436599731445, 5.240952968597412, 5.40266227722168, 5.5643720626831055, 5.726081848144531, 5.887791156768799, 6.049500465393066, 6.211210250854492, 6.372920036315918, 6.5346293449401855, 6.696338653564453, 6.858048439025879]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 10.0, 4.0, 5.0, 3.0, 12.0, 7.0, 8.0, 16.0, 16.0, 18.0, 13.0, 31.0, 12.0, 27.0, 35.0, 69.0, 114.0, 147.0, 133.0, 81.0, 53.0, 26.0, 17.0, 23.0, 17.0, 17.0, 16.0, 18.0, 6.0, 12.0, 9.0, 9.0, 7.0, 3.0, 9.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6377370357513428, -2.5515856742858887, -2.4654340744018555, -2.3792827129364014, -2.2931313514709473, -2.206979990005493, -2.12082839012146, -2.034677028656006, -1.9485256671905518, -1.862374186515808, -1.776222825050354, -1.6900713443756104, -1.6039199829101562, -1.5177685022354126, -1.431617021560669, -1.3454656600952148, -1.2593141794204712, -1.1731626987457275, -1.0870113372802734, -1.0008598566055298, -0.9147084951400757, -0.828557014465332, -0.7424055933952332, -0.6562541723251343, -0.5701027512550354, -0.4839513301849365, -0.39779990911483765, -0.3116484582424164, -0.2254970371723175, -0.13934561610221863, -0.05319416522979736, 0.032957255840301514, 0.11910867691040039, 0.20526009798049927, 0.29141151905059814, 0.3775629699230194, 0.4637143909931183, 0.5498658418655396, 0.6360172629356384, 0.7221686840057373, 0.8083201050758362, 0.8944715261459351, 0.9806229472160339, 1.0667743682861328, 1.1529258489608765, 1.2390772104263306, 1.3252286911010742, 1.4113800525665283, 1.497531533241272, 1.5836830139160156, 1.6698343753814697, 1.7559858560562134, 1.8421372175216675, 1.9282886981964111, 2.0144400596618652, 2.1005916595458984, 2.1867430210113525, 2.2728943824768066, 2.35904598236084, 2.445197343826294, 2.531348705291748, 2.617500066757202, 2.7036516666412354, 2.7898030281066895, 2.8759543895721436]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 8.0, 6.0, 9.0, 11.0, 13.0, 18.0, 17.0, 17.0, 17.0, 27.0, 25.0, 32.0, 31.0, 38.0, 47.0, 96.0, 168.0, 97.0, 50.0, 26.0, 27.0, 24.0, 26.0, 24.0, 28.0, 18.0, 17.0, 17.0, 17.0, 8.0, 8.0, 4.0, 9.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.219482421875, -0.21248626708984375, -0.2054901123046875, -0.19849395751953125, -0.191497802734375, -0.18450164794921875, -0.1775054931640625, -0.17050933837890625, -0.16351318359375, -0.15651702880859375, -0.1495208740234375, -0.14252471923828125, -0.135528564453125, -0.12853240966796875, -0.1215362548828125, -0.11454010009765625, -0.1075439453125, -0.10054779052734375, -0.0935516357421875, -0.08655548095703125, -0.079559326171875, -0.07256317138671875, -0.0655670166015625, -0.05857086181640625, -0.05157470703125, -0.04457855224609375, -0.0375823974609375, -0.03058624267578125, -0.023590087890625, -0.01659393310546875, -0.0095977783203125, -0.00260162353515625, 0.00439453125, 0.01139068603515625, 0.0183868408203125, 0.02538299560546875, 0.032379150390625, 0.03937530517578125, 0.0463714599609375, 0.05336761474609375, 0.06036376953125, 0.06735992431640625, 0.0743560791015625, 0.08135223388671875, 0.088348388671875, 0.09534454345703125, 0.1023406982421875, 0.10933685302734375, 0.1163330078125, 0.12332916259765625, 0.1303253173828125, 0.13732147216796875, 0.144317626953125, 0.15131378173828125, 0.1583099365234375, 0.16530609130859375, 0.17230224609375, 0.17929840087890625, 0.1862945556640625, 0.19329071044921875, 0.200286865234375, 0.20728302001953125, 0.2142791748046875, 0.22127532958984375, 0.228271484375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 1.0, 1.0, 0.0, 4.0, 8.0, 5.0, 12.0, 9.0, 9.0, 11.0, 22.0, 18.0, 51.0, 69.0, 105.0, 217.0, 378.0, 1232.0, 5160.0, 81662.0, 8288168.0, 8507.0, 1805.0, 547.0, 220.0, 127.0, 71.0, 32.0, 39.0, 19.0, 12.0, 13.0, 10.0, 5.0, 5.0, 2.0, 5.0, 3.0, 14.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.226417064666748, -2.1664845943450928, -2.1065521240234375, -2.046619415283203, -1.9866869449615479, -1.9267544746398926, -1.8668218851089478, -1.806889295578003, -1.7469568252563477, -1.6870243549346924, -1.6270917654037476, -1.5671591758728027, -1.5072267055511475, -1.4472942352294922, -1.3873616456985474, -1.3274290561676025, -1.2674965858459473, -1.207564115524292, -1.1476315259933472, -1.0876989364624023, -1.027766466140747, -0.967833936214447, -0.907901406288147, -0.8479688763618469, -0.7880363464355469, -0.7281038165092468, -0.6681712865829468, -0.6082387566566467, -0.5483062267303467, -0.48837369680404663, -0.4284411668777466, -0.36850863695144653, -0.30857622623443604, -0.248643696308136, -0.18871116638183594, -0.1287786364555359, -0.06884610652923584, -0.008913576602935791, 0.05101895332336426, 0.1109514832496643, 0.17088401317596436, 0.2308165431022644, 0.29074907302856445, 0.3506816029548645, 0.41061413288116455, 0.4705466628074646, 0.5304791927337646, 0.5904117226600647, 0.6503442525863647, 0.7102767825126648, 0.7702093124389648, 0.8301418423652649, 0.8900743722915649, 0.950006902217865, 1.009939432144165, 1.0698719024658203, 1.1298044919967651, 1.18973708152771, 1.2496695518493652, 1.3096020221710205, 1.3695346117019653, 1.4294672012329102, 1.4893996715545654, 1.5493321418762207, 1.6092647314071655]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 1.0, 1.0, 4.0, 6.0, 2.0, 9.0, 1.0, 4.0, 6.0, 2.0, 6.0, 7.0, 7.0, 3.0, 6.0, 3.0, 7.0, 3.0, 3.0, 0.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.300006628036499, -2.208965301513672, -2.1179239749908447, -2.0268826484680176, -1.9358413219451904, -1.8447999954223633, -1.7537587881088257, -1.6627174615859985, -1.5716761350631714, -1.4806348085403442, -1.389593482017517, -1.2985522747039795, -1.2075109481811523, -1.1164696216583252, -1.025428295135498, -0.9343869686126709, -0.8433456420898438, -0.7523043155670166, -0.6612629890441895, -0.5702217221260071, -0.47918039560317993, -0.3881390690803528, -0.2970978021621704, -0.20605647563934326, -0.11501514911651611, -0.02397383749485016, 0.0670674741268158, 0.15810877084732056, 0.2491500973701477, 0.34019142389297485, 0.4312326908111572, 0.5222740173339844, 0.6133155822753906, 0.7043569087982178, 0.7953982353210449, 0.8864395022392273, 0.9774808287620544, 1.0685222148895264, 1.159563422203064, 1.2506047487258911, 1.3416460752487183, 1.4326874017715454, 1.5237287282943726, 1.6147699356079102, 1.7058112621307373, 1.7968525886535645, 1.8878939151763916, 1.9789352416992188, 2.069976568222046, 2.161017894744873, 2.2520592212677, 2.3431005477905273, 2.4341418743133545, 2.5251832008361816, 2.6162242889404297, 2.707265853881836, 2.798306941986084, 2.889348268508911, 2.9803895950317383, 3.0714309215545654, 3.1624722480773926, 3.2535135746002197, 3.344554901123047, 3.435595989227295, 3.526637554168701]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 6.0, 3.0, 13.0, 13.0, 15.0, 21.0, 38.0, 23.0, 41.0, 51.0, 55.0, 51.0, 61.0, 69.0, 60.0, 60.0, 66.0, 56.0, 61.0, 59.0, 45.0, 30.0, 20.0, 16.0, 12.0, 14.0, 18.0, 8.0, 9.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2430419921875, -0.23597145080566406, -0.22890090942382812, -0.2218303680419922, -0.21475982666015625, -0.2076892852783203, -0.20061874389648438, -0.19354820251464844, -0.1864776611328125, -0.17940711975097656, -0.17233657836914062, -0.1652660369873047, -0.15819549560546875, -0.1511249542236328, -0.14405441284179688, -0.13698387145996094, -0.129913330078125, -0.12284278869628906, -0.11577224731445312, -0.10870170593261719, -0.10163116455078125, -0.09456062316894531, -0.08749008178710938, -0.08041954040527344, -0.0733489990234375, -0.06627845764160156, -0.059207916259765625, -0.05213737487792969, -0.04506683349609375, -0.03799629211425781, -0.030925750732421875, -0.023855209350585938, -0.01678466796875, -0.009714126586914062, -0.002643585205078125, 0.0044269561767578125, 0.01149749755859375, 0.018568038940429688, 0.025638580322265625, 0.03270912170410156, 0.0397796630859375, 0.04685020446777344, 0.053920745849609375, 0.06099128723144531, 0.06806182861328125, 0.07513236999511719, 0.08220291137695312, 0.08927345275878906, 0.096343994140625, 0.10341453552246094, 0.11048507690429688, 0.11755561828613281, 0.12462615966796875, 0.1316967010498047, 0.13876724243164062, 0.14583778381347656, 0.1529083251953125, 0.15997886657714844, 0.16704940795898438, 0.1741199493408203, 0.18119049072265625, 0.1882610321044922, 0.19533157348632812, 0.20240211486816406, 0.20947265625]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 5.0, 10.0, 13.0, 20.0, 32.0, 40.0, 47.0, 71.0, 94.0, 157.0, 267.0, 431.0, 787.0, 1625.0, 3180.0, 6979.0, 15868.0, 37509.0, 87101.0, 158705.0, 117519.0, 52331.0, 22589.0, 9903.0, 4450.0, 2066.0, 1004.0, 542.0, 305.0, 192.0, 121.0, 85.0, 51.0, 50.0, 31.0, 22.0, 16.0, 13.0, 12.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.98779296875, -0.9521255493164062, -0.9164581298828125, -0.8807907104492188, -0.845123291015625, -0.8094558715820312, -0.7737884521484375, -0.7381210327148438, -0.70245361328125, -0.6667861938476562, -0.6311187744140625, -0.5954513549804688, -0.559783935546875, -0.5241165161132812, -0.4884490966796875, -0.45278167724609375, -0.4171142578125, -0.38144683837890625, -0.3457794189453125, -0.31011199951171875, -0.274444580078125, -0.23877716064453125, -0.2031097412109375, -0.16744232177734375, -0.13177490234375, -0.09610748291015625, -0.0604400634765625, -0.02477264404296875, 0.010894775390625, 0.04656219482421875, 0.0822296142578125, 0.11789703369140625, 0.153564453125, 0.18923187255859375, 0.2248992919921875, 0.26056671142578125, 0.296234130859375, 0.33190155029296875, 0.3675689697265625, 0.40323638916015625, 0.43890380859375, 0.47457122802734375, 0.5102386474609375, 0.5459060668945312, 0.581573486328125, 0.6172409057617188, 0.6529083251953125, 0.6885757446289062, 0.7242431640625, 0.7599105834960938, 0.7955780029296875, 0.8312454223632812, 0.866912841796875, 0.9025802612304688, 0.9382476806640625, 0.9739151000976562, 1.00958251953125, 1.0452499389648438, 1.0809173583984375, 1.1165847778320312, 1.152252197265625, 1.1879196166992188, 1.2235870361328125, 1.2592544555664062, 1.294921875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 12.0, 13.0, 13.0, 17.0, 21.0, 20.0, 37.0, 39.0, 50.0, 64.0, 61.0, 66.0, 72.0, 66.0, 56.0, 73.0, 51.0, 43.0, 44.0, 42.0, 28.0, 26.0, 22.0, 14.0, 12.0, 6.0, 10.0, 1.0, 5.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.208984375, -0.20121002197265625, -0.1934356689453125, -0.18566131591796875, -0.177886962890625, -0.17011260986328125, -0.1623382568359375, -0.15456390380859375, -0.14678955078125, -0.13901519775390625, -0.1312408447265625, -0.12346649169921875, -0.115692138671875, -0.10791778564453125, -0.1001434326171875, -0.09236907958984375, -0.0845947265625, -0.07682037353515625, -0.0690460205078125, -0.06127166748046875, -0.053497314453125, -0.04572296142578125, -0.0379486083984375, -0.03017425537109375, -0.02239990234375, -0.01462554931640625, -0.0068511962890625, 0.00092315673828125, 0.008697509765625, 0.01647186279296875, 0.0242462158203125, 0.03202056884765625, 0.039794921875, 0.04756927490234375, 0.0553436279296875, 0.06311798095703125, 0.070892333984375, 0.07866668701171875, 0.0864410400390625, 0.09421539306640625, 0.10198974609375, 0.10976409912109375, 0.1175384521484375, 0.12531280517578125, 0.133087158203125, 0.14086151123046875, 0.1486358642578125, 0.15641021728515625, 0.1641845703125, 0.17195892333984375, 0.1797332763671875, 0.18750762939453125, 0.195281982421875, 0.20305633544921875, 0.2108306884765625, 0.21860504150390625, 0.22637939453125, 0.23415374755859375, 0.2419281005859375, 0.24970245361328125, 0.257476806640625, 0.26525115966796875, 0.2730255126953125, 0.28079986572265625, 0.28857421875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 3.0, 10.0, 9.0, 14.0, 49.0, 83.0, 92.0, 95.0, 51.0, 21.0, 8.0, 10.0, 4.0, 6.0, 3.0, 5.0, 0.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.053524971008301, -1.992791771888733, -1.932058572769165, -1.8713253736495972, -1.8105921745300293, -1.7498589754104614, -1.6891257762908936, -1.6283925771713257, -1.5676593780517578, -1.50692617893219, -1.446192979812622, -1.3854597806930542, -1.3247265815734863, -1.2639933824539185, -1.2032601833343506, -1.1425269842147827, -1.0817937850952148, -1.021060585975647, -0.9603273868560791, -0.8995941877365112, -0.8388609886169434, -0.7781277894973755, -0.7173945903778076, -0.6566613912582397, -0.5959280729293823, -0.5351948738098145, -0.4744616746902466, -0.4137284755706787, -0.35299527645111084, -0.2922620475292206, -0.2315288484096527, -0.17079564929008484, -0.11006247997283936, -0.049329277127981186, 0.011403925716876984, 0.07213713228702545, 0.13287033140659332, 0.1936035454273224, 0.25433674454689026, 0.31506994366645813, 0.375803142786026, 0.43653634190559387, 0.49726954102516174, 0.558002769947052, 0.6187359690666199, 0.6794691681861877, 0.7402023673057556, 0.8009355664253235, 0.8616687655448914, 0.9224019646644592, 0.9831351637840271, 1.0438684225082397, 1.1046016216278076, 1.1653348207473755, 1.2260680198669434, 1.2868012189865112, 1.347534418106079, 1.408267617225647, 1.4690008163452148, 1.5297340154647827, 1.5904672145843506, 1.6512004137039185, 1.7119336128234863, 1.7726668119430542, 1.833400011062622]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 2.0, 7.0, 5.0, 4.0, 7.0, 7.0, 9.0, 27.0, 37.0, 65.0, 85.0, 74.0, 51.0, 23.0, 17.0, 11.0, 3.0, 6.0, 5.0, 7.0, 5.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0230109691619873, -0.9876903891563416, -0.9523698091506958, -0.91704922914505, -0.8817286491394043, -0.8464081287384033, -0.8110875487327576, -0.7757669687271118, -0.7404463887214661, -0.7051258087158203, -0.6698052287101746, -0.6344846487045288, -0.5991641283035278, -0.5638434886932373, -0.5285229682922363, -0.4932023882865906, -0.4578818082809448, -0.4225612282752991, -0.3872406482696533, -0.35192009806632996, -0.3165995180606842, -0.28127893805503845, -0.2459583729505539, -0.21063780784606934, -0.17531722784042358, -0.13999664783477783, -0.10467608273029327, -0.06935551017522812, -0.034034937620162964, 0.001285642385482788, 0.036606207489967346, 0.0719267725944519, 0.10724735260009766, 0.1425679326057434, 0.17788849771022797, 0.21320906281471252, 0.24852964282035828, 0.28385022282600403, 0.3191707730293274, 0.35449135303497314, 0.3898119330406189, 0.42513251304626465, 0.4604530930519104, 0.49577364325523376, 0.5310941934585571, 0.5664148330688477, 0.6017353534698486, 0.6370559334754944, 0.6723765134811401, 0.7076970934867859, 0.7430176734924316, 0.7783382534980774, 0.8136588335037231, 0.8489793539047241, 0.8842999339103699, 0.9196205139160156, 0.9549410939216614, 0.9902616739273071, 1.025582194328308, 1.0609028339385986, 1.0962233543395996, 1.1315439939498901, 1.1668645143508911, 1.2021851539611816, 1.2375056743621826]}, "eval/loss": 0.36502909660339355, "eval/wer": 0.11207854026180088, "eval/runtime": 567.0865, "eval/samples_per_second": 4.659, "eval/steps_per_second": 0.584} \ No newline at end of file +{"train/loss": 0.2069, "train/learning_rate": 1.9512195121951218e-06, "train/epoch": 5.0, "train/global_step": 1115, "_runtime": 25980, "_timestamp": 1648263108, "_step": 1117, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 4.0, 2.0, 13.0, 18.0, 25.0, 50.0, 74.0, 109.0, 157.0, 160.0, 161.0, 89.0, 56.0, 41.0, 23.0, 17.0, 7.0, 1.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.614524245262146, -0.5559785962104797, -0.4974329471588135, -0.4388873279094696, -0.38034167885780334, -0.3217960298061371, -0.2632504105567932, -0.20470476150512695, -0.1461591124534607, -0.08761347085237503, -0.029067829251289368, 0.029477804899215698, 0.08802345395088196, 0.14656910300254822, 0.2051147222518921, 0.26366037130355835, 0.3222060203552246, 0.38075166940689087, 0.43929731845855713, 0.497842937707901, 0.5563886165618896, 0.6149342060089111, 0.6734798550605774, 0.7320255041122437, 0.7905711531639099, 0.8491168022155762, 0.9076624512672424, 0.9662081003189087, 1.0247536897659302, 1.0832993984222412, 1.1418449878692627, 1.2003905773162842, 1.2589364051818848, 1.3174819946289062, 1.3760277032852173, 1.4345732927322388, 1.4931190013885498, 1.5516645908355713, 1.6102101802825928, 1.6687558889389038, 1.7273015975952148, 1.7858471870422363, 1.8443928956985474, 1.9029384851455688, 1.9614841938018799, 2.0200297832489014, 2.078575372695923, 2.1371212005615234, 2.195666790008545, 2.2542123794555664, 2.312757968902588, 2.3713037967681885, 2.42984938621521, 2.4883949756622314, 2.546940565109253, 2.6054863929748535, 2.664031744003296, 2.7225773334503174, 2.781122922897339, 2.8396687507629395, 2.898214340209961, 2.9567599296569824, 3.015305519104004, 3.0738511085510254, 3.132396936416626]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 1.0, 2.0, 4.0, 7.0, 7.0, 5.0, 8.0, 16.0, 17.0, 13.0, 14.0, 24.0, 20.0, 25.0, 31.0, 27.0, 24.0, 39.0, 29.0, 38.0, 51.0, 40.0, 46.0, 41.0, 32.0, 36.0, 41.0, 34.0, 39.0, 27.0, 32.0, 14.0, 23.0, 25.0, 27.0, 19.0, 19.0, 13.0, 9.0, 15.0, 14.0, 10.0, 5.0, 10.0, 8.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 5.0], "bins": [-0.7400795221328735, -0.7190272808074951, -0.6979750990867615, -0.6769228577613831, -0.6558706760406494, -0.634818434715271, -0.6137662529945374, -0.5927140116691589, -0.5716618299484253, -0.5506095886230469, -0.5295574069023132, -0.5085051655769348, -0.48745298385620117, -0.46640077233314514, -0.4453485608100891, -0.4242963194847107, -0.40324410796165466, -0.38219189643859863, -0.3611396849155426, -0.3400874733924866, -0.31903526186943054, -0.2979830503463745, -0.2769308090209961, -0.25587862730026245, -0.23482640087604523, -0.2137741893529892, -0.19272197782993317, -0.17166975140571594, -0.1506175398826599, -0.12956532835960388, -0.10851311683654785, -0.08746090531349182, -0.06640869379043579, -0.04535648226737976, -0.024304267019033432, -0.0032520517706871033, 0.017800159752368927, 0.03885237127542496, 0.059904590249061584, 0.08095680177211761, 0.10200901329517365, 0.12306122481822968, 0.1441134363412857, 0.16516566276550293, 0.18621787428855896, 0.207270085811615, 0.22832229733467102, 0.24937450885772705, 0.2704267203807831, 0.2914789319038391, 0.31253114342689514, 0.33358335494995117, 0.3546355664730072, 0.37568777799606323, 0.39674001932144165, 0.4177922010421753, 0.4388444423675537, 0.45989665389060974, 0.48094886541366577, 0.5020011067390442, 0.5230532884597778, 0.5441055297851562, 0.5651577115058899, 0.5862099528312683, 0.607262134552002]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 6.0, 17.0, 15.0, 26.0, 30.0, 35.0, 63.0, 97.0, 128.0, 188.0, 280.0, 440.0, 788.0, 1307.0, 2487.0, 5555.0, 14801.0, 99328.0, 1248391.0, 2544552.0, 235525.0, 25350.0, 7514.0, 3245.0, 1628.0, 850.0, 515.0, 345.0, 222.0, 156.0, 135.0, 69.0, 52.0, 37.0, 32.0, 17.0, 15.0, 9.0, 8.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0], "bins": [-3.935546875, -3.829681396484375, -3.72381591796875, -3.617950439453125, -3.5120849609375, -3.406219482421875, -3.30035400390625, -3.194488525390625, -3.088623046875, -2.982757568359375, -2.87689208984375, -2.771026611328125, -2.6651611328125, -2.559295654296875, -2.45343017578125, -2.347564697265625, -2.24169921875, -2.135833740234375, -2.02996826171875, -1.924102783203125, -1.8182373046875, -1.712371826171875, -1.60650634765625, -1.500640869140625, -1.394775390625, -1.288909912109375, -1.18304443359375, -1.077178955078125, -0.9713134765625, -0.865447998046875, -0.75958251953125, -0.653717041015625, -0.5478515625, -0.441986083984375, -0.33612060546875, -0.230255126953125, -0.1243896484375, -0.018524169921875, 0.08734130859375, 0.193206787109375, 0.299072265625, 0.404937744140625, 0.51080322265625, 0.616668701171875, 0.7225341796875, 0.828399658203125, 0.93426513671875, 1.040130615234375, 1.14599609375, 1.251861572265625, 1.35772705078125, 1.463592529296875, 1.5694580078125, 1.675323486328125, 1.78118896484375, 1.887054443359375, 1.992919921875, 2.098785400390625, 2.20465087890625, 2.310516357421875, 2.4163818359375, 2.522247314453125, 2.62811279296875, 2.733978271484375, 2.83984375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 8.0, 7.0, 9.0, 10.0, 8.0, 20.0, 18.0, 26.0, 21.0, 22.0, 34.0, 32.0, 29.0, 33.0, 45.0, 34.0, 57.0, 56.0, 54.0, 32.0, 41.0, 46.0, 38.0, 50.0, 33.0, 23.0, 30.0, 22.0, 29.0, 18.0, 22.0, 15.0, 10.0, 8.0, 12.0, 9.0, 9.0, 10.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.7158203125, -1.6680145263671875, -1.620208740234375, -1.5724029541015625, -1.52459716796875, -1.4767913818359375, -1.428985595703125, -1.3811798095703125, -1.3333740234375, -1.2855682373046875, -1.237762451171875, -1.1899566650390625, -1.14215087890625, -1.0943450927734375, -1.046539306640625, -0.9987335205078125, -0.950927734375, -0.9031219482421875, -0.855316162109375, -0.8075103759765625, -0.75970458984375, -0.7118988037109375, -0.664093017578125, -0.6162872314453125, -0.5684814453125, -0.5206756591796875, -0.472869873046875, -0.4250640869140625, -0.37725830078125, -0.3294525146484375, -0.281646728515625, -0.2338409423828125, -0.18603515625, -0.1382293701171875, -0.090423583984375, -0.0426177978515625, 0.00518798828125, 0.0529937744140625, 0.100799560546875, 0.1486053466796875, 0.1964111328125, 0.2442169189453125, 0.292022705078125, 0.3398284912109375, 0.38763427734375, 0.4354400634765625, 0.483245849609375, 0.5310516357421875, 0.578857421875, 0.6266632080078125, 0.674468994140625, 0.7222747802734375, 0.77008056640625, 0.8178863525390625, 0.865692138671875, 0.9134979248046875, 0.9613037109375, 1.0091094970703125, 1.056915283203125, 1.1047210693359375, 1.15252685546875, 1.2003326416015625, 1.248138427734375, 1.2959442138671875, 1.34375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 4.0, 6.0, 9.0, 13.0, 22.0, 17.0, 39.0, 74.0, 132.0, 333.0, 1811.0, 55303.0, 4126606.0, 8398.0, 912.0, 313.0, 113.0, 58.0, 41.0, 24.0, 17.0, 11.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9609375, -12.533203125, -12.10546875, -11.677734375, -11.25, -10.822265625, -10.39453125, -9.966796875, -9.5390625, -9.111328125, -8.68359375, -8.255859375, -7.828125, -7.400390625, -6.97265625, -6.544921875, -6.1171875, -5.689453125, -5.26171875, -4.833984375, -4.40625, -3.978515625, -3.55078125, -3.123046875, -2.6953125, -2.267578125, -1.83984375, -1.412109375, -0.984375, -0.556640625, -0.12890625, 0.298828125, 0.7265625, 1.154296875, 1.58203125, 2.009765625, 2.4375, 2.865234375, 3.29296875, 3.720703125, 4.1484375, 4.576171875, 5.00390625, 5.431640625, 5.859375, 6.287109375, 6.71484375, 7.142578125, 7.5703125, 7.998046875, 8.42578125, 8.853515625, 9.28125, 9.708984375, 10.13671875, 10.564453125, 10.9921875, 11.419921875, 11.84765625, 12.275390625, 12.703125, 13.130859375, 13.55859375, 13.986328125, 14.4140625]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 4.0, 4.0, 9.0, 10.0, 24.0, 21.0, 44.0, 79.0, 118.0, 221.0, 658.0, 1295.0, 822.0, 338.0, 165.0, 90.0, 63.0, 32.0, 25.0, 15.0, 10.0, 4.0, 7.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9208984375, -0.8875885009765625, -0.854278564453125, -0.8209686279296875, -0.78765869140625, -0.7543487548828125, -0.721038818359375, -0.6877288818359375, -0.6544189453125, -0.6211090087890625, -0.587799072265625, -0.5544891357421875, -0.52117919921875, -0.4878692626953125, -0.454559326171875, -0.4212493896484375, -0.387939453125, -0.3546295166015625, -0.321319580078125, -0.2880096435546875, -0.25469970703125, -0.2213897705078125, -0.188079833984375, -0.1547698974609375, -0.1214599609375, -0.0881500244140625, -0.054840087890625, -0.0215301513671875, 0.01177978515625, 0.0450897216796875, 0.078399658203125, 0.1117095947265625, 0.14501953125, 0.1783294677734375, 0.211639404296875, 0.2449493408203125, 0.27825927734375, 0.3115692138671875, 0.344879150390625, 0.3781890869140625, 0.4114990234375, 0.4448089599609375, 0.478118896484375, 0.5114288330078125, 0.54473876953125, 0.5780487060546875, 0.611358642578125, 0.6446685791015625, 0.677978515625, 0.7112884521484375, 0.744598388671875, 0.7779083251953125, 0.81121826171875, 0.8445281982421875, 0.877838134765625, 0.9111480712890625, 0.9444580078125, 0.9777679443359375, 1.011077880859375, 1.0443878173828125, 1.07769775390625, 1.1110076904296875, 1.144317626953125, 1.1776275634765625, 1.2109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0, 4.0, 7.0, 11.0, 17.0, 15.0, 18.0, 14.0, 20.0, 32.0, 35.0, 61.0, 62.0, 76.0, 86.0, 81.0, 95.0, 81.0, 64.0, 50.0, 33.0, 34.0, 23.0, 23.0, 12.0, 14.0, 11.0, 7.0, 10.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.188549280166626, -2.1190285682678223, -2.0495080947875977, -1.979987382888794, -1.9104666709899902, -1.840946078300476, -1.771425485610962, -1.7019047737121582, -1.632384181022644, -1.5628635883331299, -1.4933428764343262, -1.423822283744812, -1.3543016910552979, -1.2847809791564941, -1.21526038646698, -1.1457397937774658, -1.076219081878662, -1.006698489189148, -0.9371777772903442, -0.8676571846008301, -0.7981365323066711, -0.7286158800125122, -0.659095287322998, -0.5895746350288391, -0.5200539827346802, -0.45053333044052124, -0.3810127079486847, -0.31149208545684814, -0.2419714331626892, -0.17245078086853027, -0.10293015837669373, -0.03340953588485718, 0.03611111640930176, 0.1056317538022995, 0.17515239119529724, 0.24467302858829498, 0.3141936659812927, 0.38371431827545166, 0.4532349407672882, 0.5227555632591248, 0.5922762155532837, 0.6617968678474426, 0.7313175201416016, 0.8008381128311157, 0.8703587651252747, 0.9398794174194336, 1.0094000101089478, 1.078920602798462, 1.1484413146972656, 1.2179619073867798, 1.2874826192855835, 1.3570032119750977, 1.4265239238739014, 1.4960445165634155, 1.5655651092529297, 1.6350858211517334, 1.7046064138412476, 1.7741270065307617, 1.8436477184295654, 1.9131683111190796, 1.9826889038085938, 2.0522096157073975, 2.121730327606201, 2.191250801086426, 2.2607715129852295]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 5.0, 8.0, 5.0, 14.0, 12.0, 11.0, 14.0, 19.0, 16.0, 28.0, 35.0, 36.0, 40.0, 39.0, 38.0, 44.0, 50.0, 42.0, 38.0, 56.0, 36.0, 38.0, 51.0, 35.0, 32.0, 40.0, 25.0, 32.0, 25.0, 25.0, 22.0, 16.0, 18.0, 9.0, 15.0, 8.0, 8.0, 6.0, 2.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.7684389352798462, -1.720792293548584, -1.6731456518173218, -1.6254990100860596, -1.5778523683547974, -1.5302057266235352, -1.482559084892273, -1.4349124431610107, -1.3872658014297485, -1.3396191596984863, -1.2919725179672241, -1.244325876235962, -1.1966792345046997, -1.1490325927734375, -1.1013859510421753, -1.053739309310913, -1.0060926675796509, -0.9584460258483887, -0.9107993841171265, -0.8631527423858643, -0.815506100654602, -0.7678594589233398, -0.7202128171920776, -0.6725661754608154, -0.6249195337295532, -0.577272891998291, -0.5296262502670288, -0.4819796085357666, -0.4343329668045044, -0.3866863250732422, -0.33903968334198, -0.2913930416107178, -0.24374651908874512, -0.1960998773574829, -0.1484532356262207, -0.1008065938949585, -0.05315995216369629, -0.005513310432434082, 0.042133331298828125, 0.08977997303009033, 0.13742661476135254, 0.18507325649261475, 0.23271989822387695, 0.28036653995513916, 0.32801318168640137, 0.3756598234176636, 0.4233064651489258, 0.470953106880188, 0.5185997486114502, 0.5662463903427124, 0.6138930320739746, 0.6615396738052368, 0.709186315536499, 0.7568329572677612, 0.8044795989990234, 0.8521262407302856, 0.8997728824615479, 0.9474195241928101, 0.9950661659240723, 1.0427128076553345, 1.0903594493865967, 1.1380060911178589, 1.185652732849121, 1.2332993745803833, 1.2809460163116455]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 5.0, 6.0, 12.0, 14.0, 30.0, 32.0, 40.0, 67.0, 108.0, 162.0, 249.0, 372.0, 607.0, 898.0, 1588.0, 2695.0, 5145.0, 9935.0, 21051.0, 46848.0, 108909.0, 254478.0, 324257.0, 151142.0, 64048.0, 27879.0, 13056.0, 6534.0, 3393.0, 1934.0, 1120.0, 672.0, 438.0, 292.0, 169.0, 120.0, 70.0, 46.0, 38.0, 32.0, 26.0, 17.0, 9.0, 4.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.755859375, -0.7308197021484375, -0.705780029296875, -0.6807403564453125, -0.65570068359375, -0.6306610107421875, -0.605621337890625, -0.5805816650390625, -0.5555419921875, -0.5305023193359375, -0.505462646484375, -0.4804229736328125, -0.45538330078125, -0.4303436279296875, -0.405303955078125, -0.3802642822265625, -0.355224609375, -0.3301849365234375, -0.305145263671875, -0.2801055908203125, -0.25506591796875, -0.2300262451171875, -0.204986572265625, -0.1799468994140625, -0.1549072265625, -0.1298675537109375, -0.104827880859375, -0.0797882080078125, -0.05474853515625, -0.0297088623046875, -0.004669189453125, 0.0203704833984375, 0.04541015625, 0.0704498291015625, 0.095489501953125, 0.1205291748046875, 0.14556884765625, 0.1706085205078125, 0.195648193359375, 0.2206878662109375, 0.2457275390625, 0.2707672119140625, 0.295806884765625, 0.3208465576171875, 0.34588623046875, 0.3709259033203125, 0.395965576171875, 0.4210052490234375, 0.446044921875, 0.4710845947265625, 0.496124267578125, 0.5211639404296875, 0.54620361328125, 0.5712432861328125, 0.596282958984375, 0.6213226318359375, 0.6463623046875, 0.6714019775390625, 0.696441650390625, 0.7214813232421875, 0.74652099609375, 0.7715606689453125, 0.796600341796875, 0.8216400146484375, 0.8466796875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 2.0, 7.0, 10.0, 10.0, 23.0, 10.0, 16.0, 19.0, 30.0, 30.0, 38.0, 42.0, 45.0, 43.0, 32.0, 37.0, 54.0, 42.0, 37.0, 43.0, 49.0, 38.0, 43.0, 39.0, 39.0, 27.0, 31.0, 26.0, 19.0, 21.0, 17.0, 9.0, 12.0, 9.0, 12.0, 12.0, 7.0, 7.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.0283203125, -0.998291015625, -0.96826171875, -0.938232421875, -0.908203125, -0.878173828125, -0.84814453125, -0.818115234375, -0.7880859375, -0.758056640625, -0.72802734375, -0.697998046875, -0.66796875, -0.637939453125, -0.60791015625, -0.577880859375, -0.5478515625, -0.517822265625, -0.48779296875, -0.457763671875, -0.427734375, -0.397705078125, -0.36767578125, -0.337646484375, -0.3076171875, -0.277587890625, -0.24755859375, -0.217529296875, -0.1875, -0.157470703125, -0.12744140625, -0.097412109375, -0.0673828125, -0.037353515625, -0.00732421875, 0.022705078125, 0.052734375, 0.082763671875, 0.11279296875, 0.142822265625, 0.1728515625, 0.202880859375, 0.23291015625, 0.262939453125, 0.29296875, 0.322998046875, 0.35302734375, 0.383056640625, 0.4130859375, 0.443115234375, 0.47314453125, 0.503173828125, 0.533203125, 0.563232421875, 0.59326171875, 0.623291015625, 0.6533203125, 0.683349609375, 0.71337890625, 0.743408203125, 0.7734375, 0.803466796875, 0.83349609375, 0.863525390625, 0.8935546875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 9.0, 7.0, 13.0, 17.0, 28.0, 52.0, 85.0, 107.0, 175.0, 312.0, 434.0, 930.0, 1738.0, 3460.0, 8021.0, 20772.0, 64294.0, 239131.0, 472048.0, 163144.0, 45991.0, 15690.0, 6183.0, 2696.0, 1385.0, 761.0, 396.0, 246.0, 149.0, 87.0, 65.0, 33.0, 31.0, 19.0, 15.0, 8.0, 10.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90478515625, -0.8739700317382812, -0.8431549072265625, -0.8123397827148438, -0.781524658203125, -0.7507095336914062, -0.7198944091796875, -0.6890792846679688, -0.65826416015625, -0.6274490356445312, -0.5966339111328125, -0.5658187866210938, -0.535003662109375, -0.5041885375976562, -0.4733734130859375, -0.44255828857421875, -0.4117431640625, -0.38092803955078125, -0.3501129150390625, -0.31929779052734375, -0.288482666015625, -0.25766754150390625, -0.2268524169921875, -0.19603729248046875, -0.16522216796875, -0.13440704345703125, -0.1035919189453125, -0.07277679443359375, -0.041961669921875, -0.01114654541015625, 0.0196685791015625, 0.05048370361328125, 0.081298828125, 0.11211395263671875, 0.1429290771484375, 0.17374420166015625, 0.204559326171875, 0.23537445068359375, 0.2661895751953125, 0.29700469970703125, 0.32781982421875, 0.35863494873046875, 0.3894500732421875, 0.42026519775390625, 0.451080322265625, 0.48189544677734375, 0.5127105712890625, 0.5435256958007812, 0.5743408203125, 0.6051559448242188, 0.6359710693359375, 0.6667861938476562, 0.697601318359375, 0.7284164428710938, 0.7592315673828125, 0.7900466918945312, 0.82086181640625, 0.8516769409179688, 0.8824920654296875, 0.9133071899414062, 0.944122314453125, 0.9749374389648438, 1.0057525634765625, 1.0365676879882812, 1.0673828125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 2.0, 4.0, 8.0, 6.0, 9.0, 10.0, 16.0, 15.0, 13.0, 10.0, 22.0, 20.0, 16.0, 32.0, 44.0, 43.0, 35.0, 49.0, 47.0, 51.0, 32.0, 48.0, 46.0, 51.0, 33.0, 51.0, 42.0, 29.0, 29.0, 25.0, 22.0, 16.0, 18.0, 19.0, 11.0, 9.0, 11.0, 14.0, 6.0, 8.0, 7.0, 4.0, 3.0, 8.0, 2.0, 4.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.9306640625, -1.8682098388671875, -1.805755615234375, -1.7433013916015625, -1.68084716796875, -1.6183929443359375, -1.555938720703125, -1.4934844970703125, -1.4310302734375, -1.3685760498046875, -1.306121826171875, -1.2436676025390625, -1.18121337890625, -1.1187591552734375, -1.056304931640625, -0.9938507080078125, -0.931396484375, -0.8689422607421875, -0.806488037109375, -0.7440338134765625, -0.68157958984375, -0.6191253662109375, -0.556671142578125, -0.4942169189453125, -0.4317626953125, -0.3693084716796875, -0.306854248046875, -0.2444000244140625, -0.18194580078125, -0.1194915771484375, -0.057037353515625, 0.0054168701171875, 0.06787109375, 0.1303253173828125, 0.192779541015625, 0.2552337646484375, 0.31768798828125, 0.3801422119140625, 0.442596435546875, 0.5050506591796875, 0.5675048828125, 0.6299591064453125, 0.692413330078125, 0.7548675537109375, 0.81732177734375, 0.8797760009765625, 0.942230224609375, 1.0046844482421875, 1.067138671875, 1.1295928955078125, 1.192047119140625, 1.2545013427734375, 1.31695556640625, 1.3794097900390625, 1.441864013671875, 1.5043182373046875, 1.5667724609375, 1.6292266845703125, 1.691680908203125, 1.7541351318359375, 1.81658935546875, 1.8790435791015625, 1.941497802734375, 2.0039520263671875, 2.06640625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 8.0, 12.0, 15.0, 35.0, 54.0, 45.0, 76.0, 145.0, 205.0, 311.0, 530.0, 876.0, 1483.0, 2792.0, 5473.0, 12108.0, 30805.0, 131137.0, 624842.0, 174003.0, 36964.0, 13422.0, 6118.0, 2921.0, 1680.0, 1002.0, 531.0, 346.0, 207.0, 121.0, 92.0, 54.0, 37.0, 25.0, 25.0, 12.0, 12.0, 10.0, 3.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2384033203125, -0.23130226135253906, -0.22420120239257812, -0.2171001434326172, -0.20999908447265625, -0.2028980255126953, -0.19579696655273438, -0.18869590759277344, -0.1815948486328125, -0.17449378967285156, -0.16739273071289062, -0.1602916717529297, -0.15319061279296875, -0.1460895538330078, -0.13898849487304688, -0.13188743591308594, -0.124786376953125, -0.11768531799316406, -0.11058425903320312, -0.10348320007324219, -0.09638214111328125, -0.08928108215332031, -0.08218002319335938, -0.07507896423339844, -0.0679779052734375, -0.06087684631347656, -0.053775787353515625, -0.04667472839355469, -0.03957366943359375, -0.03247261047363281, -0.025371551513671875, -0.018270492553710938, -0.01116943359375, -0.0040683746337890625, 0.003032684326171875, 0.010133743286132812, 0.01723480224609375, 0.024335861206054688, 0.031436920166015625, 0.03853797912597656, 0.0456390380859375, 0.05274009704589844, 0.059841156005859375, 0.06694221496582031, 0.07404327392578125, 0.08114433288574219, 0.08824539184570312, 0.09534645080566406, 0.102447509765625, 0.10954856872558594, 0.11664962768554688, 0.12375068664550781, 0.13085174560546875, 0.1379528045654297, 0.14505386352539062, 0.15215492248535156, 0.1592559814453125, 0.16635704040527344, 0.17345809936523438, 0.1805591583251953, 0.18766021728515625, 0.1947612762451172, 0.20186233520507812, 0.20896339416503906, 0.216064453125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 10.0, 6.0, 10.0, 18.0, 15.0, 39.0, 41.0, 103.0, 150.0, 203.0, 140.0, 85.0, 47.0, 30.0, 23.0, 21.0, 9.0, 9.0, 5.0, 2.0, 2.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020241737365722656, -0.0001963600516319275, -0.00019030272960662842, -0.00018424540758132935, -0.00017818808555603027, -0.0001721307635307312, -0.00016607344150543213, -0.00016001611948013306, -0.00015395879745483398, -0.0001479014754295349, -0.00014184415340423584, -0.00013578683137893677, -0.0001297295093536377, -0.00012367218732833862, -0.00011761486530303955, -0.00011155754327774048, -0.0001055002212524414, -9.944289922714233e-05, -9.338557720184326e-05, -8.732825517654419e-05, -8.127093315124512e-05, -7.521361112594604e-05, -6.915628910064697e-05, -6.30989670753479e-05, -5.704164505004883e-05, -5.0984323024749756e-05, -4.4927000999450684e-05, -3.886967897415161e-05, -3.281235694885254e-05, -2.6755034923553467e-05, -2.0697712898254395e-05, -1.4640390872955322e-05, -8.58306884765625e-06, -2.5257468223571777e-06, 3.5315752029418945e-06, 9.588897228240967e-06, 1.564621925354004e-05, 2.170354127883911e-05, 2.7760863304138184e-05, 3.3818185329437256e-05, 3.987550735473633e-05, 4.59328293800354e-05, 5.199015140533447e-05, 5.8047473430633545e-05, 6.410479545593262e-05, 7.016211748123169e-05, 7.621943950653076e-05, 8.227676153182983e-05, 8.83340835571289e-05, 9.439140558242798e-05, 0.00010044872760772705, 0.00010650604963302612, 0.0001125633716583252, 0.00011862069368362427, 0.00012467801570892334, 0.0001307353377342224, 0.00013679265975952148, 0.00014284998178482056, 0.00014890730381011963, 0.0001549646258354187, 0.00016102194786071777, 0.00016707926988601685, 0.00017313659191131592, 0.000179193913936615, 0.00018525123596191406]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 2.0, 4.0, 5.0, 3.0, 13.0, 14.0, 24.0, 28.0, 41.0, 96.0, 135.0, 308.0, 653.0, 1396.0, 3181.0, 8031.0, 24139.0, 112015.0, 642628.0, 202067.0, 35427.0, 10828.0, 4172.0, 1705.0, 808.0, 386.0, 180.0, 86.0, 48.0, 37.0, 25.0, 12.0, 15.0, 6.0, 10.0, 1.0, 3.0, 3.0, 5.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.287109375, -0.2785758972167969, -0.27004241943359375, -0.2615089416503906, -0.2529754638671875, -0.24444198608398438, -0.23590850830078125, -0.22737503051757812, -0.218841552734375, -0.21030807495117188, -0.20177459716796875, -0.19324111938476562, -0.1847076416015625, -0.17617416381835938, -0.16764068603515625, -0.15910720825195312, -0.15057373046875, -0.14204025268554688, -0.13350677490234375, -0.12497329711914062, -0.1164398193359375, -0.10790634155273438, -0.09937286376953125, -0.09083938598632812, -0.082305908203125, -0.07377243041992188, -0.06523895263671875, -0.056705474853515625, -0.0481719970703125, -0.039638519287109375, -0.03110504150390625, -0.022571563720703125, -0.0140380859375, -0.005504608154296875, 0.00302886962890625, 0.011562347412109375, 0.0200958251953125, 0.028629302978515625, 0.03716278076171875, 0.045696258544921875, 0.054229736328125, 0.06276321411132812, 0.07129669189453125, 0.07983016967773438, 0.0883636474609375, 0.09689712524414062, 0.10543060302734375, 0.11396408081054688, 0.12249755859375, 0.13103103637695312, 0.13956451416015625, 0.14809799194335938, 0.1566314697265625, 0.16516494750976562, 0.17369842529296875, 0.18223190307617188, 0.190765380859375, 0.19929885864257812, 0.20783233642578125, 0.21636581420898438, 0.2248992919921875, 0.23343276977539062, 0.24196624755859375, 0.2504997253417969, 0.259033203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 5.0, 3.0, 3.0, 10.0, 8.0, 15.0, 15.0, 18.0, 27.0, 44.0, 43.0, 61.0, 75.0, 82.0, 101.0, 95.0, 86.0, 59.0, 53.0, 30.0, 36.0, 27.0, 23.0, 7.0, 10.0, 13.0, 7.0, 4.0, 5.0, 6.0, 3.0, 2.0, 2.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0701904296875, -0.0681161880493164, -0.06604194641113281, -0.06396770477294922, -0.061893463134765625, -0.05981922149658203, -0.05774497985839844, -0.055670738220214844, -0.05359649658203125, -0.051522254943847656, -0.04944801330566406, -0.04737377166748047, -0.045299530029296875, -0.04322528839111328, -0.04115104675292969, -0.039076805114746094, -0.0370025634765625, -0.034928321838378906, -0.03285408020019531, -0.03077983856201172, -0.028705596923828125, -0.02663135528564453, -0.024557113647460938, -0.022482872009277344, -0.02040863037109375, -0.018334388732910156, -0.016260147094726562, -0.014185905456542969, -0.012111663818359375, -0.010037422180175781, -0.007963180541992188, -0.005888938903808594, -0.003814697265625, -0.0017404556274414062, 0.0003337860107421875, 0.0024080276489257812, 0.004482269287109375, 0.006556510925292969, 0.008630752563476562, 0.010704994201660156, 0.01277923583984375, 0.014853477478027344, 0.016927719116210938, 0.01900196075439453, 0.021076202392578125, 0.02315044403076172, 0.025224685668945312, 0.027298927307128906, 0.0293731689453125, 0.031447410583496094, 0.03352165222167969, 0.03559589385986328, 0.037670135498046875, 0.03974437713623047, 0.04181861877441406, 0.043892860412597656, 0.04596710205078125, 0.048041343688964844, 0.05011558532714844, 0.05218982696533203, 0.054264068603515625, 0.05633831024169922, 0.05841255187988281, 0.060486793518066406, 0.06256103515625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 7.0, 13.0, 33.0, 42.0, 62.0, 98.0, 145.0, 196.0, 152.0, 105.0, 47.0, 40.0, 29.0, 10.0, 7.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.620237350463867, -2.541998863220215, -2.4637603759765625, -2.385521650314331, -2.3072831630706787, -2.2290446758270264, -2.150806188583374, -2.0725677013397217, -1.9943290948867798, -1.9160906076431274, -1.8378520011901855, -1.7596135139465332, -1.6813750267028809, -1.603136420249939, -1.5248979330062866, -1.4466593265533447, -1.3684208393096924, -1.29018235206604, -1.2119437456130981, -1.1337052583694458, -1.055466651916504, -0.9772281646728516, -0.8989896774291992, -0.8207511305809021, -0.742512583732605, -0.6642740368843079, -0.5860354900360107, -0.5077970027923584, -0.4295584559440613, -0.35131990909576416, -0.27308139204978943, -0.1948428750038147, -0.11660432815551758, -0.03836579620838165, 0.03987273573875427, 0.1181112676858902, 0.19634979963302612, 0.27458834648132324, 0.352826863527298, 0.4310653805732727, 0.5093039274215698, 0.5875424742698669, 0.6657810211181641, 0.7440195083618164, 0.8222580552101135, 0.9004966020584106, 0.978735089302063, 1.0569736957550049, 1.1352121829986572, 1.2134506702423096, 1.2916892766952515, 1.3699277639389038, 1.4481663703918457, 1.526404857635498, 1.6046433448791504, 1.6828818321228027, 1.7611204385757446, 1.839358925819397, 1.9175975322723389, 1.9958360195159912, 2.0740745067596436, 2.152313232421875, 2.2305517196655273, 2.3087902069091797, 2.387028694152832]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 5.0, 5.0, 3.0, 8.0, 3.0, 7.0, 12.0, 21.0, 21.0, 18.0, 17.0, 27.0, 28.0, 34.0, 37.0, 38.0, 35.0, 38.0, 47.0, 43.0, 41.0, 41.0, 27.0, 46.0, 40.0, 49.0, 34.0, 33.0, 30.0, 30.0, 31.0, 27.0, 21.0, 20.0, 9.0, 7.0, 20.0, 10.0, 14.0, 6.0, 5.0, 3.0, 4.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.9393354058265686, -0.9121330976486206, -0.8849307894706726, -0.8577284812927246, -0.8305262327194214, -0.8033239245414734, -0.7761216163635254, -0.7489193081855774, -0.7217170000076294, -0.6945146918296814, -0.6673123836517334, -0.6401101350784302, -0.6129078269004822, -0.5857055187225342, -0.5585032105445862, -0.5313009023666382, -0.504098653793335, -0.47689634561538696, -0.44969406723976135, -0.42249175906181335, -0.39528948068618774, -0.36808717250823975, -0.34088486433029175, -0.31368255615234375, -0.28648027777671814, -0.25927796959877014, -0.23207569122314453, -0.20487338304519653, -0.17767108976840973, -0.15046879649162292, -0.12326648831367493, -0.09606419503688812, -0.06886190176010132, -0.041659604758024216, -0.014457307755947113, 0.012744992971420288, 0.03994728624820709, 0.0671495795249939, 0.0943518877029419, 0.1215541809797287, 0.1487564742565155, 0.1759587675333023, 0.2031610608100891, 0.2303633689880371, 0.2575656771659851, 0.2847679555416107, 0.3119702637195587, 0.3391725420951843, 0.3663748502731323, 0.3935771584510803, 0.42077943682670593, 0.44798174500465393, 0.47518402338027954, 0.5023863315582275, 0.5295886397361755, 0.5567909479141235, 0.5839931964874268, 0.6111955046653748, 0.6383978128433228, 0.665600061416626, 0.692802369594574, 0.720004677772522, 0.74720698595047, 0.774409294128418, 0.801611602306366]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 11.0, 7.0, 16.0, 12.0, 33.0, 37.0, 41.0, 50.0, 69.0, 115.0, 182.0, 279.0, 471.0, 820.0, 1381.0, 2596.0, 5119.0, 10773.0, 24766.0, 60498.0, 157344.0, 343180.0, 261970.0, 104436.0, 40859.0, 17267.0, 7853.0, 3695.0, 1915.0, 1006.0, 600.0, 358.0, 242.0, 179.0, 122.0, 76.0, 58.0, 33.0, 22.0, 21.0, 14.0, 8.0, 6.0, 6.0, 6.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.37939453125, -0.3674583435058594, -0.35552215576171875, -0.3435859680175781, -0.3316497802734375, -0.3197135925292969, -0.30777740478515625, -0.2958412170410156, -0.283905029296875, -0.2719688415527344, -0.26003265380859375, -0.24809646606445312, -0.2361602783203125, -0.22422409057617188, -0.21228790283203125, -0.20035171508789062, -0.18841552734375, -0.17647933959960938, -0.16454315185546875, -0.15260696411132812, -0.1406707763671875, -0.12873458862304688, -0.11679840087890625, -0.10486221313476562, -0.092926025390625, -0.08098983764648438, -0.06905364990234375, -0.057117462158203125, -0.0451812744140625, -0.033245086669921875, -0.02130889892578125, -0.009372711181640625, 0.0025634765625, 0.014499664306640625, 0.02643585205078125, 0.038372039794921875, 0.0503082275390625, 0.062244415283203125, 0.07418060302734375, 0.08611679077148438, 0.098052978515625, 0.10998916625976562, 0.12192535400390625, 0.13386154174804688, 0.1457977294921875, 0.15773391723632812, 0.16967010498046875, 0.18160629272460938, 0.19354248046875, 0.20547866821289062, 0.21741485595703125, 0.22935104370117188, 0.2412872314453125, 0.2532234191894531, 0.26515960693359375, 0.2770957946777344, 0.289031982421875, 0.3009681701660156, 0.31290435791015625, 0.3248405456542969, 0.3367767333984375, 0.3487129211425781, 0.36064910888671875, 0.3725852966308594, 0.384521484375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 11.0, 12.0, 11.0, 20.0, 15.0, 14.0, 23.0, 19.0, 30.0, 37.0, 36.0, 36.0, 40.0, 29.0, 44.0, 36.0, 39.0, 54.0, 48.0, 47.0, 31.0, 45.0, 42.0, 37.0, 37.0, 29.0, 31.0, 19.0, 16.0, 16.0, 14.0, 11.0, 13.0, 6.0, 8.0, 5.0, 4.0, 6.0, 8.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-5.45703125, -5.3033447265625, -5.149658203125, -4.9959716796875, -4.84228515625, -4.6885986328125, -4.534912109375, -4.3812255859375, -4.2275390625, -4.0738525390625, -3.920166015625, -3.7664794921875, -3.61279296875, -3.4591064453125, -3.305419921875, -3.1517333984375, -2.998046875, -2.8443603515625, -2.690673828125, -2.5369873046875, -2.38330078125, -2.2296142578125, -2.075927734375, -1.9222412109375, -1.7685546875, -1.6148681640625, -1.461181640625, -1.3074951171875, -1.15380859375, -1.0001220703125, -0.846435546875, -0.6927490234375, -0.5390625, -0.3853759765625, -0.231689453125, -0.0780029296875, 0.07568359375, 0.2293701171875, 0.383056640625, 0.5367431640625, 0.6904296875, 0.8441162109375, 0.997802734375, 1.1514892578125, 1.30517578125, 1.4588623046875, 1.612548828125, 1.7662353515625, 1.919921875, 2.0736083984375, 2.227294921875, 2.3809814453125, 2.53466796875, 2.6883544921875, 2.842041015625, 2.9957275390625, 3.1494140625, 3.3031005859375, 3.456787109375, 3.6104736328125, 3.76416015625, 3.9178466796875, 4.071533203125, 4.2252197265625, 4.37890625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 3.0, 3.0, 10.0, 6.0, 9.0, 22.0, 13.0, 21.0, 29.0, 31.0, 41.0, 52.0, 58.0, 85.0, 124.0, 210.0, 385.0, 1213.0, 10878.0, 1012088.0, 20779.0, 1371.0, 450.0, 189.0, 108.0, 70.0, 62.0, 47.0, 42.0, 37.0, 22.0, 15.0, 14.0, 12.0, 11.0, 9.0, 10.0, 7.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.251953125, -3.157867431640625, -3.06378173828125, -2.969696044921875, -2.8756103515625, -2.781524658203125, -2.68743896484375, -2.593353271484375, -2.499267578125, -2.405181884765625, -2.31109619140625, -2.217010498046875, -2.1229248046875, -2.028839111328125, -1.93475341796875, -1.840667724609375, -1.74658203125, -1.652496337890625, -1.55841064453125, -1.464324951171875, -1.3702392578125, -1.276153564453125, -1.18206787109375, -1.087982177734375, -0.993896484375, -0.899810791015625, -0.80572509765625, -0.711639404296875, -0.6175537109375, -0.523468017578125, -0.42938232421875, -0.335296630859375, -0.2412109375, -0.147125244140625, -0.05303955078125, 0.041046142578125, 0.1351318359375, 0.229217529296875, 0.32330322265625, 0.417388916015625, 0.511474609375, 0.605560302734375, 0.69964599609375, 0.793731689453125, 0.8878173828125, 0.981903076171875, 1.07598876953125, 1.170074462890625, 1.26416015625, 1.358245849609375, 1.45233154296875, 1.546417236328125, 1.6405029296875, 1.734588623046875, 1.82867431640625, 1.922760009765625, 2.016845703125, 2.110931396484375, 2.20501708984375, 2.299102783203125, 2.3931884765625, 2.487274169921875, 2.58135986328125, 2.675445556640625, 2.76953125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 2.0, 3.0, 11.0, 5.0, 7.0, 20.0, 11.0, 18.0, 25.0, 26.0, 34.0, 34.0, 35.0, 33.0, 52.0, 40.0, 36.0, 46.0, 51.0, 51.0, 49.0, 43.0, 35.0, 34.0, 35.0, 35.0, 34.0, 24.0, 31.0, 29.0, 16.0, 16.0, 13.0, 10.0, 11.0, 10.0, 12.0, 5.0, 2.0, 6.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1484375, -4.99945068359375, -4.8504638671875, -4.70147705078125, -4.552490234375, -4.40350341796875, -4.2545166015625, -4.10552978515625, -3.95654296875, -3.80755615234375, -3.6585693359375, -3.50958251953125, -3.360595703125, -3.21160888671875, -3.0626220703125, -2.91363525390625, -2.7646484375, -2.61566162109375, -2.4666748046875, -2.31768798828125, -2.168701171875, -2.01971435546875, -1.8707275390625, -1.72174072265625, -1.57275390625, -1.42376708984375, -1.2747802734375, -1.12579345703125, -0.976806640625, -0.82781982421875, -0.6788330078125, -0.52984619140625, -0.380859375, -0.23187255859375, -0.0828857421875, 0.06610107421875, 0.215087890625, 0.36407470703125, 0.5130615234375, 0.66204833984375, 0.81103515625, 0.96002197265625, 1.1090087890625, 1.25799560546875, 1.406982421875, 1.55596923828125, 1.7049560546875, 1.85394287109375, 2.0029296875, 2.15191650390625, 2.3009033203125, 2.44989013671875, 2.598876953125, 2.74786376953125, 2.8968505859375, 3.04583740234375, 3.19482421875, 3.34381103515625, 3.4927978515625, 3.64178466796875, 3.790771484375, 3.93975830078125, 4.0887451171875, 4.23773193359375, 4.38671875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 1.0, 1.0, 4.0, 8.0, 13.0, 9.0, 17.0, 14.0, 33.0, 31.0, 56.0, 62.0, 98.0, 164.0, 239.0, 396.0, 774.0, 1334.0, 2655.0, 5988.0, 16645.0, 92354.0, 818880.0, 81647.0, 15690.0, 5710.0, 2542.0, 1323.0, 694.0, 411.0, 244.0, 146.0, 118.0, 74.0, 46.0, 37.0, 26.0, 15.0, 16.0, 10.0, 7.0, 5.0, 6.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.14990234375, -0.1451396942138672, -0.14037704467773438, -0.13561439514160156, -0.13085174560546875, -0.12608909606933594, -0.12132644653320312, -0.11656379699707031, -0.1118011474609375, -0.10703849792480469, -0.10227584838867188, -0.09751319885253906, -0.09275054931640625, -0.08798789978027344, -0.08322525024414062, -0.07846260070800781, -0.073699951171875, -0.06893730163574219, -0.06417465209960938, -0.05941200256347656, -0.05464935302734375, -0.04988670349121094, -0.045124053955078125, -0.04036140441894531, -0.0355987548828125, -0.030836105346679688, -0.026073455810546875, -0.021310806274414062, -0.01654815673828125, -0.011785507202148438, -0.007022857666015625, -0.0022602081298828125, 0.00250244140625, 0.0072650909423828125, 0.012027740478515625, 0.016790390014648438, 0.02155303955078125, 0.026315689086914062, 0.031078338623046875, 0.03584098815917969, 0.0406036376953125, 0.04536628723144531, 0.050128936767578125, 0.05489158630371094, 0.05965423583984375, 0.06441688537597656, 0.06917953491210938, 0.07394218444824219, 0.078704833984375, 0.08346748352050781, 0.08823013305664062, 0.09299278259277344, 0.09775543212890625, 0.10251808166503906, 0.10728073120117188, 0.11204338073730469, 0.1168060302734375, 0.12156867980957031, 0.12633132934570312, 0.13109397888183594, 0.13585662841796875, 0.14061927795410156, 0.14538192749023438, 0.1501445770263672, 0.1549072265625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 4.0, 6.0, 7.0, 12.0, 29.0, 115.0, 453.0, 266.0, 61.0, 21.0, 11.0, 7.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.128715515136719e-05, -6.92959874868393e-05, -6.73048198223114e-05, -6.531365215778351e-05, -6.332248449325562e-05, -6.133131682872772e-05, -5.934014916419983e-05, -5.7348981499671936e-05, -5.535781383514404e-05, -5.336664617061615e-05, -5.137547850608826e-05, -4.9384310841560364e-05, -4.739314317703247e-05, -4.540197551250458e-05, -4.3410807847976685e-05, -4.141964018344879e-05, -3.94284725189209e-05, -3.7437304854393005e-05, -3.544613718986511e-05, -3.345496952533722e-05, -3.1463801860809326e-05, -2.9472634196281433e-05, -2.748146653175354e-05, -2.5490298867225647e-05, -2.3499131202697754e-05, -2.150796353816986e-05, -1.9516795873641968e-05, -1.7525628209114075e-05, -1.553446054458618e-05, -1.3543292880058289e-05, -1.1552125215530396e-05, -9.560957551002502e-06, -7.569789886474609e-06, -5.578622221946716e-06, -3.5874545574188232e-06, -1.5962868928909302e-06, 3.948807716369629e-07, 2.386048436164856e-06, 4.377216100692749e-06, 6.368383765220642e-06, 8.359551429748535e-06, 1.0350719094276428e-05, 1.2341886758804321e-05, 1.4333054423332214e-05, 1.6324222087860107e-05, 1.8315389752388e-05, 2.0306557416915894e-05, 2.2297725081443787e-05, 2.428889274597168e-05, 2.6280060410499573e-05, 2.8271228075027466e-05, 3.026239573955536e-05, 3.225356340408325e-05, 3.4244731068611145e-05, 3.623589873313904e-05, 3.822706639766693e-05, 4.0218234062194824e-05, 4.220940172672272e-05, 4.420056939125061e-05, 4.6191737055778503e-05, 4.8182904720306396e-05, 5.017407238483429e-05, 5.216524004936218e-05, 5.4156407713890076e-05, 5.614757537841797e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 8.0, 5.0, 10.0, 10.0, 31.0, 40.0, 55.0, 91.0, 161.0, 300.0, 612.0, 1469.0, 4791.0, 21665.0, 666509.0, 329105.0, 17157.0, 3995.0, 1339.0, 558.0, 259.0, 163.0, 84.0, 52.0, 27.0, 20.0, 17.0, 6.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1826171875, -0.17557525634765625, -0.1685333251953125, -0.16149139404296875, -0.154449462890625, -0.14740753173828125, -0.1403656005859375, -0.13332366943359375, -0.12628173828125, -0.11923980712890625, -0.1121978759765625, -0.10515594482421875, -0.098114013671875, -0.09107208251953125, -0.0840301513671875, -0.07698822021484375, -0.0699462890625, -0.06290435791015625, -0.0558624267578125, -0.04882049560546875, -0.041778564453125, -0.03473663330078125, -0.0276947021484375, -0.02065277099609375, -0.01361083984375, -0.00656890869140625, 0.0004730224609375, 0.00751495361328125, 0.014556884765625, 0.02159881591796875, 0.0286407470703125, 0.03568267822265625, 0.042724609375, 0.04976654052734375, 0.0568084716796875, 0.06385040283203125, 0.070892333984375, 0.07793426513671875, 0.0849761962890625, 0.09201812744140625, 0.09906005859375, 0.10610198974609375, 0.1131439208984375, 0.12018585205078125, 0.127227783203125, 0.13426971435546875, 0.1413116455078125, 0.14835357666015625, 0.1553955078125, 0.16243743896484375, 0.1694793701171875, 0.17652130126953125, 0.183563232421875, 0.19060516357421875, 0.1976470947265625, 0.20468902587890625, 0.21173095703125, 0.21877288818359375, 0.2258148193359375, 0.23285675048828125, 0.239898681640625, 0.24694061279296875, 0.2539825439453125, 0.26102447509765625, 0.26806640625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 8.0, 5.0, 6.0, 9.0, 15.0, 29.0, 43.0, 90.0, 198.0, 237.0, 145.0, 87.0, 43.0, 29.0, 23.0, 13.0, 6.0, 6.0, 4.0, 5.0, 1.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1058349609375, -0.10308170318603516, -0.10032844543457031, -0.09757518768310547, -0.09482192993164062, -0.09206867218017578, -0.08931541442871094, -0.0865621566772461, -0.08380889892578125, -0.0810556411743164, -0.07830238342285156, -0.07554912567138672, -0.07279586791992188, -0.07004261016845703, -0.06728935241699219, -0.06453609466552734, -0.0617828369140625, -0.059029579162597656, -0.05627632141113281, -0.05352306365966797, -0.050769805908203125, -0.04801654815673828, -0.04526329040527344, -0.042510032653808594, -0.03975677490234375, -0.037003517150878906, -0.03425025939941406, -0.03149700164794922, -0.028743743896484375, -0.02599048614501953, -0.023237228393554688, -0.020483970642089844, -0.017730712890625, -0.014977455139160156, -0.012224197387695312, -0.009470939636230469, -0.006717681884765625, -0.003964424133300781, -0.0012111663818359375, 0.0015420913696289062, 0.00429534912109375, 0.007048606872558594, 0.009801864624023438, 0.012555122375488281, 0.015308380126953125, 0.01806163787841797, 0.020814895629882812, 0.023568153381347656, 0.0263214111328125, 0.029074668884277344, 0.03182792663574219, 0.03458118438720703, 0.037334442138671875, 0.04008769989013672, 0.04284095764160156, 0.045594215393066406, 0.04834747314453125, 0.051100730895996094, 0.05385398864746094, 0.05660724639892578, 0.059360504150390625, 0.06211376190185547, 0.06486701965332031, 0.06762027740478516, 0.07037353515625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 19.0, 17.0, 16.0, 34.0, 53.0, 49.0, 66.0, 102.0, 119.0, 116.0, 97.0, 82.0, 57.0, 44.0, 28.0, 26.0, 21.0, 13.0, 6.0, 10.0, 2.0, 4.0, 1.0, 0.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.479384660720825, -2.399658441543579, -2.319932460784912, -2.240206241607666, -2.16048002243042, -2.080754041671753, -2.001027822494507, -1.9213017225265503, -1.8415756225585938, -1.7618495225906372, -1.6821233034133911, -1.6023972034454346, -1.522671103477478, -1.4429450035095215, -1.3632187843322754, -1.2834926843643188, -1.2037664651870728, -1.1240403652191162, -1.0443141460418701, -0.9645880460739136, -0.884861946105957, -0.8051357865333557, -0.7254096269607544, -0.6456835269927979, -0.5659573674201965, -0.4862312376499176, -0.40650510787963867, -0.32677894830703735, -0.24705281853675842, -0.1673266887664795, -0.08760052919387817, -0.00787442922592163, 0.07185173034667969, 0.15157786011695862, 0.23130400478839874, 0.31103014945983887, 0.3907562792301178, 0.47048240900039673, 0.550208568572998, 0.6299346685409546, 0.7096608281135559, 0.7893869876861572, 0.8691130876541138, 0.9488392472267151, 1.0285654067993164, 1.108291506767273, 1.1880176067352295, 1.2677438259124756, 1.3474699258804321, 1.4271960258483887, 1.5069222450256348, 1.5866483449935913, 1.6663744449615479, 1.746100664138794, 1.8258267641067505, 1.905552864074707, 1.9852790832519531, 2.065005302429199, 2.144731283187866, 2.2244575023651123, 2.3041837215423584, 2.3839097023010254, 2.4636359214782715, 2.5433621406555176, 2.6230881214141846]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 11.0, 6.0, 6.0, 9.0, 13.0, 9.0, 9.0, 22.0, 21.0, 28.0, 28.0, 25.0, 28.0, 37.0, 26.0, 38.0, 31.0, 35.0, 27.0, 53.0, 40.0, 33.0, 34.0, 36.0, 43.0, 39.0, 29.0, 34.0, 28.0, 25.0, 29.0, 25.0, 24.0, 13.0, 21.0, 21.0, 11.0, 9.0, 9.0, 13.0, 3.0, 7.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.507295608520508, -6.283201217651367, -6.059106349945068, -5.8350114822387695, -5.610917091369629, -5.386822700500488, -5.1627278327941895, -4.938632965087891, -4.71453857421875, -4.490444183349609, -4.2663493156433105, -4.042254447937012, -3.818160057067871, -3.5940654277801514, -3.3699707984924316, -3.145876169204712, -2.921781539916992, -2.6976869106292725, -2.4735922813415527, -2.249497652053833, -2.0254030227661133, -1.8013083934783936, -1.5772137641906738, -1.353119134902954, -1.1290245056152344, -0.9049298763275146, -0.6808352470397949, -0.4567406177520752, -0.23264598846435547, -0.008551359176635742, 0.21554327011108398, 0.4396378993988037, 0.6637330055236816, 0.8878276348114014, 1.111922264099121, 1.3360168933868408, 1.5601115226745605, 1.7842061519622803, 2.00830078125, 2.2323954105377197, 2.4564900398254395, 2.680584669113159, 2.904679298400879, 3.1287739276885986, 3.3528685569763184, 3.576963186264038, 3.801057815551758, 4.025152206420898, 4.249247074127197, 4.473341941833496, 4.697436332702637, 4.921530723571777, 5.145625591278076, 5.369720458984375, 5.593814849853516, 5.817909240722656, 6.042004108428955, 6.266098976135254, 6.4901933670043945, 6.714287757873535, 6.938382625579834, 7.162477493286133, 7.386571884155273, 7.610666275024414, 7.834761142730713]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 4.0, 12.0, 9.0, 8.0, 21.0, 22.0, 26.0, 48.0, 99.0, 156.0, 277.0, 616.0, 1469.0, 3742.0, 10691.0, 59128.0, 2125065.0, 1921191.0, 54649.0, 10837.0, 3561.0, 1409.0, 583.0, 268.0, 130.0, 69.0, 59.0, 16.0, 20.0, 13.0, 11.0, 13.0, 18.0, 7.0, 8.0, 3.0, 4.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.103515625, -3.009429931640625, -2.91534423828125, -2.821258544921875, -2.7271728515625, -2.633087158203125, -2.53900146484375, -2.444915771484375, -2.350830078125, -2.256744384765625, -2.16265869140625, -2.068572998046875, -1.9744873046875, -1.880401611328125, -1.78631591796875, -1.692230224609375, -1.59814453125, -1.504058837890625, -1.40997314453125, -1.315887451171875, -1.2218017578125, -1.127716064453125, -1.03363037109375, -0.939544677734375, -0.845458984375, -0.751373291015625, -0.65728759765625, -0.563201904296875, -0.4691162109375, -0.375030517578125, -0.28094482421875, -0.186859130859375, -0.0927734375, 0.001312255859375, 0.09539794921875, 0.189483642578125, 0.2835693359375, 0.377655029296875, 0.47174072265625, 0.565826416015625, 0.659912109375, 0.753997802734375, 0.84808349609375, 0.942169189453125, 1.0362548828125, 1.130340576171875, 1.22442626953125, 1.318511962890625, 1.41259765625, 1.506683349609375, 1.60076904296875, 1.694854736328125, 1.7889404296875, 1.883026123046875, 1.97711181640625, 2.071197509765625, 2.165283203125, 2.259368896484375, 2.35345458984375, 2.447540283203125, 2.5416259765625, 2.635711669921875, 2.72979736328125, 2.823883056640625, 2.91796875]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 5.0, 7.0, 7.0, 19.0, 9.0, 15.0, 23.0, 23.0, 28.0, 26.0, 37.0, 36.0, 37.0, 32.0, 39.0, 43.0, 48.0, 50.0, 44.0, 49.0, 42.0, 55.0, 44.0, 31.0, 33.0, 29.0, 32.0, 28.0, 25.0, 20.0, 19.0, 13.0, 9.0, 6.0, 7.0, 8.0, 4.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0], "bins": [-1.2216796875, -1.1895370483398438, -1.1573944091796875, -1.1252517700195312, -1.093109130859375, -1.0609664916992188, -1.0288238525390625, -0.9966812133789062, -0.96453857421875, -0.9323959350585938, -0.9002532958984375, -0.8681106567382812, -0.835968017578125, -0.8038253784179688, -0.7716827392578125, -0.7395401000976562, -0.7073974609375, -0.6752548217773438, -0.6431121826171875, -0.6109695434570312, -0.578826904296875, -0.5466842651367188, -0.5145416259765625, -0.48239898681640625, -0.45025634765625, -0.41811370849609375, -0.3859710693359375, -0.35382843017578125, -0.321685791015625, -0.28954315185546875, -0.2574005126953125, -0.22525787353515625, -0.193115234375, -0.16097259521484375, -0.1288299560546875, -0.09668731689453125, -0.064544677734375, -0.03240203857421875, -0.0002593994140625, 0.03188323974609375, 0.06402587890625, 0.09616851806640625, 0.1283111572265625, 0.16045379638671875, 0.192596435546875, 0.22473907470703125, 0.2568817138671875, 0.28902435302734375, 0.3211669921875, 0.35330963134765625, 0.3854522705078125, 0.41759490966796875, 0.449737548828125, 0.48188018798828125, 0.5140228271484375, 0.5461654663085938, 0.57830810546875, 0.6104507446289062, 0.6425933837890625, 0.6747360229492188, 0.706878662109375, 0.7390213012695312, 0.7711639404296875, 0.8033065795898438, 0.83544921875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 8.0, 10.0, 20.0, 37.0, 114.0, 1006.0, 4192238.0, 634.0, 114.0, 40.0, 27.0, 8.0, 14.0, 3.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.90625, -21.9296875, -20.953125, -19.9765625, -19.0, -18.0234375, -17.046875, -16.0703125, -15.09375, -14.1171875, -13.140625, -12.1640625, -11.1875, -10.2109375, -9.234375, -8.2578125, -7.28125, -6.3046875, -5.328125, -4.3515625, -3.375, -2.3984375, -1.421875, -0.4453125, 0.53125, 1.5078125, 2.484375, 3.4609375, 4.4375, 5.4140625, 6.390625, 7.3671875, 8.34375, 9.3203125, 10.296875, 11.2734375, 12.25, 13.2265625, 14.203125, 15.1796875, 16.15625, 17.1328125, 18.109375, 19.0859375, 20.0625, 21.0390625, 22.015625, 22.9921875, 23.96875, 24.9453125, 25.921875, 26.8984375, 27.875, 28.8515625, 29.828125, 30.8046875, 31.78125, 32.7578125, 33.734375, 34.7109375, 35.6875, 36.6640625, 37.640625, 38.6171875, 39.59375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 7.0, 11.0, 5.0, 15.0, 15.0, 37.0, 27.0, 49.0, 65.0, 106.0, 157.0, 351.0, 758.0, 1122.0, 624.0, 294.0, 138.0, 85.0, 54.0, 45.0, 29.0, 23.0, 21.0, 9.0, 6.0, 6.0, 2.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71826171875, -0.6973495483398438, -0.6764373779296875, -0.6555252075195312, -0.634613037109375, -0.6137008666992188, -0.5927886962890625, -0.5718765258789062, -0.55096435546875, -0.5300521850585938, -0.5091400146484375, -0.48822784423828125, -0.467315673828125, -0.44640350341796875, -0.4254913330078125, -0.40457916259765625, -0.3836669921875, -0.36275482177734375, -0.3418426513671875, -0.32093048095703125, -0.300018310546875, -0.27910614013671875, -0.2581939697265625, -0.23728179931640625, -0.21636962890625, -0.19545745849609375, -0.1745452880859375, -0.15363311767578125, -0.132720947265625, -0.11180877685546875, -0.0908966064453125, -0.06998443603515625, -0.049072265625, -0.02816009521484375, -0.0072479248046875, 0.01366424560546875, 0.034576416015625, 0.05548858642578125, 0.0764007568359375, 0.09731292724609375, 0.11822509765625, 0.13913726806640625, 0.1600494384765625, 0.18096160888671875, 0.201873779296875, 0.22278594970703125, 0.2436981201171875, 0.26461029052734375, 0.2855224609375, 0.30643463134765625, 0.3273468017578125, 0.34825897216796875, 0.369171142578125, 0.39008331298828125, 0.4109954833984375, 0.43190765380859375, 0.45281982421875, 0.47373199462890625, 0.4946441650390625, 0.5155563354492188, 0.536468505859375, 0.5573806762695312, 0.5782928466796875, 0.5992050170898438, 0.6201171875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 2.0, 4.0, 10.0, 18.0, 18.0, 28.0, 27.0, 32.0, 61.0, 96.0, 105.0, 97.0, 135.0, 85.0, 73.0, 53.0, 37.0, 34.0, 19.0, 16.0, 11.0, 9.0, 6.0, 8.0, 4.0, 6.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.5102577209472656, -2.450434684753418, -2.3906118869781494, -2.3307888507843018, -2.270966053009033, -2.2111430168151855, -2.151320219039917, -2.0914971828460693, -2.031674385070801, -1.9718514680862427, -1.9120285511016846, -1.8522056341171265, -1.7923827171325684, -1.7325596809387207, -1.6727367639541626, -1.6129138469696045, -1.5530908107757568, -1.4932678937911987, -1.4334449768066406, -1.3736220598220825, -1.3137991428375244, -1.2539761066436768, -1.1941531896591187, -1.1343302726745605, -1.0745073556900024, -1.0146844387054443, -0.9548615217208862, -0.8950385451316833, -0.8352156281471252, -0.7753927111625671, -0.7155697345733643, -0.6557468175888062, -0.5959240198135376, -0.5361011028289795, -0.476278156042099, -0.4164552092552185, -0.3566322922706604, -0.2968093752861023, -0.2369864284992218, -0.1771634817123413, -0.1173405647277832, -0.057517632842063904, 0.0023052990436553955, 0.062128230929374695, 0.121951162815094, 0.1817740797996521, 0.2415970265865326, 0.3014199733734131, 0.3612428903579712, 0.4210658073425293, 0.4808887541294098, 0.5407117009162903, 0.6005346179008484, 0.6603575348854065, 0.7201805114746094, 0.7800034284591675, 0.8398263454437256, 0.8996492624282837, 0.9594721794128418, 1.0192950963974, 1.079118013381958, 1.1389410495758057, 1.1987639665603638, 1.2585868835449219, 1.31840980052948]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 6.0, 5.0, 6.0, 6.0, 15.0, 13.0, 14.0, 19.0, 28.0, 32.0, 31.0, 35.0, 33.0, 27.0, 25.0, 27.0, 33.0, 45.0, 51.0, 53.0, 46.0, 39.0, 42.0, 42.0, 32.0, 33.0, 37.0, 29.0, 23.0, 30.0, 26.0, 26.0, 11.0, 15.0, 7.0, 12.0, 6.0, 6.0, 4.0, 8.0, 7.0, 5.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1077584028244019, -1.0767717361450195, -1.0457850694656372, -1.0147982835769653, -0.983811616897583, -0.9528249502182007, -0.9218382835388184, -0.8908515572547913, -0.8598648309707642, -0.8288781642913818, -0.7978914380073547, -0.7669047713279724, -0.7359180450439453, -0.704931378364563, -0.6739447116851807, -0.6429579854011536, -0.6119713187217712, -0.5809846520423889, -0.5499979257583618, -0.5190112590789795, -0.4880245327949524, -0.45703786611557007, -0.42605116963386536, -0.39506447315216064, -0.36407777667045593, -0.3330910801887512, -0.3021043837070465, -0.2711176872253418, -0.24013100564479828, -0.20914430916309357, -0.17815762758255005, -0.14717093110084534, -0.11618417501449585, -0.08519747853279114, -0.05421078950166702, -0.023224100470542908, 0.007762596011161804, 0.038749292492866516, 0.06973597407341003, 0.10072267055511475, 0.13170936703681946, 0.16269606351852417, 0.19368276000022888, 0.2246694415807724, 0.2556561231613159, 0.286642849445343, 0.31762951612472534, 0.34861621260643005, 0.37960290908813477, 0.4105896055698395, 0.4415763020515442, 0.4725629687309265, 0.5035496950149536, 0.5345363616943359, 0.5655230283737183, 0.5965097546577454, 0.6274964809417725, 0.6584831476211548, 0.6894698739051819, 0.7204565405845642, 0.7514432668685913, 0.7824299335479736, 0.813416600227356, 0.8444033265113831, 0.8753899931907654]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 8.0, 15.0, 14.0, 15.0, 28.0, 45.0, 82.0, 82.0, 114.0, 158.0, 217.0, 304.0, 486.0, 743.0, 1149.0, 1955.0, 3142.0, 5618.0, 10458.0, 22197.0, 51631.0, 140810.0, 387232.0, 264109.0, 87930.0, 35092.0, 15674.0, 7851.0, 4342.0, 2573.0, 1562.0, 984.0, 584.0, 417.0, 260.0, 188.0, 149.0, 102.0, 70.0, 50.0, 22.0, 28.0, 16.0, 17.0, 11.0, 7.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.488037109375, -0.4731483459472656, -0.45825958251953125, -0.4433708190917969, -0.4284820556640625, -0.4135932922363281, -0.39870452880859375, -0.3838157653808594, -0.368927001953125, -0.3540382385253906, -0.33914947509765625, -0.3242607116699219, -0.3093719482421875, -0.2944831848144531, -0.27959442138671875, -0.2647056579589844, -0.24981689453125, -0.23492813110351562, -0.22003936767578125, -0.20515060424804688, -0.1902618408203125, -0.17537307739257812, -0.16048431396484375, -0.14559555053710938, -0.130706787109375, -0.11581802368164062, -0.10092926025390625, -0.08604049682617188, -0.0711517333984375, -0.056262969970703125, -0.04137420654296875, -0.026485443115234375, -0.0115966796875, 0.003292083740234375, 0.01818084716796875, 0.033069610595703125, 0.0479583740234375, 0.06284713745117188, 0.07773590087890625, 0.09262466430664062, 0.107513427734375, 0.12240219116210938, 0.13729095458984375, 0.15217971801757812, 0.1670684814453125, 0.18195724487304688, 0.19684600830078125, 0.21173477172851562, 0.22662353515625, 0.24151229858398438, 0.25640106201171875, 0.2712898254394531, 0.2861785888671875, 0.3010673522949219, 0.31595611572265625, 0.3308448791503906, 0.345733642578125, 0.3606224060058594, 0.37551116943359375, 0.3903999328613281, 0.4052886962890625, 0.4201774597167969, 0.43506622314453125, 0.4499549865722656, 0.46484375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 7.0, 5.0, 4.0, 6.0, 10.0, 11.0, 5.0, 10.0, 14.0, 23.0, 35.0, 33.0, 22.0, 43.0, 37.0, 34.0, 27.0, 39.0, 37.0, 57.0, 47.0, 45.0, 51.0, 49.0, 39.0, 46.0, 29.0, 33.0, 23.0, 26.0, 29.0, 24.0, 21.0, 12.0, 16.0, 10.0, 8.0, 7.0, 6.0, 3.0, 3.0, 9.0, 5.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.796875, -0.774658203125, -0.75244140625, -0.730224609375, -0.7080078125, -0.685791015625, -0.66357421875, -0.641357421875, -0.619140625, -0.596923828125, -0.57470703125, -0.552490234375, -0.5302734375, -0.508056640625, -0.48583984375, -0.463623046875, -0.44140625, -0.419189453125, -0.39697265625, -0.374755859375, -0.3525390625, -0.330322265625, -0.30810546875, -0.285888671875, -0.263671875, -0.241455078125, -0.21923828125, -0.197021484375, -0.1748046875, -0.152587890625, -0.13037109375, -0.108154296875, -0.0859375, -0.063720703125, -0.04150390625, -0.019287109375, 0.0029296875, 0.025146484375, 0.04736328125, 0.069580078125, 0.091796875, 0.114013671875, 0.13623046875, 0.158447265625, 0.1806640625, 0.202880859375, 0.22509765625, 0.247314453125, 0.26953125, 0.291748046875, 0.31396484375, 0.336181640625, 0.3583984375, 0.380615234375, 0.40283203125, 0.425048828125, 0.447265625, 0.469482421875, 0.49169921875, 0.513916015625, 0.5361328125, 0.558349609375, 0.58056640625, 0.602783203125, 0.625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 5.0, 5.0, 8.0, 10.0, 13.0, 19.0, 19.0, 24.0, 50.0, 72.0, 74.0, 136.0, 177.0, 270.0, 450.0, 604.0, 1059.0, 1822.0, 3393.0, 6704.0, 14834.0, 38305.0, 115876.0, 385495.0, 326855.0, 93807.0, 31969.0, 12940.0, 5936.0, 3014.0, 1744.0, 1015.0, 614.0, 361.0, 275.0, 168.0, 127.0, 86.0, 67.0, 48.0, 34.0, 17.0, 18.0, 13.0, 6.0, 6.0, 7.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.487060546875, -0.4722633361816406, -0.45746612548828125, -0.4426689147949219, -0.4278717041015625, -0.4130744934082031, -0.39827728271484375, -0.3834800720214844, -0.368682861328125, -0.3538856506347656, -0.33908843994140625, -0.3242912292480469, -0.3094940185546875, -0.2946968078613281, -0.27989959716796875, -0.2651023864746094, -0.25030517578125, -0.23550796508789062, -0.22071075439453125, -0.20591354370117188, -0.1911163330078125, -0.17631912231445312, -0.16152191162109375, -0.14672470092773438, -0.131927490234375, -0.11713027954101562, -0.10233306884765625, -0.08753585815429688, -0.0727386474609375, -0.057941436767578125, -0.04314422607421875, -0.028347015380859375, -0.0135498046875, 0.001247406005859375, 0.01604461669921875, 0.030841827392578125, 0.0456390380859375, 0.060436248779296875, 0.07523345947265625, 0.09003067016601562, 0.104827880859375, 0.11962509155273438, 0.13442230224609375, 0.14921951293945312, 0.1640167236328125, 0.17881393432617188, 0.19361114501953125, 0.20840835571289062, 0.22320556640625, 0.23800277709960938, 0.25279998779296875, 0.2675971984863281, 0.2823944091796875, 0.2971916198730469, 0.31198883056640625, 0.3267860412597656, 0.341583251953125, 0.3563804626464844, 0.37117767333984375, 0.3859748840332031, 0.4007720947265625, 0.4155693054199219, 0.43036651611328125, 0.4451637268066406, 0.4599609375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 16.0, 12.0, 22.0, 23.0, 22.0, 37.0, 29.0, 47.0, 42.0, 42.0, 63.0, 55.0, 64.0, 60.0, 68.0, 62.0, 57.0, 34.0, 45.0, 40.0, 41.0, 28.0, 13.0, 18.0, 19.0, 7.0, 6.0, 6.0, 6.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9990234375, -1.9416961669921875, -1.884368896484375, -1.8270416259765625, -1.76971435546875, -1.7123870849609375, -1.655059814453125, -1.5977325439453125, -1.5404052734375, -1.4830780029296875, -1.425750732421875, -1.3684234619140625, -1.31109619140625, -1.2537689208984375, -1.196441650390625, -1.1391143798828125, -1.081787109375, -1.0244598388671875, -0.967132568359375, -0.9098052978515625, -0.85247802734375, -0.7951507568359375, -0.737823486328125, -0.6804962158203125, -0.6231689453125, -0.5658416748046875, -0.508514404296875, -0.4511871337890625, -0.39385986328125, -0.3365325927734375, -0.279205322265625, -0.2218780517578125, -0.16455078125, -0.1072235107421875, -0.049896240234375, 0.0074310302734375, 0.06475830078125, 0.1220855712890625, 0.179412841796875, 0.2367401123046875, 0.2940673828125, 0.3513946533203125, 0.408721923828125, 0.4660491943359375, 0.52337646484375, 0.5807037353515625, 0.638031005859375, 0.6953582763671875, 0.752685546875, 0.8100128173828125, 0.867340087890625, 0.9246673583984375, 0.98199462890625, 1.0393218994140625, 1.096649169921875, 1.1539764404296875, 1.2113037109375, 1.2686309814453125, 1.325958251953125, 1.3832855224609375, 1.44061279296875, 1.4979400634765625, 1.555267333984375, 1.6125946044921875, 1.669921875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 1.0, 5.0, 6.0, 9.0, 16.0, 18.0, 27.0, 33.0, 70.0, 124.0, 163.0, 284.0, 531.0, 960.0, 2233.0, 5241.0, 16280.0, 63873.0, 369235.0, 476382.0, 81931.0, 20028.0, 6236.0, 2441.0, 1108.0, 590.0, 315.0, 168.0, 94.0, 49.0, 42.0, 19.0, 12.0, 9.0, 10.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.125732421875, -0.12181282043457031, -0.11789321899414062, -0.11397361755371094, -0.11005401611328125, -0.10613441467285156, -0.10221481323242188, -0.09829521179199219, -0.0943756103515625, -0.09045600891113281, -0.08653640747070312, -0.08261680603027344, -0.07869720458984375, -0.07477760314941406, -0.07085800170898438, -0.06693840026855469, -0.063018798828125, -0.05909919738769531, -0.055179595947265625, -0.05125999450683594, -0.04734039306640625, -0.04342079162597656, -0.039501190185546875, -0.03558158874511719, -0.0316619873046875, -0.027742385864257812, -0.023822784423828125, -0.019903182983398438, -0.01598358154296875, -0.012063980102539062, -0.008144378662109375, -0.0042247772216796875, -0.00030517578125, 0.0036144256591796875, 0.007534027099609375, 0.011453628540039062, 0.01537322998046875, 0.019292831420898438, 0.023212432861328125, 0.027132034301757812, 0.0310516357421875, 0.03497123718261719, 0.038890838623046875, 0.04281044006347656, 0.04673004150390625, 0.05064964294433594, 0.054569244384765625, 0.05848884582519531, 0.062408447265625, 0.06632804870605469, 0.07024765014648438, 0.07416725158691406, 0.07808685302734375, 0.08200645446777344, 0.08592605590820312, 0.08984565734863281, 0.0937652587890625, 0.09768486022949219, 0.10160446166992188, 0.10552406311035156, 0.10944366455078125, 0.11336326599121094, 0.11728286743164062, 0.12120246887207031, 0.1251220703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 6.0, 2.0, 2.0, 10.0, 12.0, 16.0, 19.0, 27.0, 32.0, 44.0, 58.0, 63.0, 77.0, 122.0, 100.0, 97.0, 79.0, 57.0, 39.0, 30.0, 28.0, 16.0, 15.0, 9.0, 8.0, 12.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.975101470947266e-05, -7.766392081975937e-05, -7.557682693004608e-05, -7.34897330403328e-05, -7.140263915061951e-05, -6.931554526090622e-05, -6.722845137119293e-05, -6.514135748147964e-05, -6.305426359176636e-05, -6.096716970205307e-05, -5.888007581233978e-05, -5.6792981922626495e-05, -5.470588803291321e-05, -5.261879414319992e-05, -5.053170025348663e-05, -4.8444606363773346e-05, -4.635751247406006e-05, -4.427041858434677e-05, -4.2183324694633484e-05, -4.0096230804920197e-05, -3.800913691520691e-05, -3.592204302549362e-05, -3.3834949135780334e-05, -3.174785524606705e-05, -2.966076135635376e-05, -2.7573667466640472e-05, -2.5486573576927185e-05, -2.3399479687213898e-05, -2.131238579750061e-05, -1.9225291907787323e-05, -1.7138198018074036e-05, -1.5051104128360748e-05, -1.2964010238647461e-05, -1.0876916348934174e-05, -8.789822459220886e-06, -6.702728569507599e-06, -4.6156346797943115e-06, -2.528540790081024e-06, -4.414469003677368e-07, 1.6456469893455505e-06, 3.732740879058838e-06, 5.819834768772125e-06, 7.906928658485413e-06, 9.9940225481987e-06, 1.2081116437911987e-05, 1.4168210327625275e-05, 1.6255304217338562e-05, 1.834239810705185e-05, 2.0429491996765137e-05, 2.2516585886478424e-05, 2.460367977619171e-05, 2.6690773665905e-05, 2.8777867555618286e-05, 3.0864961445331573e-05, 3.295205533504486e-05, 3.503914922475815e-05, 3.7126243114471436e-05, 3.921333700418472e-05, 4.130043089389801e-05, 4.33875247836113e-05, 4.5474618673324585e-05, 4.756171256303787e-05, 4.964880645275116e-05, 5.173590034246445e-05, 5.3822994232177734e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 9.0, 13.0, 5.0, 17.0, 25.0, 29.0, 36.0, 55.0, 128.0, 328.0, 835.0, 2394.0, 7607.0, 30121.0, 180654.0, 665984.0, 127269.0, 23585.0, 6176.0, 1971.0, 700.0, 278.0, 120.0, 81.0, 39.0, 23.0, 21.0, 10.0, 6.0, 5.0, 7.0, 9.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.136474609375, -0.13149642944335938, -0.12651824951171875, -0.12154006958007812, -0.1165618896484375, -0.11158370971679688, -0.10660552978515625, -0.10162734985351562, -0.096649169921875, -0.09167098999023438, -0.08669281005859375, -0.08171463012695312, -0.0767364501953125, -0.07175827026367188, -0.06678009033203125, -0.061801910400390625, -0.05682373046875, -0.051845550537109375, -0.04686737060546875, -0.041889190673828125, -0.0369110107421875, -0.031932830810546875, -0.02695465087890625, -0.021976470947265625, -0.016998291015625, -0.012020111083984375, -0.00704193115234375, -0.002063751220703125, 0.0029144287109375, 0.007892608642578125, 0.01287078857421875, 0.017848968505859375, 0.0228271484375, 0.027805328369140625, 0.03278350830078125, 0.037761688232421875, 0.0427398681640625, 0.047718048095703125, 0.05269622802734375, 0.057674407958984375, 0.062652587890625, 0.06763076782226562, 0.07260894775390625, 0.07758712768554688, 0.0825653076171875, 0.08754348754882812, 0.09252166748046875, 0.09749984741210938, 0.10247802734375, 0.10745620727539062, 0.11243438720703125, 0.11741256713867188, 0.1223907470703125, 0.12736892700195312, 0.13234710693359375, 0.13732528686523438, 0.142303466796875, 0.14728164672851562, 0.15225982666015625, 0.15723800659179688, 0.1622161865234375, 0.16719436645507812, 0.17217254638671875, 0.17715072631835938, 0.18212890625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 8.0, 0.0, 5.0, 7.0, 5.0, 7.0, 11.0, 10.0, 15.0, 19.0, 27.0, 28.0, 39.0, 56.0, 55.0, 55.0, 62.0, 71.0, 83.0, 92.0, 68.0, 63.0, 28.0, 35.0, 27.0, 28.0, 29.0, 7.0, 12.0, 10.0, 13.0, 7.0, 8.0, 6.0, 7.0, 1.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032318115234375, -0.031420230865478516, -0.03052234649658203, -0.029624462127685547, -0.028726577758789062, -0.027828693389892578, -0.026930809020996094, -0.02603292465209961, -0.025135040283203125, -0.02423715591430664, -0.023339271545410156, -0.022441387176513672, -0.021543502807617188, -0.020645618438720703, -0.01974773406982422, -0.018849849700927734, -0.01795196533203125, -0.017054080963134766, -0.01615619659423828, -0.015258312225341797, -0.014360427856445312, -0.013462543487548828, -0.012564659118652344, -0.01166677474975586, -0.010768890380859375, -0.00987100601196289, -0.008973121643066406, -0.008075237274169922, -0.0071773529052734375, -0.006279468536376953, -0.005381584167480469, -0.004483699798583984, -0.0035858154296875, -0.0026879310607910156, -0.0017900466918945312, -0.0008921623229980469, 5.7220458984375e-06, 0.0009036064147949219, 0.0018014907836914062, 0.0026993751525878906, 0.003597259521484375, 0.004495143890380859, 0.005393028259277344, 0.006290912628173828, 0.0071887969970703125, 0.008086681365966797, 0.008984565734863281, 0.009882450103759766, 0.01078033447265625, 0.011678218841552734, 0.012576103210449219, 0.013473987579345703, 0.014371871948242188, 0.015269756317138672, 0.016167640686035156, 0.01706552505493164, 0.017963409423828125, 0.01886129379272461, 0.019759178161621094, 0.020657062530517578, 0.021554946899414062, 0.022452831268310547, 0.02335071563720703, 0.024248600006103516, 0.025146484375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 23.0, 37.0, 29.0, 68.0, 137.0, 200.0, 207.0, 105.0, 73.0, 37.0, 26.0, 17.0, 9.0, 11.0, 6.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.530160665512085, -2.473973512649536, -2.4177865982055664, -2.3615994453430176, -2.305412530899048, -2.249225378036499, -2.1930384635925293, -2.1368513107299805, -2.0806641578674316, -2.024477005004883, -1.968290090560913, -1.9121030569076538, -1.8559160232543945, -1.7997288703918457, -1.7435418367385864, -1.6873548030853271, -1.6311678886413574, -1.5749808549880981, -1.5187938213348389, -1.4626067876815796, -1.4064197540283203, -1.3502326011657715, -1.2940455675125122, -1.237858533859253, -1.1816715002059937, -1.1254844665527344, -1.069297432899475, -1.0131103992462158, -0.9569233059883118, -0.9007362723350525, -0.8445491790771484, -0.7883621454238892, -0.7321751117706299, -0.6759880781173706, -0.6198010444641113, -0.5636139512062073, -0.507426917552948, -0.4512398838996887, -0.39505282044410706, -0.3388657569885254, -0.2826787233352661, -0.22649167478084564, -0.17030462622642517, -0.1141175776720047, -0.05793052911758423, -0.0017434954643249512, 0.054443567991256714, 0.11063063144683838, 0.16681766510009766, 0.22300471365451813, 0.2791917622089386, 0.33537882566452026, 0.39156585931777954, 0.4477528929710388, 0.5039399862289429, 0.5601270198822021, 0.6163140535354614, 0.6725010871887207, 0.72868812084198, 0.784875214099884, 0.8410622477531433, 0.8972492814064026, 0.9534363746643066, 1.009623408317566, 1.0658104419708252]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 4.0, 5.0, 6.0, 18.0, 9.0, 15.0, 20.0, 27.0, 30.0, 32.0, 38.0, 33.0, 29.0, 18.0, 36.0, 53.0, 33.0, 49.0, 47.0, 31.0, 63.0, 37.0, 36.0, 41.0, 34.0, 40.0, 25.0, 31.0, 22.0, 27.0, 20.0, 12.0, 13.0, 8.0, 8.0, 10.0, 4.0, 5.0, 9.0, 5.0, 6.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7298775911331177, -0.708768367767334, -0.6876590847969055, -0.666549801826477, -0.6454405784606934, -0.6243313550949097, -0.6032220721244812, -0.5821127891540527, -0.561003565788269, -0.5398943424224854, -0.5187850594520569, -0.4976758062839508, -0.4765665531158447, -0.45545729994773865, -0.43434804677963257, -0.4132387936115265, -0.3921295404434204, -0.37102028727531433, -0.34991103410720825, -0.3288017809391022, -0.3076925277709961, -0.28658327460289, -0.26547402143478394, -0.24436476826667786, -0.22325551509857178, -0.2021462619304657, -0.18103700876235962, -0.15992775559425354, -0.13881850242614746, -0.11770924925804138, -0.0965999960899353, -0.07549074292182922, -0.054381489753723145, -0.033272236585617065, -0.012162983417510986, 0.008946269750595093, 0.030055522918701172, 0.05116477608680725, 0.07227402925491333, 0.09338328242301941, 0.11449253559112549, 0.13560178875923157, 0.15671104192733765, 0.17782029509544373, 0.1989295482635498, 0.22003880143165588, 0.24114805459976196, 0.26225730776786804, 0.2833665609359741, 0.3044758141040802, 0.3255850672721863, 0.34669432044029236, 0.36780357360839844, 0.3889128267765045, 0.4100220799446106, 0.4311313331127167, 0.45224058628082275, 0.47334983944892883, 0.4944590926170349, 0.5155683755874634, 0.5366775989532471, 0.5577868223190308, 0.5788961052894592, 0.6000053882598877, 0.6211146116256714]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 4.0, 7.0, 8.0, 11.0, 12.0, 19.0, 23.0, 34.0, 45.0, 68.0, 107.0, 118.0, 188.0, 259.0, 394.0, 541.0, 890.0, 1363.0, 2385.0, 5039.0, 12823.0, 47464.0, 290005.0, 557730.0, 92988.0, 20907.0, 7014.0, 3245.0, 1678.0, 1074.0, 622.0, 440.0, 308.0, 205.0, 148.0, 105.0, 69.0, 62.0, 46.0, 39.0, 23.0, 15.0, 9.0, 9.0, 8.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5087890625, -0.491943359375, -0.47509765625, -0.458251953125, -0.44140625, -0.424560546875, -0.40771484375, -0.390869140625, -0.3740234375, -0.357177734375, -0.34033203125, -0.323486328125, -0.306640625, -0.289794921875, -0.27294921875, -0.256103515625, -0.2392578125, -0.222412109375, -0.20556640625, -0.188720703125, -0.171875, -0.155029296875, -0.13818359375, -0.121337890625, -0.1044921875, -0.087646484375, -0.07080078125, -0.053955078125, -0.037109375, -0.020263671875, -0.00341796875, 0.013427734375, 0.0302734375, 0.047119140625, 0.06396484375, 0.080810546875, 0.09765625, 0.114501953125, 0.13134765625, 0.148193359375, 0.1650390625, 0.181884765625, 0.19873046875, 0.215576171875, 0.232421875, 0.249267578125, 0.26611328125, 0.282958984375, 0.2998046875, 0.316650390625, 0.33349609375, 0.350341796875, 0.3671875, 0.384033203125, 0.40087890625, 0.417724609375, 0.4345703125, 0.451416015625, 0.46826171875, 0.485107421875, 0.501953125, 0.518798828125, 0.53564453125, 0.552490234375, 0.5693359375]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 6.0, 4.0, 11.0, 8.0, 14.0, 8.0, 12.0, 19.0, 23.0, 31.0, 26.0, 35.0, 35.0, 28.0, 42.0, 36.0, 43.0, 44.0, 48.0, 43.0, 46.0, 56.0, 44.0, 43.0, 42.0, 25.0, 28.0, 24.0, 31.0, 28.0, 24.0, 22.0, 18.0, 17.0, 9.0, 7.0, 7.0, 6.0, 4.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0], "bins": [-2.0703125, -2.01220703125, -1.9541015625, -1.89599609375, -1.837890625, -1.77978515625, -1.7216796875, -1.66357421875, -1.60546875, -1.54736328125, -1.4892578125, -1.43115234375, -1.373046875, -1.31494140625, -1.2568359375, -1.19873046875, -1.140625, -1.08251953125, -1.0244140625, -0.96630859375, -0.908203125, -0.85009765625, -0.7919921875, -0.73388671875, -0.67578125, -0.61767578125, -0.5595703125, -0.50146484375, -0.443359375, -0.38525390625, -0.3271484375, -0.26904296875, -0.2109375, -0.15283203125, -0.0947265625, -0.03662109375, 0.021484375, 0.07958984375, 0.1376953125, 0.19580078125, 0.25390625, 0.31201171875, 0.3701171875, 0.42822265625, 0.486328125, 0.54443359375, 0.6025390625, 0.66064453125, 0.71875, 0.77685546875, 0.8349609375, 0.89306640625, 0.951171875, 1.00927734375, 1.0673828125, 1.12548828125, 1.18359375, 1.24169921875, 1.2998046875, 1.35791015625, 1.416015625, 1.47412109375, 1.5322265625, 1.59033203125, 1.6484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 10.0, 12.0, 15.0, 25.0, 24.0, 22.0, 30.0, 36.0, 47.0, 68.0, 122.0, 487.0, 989194.0, 57705.0, 306.0, 98.0, 60.0, 46.0, 50.0, 32.0, 39.0, 29.0, 22.0, 20.0, 14.0, 15.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.78515625, -5.5701904296875, -5.355224609375, -5.1402587890625, -4.92529296875, -4.7103271484375, -4.495361328125, -4.2803955078125, -4.0654296875, -3.8504638671875, -3.635498046875, -3.4205322265625, -3.20556640625, -2.9906005859375, -2.775634765625, -2.5606689453125, -2.345703125, -2.1307373046875, -1.915771484375, -1.7008056640625, -1.48583984375, -1.2708740234375, -1.055908203125, -0.8409423828125, -0.6259765625, -0.4110107421875, -0.196044921875, 0.0189208984375, 0.23388671875, 0.4488525390625, 0.663818359375, 0.8787841796875, 1.09375, 1.3087158203125, 1.523681640625, 1.7386474609375, 1.95361328125, 2.1685791015625, 2.383544921875, 2.5985107421875, 2.8134765625, 3.0284423828125, 3.243408203125, 3.4583740234375, 3.67333984375, 3.8883056640625, 4.103271484375, 4.3182373046875, 4.533203125, 4.7481689453125, 4.963134765625, 5.1781005859375, 5.39306640625, 5.6080322265625, 5.822998046875, 6.0379638671875, 6.2529296875, 6.4678955078125, 6.682861328125, 6.8978271484375, 7.11279296875, 7.3277587890625, 7.542724609375, 7.7576904296875, 7.97265625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 8.0, 8.0, 9.0, 11.0, 15.0, 28.0, 24.0, 23.0, 30.0, 38.0, 37.0, 63.0, 68.0, 62.0, 84.0, 58.0, 54.0, 56.0, 47.0, 43.0, 51.0, 39.0, 30.0, 30.0, 23.0, 24.0, 8.0, 17.0, 3.0, 2.0, 1.0, 5.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3046875, -2.218841552734375, -2.13299560546875, -2.047149658203125, -1.9613037109375, -1.875457763671875, -1.78961181640625, -1.703765869140625, -1.617919921875, -1.532073974609375, -1.44622802734375, -1.360382080078125, -1.2745361328125, -1.188690185546875, -1.10284423828125, -1.016998291015625, -0.93115234375, -0.845306396484375, -0.75946044921875, -0.673614501953125, -0.5877685546875, -0.501922607421875, -0.41607666015625, -0.330230712890625, -0.244384765625, -0.158538818359375, -0.07269287109375, 0.013153076171875, 0.0989990234375, 0.184844970703125, 0.27069091796875, 0.356536865234375, 0.4423828125, 0.528228759765625, 0.61407470703125, 0.699920654296875, 0.7857666015625, 0.871612548828125, 0.95745849609375, 1.043304443359375, 1.129150390625, 1.214996337890625, 1.30084228515625, 1.386688232421875, 1.4725341796875, 1.558380126953125, 1.64422607421875, 1.730072021484375, 1.81591796875, 1.901763916015625, 1.98760986328125, 2.073455810546875, 2.1593017578125, 2.245147705078125, 2.33099365234375, 2.416839599609375, 2.502685546875, 2.588531494140625, 2.67437744140625, 2.760223388671875, 2.8460693359375, 2.931915283203125, 3.01776123046875, 3.103607177734375, 3.189453125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 5.0, 10.0, 21.0, 38.0, 145.0, 925.0, 151996.0, 893694.0, 1468.0, 156.0, 47.0, 16.0, 6.0, 5.0, 4.0, 5.0, 1.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68603515625, -0.6500625610351562, -0.6140899658203125, -0.5781173706054688, -0.542144775390625, -0.5061721801757812, -0.4701995849609375, -0.43422698974609375, -0.39825439453125, -0.36228179931640625, -0.3263092041015625, -0.29033660888671875, -0.254364013671875, -0.21839141845703125, -0.1824188232421875, -0.14644622802734375, -0.1104736328125, -0.07450103759765625, -0.0385284423828125, -0.00255584716796875, 0.033416748046875, 0.06938934326171875, 0.1053619384765625, 0.14133453369140625, 0.17730712890625, 0.21327972412109375, 0.2492523193359375, 0.28522491455078125, 0.321197509765625, 0.35717010498046875, 0.3931427001953125, 0.42911529541015625, 0.465087890625, 0.5010604858398438, 0.5370330810546875, 0.5730056762695312, 0.608978271484375, 0.6449508666992188, 0.6809234619140625, 0.7168960571289062, 0.75286865234375, 0.7888412475585938, 0.8248138427734375, 0.8607864379882812, 0.896759033203125, 0.9327316284179688, 0.9687042236328125, 1.0046768188476562, 1.0406494140625, 1.0766220092773438, 1.1125946044921875, 1.1485671997070312, 1.184539794921875, 1.2205123901367188, 1.2564849853515625, 1.2924575805664062, 1.32843017578125, 1.3644027709960938, 1.4003753662109375, 1.4363479614257812, 1.472320556640625, 1.5082931518554688, 1.5442657470703125, 1.5802383422851562, 1.6162109375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 6.0, 2.0, 12.0, 14.0, 7.0, 10.0, 19.0, 18.0, 36.0, 43.0, 82.0, 124.0, 213.0, 145.0, 102.0, 49.0, 22.0, 30.0, 17.0, 8.0, 16.0, 2.0, 7.0, 4.0, 5.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.74913215637207e-05, -3.637932240962982e-05, -3.526732325553894e-05, -3.415532410144806e-05, -3.304332494735718e-05, -3.1931325793266296e-05, -3.0819326639175415e-05, -2.9707327485084534e-05, -2.8595328330993652e-05, -2.748332917690277e-05, -2.637133002281189e-05, -2.5259330868721008e-05, -2.4147331714630127e-05, -2.3035332560539246e-05, -2.1923333406448364e-05, -2.0811334252357483e-05, -1.96993350982666e-05, -1.858733594417572e-05, -1.747533679008484e-05, -1.6363337635993958e-05, -1.5251338481903076e-05, -1.4139339327812195e-05, -1.3027340173721313e-05, -1.1915341019630432e-05, -1.080334186553955e-05, -9.69134271144867e-06, -8.579343557357788e-06, -7.467344403266907e-06, -6.355345249176025e-06, -5.243346095085144e-06, -4.131346940994263e-06, -3.0193477869033813e-06, -1.9073486328125e-06, -7.953494787216187e-07, 3.166496753692627e-07, 1.428648829460144e-06, 2.5406479835510254e-06, 3.6526471376419067e-06, 4.764646291732788e-06, 5.8766454458236694e-06, 6.988644599914551e-06, 8.100643754005432e-06, 9.212642908096313e-06, 1.0324642062187195e-05, 1.1436641216278076e-05, 1.2548640370368958e-05, 1.3660639524459839e-05, 1.477263867855072e-05, 1.58846378326416e-05, 1.6996636986732483e-05, 1.8108636140823364e-05, 1.9220635294914246e-05, 2.0332634449005127e-05, 2.1444633603096008e-05, 2.255663275718689e-05, 2.366863191127777e-05, 2.4780631065368652e-05, 2.5892630219459534e-05, 2.7004629373550415e-05, 2.8116628527641296e-05, 2.9228627681732178e-05, 3.034062683582306e-05, 3.145262598991394e-05, 3.256462514400482e-05, 3.36766242980957e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 17.0, 18.0, 52.0, 203.0, 1307.0, 34506.0, 1005344.0, 6271.0, 600.0, 121.0, 41.0, 19.0, 14.0, 6.0, 8.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-1.0888671875, -1.0625, -1.0361328125, -1.009765625, -0.9833984375, -0.95703125, -0.9306640625, -0.904296875, -0.8779296875, -0.8515625, -0.8251953125, -0.798828125, -0.7724609375, -0.74609375, -0.7197265625, -0.693359375, -0.6669921875, -0.640625, -0.6142578125, -0.587890625, -0.5615234375, -0.53515625, -0.5087890625, -0.482421875, -0.4560546875, -0.4296875, -0.4033203125, -0.376953125, -0.3505859375, -0.32421875, -0.2978515625, -0.271484375, -0.2451171875, -0.21875, -0.1923828125, -0.166015625, -0.1396484375, -0.11328125, -0.0869140625, -0.060546875, -0.0341796875, -0.0078125, 0.0185546875, 0.044921875, 0.0712890625, 0.09765625, 0.1240234375, 0.150390625, 0.1767578125, 0.203125, 0.2294921875, 0.255859375, 0.2822265625, 0.30859375, 0.3349609375, 0.361328125, 0.3876953125, 0.4140625, 0.4404296875, 0.466796875, 0.4931640625, 0.51953125, 0.5458984375, 0.572265625, 0.5986328125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 5.0, 7.0, 11.0, 18.0, 32.0, 46.0, 69.0, 128.0, 232.0, 189.0, 111.0, 57.0, 36.0, 25.0, 11.0, 9.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09320068359375, -0.0897207260131836, -0.08624076843261719, -0.08276081085205078, -0.07928085327148438, -0.07580089569091797, -0.07232093811035156, -0.06884098052978516, -0.06536102294921875, -0.061881065368652344, -0.05840110778808594, -0.05492115020751953, -0.051441192626953125, -0.04796123504638672, -0.04448127746582031, -0.041001319885253906, -0.0375213623046875, -0.034041404724121094, -0.030561447143554688, -0.02708148956298828, -0.023601531982421875, -0.02012157440185547, -0.016641616821289062, -0.013161659240722656, -0.00968170166015625, -0.006201744079589844, -0.0027217864990234375, 0.0007581710815429688, 0.004238128662109375, 0.007718086242675781, 0.011198043823242188, 0.014678001403808594, 0.018157958984375, 0.021637916564941406, 0.025117874145507812, 0.02859783172607422, 0.032077789306640625, 0.03555774688720703, 0.03903770446777344, 0.042517662048339844, 0.04599761962890625, 0.049477577209472656, 0.05295753479003906, 0.05643749237060547, 0.059917449951171875, 0.06339740753173828, 0.06687736511230469, 0.0703573226928711, 0.0738372802734375, 0.0773172378540039, 0.08079719543457031, 0.08427715301513672, 0.08775711059570312, 0.09123706817626953, 0.09471702575683594, 0.09819698333740234, 0.10167694091796875, 0.10515689849853516, 0.10863685607910156, 0.11211681365966797, 0.11559677124023438, 0.11907672882080078, 0.12255668640136719, 0.1260366439819336, 0.1295166015625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 6.0, 11.0, 23.0, 27.0, 48.0, 63.0, 116.0, 168.0, 193.0, 128.0, 74.0, 48.0, 28.0, 26.0, 11.0, 12.0, 4.0, 7.0, 3.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.985243320465088, -2.889725923538208, -2.7942087650299072, -2.6986913681030273, -2.6031739711761475, -2.5076565742492676, -2.412139415740967, -2.316622018814087, -2.221104621887207, -2.125587224960327, -2.0300700664520264, -1.9345526695251465, -1.8390352725982666, -1.7435179948806763, -1.648000717163086, -1.552483320236206, -1.4569661617279053, -1.361448884010315, -1.265931487083435, -1.1704142093658447, -1.0748968124389648, -0.9793795347213745, -0.8838622570037842, -0.7883449196815491, -0.692827582359314, -0.5973102450370789, -0.5017929077148438, -0.4062756299972534, -0.3107582926750183, -0.2152409553527832, -0.11972367763519287, -0.024206340312957764, 0.07131099700927734, 0.16682831943035126, 0.26234564185142517, 0.3578629493713379, 0.453380286693573, 0.5488976240158081, 0.6444149017333984, 0.7399322390556335, 0.8354495763778687, 0.9309669137001038, 1.0264842510223389, 1.1220015287399292, 1.2175188064575195, 1.3130362033843994, 1.4085534811019897, 1.50407075881958, 1.59958815574646, 1.6951054334640503, 1.7906228303909302, 1.8861401081085205, 1.9816575050354004, 2.077174663543701, 2.172692060470581, 2.268209457397461, 2.3637266159057617, 2.4592440128326416, 2.5547611713409424, 2.6502785682678223, 2.745795965194702, 2.841313362121582, 2.936830520629883, 3.0323479175567627, 3.1278653144836426]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 7.0, 5.0, 8.0, 10.0, 13.0, 18.0, 14.0, 21.0, 24.0, 36.0, 22.0, 26.0, 34.0, 21.0, 39.0, 50.0, 45.0, 47.0, 39.0, 36.0, 46.0, 49.0, 42.0, 40.0, 37.0, 33.0, 33.0, 31.0, 28.0, 21.0, 20.0, 19.0, 12.0, 11.0, 14.0, 14.0, 10.0, 9.0, 5.0, 0.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6409285068511963, -2.5557265281677246, -2.470524311065674, -2.385322332382202, -2.3001201152801514, -2.2149181365966797, -2.129715919494629, -2.0445139408111572, -1.959311842918396, -1.8741097450256348, -1.7889076471328735, -1.7037055492401123, -1.6185035705566406, -1.5333013534545898, -1.4480993747711182, -1.362897276878357, -1.2776951789855957, -1.1924930810928345, -1.1072909832000732, -1.0220890045166016, -0.9368868470191956, -0.8516847491264343, -0.7664827108383179, -0.6812806129455566, -0.5960785150527954, -0.5108764171600342, -0.42567434906959534, -0.3404722809791565, -0.25527018308639526, -0.17006808519363403, -0.08486604690551758, 0.00033605098724365234, 0.08553814888000488, 0.17074023187160492, 0.25594231486320496, 0.3411443829536438, 0.42634648084640503, 0.5115485787391663, 0.5967506170272827, 0.681952714920044, 0.7671548128128052, 0.8523569107055664, 0.9375590085983276, 1.0227611064910889, 1.1079630851745605, 1.1931653022766113, 1.278367280960083, 1.3635693788528442, 1.4487714767456055, 1.5339735746383667, 1.619175672531128, 1.7043776512145996, 1.7895798683166504, 1.874781847000122, 1.9599839448928833, 2.0451860427856445, 2.1303882598876953, 2.215590238571167, 2.3007924556732178, 2.3859944343566895, 2.4711966514587402, 2.556398630142212, 2.6416006088256836, 2.7268028259277344, 2.812004804611206]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 8.0, 10.0, 10.0, 18.0, 13.0, 20.0, 15.0, 25.0, 34.0, 53.0, 58.0, 93.0, 131.0, 242.0, 390.0, 740.0, 1479.0, 3821.0, 12624.0, 107838.0, 3489281.0, 544494.0, 22975.0, 5720.0, 2053.0, 895.0, 439.0, 246.0, 159.0, 112.0, 77.0, 55.0, 28.0, 28.0, 23.0, 17.0, 21.0, 8.0, 9.0, 5.0, 11.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.76171875, -2.671722412109375, -2.58172607421875, -2.491729736328125, -2.4017333984375, -2.311737060546875, -2.22174072265625, -2.131744384765625, -2.041748046875, -1.951751708984375, -1.86175537109375, -1.771759033203125, -1.6817626953125, -1.591766357421875, -1.50177001953125, -1.411773681640625, -1.32177734375, -1.231781005859375, -1.14178466796875, -1.051788330078125, -0.9617919921875, -0.871795654296875, -0.78179931640625, -0.691802978515625, -0.601806640625, -0.511810302734375, -0.42181396484375, -0.331817626953125, -0.2418212890625, -0.151824951171875, -0.06182861328125, 0.028167724609375, 0.1181640625, 0.208160400390625, 0.29815673828125, 0.388153076171875, 0.4781494140625, 0.568145751953125, 0.65814208984375, 0.748138427734375, 0.838134765625, 0.928131103515625, 1.01812744140625, 1.108123779296875, 1.1981201171875, 1.288116455078125, 1.37811279296875, 1.468109130859375, 1.55810546875, 1.648101806640625, 1.73809814453125, 1.828094482421875, 1.9180908203125, 2.008087158203125, 2.09808349609375, 2.188079833984375, 2.278076171875, 2.368072509765625, 2.45806884765625, 2.548065185546875, 2.6380615234375, 2.728057861328125, 2.81805419921875, 2.908050537109375, 2.998046875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 4.0, 5.0, 7.0, 9.0, 10.0, 12.0, 24.0, 17.0, 16.0, 34.0, 24.0, 29.0, 41.0, 34.0, 31.0, 39.0, 41.0, 50.0, 52.0, 58.0, 49.0, 58.0, 49.0, 34.0, 38.0, 33.0, 21.0, 29.0, 27.0, 20.0, 19.0, 25.0, 10.0, 10.0, 8.0, 11.0, 6.0, 4.0, 2.0, 5.0, 2.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.82470703125, -0.800506591796875, -0.77630615234375, -0.752105712890625, -0.7279052734375, -0.703704833984375, -0.67950439453125, -0.655303955078125, -0.631103515625, -0.606903076171875, -0.58270263671875, -0.558502197265625, -0.5343017578125, -0.510101318359375, -0.48590087890625, -0.461700439453125, -0.4375, -0.413299560546875, -0.38909912109375, -0.364898681640625, -0.3406982421875, -0.316497802734375, -0.29229736328125, -0.268096923828125, -0.243896484375, -0.219696044921875, -0.19549560546875, -0.171295166015625, -0.1470947265625, -0.122894287109375, -0.09869384765625, -0.074493408203125, -0.05029296875, -0.026092529296875, -0.00189208984375, 0.022308349609375, 0.0465087890625, 0.070709228515625, 0.09490966796875, 0.119110107421875, 0.143310546875, 0.167510986328125, 0.19171142578125, 0.215911865234375, 0.2401123046875, 0.264312744140625, 0.28851318359375, 0.312713623046875, 0.3369140625, 0.361114501953125, 0.38531494140625, 0.409515380859375, 0.4337158203125, 0.457916259765625, 0.48211669921875, 0.506317138671875, 0.530517578125, 0.554718017578125, 0.57891845703125, 0.603118896484375, 0.6273193359375, 0.651519775390625, 0.67572021484375, 0.699920654296875, 0.72412109375]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 9.0, 16.0, 14.0, 30.0, 63.0, 95.0, 248.0, 669.0, 14865.0, 4169179.0, 8108.0, 550.0, 201.0, 93.0, 50.0, 34.0, 16.0, 5.0, 5.0, 6.0, 4.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9296875, -7.605224609375, -7.28076171875, -6.956298828125, -6.6318359375, -6.307373046875, -5.98291015625, -5.658447265625, -5.333984375, -5.009521484375, -4.68505859375, -4.360595703125, -4.0361328125, -3.711669921875, -3.38720703125, -3.062744140625, -2.73828125, -2.413818359375, -2.08935546875, -1.764892578125, -1.4404296875, -1.115966796875, -0.79150390625, -0.467041015625, -0.142578125, 0.181884765625, 0.50634765625, 0.830810546875, 1.1552734375, 1.479736328125, 1.80419921875, 2.128662109375, 2.453125, 2.777587890625, 3.10205078125, 3.426513671875, 3.7509765625, 4.075439453125, 4.39990234375, 4.724365234375, 5.048828125, 5.373291015625, 5.69775390625, 6.022216796875, 6.3466796875, 6.671142578125, 6.99560546875, 7.320068359375, 7.64453125, 7.968994140625, 8.29345703125, 8.617919921875, 8.9423828125, 9.266845703125, 9.59130859375, 9.915771484375, 10.240234375, 10.564697265625, 10.88916015625, 11.213623046875, 11.5380859375, 11.862548828125, 12.18701171875, 12.511474609375, 12.8359375]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 7.0, 3.0, 4.0, 5.0, 3.0, 6.0, 10.0, 9.0, 14.0, 14.0, 15.0, 20.0, 31.0, 44.0, 57.0, 87.0, 147.0, 216.0, 438.0, 737.0, 772.0, 573.0, 288.0, 166.0, 98.0, 85.0, 57.0, 36.0, 30.0, 23.0, 15.0, 20.0, 12.0, 11.0, 4.0, 4.0, 5.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.50830078125, -0.49462890625, -0.48095703125, -0.46728515625, -0.45361328125, -0.43994140625, -0.42626953125, -0.41259765625, -0.39892578125, -0.38525390625, -0.37158203125, -0.35791015625, -0.34423828125, -0.33056640625, -0.31689453125, -0.30322265625, -0.28955078125, -0.27587890625, -0.26220703125, -0.24853515625, -0.23486328125, -0.22119140625, -0.20751953125, -0.19384765625, -0.18017578125, -0.16650390625, -0.15283203125, -0.13916015625, -0.12548828125, -0.11181640625, -0.09814453125, -0.08447265625, -0.07080078125, -0.05712890625, -0.04345703125, -0.02978515625, -0.01611328125, -0.00244140625, 0.01123046875, 0.02490234375, 0.03857421875, 0.05224609375, 0.06591796875, 0.07958984375, 0.09326171875, 0.10693359375, 0.12060546875, 0.13427734375, 0.14794921875, 0.16162109375, 0.17529296875, 0.18896484375, 0.20263671875, 0.21630859375, 0.22998046875, 0.24365234375, 0.25732421875, 0.27099609375, 0.28466796875, 0.29833984375, 0.31201171875, 0.32568359375, 0.33935546875, 0.35302734375, 0.36669921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 8.0, 6.0, 2.0, 12.0, 13.0, 20.0, 30.0, 57.0, 69.0, 76.0, 91.0, 112.0, 134.0, 100.0, 75.0, 61.0, 38.0, 24.0, 14.0, 12.0, 8.0, 11.0, 8.0, 4.0, 9.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9296356439590454, -1.8824702501296997, -1.835304856300354, -1.7881394624710083, -1.7409741878509521, -1.6938087940216064, -1.6466434001922607, -1.599478006362915, -1.5523126125335693, -1.5051472187042236, -1.457981824874878, -1.4108164310455322, -1.3636510372161865, -1.3164857625961304, -1.2693203687667847, -1.222154974937439, -1.1749895811080933, -1.1278241872787476, -1.0806587934494019, -1.0334933996200562, -0.9863280653953552, -0.9391626715660095, -0.8919973373413086, -0.8448319435119629, -0.7976665496826172, -0.7505011558532715, -0.7033357620239258, -0.6561704277992249, -0.6090050339698792, -0.5618396401405334, -0.5146743059158325, -0.4675089120864868, -0.42034363746643066, -0.37317824363708496, -0.32601287961006165, -0.27884751558303833, -0.23168212175369263, -0.18451674282550812, -0.1373513638973236, -0.09018599987030029, -0.04302060604095459, 0.004144772887229919, 0.05131015181541443, 0.09847553074359894, 0.14564090967178345, 0.19280628859996796, 0.23997166752815247, 0.2871370315551758, 0.3343024253845215, 0.3814678192138672, 0.4286331832408905, 0.4757985472679138, 0.5229639410972595, 0.5701293349266052, 0.6172946691513062, 0.6644600629806519, 0.7116254568099976, 0.7587908506393433, 0.805956244468689, 0.8531215786933899, 0.9002869725227356, 0.9474523663520813, 0.9946177005767822, 1.041783094406128, 1.0889484882354736]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 7.0, 5.0, 6.0, 8.0, 6.0, 13.0, 12.0, 17.0, 16.0, 26.0, 24.0, 30.0, 20.0, 30.0, 22.0, 28.0, 26.0, 40.0, 44.0, 38.0, 38.0, 46.0, 31.0, 36.0, 40.0, 38.0, 28.0, 24.0, 25.0, 35.0, 24.0, 28.0, 25.0, 19.0, 15.0, 12.0, 17.0, 16.0, 13.0, 11.0, 7.0, 8.0, 14.0, 5.0, 8.0, 4.0, 3.0, 2.0, 1.0, 5.0], "bins": [-0.7717801332473755, -0.7501706480979919, -0.7285611629486084, -0.7069516181945801, -0.6853421330451965, -0.663732647895813, -0.6421231031417847, -0.6205136179924011, -0.5989041328430176, -0.577294647693634, -0.5556851625442505, -0.5340756177902222, -0.5124661326408386, -0.4908566474914551, -0.46924713253974915, -0.4476376175880432, -0.42602813243865967, -0.4044186472892761, -0.3828091323375702, -0.36119961738586426, -0.3395901322364807, -0.31798064708709717, -0.29637113213539124, -0.2747616171836853, -0.25315213203430176, -0.23154263198375702, -0.20993313193321228, -0.18832363188266754, -0.1667141318321228, -0.14510463178157806, -0.12349513173103333, -0.10188563168048859, -0.08027607202529907, -0.058666571974754333, -0.037057071924209595, -0.015447571873664856, 0.006161928176879883, 0.02777142822742462, 0.04938092827796936, 0.0709904283285141, 0.09259992837905884, 0.11420942842960358, 0.13581892848014832, 0.15742842853069305, 0.1790379285812378, 0.20064742863178253, 0.22225692868232727, 0.243866428732872, 0.26547592878341675, 0.2870854139328003, 0.3086949288845062, 0.33030444383621216, 0.3519139289855957, 0.37352341413497925, 0.3951329290866852, 0.4167424440383911, 0.43835192918777466, 0.4599614143371582, 0.48157092928886414, 0.5031804442405701, 0.5247899293899536, 0.5463994145393372, 0.5680088996887207, 0.589618444442749, 0.6112279295921326]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 4.0, 7.0, 11.0, 9.0, 25.0, 36.0, 33.0, 51.0, 73.0, 120.0, 190.0, 230.0, 336.0, 505.0, 803.0, 1343.0, 1999.0, 3467.0, 6014.0, 11069.0, 21877.0, 49651.0, 155043.0, 503256.0, 184399.0, 56062.0, 23777.0, 11867.0, 6509.0, 3623.0, 2182.0, 1281.0, 881.0, 584.0, 408.0, 258.0, 173.0, 128.0, 80.0, 55.0, 38.0, 31.0, 22.0, 17.0, 11.0, 3.0, 2.0, 6.0, 5.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.36767578125, -0.356719970703125, -0.34576416015625, -0.334808349609375, -0.3238525390625, -0.312896728515625, -0.30194091796875, -0.290985107421875, -0.280029296875, -0.269073486328125, -0.25811767578125, -0.247161865234375, -0.2362060546875, -0.225250244140625, -0.21429443359375, -0.203338623046875, -0.1923828125, -0.181427001953125, -0.17047119140625, -0.159515380859375, -0.1485595703125, -0.137603759765625, -0.12664794921875, -0.115692138671875, -0.104736328125, -0.093780517578125, -0.08282470703125, -0.071868896484375, -0.0609130859375, -0.049957275390625, -0.03900146484375, -0.028045654296875, -0.01708984375, -0.006134033203125, 0.00482177734375, 0.015777587890625, 0.0267333984375, 0.037689208984375, 0.04864501953125, 0.059600830078125, 0.070556640625, 0.081512451171875, 0.09246826171875, 0.103424072265625, 0.1143798828125, 0.125335693359375, 0.13629150390625, 0.147247314453125, 0.158203125, 0.169158935546875, 0.18011474609375, 0.191070556640625, 0.2020263671875, 0.212982177734375, 0.22393798828125, 0.234893798828125, 0.245849609375, 0.256805419921875, 0.26776123046875, 0.278717041015625, 0.2896728515625, 0.300628662109375, 0.31158447265625, 0.322540283203125, 0.33349609375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 4.0, 5.0, 10.0, 8.0, 14.0, 10.0, 13.0, 9.0, 17.0, 22.0, 25.0, 25.0, 22.0, 28.0, 27.0, 36.0, 35.0, 46.0, 53.0, 46.0, 41.0, 35.0, 46.0, 49.0, 36.0, 39.0, 21.0, 38.0, 29.0, 40.0, 25.0, 26.0, 18.0, 12.0, 14.0, 11.0, 13.0, 10.0, 6.0, 7.0, 10.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.51904296875, -0.5046348571777344, -0.49022674560546875, -0.4758186340332031, -0.4614105224609375, -0.4470024108886719, -0.43259429931640625, -0.4181861877441406, -0.403778076171875, -0.3893699645996094, -0.37496185302734375, -0.3605537414550781, -0.3461456298828125, -0.3317375183105469, -0.31732940673828125, -0.3029212951660156, -0.28851318359375, -0.2741050720214844, -0.25969696044921875, -0.24528884887695312, -0.2308807373046875, -0.21647262573242188, -0.20206451416015625, -0.18765640258789062, -0.173248291015625, -0.15884017944335938, -0.14443206787109375, -0.13002395629882812, -0.1156158447265625, -0.10120773315429688, -0.08679962158203125, -0.07239151000976562, -0.0579833984375, -0.043575286865234375, -0.02916717529296875, -0.014759063720703125, -0.0003509521484375, 0.014057159423828125, 0.02846527099609375, 0.042873382568359375, 0.057281494140625, 0.07168960571289062, 0.08609771728515625, 0.10050582885742188, 0.1149139404296875, 0.12932205200195312, 0.14373016357421875, 0.15813827514648438, 0.17254638671875, 0.18695449829101562, 0.20136260986328125, 0.21577072143554688, 0.2301788330078125, 0.24458694458007812, 0.25899505615234375, 0.2734031677246094, 0.287811279296875, 0.3022193908691406, 0.31662750244140625, 0.3310356140136719, 0.3454437255859375, 0.3598518371582031, 0.37425994873046875, 0.3886680603027344, 0.403076171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 7.0, 6.0, 12.0, 11.0, 16.0, 32.0, 56.0, 62.0, 89.0, 162.0, 219.0, 400.0, 698.0, 1205.0, 2160.0, 4256.0, 9319.0, 22358.0, 66622.0, 278490.0, 482237.0, 118759.0, 35235.0, 13476.0, 6018.0, 3011.0, 1536.0, 816.0, 491.0, 307.0, 165.0, 96.0, 80.0, 43.0, 27.0, 24.0, 12.0, 12.0, 12.0, 8.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3017578125, -0.2923927307128906, -0.28302764892578125, -0.2736625671386719, -0.2642974853515625, -0.2549324035644531, -0.24556732177734375, -0.23620223999023438, -0.226837158203125, -0.21747207641601562, -0.20810699462890625, -0.19874191284179688, -0.1893768310546875, -0.18001174926757812, -0.17064666748046875, -0.16128158569335938, -0.15191650390625, -0.14255142211914062, -0.13318634033203125, -0.12382125854492188, -0.1144561767578125, -0.10509109497070312, -0.09572601318359375, -0.08636093139648438, -0.076995849609375, -0.06763076782226562, -0.05826568603515625, -0.048900604248046875, -0.0395355224609375, -0.030170440673828125, -0.02080535888671875, -0.011440277099609375, -0.0020751953125, 0.007289886474609375, 0.01665496826171875, 0.026020050048828125, 0.0353851318359375, 0.044750213623046875, 0.05411529541015625, 0.06348037719726562, 0.072845458984375, 0.08221054077148438, 0.09157562255859375, 0.10094070434570312, 0.1103057861328125, 0.11967086791992188, 0.12903594970703125, 0.13840103149414062, 0.14776611328125, 0.15713119506835938, 0.16649627685546875, 0.17586135864257812, 0.1852264404296875, 0.19459152221679688, 0.20395660400390625, 0.21332168579101562, 0.222686767578125, 0.23205184936523438, 0.24141693115234375, 0.2507820129394531, 0.2601470947265625, 0.2695121765136719, 0.27887725830078125, 0.2882423400878906, 0.297607421875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 10.0, 3.0, 10.0, 6.0, 7.0, 10.0, 16.0, 9.0, 29.0, 21.0, 25.0, 23.0, 28.0, 24.0, 43.0, 29.0, 38.0, 47.0, 35.0, 50.0, 32.0, 41.0, 37.0, 50.0, 40.0, 44.0, 38.0, 31.0, 33.0, 28.0, 21.0, 22.0, 13.0, 17.0, 17.0, 16.0, 11.0, 9.0, 5.0, 7.0, 8.0, 5.0, 4.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.89453125, -0.868927001953125, -0.84332275390625, -0.817718505859375, -0.7921142578125, -0.766510009765625, -0.74090576171875, -0.715301513671875, -0.689697265625, -0.664093017578125, -0.63848876953125, -0.612884521484375, -0.5872802734375, -0.561676025390625, -0.53607177734375, -0.510467529296875, -0.48486328125, -0.459259033203125, -0.43365478515625, -0.408050537109375, -0.3824462890625, -0.356842041015625, -0.33123779296875, -0.305633544921875, -0.280029296875, -0.254425048828125, -0.22882080078125, -0.203216552734375, -0.1776123046875, -0.152008056640625, -0.12640380859375, -0.100799560546875, -0.0751953125, -0.049591064453125, -0.02398681640625, 0.001617431640625, 0.0272216796875, 0.052825927734375, 0.07843017578125, 0.104034423828125, 0.129638671875, 0.155242919921875, 0.18084716796875, 0.206451416015625, 0.2320556640625, 0.257659912109375, 0.28326416015625, 0.308868408203125, 0.33447265625, 0.360076904296875, 0.38568115234375, 0.411285400390625, 0.4368896484375, 0.462493896484375, 0.48809814453125, 0.513702392578125, 0.539306640625, 0.564910888671875, 0.59051513671875, 0.616119384765625, 0.6417236328125, 0.667327880859375, 0.69293212890625, 0.718536376953125, 0.744140625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 2.0, 9.0, 5.0, 6.0, 10.0, 17.0, 22.0, 41.0, 70.0, 91.0, 129.0, 175.0, 254.0, 393.0, 643.0, 1107.0, 1989.0, 3899.0, 8491.0, 20573.0, 60794.0, 221003.0, 469716.0, 175889.0, 50035.0, 17564.0, 7359.0, 3583.0, 1833.0, 1042.0, 646.0, 389.0, 233.0, 158.0, 123.0, 82.0, 53.0, 32.0, 31.0, 16.0, 20.0, 12.0, 3.0, 7.0, 1.0, 5.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055755615234375, -0.05379343032836914, -0.05183124542236328, -0.04986906051635742, -0.04790687561035156, -0.0459446907043457, -0.043982505798339844, -0.042020320892333984, -0.040058135986328125, -0.038095951080322266, -0.036133766174316406, -0.03417158126831055, -0.03220939636230469, -0.030247211456298828, -0.02828502655029297, -0.02632284164428711, -0.02436065673828125, -0.02239847183227539, -0.02043628692626953, -0.018474102020263672, -0.016511917114257812, -0.014549732208251953, -0.012587547302246094, -0.010625362396240234, -0.008663177490234375, -0.006700992584228516, -0.004738807678222656, -0.002776622772216797, -0.0008144378662109375, 0.0011477470397949219, 0.0031099319458007812, 0.005072116851806641, 0.0070343017578125, 0.00899648666381836, 0.010958671569824219, 0.012920856475830078, 0.014883041381835938, 0.016845226287841797, 0.018807411193847656, 0.020769596099853516, 0.022731781005859375, 0.024693965911865234, 0.026656150817871094, 0.028618335723876953, 0.030580520629882812, 0.03254270553588867, 0.03450489044189453, 0.03646707534790039, 0.03842926025390625, 0.04039144515991211, 0.04235363006591797, 0.04431581497192383, 0.04627799987792969, 0.04824018478393555, 0.050202369689941406, 0.052164554595947266, 0.054126739501953125, 0.056088924407958984, 0.058051109313964844, 0.0600132942199707, 0.06197547912597656, 0.06393766403198242, 0.06589984893798828, 0.06786203384399414, 0.06982421875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 5.0, 10.0, 12.0, 14.0, 26.0, 42.0, 65.0, 120.0, 170.0, 193.0, 116.0, 76.0, 54.0, 32.0, 20.0, 10.0, 10.0, 3.0, 6.0, 3.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.61015510559082e-05, -6.347056478261948e-05, -6.083957850933075e-05, -5.820859223604202e-05, -5.5577605962753296e-05, -5.294661968946457e-05, -5.031563341617584e-05, -4.7684647142887115e-05, -4.505366086959839e-05, -4.242267459630966e-05, -3.9791688323020935e-05, -3.716070204973221e-05, -3.452971577644348e-05, -3.1898729503154755e-05, -2.9267743229866028e-05, -2.66367569565773e-05, -2.4005770683288574e-05, -2.1374784409999847e-05, -1.874379813671112e-05, -1.6112811863422394e-05, -1.3481825590133667e-05, -1.085083931684494e-05, -8.219853043556213e-06, -5.5888667702674866e-06, -2.9578804969787598e-06, -3.2689422369003296e-07, 2.304092049598694e-06, 4.935078322887421e-06, 7.5660645961761475e-06, 1.0197050869464874e-05, 1.2828037142753601e-05, 1.5459023416042328e-05, 1.8090009689331055e-05, 2.072099596261978e-05, 2.3351982235908508e-05, 2.5982968509197235e-05, 2.8613954782485962e-05, 3.124494105577469e-05, 3.3875927329063416e-05, 3.650691360235214e-05, 3.913789987564087e-05, 4.1768886148929596e-05, 4.439987242221832e-05, 4.703085869550705e-05, 4.9661844968795776e-05, 5.22928312420845e-05, 5.492381751537323e-05, 5.755480378866196e-05, 6.0185790061950684e-05, 6.281677633523941e-05, 6.544776260852814e-05, 6.807874888181686e-05, 7.070973515510559e-05, 7.334072142839432e-05, 7.597170770168304e-05, 7.860269397497177e-05, 8.12336802482605e-05, 8.386466652154922e-05, 8.649565279483795e-05, 8.912663906812668e-05, 9.17576253414154e-05, 9.438861161470413e-05, 9.701959788799286e-05, 9.965058416128159e-05, 0.00010228157043457031]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 16.0, 18.0, 18.0, 40.0, 91.0, 179.0, 369.0, 1203.0, 4064.0, 19456.0, 188405.0, 739131.0, 80440.0, 10998.0, 2724.0, 803.0, 291.0, 129.0, 60.0, 28.0, 20.0, 16.0, 4.0, 12.0, 4.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.134521484375, -0.12993621826171875, -0.1253509521484375, -0.12076568603515625, -0.116180419921875, -0.11159515380859375, -0.1070098876953125, -0.10242462158203125, -0.09783935546875, -0.09325408935546875, -0.0886688232421875, -0.08408355712890625, -0.079498291015625, -0.07491302490234375, -0.0703277587890625, -0.06574249267578125, -0.0611572265625, -0.05657196044921875, -0.0519866943359375, -0.04740142822265625, -0.042816162109375, -0.03823089599609375, -0.0336456298828125, -0.02906036376953125, -0.02447509765625, -0.01988983154296875, -0.0153045654296875, -0.01071929931640625, -0.006134033203125, -0.00154876708984375, 0.0030364990234375, 0.00762176513671875, 0.01220703125, 0.01679229736328125, 0.0213775634765625, 0.02596282958984375, 0.030548095703125, 0.03513336181640625, 0.0397186279296875, 0.04430389404296875, 0.04888916015625, 0.05347442626953125, 0.0580596923828125, 0.06264495849609375, 0.067230224609375, 0.07181549072265625, 0.0764007568359375, 0.08098602294921875, 0.0855712890625, 0.09015655517578125, 0.0947418212890625, 0.09932708740234375, 0.103912353515625, 0.10849761962890625, 0.1130828857421875, 0.11766815185546875, 0.12225341796875, 0.12683868408203125, 0.1314239501953125, 0.13600921630859375, 0.140594482421875, 0.14517974853515625, 0.1497650146484375, 0.15435028076171875, 0.158935546875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 2.0, 5.0, 8.0, 12.0, 9.0, 10.0, 17.0, 22.0, 33.0, 37.0, 56.0, 63.0, 70.0, 65.0, 76.0, 74.0, 80.0, 52.0, 60.0, 64.0, 49.0, 28.0, 25.0, 23.0, 8.0, 11.0, 12.0, 7.0, 1.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0187530517578125, -0.01811075210571289, -0.01746845245361328, -0.016826152801513672, -0.016183853149414062, -0.015541553497314453, -0.014899253845214844, -0.014256954193115234, -0.013614654541015625, -0.012972354888916016, -0.012330055236816406, -0.011687755584716797, -0.011045455932617188, -0.010403156280517578, -0.009760856628417969, -0.00911855697631836, -0.00847625732421875, -0.00783395767211914, -0.007191658020019531, -0.006549358367919922, -0.0059070587158203125, -0.005264759063720703, -0.004622459411621094, -0.003980159759521484, -0.003337860107421875, -0.0026955604553222656, -0.0020532608032226562, -0.0014109611511230469, -0.0007686614990234375, -0.00012636184692382812, 0.0005159378051757812, 0.0011582374572753906, 0.001800537109375, 0.0024428367614746094, 0.0030851364135742188, 0.003727436065673828, 0.0043697357177734375, 0.005012035369873047, 0.005654335021972656, 0.006296634674072266, 0.006938934326171875, 0.007581233978271484, 0.008223533630371094, 0.008865833282470703, 0.009508132934570312, 0.010150432586669922, 0.010792732238769531, 0.01143503189086914, 0.01207733154296875, 0.01271963119506836, 0.013361930847167969, 0.014004230499267578, 0.014646530151367188, 0.015288829803466797, 0.015931129455566406, 0.016573429107666016, 0.017215728759765625, 0.017858028411865234, 0.018500328063964844, 0.019142627716064453, 0.019784927368164062, 0.020427227020263672, 0.02106952667236328, 0.02171182632446289, 0.0223541259765625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 9.0, 6.0, 7.0, 13.0, 15.0, 42.0, 38.0, 86.0, 109.0, 127.0, 181.0, 139.0, 76.0, 56.0, 32.0, 21.0, 17.0, 7.0, 7.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0980820655822754, -1.062807559967041, -1.027532935142517, -0.9922583699226379, -0.9569838047027588, -0.9217092990875244, -0.8864347338676453, -0.8511601686477661, -0.815885603427887, -0.7806110382080078, -0.7453364729881287, -0.7100619077682495, -0.6747874021530151, -0.6395127773284912, -0.6042382717132568, -0.5689637064933777, -0.5336891412734985, -0.4984145760536194, -0.46314001083374023, -0.42786547541618347, -0.3925909101963043, -0.35731634497642517, -0.3220418095588684, -0.28676724433898926, -0.2514926791191101, -0.21621811389923096, -0.180943563580513, -0.14566901326179504, -0.1103944480419159, -0.07511988282203674, -0.03984533250331879, -0.00457078218460083, 0.03070366382598877, 0.06597822159528732, 0.10125277936458588, 0.13652732968330383, 0.17180189490318298, 0.20707646012306213, 0.2423510104417801, 0.27762556076049805, 0.3129001259803772, 0.34817469120025635, 0.3834492564201355, 0.41872379183769226, 0.4539983570575714, 0.48927292227745056, 0.5245474576950073, 0.5598220229148865, 0.5950965881347656, 0.6303711533546448, 0.6656457185745239, 0.7009202837944031, 0.7361948490142822, 0.7714693546295166, 0.8067439198493958, 0.8420184850692749, 0.877293050289154, 0.9125676155090332, 0.9478421807289124, 0.9831167459487915, 1.0183912515640259, 1.0536658763885498, 1.0889403820037842, 1.1242148876190186, 1.1594895124435425]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 6.0, 5.0, 7.0, 10.0, 6.0, 7.0, 11.0, 17.0, 21.0, 11.0, 19.0, 21.0, 28.0, 29.0, 24.0, 19.0, 37.0, 26.0, 31.0, 34.0, 40.0, 51.0, 37.0, 51.0, 26.0, 38.0, 34.0, 25.0, 31.0, 30.0, 27.0, 35.0, 40.0, 17.0, 17.0, 19.0, 12.0, 18.0, 12.0, 9.0, 9.0, 15.0, 9.0, 7.0, 7.0, 2.0, 3.0, 4.0, 1.0, 5.0, 5.0], "bins": [-0.449985146522522, -0.43745124340057373, -0.4249173402786255, -0.41238343715667725, -0.399849534034729, -0.38731563091278076, -0.37478169798851013, -0.3622477948665619, -0.34971389174461365, -0.3371799886226654, -0.32464608550071716, -0.3121121823787689, -0.2995782494544983, -0.28704434633255005, -0.2745104432106018, -0.26197654008865356, -0.24944263696670532, -0.23690873384475708, -0.22437483072280884, -0.2118409126996994, -0.19930700957775116, -0.18677310645580292, -0.17423918843269348, -0.16170528531074524, -0.149171382188797, -0.13663747906684875, -0.12410356849431992, -0.11156965792179108, -0.09903575479984283, -0.08650185167789459, -0.07396794110536575, -0.061434030532836914, -0.04890015721321106, -0.03636625036597252, -0.02383234351873398, -0.011298436671495438, 0.001235470175743103, 0.013769373297691345, 0.026303283870220184, 0.03883719444274902, 0.051371097564697266, 0.06390500068664551, 0.07643891125917435, 0.08897282183170319, 0.10150672495365143, 0.11404062807559967, 0.1265745460987091, 0.13910844922065735, 0.1516423523426056, 0.16417625546455383, 0.17671015858650208, 0.1892440766096115, 0.20177797973155975, 0.214311882853508, 0.22684580087661743, 0.23937970399856567, 0.2519136071205139, 0.26444751024246216, 0.2769814133644104, 0.28951531648635864, 0.3020492196083069, 0.3145831227302551, 0.32711705565452576, 0.339650958776474, 0.35218486189842224]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 13.0, 7.0, 13.0, 18.0, 21.0, 41.0, 62.0, 84.0, 155.0, 225.0, 370.0, 610.0, 1039.0, 1703.0, 2921.0, 5265.0, 10224.0, 21580.0, 59373.0, 283376.0, 500742.0, 100783.0, 31189.0, 13224.0, 6711.0, 3583.0, 2081.0, 1248.0, 662.0, 430.0, 275.0, 208.0, 100.0, 73.0, 52.0, 30.0, 23.0, 15.0, 5.0, 3.0, 10.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2626953125, -0.2526664733886719, -0.24263763427734375, -0.23260879516601562, -0.2225799560546875, -0.21255111694335938, -0.20252227783203125, -0.19249343872070312, -0.182464599609375, -0.17243576049804688, -0.16240692138671875, -0.15237808227539062, -0.1423492431640625, -0.13232040405273438, -0.12229156494140625, -0.11226272583007812, -0.10223388671875, -0.09220504760742188, -0.08217620849609375, -0.07214736938476562, -0.0621185302734375, -0.052089691162109375, -0.04206085205078125, -0.032032012939453125, -0.022003173828125, -0.011974334716796875, -0.00194549560546875, 0.008083343505859375, 0.0181121826171875, 0.028141021728515625, 0.03816986083984375, 0.048198699951171875, 0.0582275390625, 0.06825637817382812, 0.07828521728515625, 0.08831405639648438, 0.0983428955078125, 0.10837173461914062, 0.11840057373046875, 0.12842941284179688, 0.138458251953125, 0.14848709106445312, 0.15851593017578125, 0.16854476928710938, 0.1785736083984375, 0.18860244750976562, 0.19863128662109375, 0.20866012573242188, 0.21868896484375, 0.22871780395507812, 0.23874664306640625, 0.24877548217773438, 0.2588043212890625, 0.2688331604003906, 0.27886199951171875, 0.2888908386230469, 0.298919677734375, 0.3089485168457031, 0.31897735595703125, 0.3290061950683594, 0.3390350341796875, 0.3490638732910156, 0.35909271240234375, 0.3691215515136719, 0.379150390625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 7.0, 6.0, 5.0, 17.0, 20.0, 12.0, 15.0, 24.0, 17.0, 43.0, 30.0, 19.0, 32.0, 41.0, 39.0, 40.0, 48.0, 46.0, 50.0, 43.0, 40.0, 37.0, 44.0, 32.0, 35.0, 30.0, 29.0, 29.0, 31.0, 21.0, 22.0, 11.0, 12.0, 14.0, 13.0, 8.0, 5.0, 7.0, 4.0, 6.0, 2.0, 4.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0849609375, -1.0517578125, -1.0185546875, -0.9853515625, -0.9521484375, -0.9189453125, -0.8857421875, -0.8525390625, -0.8193359375, -0.7861328125, -0.7529296875, -0.7197265625, -0.6865234375, -0.6533203125, -0.6201171875, -0.5869140625, -0.5537109375, -0.5205078125, -0.4873046875, -0.4541015625, -0.4208984375, -0.3876953125, -0.3544921875, -0.3212890625, -0.2880859375, -0.2548828125, -0.2216796875, -0.1884765625, -0.1552734375, -0.1220703125, -0.0888671875, -0.0556640625, -0.0224609375, 0.0107421875, 0.0439453125, 0.0771484375, 0.1103515625, 0.1435546875, 0.1767578125, 0.2099609375, 0.2431640625, 0.2763671875, 0.3095703125, 0.3427734375, 0.3759765625, 0.4091796875, 0.4423828125, 0.4755859375, 0.5087890625, 0.5419921875, 0.5751953125, 0.6083984375, 0.6416015625, 0.6748046875, 0.7080078125, 0.7412109375, 0.7744140625, 0.8076171875, 0.8408203125, 0.8740234375, 0.9072265625, 0.9404296875, 0.9736328125, 1.0068359375, 1.0400390625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 4.0, 9.0, 4.0, 10.0, 10.0, 9.0, 17.0, 20.0, 17.0, 20.0, 30.0, 22.0, 33.0, 53.0, 41.0, 35.0, 55.0, 131.0, 844078.0, 203443.0, 124.0, 47.0, 44.0, 46.0, 34.0, 36.0, 27.0, 27.0, 22.0, 18.0, 17.0, 12.0, 12.0, 6.0, 7.0, 6.0, 7.0, 8.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.29296875, -5.1416015625, -4.990234375, -4.8388671875, -4.6875, -4.5361328125, -4.384765625, -4.2333984375, -4.08203125, -3.9306640625, -3.779296875, -3.6279296875, -3.4765625, -3.3251953125, -3.173828125, -3.0224609375, -2.87109375, -2.7197265625, -2.568359375, -2.4169921875, -2.265625, -2.1142578125, -1.962890625, -1.8115234375, -1.66015625, -1.5087890625, -1.357421875, -1.2060546875, -1.0546875, -0.9033203125, -0.751953125, -0.6005859375, -0.44921875, -0.2978515625, -0.146484375, 0.0048828125, 0.15625, 0.3076171875, 0.458984375, 0.6103515625, 0.76171875, 0.9130859375, 1.064453125, 1.2158203125, 1.3671875, 1.5185546875, 1.669921875, 1.8212890625, 1.97265625, 2.1240234375, 2.275390625, 2.4267578125, 2.578125, 2.7294921875, 2.880859375, 3.0322265625, 3.18359375, 3.3349609375, 3.486328125, 3.6376953125, 3.7890625, 3.9404296875, 4.091796875, 4.2431640625, 4.39453125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 5.0, 6.0, 9.0, 8.0, 9.0, 16.0, 19.0, 19.0, 20.0, 18.0, 29.0, 29.0, 32.0, 46.0, 46.0, 28.0, 54.0, 37.0, 62.0, 49.0, 55.0, 49.0, 42.0, 39.0, 38.0, 32.0, 26.0, 31.0, 22.0, 28.0, 14.0, 15.0, 10.0, 10.0, 8.0, 8.0, 4.0, 8.0, 7.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.1552734375, -1.1223373413085938, -1.0894012451171875, -1.0564651489257812, -1.023529052734375, -0.9905929565429688, -0.9576568603515625, -0.9247207641601562, -0.89178466796875, -0.8588485717773438, -0.8259124755859375, -0.7929763793945312, -0.760040283203125, -0.7271041870117188, -0.6941680908203125, -0.6612319946289062, -0.6282958984375, -0.5953598022460938, -0.5624237060546875, -0.5294876098632812, -0.496551513671875, -0.46361541748046875, -0.4306793212890625, -0.39774322509765625, -0.36480712890625, -0.33187103271484375, -0.2989349365234375, -0.26599884033203125, -0.233062744140625, -0.20012664794921875, -0.1671905517578125, -0.13425445556640625, -0.101318359375, -0.06838226318359375, -0.0354461669921875, -0.00251007080078125, 0.030426025390625, 0.06336212158203125, 0.0962982177734375, 0.12923431396484375, 0.16217041015625, 0.19510650634765625, 0.2280426025390625, 0.26097869873046875, 0.293914794921875, 0.32685089111328125, 0.3597869873046875, 0.39272308349609375, 0.4256591796875, 0.45859527587890625, 0.4915313720703125, 0.5244674682617188, 0.557403564453125, 0.5903396606445312, 0.6232757568359375, 0.6562118530273438, 0.68914794921875, 0.7220840454101562, 0.7550201416015625, 0.7879562377929688, 0.820892333984375, 0.8538284301757812, 0.8867645263671875, 0.9197006225585938, 0.95263671875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 3.0, 7.0, 22.0, 14.0, 23.0, 28.0, 60.0, 125.0, 324.0, 979.0, 4664.0, 38956.0, 947680.0, 48448.0, 5403.0, 1191.0, 344.0, 113.0, 60.0, 35.0, 20.0, 15.0, 9.0, 4.0, 4.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44921875, -0.43497467041015625, -0.4207305908203125, -0.40648651123046875, -0.392242431640625, -0.37799835205078125, -0.3637542724609375, -0.34951019287109375, -0.33526611328125, -0.32102203369140625, -0.3067779541015625, -0.29253387451171875, -0.278289794921875, -0.26404571533203125, -0.2498016357421875, -0.23555755615234375, -0.2213134765625, -0.20706939697265625, -0.1928253173828125, -0.17858123779296875, -0.164337158203125, -0.15009307861328125, -0.1358489990234375, -0.12160491943359375, -0.10736083984375, -0.09311676025390625, -0.0788726806640625, -0.06462860107421875, -0.050384521484375, -0.03614044189453125, -0.0218963623046875, -0.00765228271484375, 0.006591796875, 0.02083587646484375, 0.0350799560546875, 0.04932403564453125, 0.063568115234375, 0.07781219482421875, 0.0920562744140625, 0.10630035400390625, 0.12054443359375, 0.13478851318359375, 0.1490325927734375, 0.16327667236328125, 0.177520751953125, 0.19176483154296875, 0.2060089111328125, 0.22025299072265625, 0.2344970703125, 0.24874114990234375, 0.2629852294921875, 0.27722930908203125, 0.291473388671875, 0.30571746826171875, 0.3199615478515625, 0.33420562744140625, 0.34844970703125, 0.36269378662109375, 0.3769378662109375, 0.39118194580078125, 0.405426025390625, 0.41967010498046875, 0.4339141845703125, 0.44815826416015625, 0.46240234375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 7.0, 7.0, 10.0, 8.0, 10.0, 19.0, 26.0, 25.0, 32.0, 86.0, 173.0, 266.0, 123.0, 65.0, 45.0, 21.0, 22.0, 11.0, 7.0, 7.0, 4.0, 1.0, 5.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.987550735473633e-05, -3.855675458908081e-05, -3.723800182342529e-05, -3.5919249057769775e-05, -3.460049629211426e-05, -3.328174352645874e-05, -3.196299076080322e-05, -3.0644237995147705e-05, -2.9325485229492188e-05, -2.800673246383667e-05, -2.6687979698181152e-05, -2.5369226932525635e-05, -2.4050474166870117e-05, -2.27317214012146e-05, -2.1412968635559082e-05, -2.0094215869903564e-05, -1.8775463104248047e-05, -1.745671033859253e-05, -1.6137957572937012e-05, -1.4819204807281494e-05, -1.3500452041625977e-05, -1.2181699275970459e-05, -1.0862946510314941e-05, -9.544193744659424e-06, -8.225440979003906e-06, -6.906688213348389e-06, -5.587935447692871e-06, -4.2691826820373535e-06, -2.950429916381836e-06, -1.6316771507263184e-06, -3.129243850708008e-07, 1.0058283805847168e-06, 2.3245811462402344e-06, 3.643333911895752e-06, 4.9620866775512695e-06, 6.280839443206787e-06, 7.599592208862305e-06, 8.918344974517822e-06, 1.023709774017334e-05, 1.1555850505828857e-05, 1.2874603271484375e-05, 1.4193356037139893e-05, 1.551210880279541e-05, 1.6830861568450928e-05, 1.8149614334106445e-05, 1.9468367099761963e-05, 2.078711986541748e-05, 2.2105872631072998e-05, 2.3424625396728516e-05, 2.4743378162384033e-05, 2.606213092803955e-05, 2.738088369369507e-05, 2.8699636459350586e-05, 3.0018389225006104e-05, 3.133714199066162e-05, 3.265589475631714e-05, 3.3974647521972656e-05, 3.5293400287628174e-05, 3.661215305328369e-05, 3.793090581893921e-05, 3.9249658584594727e-05, 4.0568411350250244e-05, 4.188716411590576e-05, 4.320591688156128e-05, 4.45246696472168e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 7.0, 9.0, 9.0, 20.0, 15.0, 34.0, 66.0, 126.0, 209.0, 333.0, 764.0, 1625.0, 3873.0, 12032.0, 59014.0, 825269.0, 117966.0, 18042.0, 5222.0, 2013.0, 946.0, 436.0, 219.0, 118.0, 66.0, 42.0, 22.0, 15.0, 15.0, 12.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.199951171875, -0.19244766235351562, -0.18494415283203125, -0.17744064331054688, -0.1699371337890625, -0.16243362426757812, -0.15493011474609375, -0.14742660522460938, -0.139923095703125, -0.13241958618164062, -0.12491607666015625, -0.11741256713867188, -0.1099090576171875, -0.10240554809570312, -0.09490203857421875, -0.08739852905273438, -0.07989501953125, -0.07239151000976562, -0.06488800048828125, -0.057384490966796875, -0.0498809814453125, -0.042377471923828125, -0.03487396240234375, -0.027370452880859375, -0.019866943359375, -0.012363433837890625, -0.00485992431640625, 0.002643585205078125, 0.0101470947265625, 0.017650604248046875, 0.02515411376953125, 0.032657623291015625, 0.0401611328125, 0.047664642333984375, 0.05516815185546875, 0.06267166137695312, 0.0701751708984375, 0.07767868041992188, 0.08518218994140625, 0.09268569946289062, 0.100189208984375, 0.10769271850585938, 0.11519622802734375, 0.12269973754882812, 0.1302032470703125, 0.13770675659179688, 0.14521026611328125, 0.15271377563476562, 0.16021728515625, 0.16772079467773438, 0.17522430419921875, 0.18272781372070312, 0.1902313232421875, 0.19773483276367188, 0.20523834228515625, 0.21274185180664062, 0.220245361328125, 0.22774887084960938, 0.23525238037109375, 0.24275588989257812, 0.2502593994140625, 0.2577629089355469, 0.26526641845703125, 0.2727699279785156, 0.2802734375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 5.0, 3.0, 2.0, 8.0, 12.0, 9.0, 15.0, 19.0, 15.0, 30.0, 49.0, 59.0, 78.0, 207.0, 192.0, 90.0, 62.0, 42.0, 23.0, 21.0, 16.0, 14.0, 11.0, 8.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1019287109375, -0.09931182861328125, -0.0966949462890625, -0.09407806396484375, -0.091461181640625, -0.08884429931640625, -0.0862274169921875, -0.08361053466796875, -0.08099365234375, -0.07837677001953125, -0.0757598876953125, -0.07314300537109375, -0.070526123046875, -0.06790924072265625, -0.0652923583984375, -0.06267547607421875, -0.06005859375, -0.05744171142578125, -0.0548248291015625, -0.05220794677734375, -0.049591064453125, -0.04697418212890625, -0.0443572998046875, -0.04174041748046875, -0.03912353515625, -0.03650665283203125, -0.0338897705078125, -0.03127288818359375, -0.028656005859375, -0.02603912353515625, -0.0234222412109375, -0.02080535888671875, -0.0181884765625, -0.01557159423828125, -0.0129547119140625, -0.01033782958984375, -0.007720947265625, -0.00510406494140625, -0.0024871826171875, 0.00012969970703125, 0.00274658203125, 0.00536346435546875, 0.0079803466796875, 0.01059722900390625, 0.013214111328125, 0.01583099365234375, 0.0184478759765625, 0.02106475830078125, 0.023681640625, 0.02629852294921875, 0.0289154052734375, 0.03153228759765625, 0.034149169921875, 0.03676605224609375, 0.0393829345703125, 0.04199981689453125, 0.04461669921875, 0.04723358154296875, 0.0498504638671875, 0.05246734619140625, 0.055084228515625, 0.05770111083984375, 0.0603179931640625, 0.06293487548828125, 0.0655517578125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 6.0, 7.0, 14.0, 22.0, 40.0, 102.0, 151.0, 212.0, 200.0, 119.0, 63.0, 26.0, 21.0, 7.0, 10.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0143203735351562, -1.917041540145874, -1.8197627067565918, -1.7224838733673096, -1.625205159187317, -1.5279263257980347, -1.4306474924087524, -1.3333687782287598, -1.2360899448394775, -1.1388111114501953, -1.041532278060913, -0.9442535042762756, -0.8469747304916382, -0.749695897102356, -0.6524170637130737, -0.5551382899284363, -0.4578593969345093, -0.36058059334754944, -0.2633017897605896, -0.16602295637130737, -0.06874415278434753, 0.028534650802612305, 0.12581348419189453, 0.22309225797653198, 0.3203710913658142, 0.41764989495277405, 0.5149286985397339, 0.6122075319290161, 0.7094863653182983, 0.8067651391029358, 0.904043972492218, 1.0013227462768555, 1.0986015796661377, 1.19588041305542, 1.2931592464447021, 1.3904380798339844, 1.487716794013977, 1.5849956274032593, 1.6822744607925415, 1.7795531749725342, 1.8768320083618164, 1.9741108417510986, 2.071389675140381, 2.168668508529663, 2.2659473419189453, 2.3632259368896484, 2.4605050086975098, 2.557783603668213, 2.655062675476074, 2.7523415088653564, 2.8496203422546387, 2.946899175643921, 3.044178009033203, 3.1414566040039062, 3.2387356758117676, 3.3360142707824707, 3.433293104171753, 3.530571937561035, 3.6278507709503174, 3.7251296043395996, 3.822408437728882, 3.919687271118164, 4.016965866088867, 4.1142449378967285, 4.211523532867432]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 4.0, 5.0, 3.0, 5.0, 4.0, 8.0, 11.0, 12.0, 12.0, 17.0, 25.0, 20.0, 28.0, 35.0, 32.0, 41.0, 36.0, 36.0, 50.0, 48.0, 49.0, 40.0, 44.0, 52.0, 38.0, 28.0, 34.0, 29.0, 29.0, 31.0, 27.0, 21.0, 25.0, 24.0, 14.0, 15.0, 10.0, 11.0, 6.0, 6.0, 7.0, 6.0, 4.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.4211187362670898, -1.374914526939392, -1.3287103176116943, -1.2825061082839966, -1.2363018989562988, -1.1900975704193115, -1.1438934803009033, -1.097689151763916, -1.0514849424362183, -1.0052807331085205, -0.9590765237808228, -0.912872314453125, -0.8666680455207825, -0.8204638361930847, -0.774259626865387, -0.7280553579330444, -0.6818512082099915, -0.6356469988822937, -0.589442789554596, -0.5432385206222534, -0.49703431129455566, -0.4508301019668579, -0.40462589263916016, -0.35842165350914, -0.31221744418144226, -0.2660132348537445, -0.21980899572372437, -0.1736047863960266, -0.12740056216716766, -0.08119633793830872, -0.03499212861061096, 0.01121211051940918, 0.057416319847106934, 0.10362054407596588, 0.14982476830482483, 0.19602897763252258, 0.24223320186138153, 0.2884374260902405, 0.33464163541793823, 0.3808458745479584, 0.42705008387565613, 0.4732542932033539, 0.519458532333374, 0.5656627416610718, 0.6118669509887695, 0.6580711603164673, 0.704275369644165, 0.7504796385765076, 0.7966838479042053, 0.8428880572319031, 0.8890922665596008, 0.9352965354919434, 0.9815007448196411, 1.0277049541473389, 1.0739091634750366, 1.1201133728027344, 1.1663175821304321, 1.2125217914581299, 1.2587260007858276, 1.3049302101135254, 1.3511344194412231, 1.397338628768921, 1.4435429573059082, 1.489747166633606, 1.5359513759613037]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 6.0, 6.0, 10.0, 14.0, 20.0, 16.0, 43.0, 41.0, 84.0, 107.0, 176.0, 269.0, 505.0, 832.0, 1548.0, 3307.0, 8509.0, 65841.0, 2569555.0, 1487336.0, 42401.0, 7347.0, 2958.0, 1426.0, 778.0, 410.0, 291.0, 152.0, 92.0, 72.0, 42.0, 26.0, 14.0, 20.0, 6.0, 12.0, 3.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9326171875, -1.8720703125, -1.8115234375, -1.7509765625, -1.6904296875, -1.6298828125, -1.5693359375, -1.5087890625, -1.4482421875, -1.3876953125, -1.3271484375, -1.2666015625, -1.2060546875, -1.1455078125, -1.0849609375, -1.0244140625, -0.9638671875, -0.9033203125, -0.8427734375, -0.7822265625, -0.7216796875, -0.6611328125, -0.6005859375, -0.5400390625, -0.4794921875, -0.4189453125, -0.3583984375, -0.2978515625, -0.2373046875, -0.1767578125, -0.1162109375, -0.0556640625, 0.0048828125, 0.0654296875, 0.1259765625, 0.1865234375, 0.2470703125, 0.3076171875, 0.3681640625, 0.4287109375, 0.4892578125, 0.5498046875, 0.6103515625, 0.6708984375, 0.7314453125, 0.7919921875, 0.8525390625, 0.9130859375, 0.9736328125, 1.0341796875, 1.0947265625, 1.1552734375, 1.2158203125, 1.2763671875, 1.3369140625, 1.3974609375, 1.4580078125, 1.5185546875, 1.5791015625, 1.6396484375, 1.7001953125, 1.7607421875, 1.8212890625, 1.8818359375, 1.9423828125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 4.0, 6.0, 5.0, 8.0, 10.0, 12.0, 12.0, 12.0, 8.0, 13.0, 26.0, 19.0, 19.0, 44.0, 29.0, 35.0, 39.0, 39.0, 74.0, 43.0, 48.0, 52.0, 57.0, 51.0, 44.0, 49.0, 38.0, 29.0, 32.0, 24.0, 22.0, 15.0, 13.0, 12.0, 9.0, 12.0, 8.0, 9.0, 7.0, 4.0, 1.0, 3.0, 4.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.72509765625, -0.7042236328125, -0.683349609375, -0.6624755859375, -0.6416015625, -0.6207275390625, -0.599853515625, -0.5789794921875, -0.55810546875, -0.5372314453125, -0.516357421875, -0.4954833984375, -0.474609375, -0.4537353515625, -0.432861328125, -0.4119873046875, -0.39111328125, -0.3702392578125, -0.349365234375, -0.3284912109375, -0.3076171875, -0.2867431640625, -0.265869140625, -0.2449951171875, -0.22412109375, -0.2032470703125, -0.182373046875, -0.1614990234375, -0.140625, -0.1197509765625, -0.098876953125, -0.0780029296875, -0.05712890625, -0.0362548828125, -0.015380859375, 0.0054931640625, 0.0263671875, 0.0472412109375, 0.068115234375, 0.0889892578125, 0.10986328125, 0.1307373046875, 0.151611328125, 0.1724853515625, 0.193359375, 0.2142333984375, 0.235107421875, 0.2559814453125, 0.27685546875, 0.2977294921875, 0.318603515625, 0.3394775390625, 0.3603515625, 0.3812255859375, 0.402099609375, 0.4229736328125, 0.44384765625, 0.4647216796875, 0.485595703125, 0.5064697265625, 0.52734375, 0.5482177734375, 0.569091796875, 0.5899658203125, 0.61083984375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 7.0, 4.0, 13.0, 15.0, 34.0, 61.0, 113.0, 253.0, 679.0, 2177.0, 9724.0, 99850.0, 3986075.0, 83403.0, 8761.0, 1931.0, 603.0, 291.0, 109.0, 69.0, 34.0, 24.0, 16.0, 11.0, 4.0, 8.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8232421875, -1.7516632080078125, -1.680084228515625, -1.6085052490234375, -1.53692626953125, -1.4653472900390625, -1.393768310546875, -1.3221893310546875, -1.2506103515625, -1.1790313720703125, -1.107452392578125, -1.0358734130859375, -0.96429443359375, -0.8927154541015625, -0.821136474609375, -0.7495574951171875, -0.677978515625, -0.6063995361328125, -0.534820556640625, -0.4632415771484375, -0.39166259765625, -0.3200836181640625, -0.248504638671875, -0.1769256591796875, -0.1053466796875, -0.0337677001953125, 0.037811279296875, 0.1093902587890625, 0.18096923828125, 0.2525482177734375, 0.324127197265625, 0.3957061767578125, 0.46728515625, 0.5388641357421875, 0.610443115234375, 0.6820220947265625, 0.75360107421875, 0.8251800537109375, 0.896759033203125, 0.9683380126953125, 1.0399169921875, 1.1114959716796875, 1.183074951171875, 1.2546539306640625, 1.32623291015625, 1.3978118896484375, 1.469390869140625, 1.5409698486328125, 1.612548828125, 1.6841278076171875, 1.755706787109375, 1.8272857666015625, 1.89886474609375, 1.9704437255859375, 2.042022705078125, 2.1136016845703125, 2.1851806640625, 2.2567596435546875, 2.328338623046875, 2.3999176025390625, 2.47149658203125, 2.5430755615234375, 2.614654541015625, 2.6862335205078125, 2.7578125]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 4.0, 5.0, 8.0, 6.0, 16.0, 15.0, 11.0, 24.0, 25.0, 23.0, 46.0, 56.0, 96.0, 146.0, 316.0, 605.0, 812.0, 762.0, 433.0, 247.0, 132.0, 79.0, 47.0, 32.0, 20.0, 20.0, 17.0, 15.0, 7.0, 10.0, 8.0, 8.0, 2.0, 1.0, 7.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.28466796875, -0.2747764587402344, -0.26488494873046875, -0.2549934387207031, -0.2451019287109375, -0.23521041870117188, -0.22531890869140625, -0.21542739868164062, -0.205535888671875, -0.19564437866210938, -0.18575286865234375, -0.17586135864257812, -0.1659698486328125, -0.15607833862304688, -0.14618682861328125, -0.13629531860351562, -0.12640380859375, -0.11651229858398438, -0.10662078857421875, -0.09672927856445312, -0.0868377685546875, -0.07694625854492188, -0.06705474853515625, -0.057163238525390625, -0.047271728515625, -0.037380218505859375, -0.02748870849609375, -0.017597198486328125, -0.0077056884765625, 0.002185821533203125, 0.01207733154296875, 0.021968841552734375, 0.0318603515625, 0.041751861572265625, 0.05164337158203125, 0.061534881591796875, 0.0714263916015625, 0.08131790161132812, 0.09120941162109375, 0.10110092163085938, 0.110992431640625, 0.12088394165039062, 0.13077545166015625, 0.14066696166992188, 0.1505584716796875, 0.16044998168945312, 0.17034149169921875, 0.18023300170898438, 0.19012451171875, 0.20001602172851562, 0.20990753173828125, 0.21979904174804688, 0.2296905517578125, 0.23958206176757812, 0.24947357177734375, 0.2593650817871094, 0.269256591796875, 0.2791481018066406, 0.28903961181640625, 0.2989311218261719, 0.3088226318359375, 0.3187141418457031, 0.32860565185546875, 0.3384971618652344, 0.348388671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 6.0, 12.0, 10.0, 17.0, 29.0, 40.0, 55.0, 70.0, 79.0, 130.0, 115.0, 117.0, 89.0, 52.0, 58.0, 33.0, 17.0, 11.0, 14.0, 11.0, 6.0, 6.0, 2.0, 9.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.5149469375610352, -1.4754689931869507, -1.4359909296035767, -1.3965129852294922, -1.3570350408554077, -1.3175570964813232, -1.2780790328979492, -1.2386010885238647, -1.1991231441497803, -1.1596451997756958, -1.1201671361923218, -1.0806891918182373, -1.0412112474441528, -1.0017333030700684, -0.9622552394866943, -0.9227772951126099, -0.8832992315292358, -0.8438212275505066, -0.8043432831764221, -0.7648652791976929, -0.7253873348236084, -0.6859093308448792, -0.6464313268661499, -0.6069533824920654, -0.5674753785133362, -0.5279973745346069, -0.48851943016052246, -0.4490414261817932, -0.40956345200538635, -0.3700854778289795, -0.33060747385025024, -0.2911294996738434, -0.2516516447067261, -0.2121736705303192, -0.17269568145275116, -0.1332176923751831, -0.09373971819877625, -0.054261744022369385, -0.01478375494480133, 0.024694234132766724, 0.06417220830917358, 0.10365018993616104, 0.1431281715631485, 0.18260616064071655, 0.2220841348171234, 0.2615621089935303, 0.3010401129722595, 0.3405180871486664, 0.37999606132507324, 0.4194740355014801, 0.45895200967788696, 0.4984300136566162, 0.5379079580307007, 0.5773859620094299, 0.6168639659881592, 0.6563419103622437, 0.6958199143409729, 0.7352979183197021, 0.7747758626937866, 0.8142538666725159, 0.8537318706512451, 0.8932098150253296, 0.9326878190040588, 0.9721658229827881, 1.0116437673568726]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 11.0, 11.0, 8.0, 12.0, 12.0, 13.0, 22.0, 31.0, 29.0, 25.0, 34.0, 30.0, 30.0, 33.0, 33.0, 31.0, 52.0, 52.0, 38.0, 31.0, 38.0, 40.0, 37.0, 33.0, 30.0, 38.0, 20.0, 27.0, 28.0, 21.0, 20.0, 22.0, 14.0, 10.0, 15.0, 11.0, 11.0, 12.0, 4.0, 5.0, 5.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0], "bins": [-0.6883559226989746, -0.668379008769989, -0.6484020948410034, -0.628425121307373, -0.6084482073783875, -0.5884712934494019, -0.5684943795204163, -0.5485174655914307, -0.5285404920578003, -0.5085635781288147, -0.4885866343975067, -0.4686097204685211, -0.44863277673721313, -0.42865586280822754, -0.40867894887924194, -0.38870200514793396, -0.36872509121894836, -0.34874817728996277, -0.3287712335586548, -0.3087943196296692, -0.2888173758983612, -0.2688404619693756, -0.24886353313922882, -0.22888660430908203, -0.20890967547893524, -0.18893274664878845, -0.16895581781864166, -0.14897888898849487, -0.12900197505950928, -0.10902503877878189, -0.0890481173992157, -0.06907118856906891, -0.04909425973892212, -0.02911733277142048, -0.009140405803918839, 0.010836519300937653, 0.030813448131084442, 0.05079037696123123, 0.07076729834079742, 0.09074422717094421, 0.110721156001091, 0.1306980848312378, 0.15067501366138458, 0.17065194249153137, 0.19062885642051697, 0.21060580015182495, 0.23058271408081055, 0.25055962800979614, 0.2705365717411041, 0.2905134856700897, 0.3104904294013977, 0.3304673433303833, 0.3504442870616913, 0.3704212009906769, 0.39039814472198486, 0.41037505865097046, 0.43035197257995605, 0.45032888650894165, 0.47030583024024963, 0.49028274416923523, 0.5102596879005432, 0.5302366018295288, 0.5502135157585144, 0.5701904296875, 0.5901674032211304]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 6.0, 11.0, 14.0, 18.0, 28.0, 42.0, 56.0, 71.0, 137.0, 160.0, 234.0, 359.0, 465.0, 666.0, 1043.0, 1496.0, 2331.0, 3532.0, 5937.0, 11323.0, 24439.0, 74964.0, 492179.0, 327085.0, 56592.0, 20477.0, 9710.0, 5555.0, 3192.0, 2041.0, 1346.0, 945.0, 607.0, 432.0, 317.0, 232.0, 153.0, 102.0, 86.0, 57.0, 27.0, 22.0, 25.0, 14.0, 10.0, 6.0, 7.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.33544921875, -0.3249320983886719, -0.31441497802734375, -0.3038978576660156, -0.2933807373046875, -0.2828636169433594, -0.27234649658203125, -0.2618293762207031, -0.251312255859375, -0.24079513549804688, -0.23027801513671875, -0.21976089477539062, -0.2092437744140625, -0.19872665405273438, -0.18820953369140625, -0.17769241333007812, -0.16717529296875, -0.15665817260742188, -0.14614105224609375, -0.13562393188476562, -0.1251068115234375, -0.11458969116210938, -0.10407257080078125, -0.09355545043945312, -0.083038330078125, -0.07252120971679688, -0.06200408935546875, -0.051486968994140625, -0.0409698486328125, -0.030452728271484375, -0.01993560791015625, -0.009418487548828125, 0.0010986328125, 0.011615753173828125, 0.02213287353515625, 0.032649993896484375, 0.0431671142578125, 0.053684234619140625, 0.06420135498046875, 0.07471847534179688, 0.085235595703125, 0.09575271606445312, 0.10626983642578125, 0.11678695678710938, 0.1273040771484375, 0.13782119750976562, 0.14833831787109375, 0.15885543823242188, 0.16937255859375, 0.17988967895507812, 0.19040679931640625, 0.20092391967773438, 0.2114410400390625, 0.22195816040039062, 0.23247528076171875, 0.24299240112304688, 0.253509521484375, 0.2640266418457031, 0.27454376220703125, 0.2850608825683594, 0.2955780029296875, 0.3060951232910156, 0.31661224365234375, 0.3271293640136719, 0.337646484375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 7.0, 11.0, 7.0, 10.0, 12.0, 14.0, 15.0, 19.0, 21.0, 30.0, 26.0, 28.0, 30.0, 34.0, 33.0, 36.0, 55.0, 53.0, 46.0, 52.0, 35.0, 48.0, 38.0, 43.0, 34.0, 39.0, 25.0, 24.0, 22.0, 22.0, 19.0, 18.0, 14.0, 11.0, 16.0, 9.0, 11.0, 7.0, 2.0, 5.0, 2.0, 5.0, 3.0, 5.0, 1.0, 3.0, 4.0, 2.0], "bins": [-0.4453125, -0.4327545166015625, -0.420196533203125, -0.4076385498046875, -0.39508056640625, -0.3825225830078125, -0.369964599609375, -0.3574066162109375, -0.3448486328125, -0.3322906494140625, -0.319732666015625, -0.3071746826171875, -0.29461669921875, -0.2820587158203125, -0.269500732421875, -0.2569427490234375, -0.244384765625, -0.2318267822265625, -0.219268798828125, -0.2067108154296875, -0.19415283203125, -0.1815948486328125, -0.169036865234375, -0.1564788818359375, -0.1439208984375, -0.1313629150390625, -0.118804931640625, -0.1062469482421875, -0.09368896484375, -0.0811309814453125, -0.068572998046875, -0.0560150146484375, -0.04345703125, -0.0308990478515625, -0.018341064453125, -0.0057830810546875, 0.00677490234375, 0.0193328857421875, 0.031890869140625, 0.0444488525390625, 0.0570068359375, 0.0695648193359375, 0.082122802734375, 0.0946807861328125, 0.10723876953125, 0.1197967529296875, 0.132354736328125, 0.1449127197265625, 0.157470703125, 0.1700286865234375, 0.182586669921875, 0.1951446533203125, 0.20770263671875, 0.2202606201171875, 0.232818603515625, 0.2453765869140625, 0.2579345703125, 0.2704925537109375, 0.283050537109375, 0.2956085205078125, 0.30816650390625, 0.3207244873046875, 0.333282470703125, 0.3458404541015625, 0.3583984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 3.0, 10.0, 10.0, 25.0, 41.0, 50.0, 75.0, 112.0, 158.0, 266.0, 406.0, 605.0, 988.0, 1705.0, 2829.0, 5359.0, 10956.0, 26807.0, 80269.0, 318594.0, 424137.0, 112183.0, 34563.0, 13669.0, 6372.0, 3363.0, 1893.0, 1072.0, 692.0, 459.0, 320.0, 172.0, 115.0, 87.0, 56.0, 37.0, 35.0, 25.0, 14.0, 7.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.189208984375, -0.18313026428222656, -0.17705154418945312, -0.1709728240966797, -0.16489410400390625, -0.1588153839111328, -0.15273666381835938, -0.14665794372558594, -0.1405792236328125, -0.13450050354003906, -0.12842178344726562, -0.12234306335449219, -0.11626434326171875, -0.11018562316894531, -0.10410690307617188, -0.09802818298339844, -0.091949462890625, -0.08587074279785156, -0.07979202270507812, -0.07371330261230469, -0.06763458251953125, -0.06155586242675781, -0.055477142333984375, -0.04939842224121094, -0.0433197021484375, -0.03724098205566406, -0.031162261962890625, -0.025083541870117188, -0.01900482177734375, -0.012926101684570312, -0.006847381591796875, -0.0007686614990234375, 0.00531005859375, 0.011388778686523438, 0.017467498779296875, 0.023546218872070312, 0.02962493896484375, 0.03570365905761719, 0.041782379150390625, 0.04786109924316406, 0.0539398193359375, 0.06001853942871094, 0.06609725952148438, 0.07217597961425781, 0.07825469970703125, 0.08433341979980469, 0.09041213989257812, 0.09649085998535156, 0.102569580078125, 0.10864830017089844, 0.11472702026367188, 0.12080574035644531, 0.12688446044921875, 0.1329631805419922, 0.13904190063476562, 0.14512062072753906, 0.1511993408203125, 0.15727806091308594, 0.16335678100585938, 0.1694355010986328, 0.17551422119140625, 0.1815929412841797, 0.18767166137695312, 0.19375038146972656, 0.1998291015625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 7.0, 6.0, 6.0, 10.0, 3.0, 15.0, 13.0, 14.0, 13.0, 17.0, 17.0, 32.0, 29.0, 25.0, 31.0, 32.0, 49.0, 56.0, 32.0, 50.0, 39.0, 47.0, 46.0, 39.0, 34.0, 40.0, 42.0, 33.0, 27.0, 27.0, 34.0, 18.0, 24.0, 12.0, 17.0, 8.0, 11.0, 11.0, 10.0, 10.0, 5.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.69091796875, -0.6693344116210938, -0.6477508544921875, -0.6261672973632812, -0.604583740234375, -0.5830001831054688, -0.5614166259765625, -0.5398330688476562, -0.51824951171875, -0.49666595458984375, -0.4750823974609375, -0.45349884033203125, -0.431915283203125, -0.41033172607421875, -0.3887481689453125, -0.36716461181640625, -0.3455810546875, -0.32399749755859375, -0.3024139404296875, -0.28083038330078125, -0.259246826171875, -0.23766326904296875, -0.2160797119140625, -0.19449615478515625, -0.17291259765625, -0.15132904052734375, -0.1297454833984375, -0.10816192626953125, -0.086578369140625, -0.06499481201171875, -0.0434112548828125, -0.02182769775390625, -0.000244140625, 0.02133941650390625, 0.0429229736328125, 0.06450653076171875, 0.086090087890625, 0.10767364501953125, 0.1292572021484375, 0.15084075927734375, 0.17242431640625, 0.19400787353515625, 0.2155914306640625, 0.23717498779296875, 0.258758544921875, 0.28034210205078125, 0.3019256591796875, 0.32350921630859375, 0.3450927734375, 0.36667633056640625, 0.3882598876953125, 0.40984344482421875, 0.431427001953125, 0.45301055908203125, 0.4745941162109375, 0.49617767333984375, 0.51776123046875, 0.5393447875976562, 0.5609283447265625, 0.5825119018554688, 0.604095458984375, 0.6256790161132812, 0.6472625732421875, 0.6688461303710938, 0.6904296875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 12.0, 18.0, 18.0, 42.0, 54.0, 85.0, 132.0, 225.0, 357.0, 611.0, 1193.0, 2235.0, 4614.0, 10980.0, 28990.0, 92764.0, 350725.0, 392717.0, 107487.0, 32894.0, 12104.0, 5141.0, 2388.0, 1163.0, 645.0, 356.0, 234.0, 129.0, 88.0, 44.0, 24.0, 22.0, 16.0, 10.0, 10.0, 1.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0421142578125, -0.04084014892578125, -0.0395660400390625, -0.03829193115234375, -0.037017822265625, -0.03574371337890625, -0.0344696044921875, -0.03319549560546875, -0.03192138671875, -0.03064727783203125, -0.0293731689453125, -0.02809906005859375, -0.026824951171875, -0.02555084228515625, -0.0242767333984375, -0.02300262451171875, -0.021728515625, -0.02045440673828125, -0.0191802978515625, -0.01790618896484375, -0.016632080078125, -0.01535797119140625, -0.0140838623046875, -0.01280975341796875, -0.01153564453125, -0.01026153564453125, -0.0089874267578125, -0.00771331787109375, -0.006439208984375, -0.00516510009765625, -0.0038909912109375, -0.00261688232421875, -0.0013427734375, -6.866455078125e-05, 0.0012054443359375, 0.00247955322265625, 0.003753662109375, 0.00502777099609375, 0.0063018798828125, 0.00757598876953125, 0.00885009765625, 0.01012420654296875, 0.0113983154296875, 0.01267242431640625, 0.013946533203125, 0.01522064208984375, 0.0164947509765625, 0.01776885986328125, 0.01904296875, 0.02031707763671875, 0.0215911865234375, 0.02286529541015625, 0.024139404296875, 0.02541351318359375, 0.0266876220703125, 0.02796173095703125, 0.02923583984375, 0.03050994873046875, 0.0317840576171875, 0.03305816650390625, 0.034332275390625, 0.03560638427734375, 0.0368804931640625, 0.03815460205078125, 0.0394287109375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 4.0, 6.0, 11.0, 17.0, 15.0, 30.0, 45.0, 58.0, 85.0, 133.0, 141.0, 130.0, 102.0, 83.0, 42.0, 34.0, 23.0, 10.0, 17.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.075599670410156e-05, -2.964399755001068e-05, -2.85319983959198e-05, -2.741999924182892e-05, -2.6308000087738037e-05, -2.5196000933647156e-05, -2.4084001779556274e-05, -2.2972002625465393e-05, -2.1860003471374512e-05, -2.074800431728363e-05, -1.963600516319275e-05, -1.8524006009101868e-05, -1.7412006855010986e-05, -1.6300007700920105e-05, -1.5188008546829224e-05, -1.4076009392738342e-05, -1.2964010238647461e-05, -1.185201108455658e-05, -1.0740011930465698e-05, -9.628012776374817e-06, -8.516013622283936e-06, -7.404014468193054e-06, -6.292015314102173e-06, -5.1800161600112915e-06, -4.06801700592041e-06, -2.956017851829529e-06, -1.8440186977386475e-06, -7.320195436477661e-07, 3.7997961044311523e-07, 1.4919787645339966e-06, 2.603977918624878e-06, 3.7159770727157593e-06, 4.827976226806641e-06, 5.939975380897522e-06, 7.051974534988403e-06, 8.163973689079285e-06, 9.275972843170166e-06, 1.0387971997261047e-05, 1.1499971151351929e-05, 1.261197030544281e-05, 1.3723969459533691e-05, 1.4835968613624573e-05, 1.5947967767715454e-05, 1.7059966921806335e-05, 1.8171966075897217e-05, 1.9283965229988098e-05, 2.039596438407898e-05, 2.150796353816986e-05, 2.2619962692260742e-05, 2.3731961846351624e-05, 2.4843961000442505e-05, 2.5955960154533386e-05, 2.7067959308624268e-05, 2.817995846271515e-05, 2.929195761680603e-05, 3.040395677089691e-05, 3.151595592498779e-05, 3.2627955079078674e-05, 3.3739954233169556e-05, 3.485195338726044e-05, 3.596395254135132e-05, 3.70759516954422e-05, 3.818795084953308e-05, 3.929995000362396e-05, 4.0411949157714844e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 8.0, 9.0, 18.0, 23.0, 49.0, 72.0, 149.0, 340.0, 801.0, 2560.0, 10482.0, 57410.0, 487737.0, 425676.0, 50122.0, 9385.0, 2370.0, 718.0, 298.0, 133.0, 72.0, 32.0, 27.0, 9.0, 20.0, 8.0, 5.0, 6.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08709716796875, -0.0845327377319336, -0.08196830749511719, -0.07940387725830078, -0.07683944702148438, -0.07427501678466797, -0.07171058654785156, -0.06914615631103516, -0.06658172607421875, -0.06401729583740234, -0.06145286560058594, -0.05888843536376953, -0.056324005126953125, -0.05375957489013672, -0.05119514465332031, -0.048630714416503906, -0.0460662841796875, -0.043501853942871094, -0.04093742370605469, -0.03837299346923828, -0.035808563232421875, -0.03324413299560547, -0.030679702758789062, -0.028115272521972656, -0.02555084228515625, -0.022986412048339844, -0.020421981811523438, -0.01785755157470703, -0.015293121337890625, -0.012728691101074219, -0.010164260864257812, -0.007599830627441406, -0.005035400390625, -0.0024709701538085938, 9.34600830078125e-05, 0.0026578903198242188, 0.005222320556640625, 0.007786750793457031, 0.010351181030273438, 0.012915611267089844, 0.01548004150390625, 0.018044471740722656, 0.020608901977539062, 0.02317333221435547, 0.025737762451171875, 0.02830219268798828, 0.030866622924804688, 0.033431053161621094, 0.0359954833984375, 0.038559913635253906, 0.04112434387207031, 0.04368877410888672, 0.046253204345703125, 0.04881763458251953, 0.05138206481933594, 0.053946495056152344, 0.05651092529296875, 0.059075355529785156, 0.06163978576660156, 0.06420421600341797, 0.06676864624023438, 0.06933307647705078, 0.07189750671386719, 0.0744619369506836, 0.0770263671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 4.0, 9.0, 5.0, 8.0, 12.0, 17.0, 13.0, 18.0, 14.0, 27.0, 31.0, 33.0, 53.0, 67.0, 61.0, 72.0, 64.0, 63.0, 73.0, 57.0, 47.0, 47.0, 32.0, 31.0, 34.0, 20.0, 22.0, 13.0, 12.0, 10.0, 6.0, 7.0, 5.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0129241943359375, -0.012572526931762695, -0.01222085952758789, -0.011869192123413086, -0.011517524719238281, -0.011165857315063477, -0.010814189910888672, -0.010462522506713867, -0.010110855102539062, -0.009759187698364258, -0.009407520294189453, -0.009055852890014648, -0.008704185485839844, -0.008352518081665039, -0.008000850677490234, -0.00764918327331543, -0.007297515869140625, -0.00694584846496582, -0.006594181060791016, -0.006242513656616211, -0.005890846252441406, -0.0055391788482666016, -0.005187511444091797, -0.004835844039916992, -0.0044841766357421875, -0.004132509231567383, -0.003780841827392578, -0.0034291744232177734, -0.0030775070190429688, -0.002725839614868164, -0.0023741722106933594, -0.0020225048065185547, -0.00167083740234375, -0.0013191699981689453, -0.0009675025939941406, -0.0006158351898193359, -0.00026416778564453125, 8.749961853027344e-05, 0.0004391670227050781, 0.0007908344268798828, 0.0011425018310546875, 0.0014941692352294922, 0.0018458366394042969, 0.0021975040435791016, 0.0025491714477539062, 0.002900838851928711, 0.0032525062561035156, 0.0036041736602783203, 0.003955841064453125, 0.00430750846862793, 0.004659175872802734, 0.005010843276977539, 0.005362510681152344, 0.0057141780853271484, 0.006065845489501953, 0.006417512893676758, 0.0067691802978515625, 0.007120847702026367, 0.007472515106201172, 0.007824182510375977, 0.008175849914550781, 0.008527517318725586, 0.00887918472290039, 0.009230852127075195, 0.00958251953125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 6.0, 13.0, 7.0, 11.0, 26.0, 25.0, 42.0, 43.0, 66.0, 89.0, 115.0, 114.0, 108.0, 92.0, 47.0, 48.0, 36.0, 31.0, 19.0, 8.0, 9.0, 6.0, 7.0, 2.0, 5.0, 2.0, 4.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.8256650567054749, -0.8052636981010437, -0.7848622798919678, -0.7644609212875366, -0.7440595626831055, -0.7236582040786743, -0.7032567858695984, -0.6828554272651672, -0.6624540090560913, -0.6420526504516602, -0.6216512322425842, -0.6012498736381531, -0.5808485150337219, -0.560447096824646, -0.5400457382202148, -0.5196443796157837, -0.49924302101135254, -0.478841632604599, -0.45844027400016785, -0.4380388855934143, -0.41763752698898315, -0.3972361385822296, -0.3768347501754761, -0.3564333915710449, -0.3360320031642914, -0.31563061475753784, -0.2952292561531067, -0.27482786774635315, -0.2544264793395996, -0.23402512073516846, -0.21362373232841492, -0.19322235882282257, -0.17282095551490784, -0.1524195820093155, -0.13201820850372314, -0.1116168200969696, -0.09121544659137726, -0.07081407308578491, -0.05041269212961197, -0.030011311173439026, -0.00960993766784668, 0.010791439563035965, 0.03119281679391861, 0.051594194024801254, 0.0719955712556839, 0.09239694476127625, 0.11279832571744919, 0.13319970667362213, 0.15360108017921448, 0.17400245368480682, 0.19440382719039917, 0.2148052155971527, 0.23520658910274506, 0.2556079626083374, 0.27600935101509094, 0.2964107394218445, 0.31681209802627563, 0.3372134864330292, 0.3576148450374603, 0.37801623344421387, 0.398417592048645, 0.41881898045539856, 0.4392203688621521, 0.45962172746658325, 0.4800231158733368]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 8.0, 9.0, 8.0, 12.0, 9.0, 12.0, 20.0, 17.0, 26.0, 36.0, 24.0, 25.0, 32.0, 28.0, 42.0, 32.0, 51.0, 49.0, 52.0, 45.0, 41.0, 29.0, 40.0, 37.0, 27.0, 48.0, 29.0, 24.0, 26.0, 33.0, 17.0, 15.0, 17.0, 12.0, 15.0, 14.0, 6.0, 8.0, 5.0, 4.0, 4.0, 3.0, 6.0, 2.0, 1.0, 4.0, 4.0], "bins": [-0.43707090616226196, -0.4251249432563782, -0.4131790101528168, -0.40123307704925537, -0.3892871141433716, -0.3773411512374878, -0.3653952181339264, -0.353449285030365, -0.3415033221244812, -0.3295573592185974, -0.317611426115036, -0.3056654930114746, -0.2937195301055908, -0.28177356719970703, -0.26982763409614563, -0.25788170099258423, -0.24593573808670044, -0.23398979008197784, -0.22204384207725525, -0.21009789407253265, -0.19815194606781006, -0.18620599806308746, -0.17426005005836487, -0.16231410205364227, -0.15036815404891968, -0.13842220604419708, -0.1264762580394745, -0.11453031003475189, -0.1025843620300293, -0.0906384140253067, -0.0786924660205841, -0.06674651801586151, -0.054800570011138916, -0.04285462200641632, -0.030908674001693726, -0.01896272599697113, -0.007016777992248535, 0.00492917001247406, 0.016875118017196655, 0.02882106602191925, 0.040767014026641846, 0.05271296203136444, 0.06465891003608704, 0.07660485804080963, 0.08855080604553223, 0.10049675405025482, 0.11244270205497742, 0.12438865005970001, 0.1363345980644226, 0.1482805460691452, 0.1602264940738678, 0.1721724420785904, 0.184118390083313, 0.19606433808803558, 0.20801028609275818, 0.21995623409748077, 0.23190218210220337, 0.24384813010692596, 0.25579407811164856, 0.26774001121520996, 0.27968597412109375, 0.29163193702697754, 0.30357787013053894, 0.31552380323410034, 0.32746976613998413]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 3.0, 6.0, 8.0, 10.0, 14.0, 18.0, 38.0, 56.0, 77.0, 97.0, 123.0, 206.0, 342.0, 471.0, 734.0, 1180.0, 1848.0, 3102.0, 5420.0, 10728.0, 32728.0, 269941.0, 625557.0, 63409.0, 15432.0, 7000.0, 3819.0, 2255.0, 1367.0, 885.0, 551.0, 397.0, 240.0, 151.0, 90.0, 70.0, 58.0, 43.0, 29.0, 24.0, 9.0, 4.0, 5.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.484619140625, -0.4700202941894531, -0.45542144775390625, -0.4408226013183594, -0.4262237548828125, -0.4116249084472656, -0.39702606201171875, -0.3824272155761719, -0.367828369140625, -0.3532295227050781, -0.33863067626953125, -0.3240318298339844, -0.3094329833984375, -0.2948341369628906, -0.28023529052734375, -0.2656364440917969, -0.25103759765625, -0.23643875122070312, -0.22183990478515625, -0.20724105834960938, -0.1926422119140625, -0.17804336547851562, -0.16344451904296875, -0.14884567260742188, -0.134246826171875, -0.11964797973632812, -0.10504913330078125, -0.09045028686523438, -0.0758514404296875, -0.061252593994140625, -0.04665374755859375, -0.032054901123046875, -0.0174560546875, -0.002857208251953125, 0.01174163818359375, 0.026340484619140625, 0.0409393310546875, 0.055538177490234375, 0.07013702392578125, 0.08473587036132812, 0.099334716796875, 0.11393356323242188, 0.12853240966796875, 0.14313125610351562, 0.1577301025390625, 0.17232894897460938, 0.18692779541015625, 0.20152664184570312, 0.21612548828125, 0.23072433471679688, 0.24532318115234375, 0.2599220275878906, 0.2745208740234375, 0.2891197204589844, 0.30371856689453125, 0.3183174133300781, 0.332916259765625, 0.3475151062011719, 0.36211395263671875, 0.3767127990722656, 0.3913116455078125, 0.4059104919433594, 0.42050933837890625, 0.4351081848144531, 0.44970703125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 10.0, 7.0, 9.0, 9.0, 14.0, 17.0, 27.0, 17.0, 25.0, 26.0, 33.0, 22.0, 38.0, 44.0, 47.0, 50.0, 47.0, 59.0, 52.0, 47.0, 30.0, 40.0, 47.0, 32.0, 28.0, 25.0, 33.0, 27.0, 19.0, 16.0, 19.0, 17.0, 9.0, 7.0, 11.0, 7.0, 8.0, 7.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 3.0], "bins": [-1.00390625, -0.9770126342773438, -0.9501190185546875, -0.9232254028320312, -0.896331787109375, -0.8694381713867188, -0.8425445556640625, -0.8156509399414062, -0.78875732421875, -0.7618637084960938, -0.7349700927734375, -0.7080764770507812, -0.681182861328125, -0.6542892456054688, -0.6273956298828125, -0.6005020141601562, -0.5736083984375, -0.5467147827148438, -0.5198211669921875, -0.49292755126953125, -0.466033935546875, -0.43914031982421875, -0.4122467041015625, -0.38535308837890625, -0.35845947265625, -0.33156585693359375, -0.3046722412109375, -0.27777862548828125, -0.250885009765625, -0.22399139404296875, -0.1970977783203125, -0.17020416259765625, -0.143310546875, -0.11641693115234375, -0.0895233154296875, -0.06262969970703125, -0.035736083984375, -0.00884246826171875, 0.0180511474609375, 0.04494476318359375, 0.07183837890625, 0.09873199462890625, 0.1256256103515625, 0.15251922607421875, 0.179412841796875, 0.20630645751953125, 0.2332000732421875, 0.26009368896484375, 0.2869873046875, 0.31388092041015625, 0.3407745361328125, 0.36766815185546875, 0.394561767578125, 0.42145538330078125, 0.4483489990234375, 0.47524261474609375, 0.50213623046875, 0.5290298461914062, 0.5559234619140625, 0.5828170776367188, 0.609710693359375, 0.6366043090820312, 0.6634979248046875, 0.6903915405273438, 0.71728515625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 3.0, 4.0, 7.0, 2.0, 5.0, 6.0, 12.0, 14.0, 5.0, 23.0, 17.0, 23.0, 17.0, 14.0, 28.0, 28.0, 39.0, 35.0, 45.0, 64.0, 136.0, 700.0, 38981.0, 1005200.0, 2556.0, 184.0, 63.0, 56.0, 36.0, 29.0, 33.0, 24.0, 22.0, 21.0, 17.0, 19.0, 8.0, 7.0, 13.0, 5.0, 9.0, 13.0, 8.0, 6.0, 4.0, 0.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.41796875, -2.337921142578125, -2.25787353515625, -2.177825927734375, -2.0977783203125, -2.017730712890625, -1.93768310546875, -1.857635498046875, -1.777587890625, -1.697540283203125, -1.61749267578125, -1.537445068359375, -1.4573974609375, -1.377349853515625, -1.29730224609375, -1.217254638671875, -1.13720703125, -1.057159423828125, -0.97711181640625, -0.897064208984375, -0.8170166015625, -0.736968994140625, -0.65692138671875, -0.576873779296875, -0.496826171875, -0.416778564453125, -0.33673095703125, -0.256683349609375, -0.1766357421875, -0.096588134765625, -0.01654052734375, 0.063507080078125, 0.1435546875, 0.223602294921875, 0.30364990234375, 0.383697509765625, 0.4637451171875, 0.543792724609375, 0.62384033203125, 0.703887939453125, 0.783935546875, 0.863983154296875, 0.94403076171875, 1.024078369140625, 1.1041259765625, 1.184173583984375, 1.26422119140625, 1.344268798828125, 1.42431640625, 1.504364013671875, 1.58441162109375, 1.664459228515625, 1.7445068359375, 1.824554443359375, 1.90460205078125, 1.984649658203125, 2.064697265625, 2.144744873046875, 2.22479248046875, 2.304840087890625, 2.3848876953125, 2.464935302734375, 2.54498291015625, 2.625030517578125, 2.705078125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 5.0, 4.0, 4.0, 5.0, 8.0, 13.0, 11.0, 20.0, 21.0, 16.0, 21.0, 21.0, 26.0, 33.0, 36.0, 47.0, 35.0, 59.0, 51.0, 42.0, 45.0, 35.0, 64.0, 38.0, 38.0, 31.0, 40.0, 34.0, 23.0, 19.0, 23.0, 24.0, 13.0, 13.0, 14.0, 9.0, 6.0, 12.0, 10.0, 5.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75146484375, -0.72705078125, -0.70263671875, -0.67822265625, -0.65380859375, -0.62939453125, -0.60498046875, -0.58056640625, -0.55615234375, -0.53173828125, -0.50732421875, -0.48291015625, -0.45849609375, -0.43408203125, -0.40966796875, -0.38525390625, -0.36083984375, -0.33642578125, -0.31201171875, -0.28759765625, -0.26318359375, -0.23876953125, -0.21435546875, -0.18994140625, -0.16552734375, -0.14111328125, -0.11669921875, -0.09228515625, -0.06787109375, -0.04345703125, -0.01904296875, 0.00537109375, 0.02978515625, 0.05419921875, 0.07861328125, 0.10302734375, 0.12744140625, 0.15185546875, 0.17626953125, 0.20068359375, 0.22509765625, 0.24951171875, 0.27392578125, 0.29833984375, 0.32275390625, 0.34716796875, 0.37158203125, 0.39599609375, 0.42041015625, 0.44482421875, 0.46923828125, 0.49365234375, 0.51806640625, 0.54248046875, 0.56689453125, 0.59130859375, 0.61572265625, 0.64013671875, 0.66455078125, 0.68896484375, 0.71337890625, 0.73779296875, 0.76220703125, 0.78662109375, 0.81103515625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 2.0, 7.0, 11.0, 13.0, 27.0, 37.0, 59.0, 109.0, 152.0, 295.0, 584.0, 1136.0, 2481.0, 6147.0, 22850.0, 635212.0, 350621.0, 18586.0, 5442.0, 2293.0, 1138.0, 595.0, 340.0, 171.0, 93.0, 61.0, 26.0, 25.0, 12.0, 4.0, 3.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.271728515625, -0.26416778564453125, -0.2566070556640625, -0.24904632568359375, -0.241485595703125, -0.23392486572265625, -0.2263641357421875, -0.21880340576171875, -0.21124267578125, -0.20368194580078125, -0.1961212158203125, -0.18856048583984375, -0.180999755859375, -0.17343902587890625, -0.1658782958984375, -0.15831756591796875, -0.1507568359375, -0.14319610595703125, -0.1356353759765625, -0.12807464599609375, -0.120513916015625, -0.11295318603515625, -0.1053924560546875, -0.09783172607421875, -0.09027099609375, -0.08271026611328125, -0.0751495361328125, -0.06758880615234375, -0.060028076171875, -0.05246734619140625, -0.0449066162109375, -0.03734588623046875, -0.02978515625, -0.02222442626953125, -0.0146636962890625, -0.00710296630859375, 0.000457763671875, 0.00801849365234375, 0.0155792236328125, 0.02313995361328125, 0.03070068359375, 0.03826141357421875, 0.0458221435546875, 0.05338287353515625, 0.060943603515625, 0.06850433349609375, 0.0760650634765625, 0.08362579345703125, 0.0911865234375, 0.09874725341796875, 0.1063079833984375, 0.11386871337890625, 0.121429443359375, 0.12899017333984375, 0.1365509033203125, 0.14411163330078125, 0.15167236328125, 0.15923309326171875, 0.1667938232421875, 0.17435455322265625, 0.181915283203125, 0.18947601318359375, 0.1970367431640625, 0.20459747314453125, 0.212158203125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 3.0, 2.0, 8.0, 8.0, 23.0, 44.0, 154.0, 408.0, 210.0, 60.0, 31.0, 16.0, 9.0, 8.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.463029861450195e-05, -3.277510404586792e-05, -3.091990947723389e-05, -2.9064714908599854e-05, -2.720952033996582e-05, -2.5354325771331787e-05, -2.3499131202697754e-05, -2.164393663406372e-05, -1.9788742065429688e-05, -1.7933547496795654e-05, -1.607835292816162e-05, -1.4223158359527588e-05, -1.2367963790893555e-05, -1.0512769222259521e-05, -8.657574653625488e-06, -6.802380084991455e-06, -4.947185516357422e-06, -3.0919909477233887e-06, -1.2367963790893555e-06, 6.183981895446777e-07, 2.473592758178711e-06, 4.328787326812744e-06, 6.183981895446777e-06, 8.03917646408081e-06, 9.894371032714844e-06, 1.1749565601348877e-05, 1.360476016998291e-05, 1.5459954738616943e-05, 1.7315149307250977e-05, 1.917034387588501e-05, 2.1025538444519043e-05, 2.2880733013153076e-05, 2.473592758178711e-05, 2.6591122150421143e-05, 2.8446316719055176e-05, 3.030151128768921e-05, 3.215670585632324e-05, 3.4011900424957275e-05, 3.586709499359131e-05, 3.772228956222534e-05, 3.9577484130859375e-05, 4.143267869949341e-05, 4.328787326812744e-05, 4.5143067836761475e-05, 4.699826240539551e-05, 4.885345697402954e-05, 5.0708651542663574e-05, 5.256384611129761e-05, 5.441904067993164e-05, 5.6274235248565674e-05, 5.812942981719971e-05, 5.998462438583374e-05, 6.183981895446777e-05, 6.36950135231018e-05, 6.555020809173584e-05, 6.740540266036987e-05, 6.92605972290039e-05, 7.111579179763794e-05, 7.297098636627197e-05, 7.4826180934906e-05, 7.668137550354004e-05, 7.853657007217407e-05, 8.03917646408081e-05, 8.224695920944214e-05, 8.410215377807617e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 9.0, 13.0, 22.0, 23.0, 43.0, 49.0, 95.0, 119.0, 213.0, 329.0, 489.0, 849.0, 1368.0, 2337.0, 4480.0, 9882.0, 32141.0, 584514.0, 365636.0, 27049.0, 8954.0, 4193.0, 2292.0, 1265.0, 824.0, 459.0, 336.0, 177.0, 122.0, 86.0, 56.0, 35.0, 30.0, 13.0, 15.0, 9.0, 9.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2122802734375, -0.20563507080078125, -0.1989898681640625, -0.19234466552734375, -0.185699462890625, -0.17905426025390625, -0.1724090576171875, -0.16576385498046875, -0.15911865234375, -0.15247344970703125, -0.1458282470703125, -0.13918304443359375, -0.132537841796875, -0.12589263916015625, -0.1192474365234375, -0.11260223388671875, -0.10595703125, -0.09931182861328125, -0.0926666259765625, -0.08602142333984375, -0.079376220703125, -0.07273101806640625, -0.0660858154296875, -0.05944061279296875, -0.05279541015625, -0.04615020751953125, -0.0395050048828125, -0.03285980224609375, -0.026214599609375, -0.01956939697265625, -0.0129241943359375, -0.00627899169921875, 0.0003662109375, 0.00701141357421875, 0.0136566162109375, 0.02030181884765625, 0.026947021484375, 0.03359222412109375, 0.0402374267578125, 0.04688262939453125, 0.05352783203125, 0.06017303466796875, 0.0668182373046875, 0.07346343994140625, 0.080108642578125, 0.08675384521484375, 0.0933990478515625, 0.10004425048828125, 0.106689453125, 0.11333465576171875, 0.1199798583984375, 0.12662506103515625, 0.133270263671875, 0.13991546630859375, 0.1465606689453125, 0.15320587158203125, 0.15985107421875, 0.16649627685546875, 0.1731414794921875, 0.17978668212890625, 0.186431884765625, 0.19307708740234375, 0.1997222900390625, 0.20636749267578125, 0.2130126953125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 5.0, 3.0, 1.0, 8.0, 14.0, 23.0, 31.0, 50.0, 102.0, 203.0, 248.0, 120.0, 58.0, 40.0, 17.0, 17.0, 13.0, 4.0, 8.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1109619140625, -0.10771656036376953, -0.10447120666503906, -0.1012258529663086, -0.09798049926757812, -0.09473514556884766, -0.09148979187011719, -0.08824443817138672, -0.08499908447265625, -0.08175373077392578, -0.07850837707519531, -0.07526302337646484, -0.07201766967773438, -0.0687723159790039, -0.06552696228027344, -0.06228160858154297, -0.0590362548828125, -0.05579090118408203, -0.05254554748535156, -0.049300193786621094, -0.046054840087890625, -0.042809486389160156, -0.03956413269042969, -0.03631877899169922, -0.03307342529296875, -0.02982807159423828, -0.026582717895507812, -0.023337364196777344, -0.020092010498046875, -0.016846656799316406, -0.013601303100585938, -0.010355949401855469, -0.007110595703125, -0.0038652420043945312, -0.0006198883056640625, 0.0026254653930664062, 0.005870819091796875, 0.009116172790527344, 0.012361526489257812, 0.015606880187988281, 0.01885223388671875, 0.02209758758544922, 0.025342941284179688, 0.028588294982910156, 0.031833648681640625, 0.035079002380371094, 0.03832435607910156, 0.04156970977783203, 0.0448150634765625, 0.04806041717529297, 0.05130577087402344, 0.054551124572753906, 0.057796478271484375, 0.061041831970214844, 0.06428718566894531, 0.06753253936767578, 0.07077789306640625, 0.07402324676513672, 0.07726860046386719, 0.08051395416259766, 0.08375930786132812, 0.0870046615600586, 0.09025001525878906, 0.09349536895751953, 0.09674072265625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 1.0, 15.0, 13.0, 19.0, 28.0, 49.0, 54.0, 91.0, 115.0, 136.0, 113.0, 115.0, 76.0, 44.0, 31.0, 27.0, 14.0, 14.0, 7.0, 7.0, 4.0, 8.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9558732509613037, -1.9066932201385498, -1.857513189315796, -1.808333158493042, -1.759153127670288, -1.7099730968475342, -1.6607930660247803, -1.6116130352020264, -1.5624330043792725, -1.5132529735565186, -1.4640729427337646, -1.4148929119110107, -1.3657128810882568, -1.316532850265503, -1.267352819442749, -1.2181727886199951, -1.1689927577972412, -1.1198127269744873, -1.0706326961517334, -1.0214526653289795, -0.9722726345062256, -0.9230926036834717, -0.8739125728607178, -0.8247325420379639, -0.77555251121521, -0.726372480392456, -0.6771924495697021, -0.6280124187469482, -0.5788323879241943, -0.5296523571014404, -0.4804723262786865, -0.4312922954559326, -0.38211214542388916, -0.33293211460113525, -0.28375208377838135, -0.23457205295562744, -0.18539202213287354, -0.13621199131011963, -0.08703196048736572, -0.037851929664611816, 0.01132810115814209, 0.060508131980895996, 0.1096881628036499, 0.1588681936264038, 0.20804822444915771, 0.2572282552719116, 0.3064082860946655, 0.35558831691741943, 0.40476834774017334, 0.45394837856292725, 0.5031284093856812, 0.5523084402084351, 0.601488471031189, 0.6506685018539429, 0.6998485326766968, 0.7490285634994507, 0.7982085943222046, 0.8473886251449585, 0.8965686559677124, 0.9457486867904663, 0.9949287176132202, 1.0441087484359741, 1.093288779258728, 1.142468810081482, 1.1916488409042358]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 12.0, 10.0, 13.0, 19.0, 18.0, 23.0, 30.0, 42.0, 29.0, 37.0, 46.0, 40.0, 40.0, 45.0, 51.0, 40.0, 45.0, 43.0, 42.0, 34.0, 40.0, 47.0, 35.0, 32.0, 28.0, 18.0, 22.0, 23.0, 20.0, 16.0, 5.0, 6.0, 9.0, 5.0, 7.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3416337966918945, -1.2968405485153198, -1.2520473003387451, -1.2072540521621704, -1.1624608039855957, -1.1176674365997314, -1.0728741884231567, -1.028080940246582, -0.9832876920700073, -0.9384944438934326, -0.8937011957168579, -0.8489078879356384, -0.8041146397590637, -0.759321391582489, -0.7145280838012695, -0.6697348356246948, -0.6249415874481201, -0.5801483392715454, -0.5353550910949707, -0.4905617833137512, -0.4457685351371765, -0.4009752869606018, -0.3561820089817047, -0.3113887310028076, -0.2665954828262329, -0.221802219748497, -0.1770089566707611, -0.1322156935930252, -0.0874224305152893, -0.042629167437553406, 0.002164095640182495, 0.04695737361907959, 0.09175074100494385, 0.13654400408267975, 0.18133726716041565, 0.22613053023815155, 0.27092379331588745, 0.31571704149246216, 0.36051031947135925, 0.40530359745025635, 0.45009684562683105, 0.49489009380340576, 0.5396833419799805, 0.5844766497612, 0.6292698979377747, 0.6740631461143494, 0.7188564538955688, 0.7636497020721436, 0.8084429502487183, 0.853236198425293, 0.8980294466018677, 0.9428227543830872, 0.9876160025596619, 1.0324093103408813, 1.077202558517456, 1.1219958066940308, 1.1667890548706055, 1.2115823030471802, 1.2563755512237549, 1.3011687994003296, 1.3459620475769043, 1.3907554149627686, 1.4355486631393433, 1.480341911315918, 1.5251351594924927]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 8.0, 14.0, 18.0, 24.0, 41.0, 55.0, 87.0, 180.0, 338.0, 839.0, 2499.0, 10447.0, 298524.0, 3814377.0, 57758.0, 6136.0, 1687.0, 615.0, 247.0, 144.0, 75.0, 42.0, 37.0, 30.0, 15.0, 14.0, 9.0, 6.0, 3.0, 2.0, 0.0, 0.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.326171875, -2.24407958984375, -2.1619873046875, -2.07989501953125, -1.997802734375, -1.91571044921875, -1.8336181640625, -1.75152587890625, -1.66943359375, -1.58734130859375, -1.5052490234375, -1.42315673828125, -1.341064453125, -1.25897216796875, -1.1768798828125, -1.09478759765625, -1.0126953125, -0.93060302734375, -0.8485107421875, -0.76641845703125, -0.684326171875, -0.60223388671875, -0.5201416015625, -0.43804931640625, -0.35595703125, -0.27386474609375, -0.1917724609375, -0.10968017578125, -0.027587890625, 0.05450439453125, 0.1365966796875, 0.21868896484375, 0.30078125, 0.38287353515625, 0.4649658203125, 0.54705810546875, 0.629150390625, 0.71124267578125, 0.7933349609375, 0.87542724609375, 0.95751953125, 1.03961181640625, 1.1217041015625, 1.20379638671875, 1.285888671875, 1.36798095703125, 1.4500732421875, 1.53216552734375, 1.6142578125, 1.69635009765625, 1.7784423828125, 1.86053466796875, 1.942626953125, 2.02471923828125, 2.1068115234375, 2.18890380859375, 2.27099609375, 2.35308837890625, 2.4351806640625, 2.51727294921875, 2.599365234375, 2.68145751953125, 2.7635498046875, 2.84564208984375, 2.927734375]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 8.0, 8.0, 6.0, 15.0, 14.0, 19.0, 22.0, 28.0, 39.0, 35.0, 38.0, 55.0, 50.0, 58.0, 59.0, 45.0, 62.0, 51.0, 56.0, 57.0, 39.0, 38.0, 38.0, 25.0, 27.0, 25.0, 23.0, 15.0, 12.0, 5.0, 8.0, 4.0, 3.0, 1.0, 5.0, 2.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.705078125, -0.6843109130859375, -0.663543701171875, -0.6427764892578125, -0.62200927734375, -0.6012420654296875, -0.580474853515625, -0.5597076416015625, -0.5389404296875, -0.5181732177734375, -0.497406005859375, -0.4766387939453125, -0.45587158203125, -0.4351043701171875, -0.414337158203125, -0.3935699462890625, -0.372802734375, -0.3520355224609375, -0.331268310546875, -0.3105010986328125, -0.28973388671875, -0.2689666748046875, -0.248199462890625, -0.2274322509765625, -0.2066650390625, -0.1858978271484375, -0.165130615234375, -0.1443634033203125, -0.12359619140625, -0.1028289794921875, -0.082061767578125, -0.0612945556640625, -0.04052734375, -0.0197601318359375, 0.001007080078125, 0.0217742919921875, 0.04254150390625, 0.0633087158203125, 0.084075927734375, 0.1048431396484375, 0.1256103515625, 0.1463775634765625, 0.167144775390625, 0.1879119873046875, 0.20867919921875, 0.2294464111328125, 0.250213623046875, 0.2709808349609375, 0.291748046875, 0.3125152587890625, 0.333282470703125, 0.3540496826171875, 0.37481689453125, 0.3955841064453125, 0.416351318359375, 0.4371185302734375, 0.4578857421875, 0.4786529541015625, 0.499420166015625, 0.5201873779296875, 0.54095458984375, 0.5617218017578125, 0.582489013671875, 0.6032562255859375, 0.6240234375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 5.0, 11.0, 12.0, 15.0, 9.0, 21.0, 26.0, 50.0, 72.0, 84.0, 208.0, 467.0, 1029.0, 2839.0, 9934.0, 51272.0, 2088163.0, 1974104.0, 51169.0, 9881.0, 2929.0, 1033.0, 423.0, 190.0, 110.0, 68.0, 36.0, 31.0, 18.0, 16.0, 21.0, 4.0, 5.0, 7.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1220703125, -1.08050537109375, -1.0389404296875, -0.99737548828125, -0.955810546875, -0.91424560546875, -0.8726806640625, -0.83111572265625, -0.78955078125, -0.74798583984375, -0.7064208984375, -0.66485595703125, -0.623291015625, -0.58172607421875, -0.5401611328125, -0.49859619140625, -0.45703125, -0.41546630859375, -0.3739013671875, -0.33233642578125, -0.290771484375, -0.24920654296875, -0.2076416015625, -0.16607666015625, -0.12451171875, -0.08294677734375, -0.0413818359375, 0.00018310546875, 0.041748046875, 0.08331298828125, 0.1248779296875, 0.16644287109375, 0.2080078125, 0.24957275390625, 0.2911376953125, 0.33270263671875, 0.374267578125, 0.41583251953125, 0.4573974609375, 0.49896240234375, 0.54052734375, 0.58209228515625, 0.6236572265625, 0.66522216796875, 0.706787109375, 0.74835205078125, 0.7899169921875, 0.83148193359375, 0.873046875, 0.91461181640625, 0.9561767578125, 0.99774169921875, 1.039306640625, 1.08087158203125, 1.1224365234375, 1.16400146484375, 1.20556640625, 1.24713134765625, 1.2886962890625, 1.33026123046875, 1.371826171875, 1.41339111328125, 1.4549560546875, 1.49652099609375, 1.5380859375]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 4.0, 4.0, 3.0, 8.0, 9.0, 19.0, 17.0, 16.0, 23.0, 29.0, 39.0, 65.0, 99.0, 114.0, 250.0, 461.0, 723.0, 820.0, 536.0, 315.0, 182.0, 94.0, 56.0, 45.0, 31.0, 23.0, 26.0, 19.0, 14.0, 5.0, 7.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.28076171875, -0.272308349609375, -0.26385498046875, -0.255401611328125, -0.2469482421875, -0.238494873046875, -0.23004150390625, -0.221588134765625, -0.213134765625, -0.204681396484375, -0.19622802734375, -0.187774658203125, -0.1793212890625, -0.170867919921875, -0.16241455078125, -0.153961181640625, -0.1455078125, -0.137054443359375, -0.12860107421875, -0.120147705078125, -0.1116943359375, -0.103240966796875, -0.09478759765625, -0.086334228515625, -0.077880859375, -0.069427490234375, -0.06097412109375, -0.052520751953125, -0.0440673828125, -0.035614013671875, -0.02716064453125, -0.018707275390625, -0.01025390625, -0.001800537109375, 0.00665283203125, 0.015106201171875, 0.0235595703125, 0.032012939453125, 0.04046630859375, 0.048919677734375, 0.057373046875, 0.065826416015625, 0.07427978515625, 0.082733154296875, 0.0911865234375, 0.099639892578125, 0.10809326171875, 0.116546630859375, 0.125, 0.133453369140625, 0.14190673828125, 0.150360107421875, 0.1588134765625, 0.167266845703125, 0.17572021484375, 0.184173583984375, 0.192626953125, 0.201080322265625, 0.20953369140625, 0.217987060546875, 0.2264404296875, 0.234893798828125, 0.24334716796875, 0.251800537109375, 0.26025390625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 9.0, 12.0, 19.0, 17.0, 28.0, 33.0, 56.0, 70.0, 133.0, 164.0, 129.0, 89.0, 58.0, 56.0, 39.0, 30.0, 19.0, 7.0, 6.0, 9.0, 6.0, 5.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6198253631591797, -1.5801854133605957, -1.5405454635620117, -1.5009055137634277, -1.4612655639648438, -1.4216256141662598, -1.3819856643676758, -1.3423457145690918, -1.3027057647705078, -1.2630658149719238, -1.2234258651733398, -1.1837859153747559, -1.1441459655761719, -1.104506015777588, -1.064866065979004, -1.02522611618042, -0.9855862259864807, -0.9459462761878967, -0.9063063263893127, -0.8666663765907288, -0.8270264267921448, -0.7873864769935608, -0.7477465867996216, -0.7081066370010376, -0.6684666872024536, -0.6288267374038696, -0.5891867876052856, -0.5495468378067017, -0.5099068880081177, -0.4702669382095337, -0.4306270182132721, -0.3909870684146881, -0.35134708881378174, -0.31170713901519775, -0.27206718921661377, -0.23242725431919098, -0.192787304520607, -0.153147354722023, -0.11350741982460022, -0.07386747002601624, -0.03422752022743225, 0.005412425845861435, 0.04505237191915512, 0.08469231426715851, 0.12433226406574249, 0.16397221386432648, 0.20361214876174927, 0.24325209856033325, 0.28289204835891724, 0.3225319981575012, 0.3621719479560852, 0.4018118977546692, 0.4414518475532532, 0.48109179735183716, 0.5207316875457764, 0.5603716373443604, 0.6000115871429443, 0.6396515369415283, 0.6792914867401123, 0.7189314365386963, 0.7585713863372803, 0.7982113361358643, 0.8378512859344482, 0.8774912357330322, 0.9171311855316162]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 8.0, 4.0, 4.0, 8.0, 12.0, 12.0, 13.0, 20.0, 19.0, 16.0, 34.0, 33.0, 43.0, 40.0, 47.0, 38.0, 45.0, 48.0, 44.0, 46.0, 43.0, 48.0, 44.0, 44.0, 49.0, 36.0, 24.0, 30.0, 31.0, 21.0, 22.0, 12.0, 17.0, 13.0, 5.0, 10.0, 9.0, 1.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6572402715682983, -0.6374079585075378, -0.6175755858421326, -0.5977432727813721, -0.5779109001159668, -0.5580785870552063, -0.5382462739944458, -0.5184139013290405, -0.49858158826828003, -0.47874924540519714, -0.45891690254211426, -0.43908458948135376, -0.4192522466182709, -0.399419903755188, -0.3795875608921051, -0.3597552180290222, -0.33992287516593933, -0.32009053230285645, -0.30025818943977356, -0.2804258465766907, -0.2605935335159302, -0.2407611906528473, -0.2209288477897644, -0.2010965198278427, -0.18126417696475983, -0.16143183410167694, -0.14159950613975525, -0.12176716327667236, -0.10193482786417007, -0.08210249245166779, -0.0622701495885849, -0.04243782162666321, -0.022605478763580322, -0.002773141488432884, 0.017059195786714554, 0.03689153492450714, 0.05672387033700943, 0.07655620574951172, 0.0963885486125946, 0.1162208765745163, 0.13605321943759918, 0.15588556230068207, 0.17571789026260376, 0.19555023312568665, 0.21538257598876953, 0.23521490395069122, 0.2550472617149353, 0.2748795747756958, 0.2947119176387787, 0.3145442605018616, 0.33437660336494446, 0.35420894622802734, 0.37404125928878784, 0.3938736021518707, 0.4137059450149536, 0.4335382580757141, 0.4533706307411194, 0.47320297360420227, 0.49303531646728516, 0.5128676295280457, 0.5327000021934509, 0.5525323152542114, 0.5723646879196167, 0.5921970009803772, 0.6120293140411377]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 0.0, 4.0, 8.0, 9.0, 12.0, 22.0, 30.0, 41.0, 53.0, 114.0, 179.0, 301.0, 676.0, 1314.0, 2955.0, 7102.0, 19750.0, 65950.0, 294994.0, 489817.0, 115624.0, 30930.0, 10728.0, 4176.0, 1820.0, 888.0, 425.0, 256.0, 134.0, 75.0, 41.0, 32.0, 28.0, 15.0, 14.0, 13.0, 7.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 4.0], "bins": [-0.1900634765625, -0.18521499633789062, -0.18036651611328125, -0.17551803588867188, -0.1706695556640625, -0.16582107543945312, -0.16097259521484375, -0.15612411499023438, -0.151275634765625, -0.14642715454101562, -0.14157867431640625, -0.13673019409179688, -0.1318817138671875, -0.12703323364257812, -0.12218475341796875, -0.11733627319335938, -0.11248779296875, -0.10763931274414062, -0.10279083251953125, -0.09794235229492188, -0.0930938720703125, -0.08824539184570312, -0.08339691162109375, -0.07854843139648438, -0.073699951171875, -0.06885147094726562, -0.06400299072265625, -0.059154510498046875, -0.0543060302734375, -0.049457550048828125, -0.04460906982421875, -0.039760589599609375, -0.034912109375, -0.030063629150390625, -0.02521514892578125, -0.020366668701171875, -0.0155181884765625, -0.010669708251953125, -0.00582122802734375, -0.000972747802734375, 0.003875732421875, 0.008724212646484375, 0.01357269287109375, 0.018421173095703125, 0.0232696533203125, 0.028118133544921875, 0.03296661376953125, 0.037815093994140625, 0.04266357421875, 0.047512054443359375, 0.05236053466796875, 0.057209014892578125, 0.0620574951171875, 0.06690597534179688, 0.07175445556640625, 0.07660293579101562, 0.081451416015625, 0.08629989624023438, 0.09114837646484375, 0.09599685668945312, 0.1008453369140625, 0.10569381713867188, 0.11054229736328125, 0.11539077758789062, 0.1202392578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 7.0, 9.0, 8.0, 15.0, 18.0, 18.0, 18.0, 34.0, 42.0, 42.0, 50.0, 52.0, 52.0, 58.0, 57.0, 54.0, 62.0, 50.0, 45.0, 55.0, 43.0, 29.0, 31.0, 26.0, 24.0, 17.0, 14.0, 18.0, 7.0, 4.0, 7.0, 5.0, 3.0, 4.0, 1.0, 0.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.489013671875, -0.4742240905761719, -0.45943450927734375, -0.4446449279785156, -0.4298553466796875, -0.4150657653808594, -0.40027618408203125, -0.3854866027832031, -0.370697021484375, -0.3559074401855469, -0.34111785888671875, -0.3263282775878906, -0.3115386962890625, -0.2967491149902344, -0.28195953369140625, -0.2671699523925781, -0.25238037109375, -0.23759078979492188, -0.22280120849609375, -0.20801162719726562, -0.1932220458984375, -0.17843246459960938, -0.16364288330078125, -0.14885330200195312, -0.134063720703125, -0.11927413940429688, -0.10448455810546875, -0.08969497680664062, -0.0749053955078125, -0.060115814208984375, -0.04532623291015625, -0.030536651611328125, -0.0157470703125, -0.000957489013671875, 0.01383209228515625, 0.028621673583984375, 0.0434112548828125, 0.058200836181640625, 0.07299041748046875, 0.08777999877929688, 0.102569580078125, 0.11735916137695312, 0.13214874267578125, 0.14693832397460938, 0.1617279052734375, 0.17651748657226562, 0.19130706787109375, 0.20609664916992188, 0.22088623046875, 0.23567581176757812, 0.25046539306640625, 0.2652549743652344, 0.2800445556640625, 0.2948341369628906, 0.30962371826171875, 0.3244132995605469, 0.339202880859375, 0.3539924621582031, 0.36878204345703125, 0.3835716247558594, 0.3983612060546875, 0.4131507873535156, 0.42794036865234375, 0.4427299499511719, 0.45751953125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 3.0, 6.0, 8.0, 10.0, 17.0, 35.0, 29.0, 66.0, 104.0, 200.0, 323.0, 560.0, 1117.0, 2437.0, 5608.0, 15156.0, 46892.0, 171207.0, 476806.0, 234098.0, 61370.0, 19434.0, 7058.0, 2940.0, 1473.0, 696.0, 368.0, 212.0, 103.0, 75.0, 47.0, 36.0, 11.0, 9.0, 10.0, 4.0, 7.0, 2.0, 5.0, 0.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.12017822265625, -0.11637687683105469, -0.11257553100585938, -0.10877418518066406, -0.10497283935546875, -0.10117149353027344, -0.09737014770507812, -0.09356880187988281, -0.0897674560546875, -0.08596611022949219, -0.08216476440429688, -0.07836341857910156, -0.07456207275390625, -0.07076072692871094, -0.06695938110351562, -0.06315803527832031, -0.059356689453125, -0.05555534362792969, -0.051753997802734375, -0.04795265197753906, -0.04415130615234375, -0.04034996032714844, -0.036548614501953125, -0.03274726867675781, -0.0289459228515625, -0.025144577026367188, -0.021343231201171875, -0.017541885375976562, -0.01374053955078125, -0.009939193725585938, -0.006137847900390625, -0.0023365020751953125, 0.00146484375, 0.0052661895751953125, 0.009067535400390625, 0.012868881225585938, 0.01667022705078125, 0.020471572875976562, 0.024272918701171875, 0.028074264526367188, 0.0318756103515625, 0.03567695617675781, 0.039478302001953125, 0.04327964782714844, 0.04708099365234375, 0.05088233947753906, 0.054683685302734375, 0.05848503112792969, 0.062286376953125, 0.06608772277832031, 0.06988906860351562, 0.07369041442871094, 0.07749176025390625, 0.08129310607910156, 0.08509445190429688, 0.08889579772949219, 0.0926971435546875, 0.09649848937988281, 0.10029983520507812, 0.10410118103027344, 0.10790252685546875, 0.11170387268066406, 0.11550521850585938, 0.11930656433105469, 0.12310791015625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 6.0, 6.0, 11.0, 14.0, 13.0, 17.0, 22.0, 27.0, 25.0, 37.0, 35.0, 34.0, 48.0, 50.0, 54.0, 35.0, 43.0, 52.0, 55.0, 48.0, 30.0, 44.0, 40.0, 42.0, 35.0, 37.0, 23.0, 19.0, 21.0, 14.0, 11.0, 8.0, 10.0, 5.0, 9.0, 7.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.7099609375, -0.6864700317382812, -0.6629791259765625, -0.6394882202148438, -0.615997314453125, -0.5925064086914062, -0.5690155029296875, -0.5455245971679688, -0.52203369140625, -0.49854278564453125, -0.4750518798828125, -0.45156097412109375, -0.428070068359375, -0.40457916259765625, -0.3810882568359375, -0.35759735107421875, -0.3341064453125, -0.31061553955078125, -0.2871246337890625, -0.26363372802734375, -0.240142822265625, -0.21665191650390625, -0.1931610107421875, -0.16967010498046875, -0.14617919921875, -0.12268829345703125, -0.0991973876953125, -0.07570648193359375, -0.052215576171875, -0.02872467041015625, -0.0052337646484375, 0.01825714111328125, 0.041748046875, 0.06523895263671875, 0.0887298583984375, 0.11222076416015625, 0.135711669921875, 0.15920257568359375, 0.1826934814453125, 0.20618438720703125, 0.22967529296875, 0.25316619873046875, 0.2766571044921875, 0.30014801025390625, 0.323638916015625, 0.34712982177734375, 0.3706207275390625, 0.39411163330078125, 0.4176025390625, 0.44109344482421875, 0.4645843505859375, 0.48807525634765625, 0.511566162109375, 0.5350570678710938, 0.5585479736328125, 0.5820388793945312, 0.60552978515625, 0.6290206909179688, 0.6525115966796875, 0.6760025024414062, 0.699493408203125, 0.7229843139648438, 0.7464752197265625, 0.7699661254882812, 0.79345703125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 9.0, 13.0, 10.0, 33.0, 37.0, 61.0, 143.0, 213.0, 378.0, 922.0, 2184.0, 6491.0, 23357.0, 118118.0, 594906.0, 244463.0, 41226.0, 10345.0, 3246.0, 1199.0, 579.0, 271.0, 145.0, 71.0, 46.0, 26.0, 18.0, 8.0, 5.0, 9.0, 7.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051849365234375, -0.05021333694458008, -0.048577308654785156, -0.046941280364990234, -0.04530525207519531, -0.04366922378540039, -0.04203319549560547, -0.04039716720581055, -0.038761138916015625, -0.0371251106262207, -0.03548908233642578, -0.03385305404663086, -0.03221702575683594, -0.030580997467041016, -0.028944969177246094, -0.027308940887451172, -0.02567291259765625, -0.024036884307861328, -0.022400856018066406, -0.020764827728271484, -0.019128799438476562, -0.01749277114868164, -0.01585674285888672, -0.014220714569091797, -0.012584686279296875, -0.010948657989501953, -0.009312629699707031, -0.007676601409912109, -0.0060405731201171875, -0.004404544830322266, -0.0027685165405273438, -0.0011324882507324219, 0.0005035400390625, 0.002139568328857422, 0.0037755966186523438, 0.005411624908447266, 0.0070476531982421875, 0.00868368148803711, 0.010319709777832031, 0.011955738067626953, 0.013591766357421875, 0.015227794647216797, 0.01686382293701172, 0.01849985122680664, 0.020135879516601562, 0.021771907806396484, 0.023407936096191406, 0.025043964385986328, 0.02667999267578125, 0.028316020965576172, 0.029952049255371094, 0.031588077545166016, 0.03322410583496094, 0.03486013412475586, 0.03649616241455078, 0.0381321907043457, 0.039768218994140625, 0.04140424728393555, 0.04304027557373047, 0.04467630386352539, 0.04631233215332031, 0.047948360443115234, 0.049584388732910156, 0.05122041702270508, 0.0528564453125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 0.0, 4.0, 3.0, 7.0, 12.0, 13.0, 9.0, 17.0, 17.0, 39.0, 42.0, 68.0, 117.0, 126.0, 101.0, 127.0, 89.0, 60.0, 47.0, 31.0, 26.0, 16.0, 6.0, 10.0, 8.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.552436828613281e-05, -3.464706242084503e-05, -3.376975655555725e-05, -3.289245069026947e-05, -3.201514482498169e-05, -3.113783895969391e-05, -3.0260533094406128e-05, -2.9383227229118347e-05, -2.8505921363830566e-05, -2.7628615498542786e-05, -2.6751309633255005e-05, -2.5874003767967224e-05, -2.4996697902679443e-05, -2.4119392037391663e-05, -2.3242086172103882e-05, -2.23647803068161e-05, -2.148747444152832e-05, -2.061016857624054e-05, -1.973286271095276e-05, -1.8855556845664978e-05, -1.7978250980377197e-05, -1.7100945115089417e-05, -1.6223639249801636e-05, -1.5346333384513855e-05, -1.4469027519226074e-05, -1.3591721653938293e-05, -1.2714415788650513e-05, -1.1837109923362732e-05, -1.0959804058074951e-05, -1.008249819278717e-05, -9.20519232749939e-06, -8.327886462211609e-06, -7.450580596923828e-06, -6.573274731636047e-06, -5.695968866348267e-06, -4.818663001060486e-06, -3.941357135772705e-06, -3.0640512704849243e-06, -2.1867454051971436e-06, -1.3094395399093628e-06, -4.3213367462158203e-07, 4.4517219066619873e-07, 1.3224780559539795e-06, 2.1997839212417603e-06, 3.077089786529541e-06, 3.954395651817322e-06, 4.8317015171051025e-06, 5.709007382392883e-06, 6.586313247680664e-06, 7.463619112968445e-06, 8.340924978256226e-06, 9.218230843544006e-06, 1.0095536708831787e-05, 1.0972842574119568e-05, 1.1850148439407349e-05, 1.272745430469513e-05, 1.360476016998291e-05, 1.4482066035270691e-05, 1.535937190055847e-05, 1.6236677765846252e-05, 1.7113983631134033e-05, 1.7991289496421814e-05, 1.8868595361709595e-05, 1.9745901226997375e-05, 2.0623207092285156e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 9.0, 9.0, 8.0, 21.0, 42.0, 46.0, 69.0, 124.0, 207.0, 363.0, 564.0, 935.0, 1759.0, 3390.0, 6780.0, 15876.0, 41380.0, 127518.0, 392454.0, 307847.0, 93239.0, 31555.0, 12299.0, 5637.0, 2779.0, 1524.0, 848.0, 485.0, 279.0, 201.0, 118.0, 62.0, 45.0, 34.0, 14.0, 16.0, 7.0, 4.0, 5.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.037506103515625, -0.03643035888671875, -0.0353546142578125, -0.03427886962890625, -0.033203125, -0.03212738037109375, -0.0310516357421875, -0.02997589111328125, -0.028900146484375, -0.02782440185546875, -0.0267486572265625, -0.02567291259765625, -0.02459716796875, -0.02352142333984375, -0.0224456787109375, -0.02136993408203125, -0.020294189453125, -0.01921844482421875, -0.0181427001953125, -0.01706695556640625, -0.0159912109375, -0.01491546630859375, -0.0138397216796875, -0.01276397705078125, -0.011688232421875, -0.01061248779296875, -0.0095367431640625, -0.00846099853515625, -0.00738525390625, -0.00630950927734375, -0.0052337646484375, -0.00415802001953125, -0.003082275390625, -0.00200653076171875, -0.0009307861328125, 0.00014495849609375, 0.001220703125, 0.00229644775390625, 0.0033721923828125, 0.00444793701171875, 0.005523681640625, 0.00659942626953125, 0.0076751708984375, 0.00875091552734375, 0.00982666015625, 0.01090240478515625, 0.0119781494140625, 0.01305389404296875, 0.014129638671875, 0.01520538330078125, 0.0162811279296875, 0.01735687255859375, 0.0184326171875, 0.01950836181640625, 0.0205841064453125, 0.02165985107421875, 0.022735595703125, 0.02381134033203125, 0.0248870849609375, 0.02596282958984375, 0.02703857421875, 0.02811431884765625, 0.0291900634765625, 0.03026580810546875, 0.031341552734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 6.0, 8.0, 12.0, 21.0, 31.0, 25.0, 34.0, 70.0, 72.0, 65.0, 97.0, 75.0, 82.0, 78.0, 58.0, 63.0, 47.0, 37.0, 26.0, 16.0, 19.0, 11.0, 12.0, 7.0, 7.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01166534423828125, -0.011307954788208008, -0.010950565338134766, -0.010593175888061523, -0.010235786437988281, -0.009878396987915039, -0.009521007537841797, -0.009163618087768555, -0.008806228637695312, -0.00844883918762207, -0.008091449737548828, -0.007734060287475586, -0.007376670837402344, -0.0070192813873291016, -0.006661891937255859, -0.006304502487182617, -0.005947113037109375, -0.005589723587036133, -0.005232334136962891, -0.0048749446868896484, -0.004517555236816406, -0.004160165786743164, -0.003802776336669922, -0.0034453868865966797, -0.0030879974365234375, -0.0027306079864501953, -0.002373218536376953, -0.002015829086303711, -0.0016584396362304688, -0.0013010501861572266, -0.0009436607360839844, -0.0005862712860107422, -0.0002288818359375, 0.0001285076141357422, 0.0004858970642089844, 0.0008432865142822266, 0.0012006759643554688, 0.001558065414428711, 0.0019154548645019531, 0.0022728443145751953, 0.0026302337646484375, 0.0029876232147216797, 0.003345012664794922, 0.003702402114868164, 0.004059791564941406, 0.0044171810150146484, 0.004774570465087891, 0.005131959915161133, 0.005489349365234375, 0.005846738815307617, 0.006204128265380859, 0.0065615177154541016, 0.006918907165527344, 0.007276296615600586, 0.007633686065673828, 0.00799107551574707, 0.008348464965820312, 0.008705854415893555, 0.009063243865966797, 0.009420633316040039, 0.009778022766113281, 0.010135412216186523, 0.010492801666259766, 0.010850191116333008, 0.01120758056640625]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 8.0, 19.0, 22.0, 26.0, 53.0, 74.0, 164.0, 195.0, 167.0, 83.0, 76.0, 46.0, 21.0, 9.0, 14.0, 10.0, 3.0, 2.0, 7.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4605964422225952, -1.4278874397277832, -1.3951785564422607, -1.3624695539474487, -1.3297605514526367, -1.2970515489578247, -1.2643426656723022, -1.2316336631774902, -1.1989246606826782, -1.1662156581878662, -1.1335067749023438, -1.1007977724075317, -1.0680887699127197, -1.0353797674179077, -1.0026708841323853, -0.9699618816375732, -0.937252938747406, -0.9045439958572388, -0.8718349933624268, -0.8391260504722595, -0.8064170479774475, -0.7737081050872803, -0.7409991025924683, -0.708290159702301, -0.6755812168121338, -0.6428722739219666, -0.6101632714271545, -0.5774543285369873, -0.5447453260421753, -0.5120363831520081, -0.47932741045951843, -0.4466184377670288, -0.4139094948768616, -0.38120052218437195, -0.3484915494918823, -0.3157826066017151, -0.2830736041069031, -0.25036466121673584, -0.21765568852424622, -0.1849467158317566, -0.15223774313926697, -0.11952877044677734, -0.08681980520486832, -0.05411083996295929, -0.021401867270469666, 0.011307105422019958, 0.04401606321334839, 0.07672503590583801, 0.10943400859832764, 0.14214298129081726, 0.17485195398330688, 0.20756091177463531, 0.24026988446712494, 0.27297884225845337, 0.305687814950943, 0.3383967876434326, 0.37110576033592224, 0.40381473302841187, 0.4365237057209015, 0.4692326784133911, 0.5019416213035583, 0.5346506237983704, 0.5673595666885376, 0.6000685691833496, 0.6327775120735168]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 6.0, 2.0, 10.0, 4.0, 6.0, 11.0, 21.0, 17.0, 20.0, 26.0, 25.0, 39.0, 45.0, 50.0, 52.0, 46.0, 52.0, 53.0, 43.0, 55.0, 57.0, 46.0, 53.0, 51.0, 28.0, 30.0, 31.0, 28.0, 20.0, 13.0, 20.0, 11.0, 3.0, 8.0, 8.0, 5.0, 1.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.44822201132774353, -0.4344092905521393, -0.42059656977653503, -0.4067838490009308, -0.39297112822532654, -0.3791584074497223, -0.36534565687179565, -0.3515329360961914, -0.33772021532058716, -0.3239074945449829, -0.31009477376937866, -0.2962820529937744, -0.28246933221817017, -0.2686566114425659, -0.25484389066696167, -0.24103115499019623, -0.22721844911575317, -0.21340572834014893, -0.19959300756454468, -0.18578028678894043, -0.17196756601333618, -0.15815484523773193, -0.1443421095609665, -0.13052938878536224, -0.116716668009758, -0.10290394723415375, -0.0890912264585495, -0.07527849823236465, -0.061465777456760406, -0.04765305668115616, -0.033840328454971313, -0.020027607679367065, -0.006214916706085205, 0.007597805932164192, 0.02141052857041359, 0.035223253071308136, 0.049035973846912384, 0.06284869462251663, 0.07666142284870148, 0.09047414362430573, 0.10428686439990997, 0.11809958517551422, 0.13191230595111847, 0.1457250416278839, 0.15953776240348816, 0.1733504831790924, 0.18716320395469666, 0.2009759247303009, 0.21478864550590515, 0.2286013662815094, 0.24241408705711365, 0.2562268078327179, 0.27003952860832214, 0.2838522493839264, 0.297664999961853, 0.3114777207374573, 0.3252904415130615, 0.33910316228866577, 0.35291588306427, 0.36672860383987427, 0.3805413246154785, 0.39435404539108276, 0.408166766166687, 0.42197948694229126, 0.4357922077178955]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 10.0, 10.0, 13.0, 16.0, 23.0, 36.0, 39.0, 60.0, 64.0, 106.0, 118.0, 182.0, 254.0, 359.0, 513.0, 822.0, 1274.0, 2238.0, 4476.0, 10097.0, 35030.0, 373309.0, 551628.0, 44532.0, 11797.0, 4875.0, 2498.0, 1413.0, 840.0, 554.0, 355.0, 282.0, 198.0, 126.0, 97.0, 74.0, 56.0, 47.0, 32.0, 28.0, 20.0, 20.0, 11.0, 6.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.53271484375, -0.5161056518554688, -0.4994964599609375, -0.48288726806640625, -0.466278076171875, -0.44966888427734375, -0.4330596923828125, -0.41645050048828125, -0.39984130859375, -0.38323211669921875, -0.3666229248046875, -0.35001373291015625, -0.333404541015625, -0.31679534912109375, -0.3001861572265625, -0.28357696533203125, -0.2669677734375, -0.25035858154296875, -0.2337493896484375, -0.21714019775390625, -0.200531005859375, -0.18392181396484375, -0.1673126220703125, -0.15070343017578125, -0.13409423828125, -0.11748504638671875, -0.1008758544921875, -0.08426666259765625, -0.067657470703125, -0.05104827880859375, -0.0344390869140625, -0.01782989501953125, -0.001220703125, 0.01538848876953125, 0.0319976806640625, 0.04860687255859375, 0.065216064453125, 0.08182525634765625, 0.0984344482421875, 0.11504364013671875, 0.13165283203125, 0.14826202392578125, 0.1648712158203125, 0.18148040771484375, 0.198089599609375, 0.21469879150390625, 0.2313079833984375, 0.24791717529296875, 0.2645263671875, 0.28113555908203125, 0.2977447509765625, 0.31435394287109375, 0.330963134765625, 0.34757232666015625, 0.3641815185546875, 0.38079071044921875, 0.39739990234375, 0.41400909423828125, 0.4306182861328125, 0.44722747802734375, 0.463836669921875, 0.48044586181640625, 0.4970550537109375, 0.5136642456054688, 0.5302734375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 7.0, 8.0, 2.0, 6.0, 17.0, 15.0, 17.0, 26.0, 24.0, 52.0, 45.0, 58.0, 57.0, 54.0, 57.0, 63.0, 65.0, 63.0, 53.0, 56.0, 64.0, 33.0, 16.0, 28.0, 30.0, 19.0, 17.0, 11.0, 9.0, 6.0, 2.0, 8.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98193359375, -0.9509658813476562, -0.9199981689453125, -0.8890304565429688, -0.858062744140625, -0.8270950317382812, -0.7961273193359375, -0.7651596069335938, -0.73419189453125, -0.7032241821289062, -0.6722564697265625, -0.6412887573242188, -0.610321044921875, -0.5793533325195312, -0.5483856201171875, -0.5174179077148438, -0.4864501953125, -0.45548248291015625, -0.4245147705078125, -0.39354705810546875, -0.362579345703125, -0.33161163330078125, -0.3006439208984375, -0.26967620849609375, -0.23870849609375, -0.20774078369140625, -0.1767730712890625, -0.14580535888671875, -0.114837646484375, -0.08386993408203125, -0.0529022216796875, -0.02193450927734375, 0.009033203125, 0.04000091552734375, 0.0709686279296875, 0.10193634033203125, 0.132904052734375, 0.16387176513671875, 0.1948394775390625, 0.22580718994140625, 0.25677490234375, 0.28774261474609375, 0.3187103271484375, 0.34967803955078125, 0.380645751953125, 0.41161346435546875, 0.4425811767578125, 0.47354888916015625, 0.5045166015625, 0.5354843139648438, 0.5664520263671875, 0.5974197387695312, 0.628387451171875, 0.6593551635742188, 0.6903228759765625, 0.7212905883789062, 0.75225830078125, 0.7832260131835938, 0.8141937255859375, 0.8451614379882812, 0.876129150390625, 0.9070968627929688, 0.9380645751953125, 0.9690322875976562, 1.0]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 6.0, 10.0, 7.0, 12.0, 15.0, 24.0, 40.0, 42.0, 73.0, 101.0, 136.0, 227.0, 404.0, 894.0, 2694.0, 21337.0, 990297.0, 27104.0, 2999.0, 970.0, 476.0, 232.0, 121.0, 96.0, 53.0, 45.0, 30.0, 18.0, 19.0, 14.0, 10.0, 13.0, 15.0, 4.0, 4.0, 0.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1044921875, -1.0628662109375, -1.021240234375, -0.9796142578125, -0.93798828125, -0.8963623046875, -0.854736328125, -0.8131103515625, -0.771484375, -0.7298583984375, -0.688232421875, -0.6466064453125, -0.60498046875, -0.5633544921875, -0.521728515625, -0.4801025390625, -0.4384765625, -0.3968505859375, -0.355224609375, -0.3135986328125, -0.27197265625, -0.2303466796875, -0.188720703125, -0.1470947265625, -0.10546875, -0.0638427734375, -0.022216796875, 0.0194091796875, 0.06103515625, 0.1026611328125, 0.144287109375, 0.1859130859375, 0.2275390625, 0.2691650390625, 0.310791015625, 0.3524169921875, 0.39404296875, 0.4356689453125, 0.477294921875, 0.5189208984375, 0.560546875, 0.6021728515625, 0.643798828125, 0.6854248046875, 0.72705078125, 0.7686767578125, 0.810302734375, 0.8519287109375, 0.8935546875, 0.9351806640625, 0.976806640625, 1.0184326171875, 1.06005859375, 1.1016845703125, 1.143310546875, 1.1849365234375, 1.2265625, 1.2681884765625, 1.309814453125, 1.3514404296875, 1.39306640625, 1.4346923828125, 1.476318359375, 1.5179443359375, 1.5595703125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 3.0, 6.0, 3.0, 5.0, 3.0, 8.0, 15.0, 9.0, 15.0, 18.0, 17.0, 17.0, 29.0, 24.0, 23.0, 32.0, 28.0, 36.0, 32.0, 31.0, 44.0, 43.0, 34.0, 45.0, 44.0, 25.0, 38.0, 36.0, 44.0, 42.0, 22.0, 33.0, 22.0, 21.0, 23.0, 25.0, 16.0, 11.0, 10.0, 12.0, 8.0, 6.0, 14.0, 12.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.63330078125, -0.6142730712890625, -0.595245361328125, -0.5762176513671875, -0.55718994140625, -0.5381622314453125, -0.519134521484375, -0.5001068115234375, -0.4810791015625, -0.4620513916015625, -0.443023681640625, -0.4239959716796875, -0.40496826171875, -0.3859405517578125, -0.366912841796875, -0.3478851318359375, -0.328857421875, -0.3098297119140625, -0.290802001953125, -0.2717742919921875, -0.25274658203125, -0.2337188720703125, -0.214691162109375, -0.1956634521484375, -0.1766357421875, -0.1576080322265625, -0.138580322265625, -0.1195526123046875, -0.10052490234375, -0.0814971923828125, -0.062469482421875, -0.0434417724609375, -0.0244140625, -0.0053863525390625, 0.013641357421875, 0.0326690673828125, 0.05169677734375, 0.0707244873046875, 0.089752197265625, 0.1087799072265625, 0.1278076171875, 0.1468353271484375, 0.165863037109375, 0.1848907470703125, 0.20391845703125, 0.2229461669921875, 0.241973876953125, 0.2610015869140625, 0.280029296875, 0.2990570068359375, 0.318084716796875, 0.3371124267578125, 0.35614013671875, 0.3751678466796875, 0.394195556640625, 0.4132232666015625, 0.4322509765625, 0.4512786865234375, 0.470306396484375, 0.4893341064453125, 0.50836181640625, 0.5273895263671875, 0.546417236328125, 0.5654449462890625, 0.58447265625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 6.0, 9.0, 14.0, 8.0, 12.0, 19.0, 41.0, 74.0, 113.0, 257.0, 605.0, 1952.0, 8795.0, 75833.0, 849914.0, 97045.0, 10433.0, 2185.0, 676.0, 273.0, 121.0, 53.0, 45.0, 28.0, 10.0, 6.0, 5.0, 5.0, 6.0, 0.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.203369140625, -0.19780349731445312, -0.19223785400390625, -0.18667221069335938, -0.1811065673828125, -0.17554092407226562, -0.16997528076171875, -0.16440963745117188, -0.158843994140625, -0.15327835083007812, -0.14771270751953125, -0.14214706420898438, -0.1365814208984375, -0.13101577758789062, -0.12545013427734375, -0.11988449096679688, -0.11431884765625, -0.10875320434570312, -0.10318756103515625, -0.09762191772460938, -0.0920562744140625, -0.08649063110351562, -0.08092498779296875, -0.07535934448242188, -0.069793701171875, -0.06422805786132812, -0.05866241455078125, -0.053096771240234375, -0.0475311279296875, -0.041965484619140625, -0.03639984130859375, -0.030834197998046875, -0.0252685546875, -0.019702911376953125, -0.01413726806640625, -0.008571624755859375, -0.0030059814453125, 0.002559661865234375, 0.00812530517578125, 0.013690948486328125, 0.019256591796875, 0.024822235107421875, 0.03038787841796875, 0.035953521728515625, 0.0415191650390625, 0.047084808349609375, 0.05265045166015625, 0.058216094970703125, 0.06378173828125, 0.06934738159179688, 0.07491302490234375, 0.08047866821289062, 0.0860443115234375, 0.09160995483398438, 0.09717559814453125, 0.10274124145507812, 0.108306884765625, 0.11387252807617188, 0.11943817138671875, 0.12500381469726562, 0.1305694580078125, 0.13613510131835938, 0.14170074462890625, 0.14726638793945312, 0.15283203125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 3.0, 9.0, 8.0, 13.0, 22.0, 22.0, 34.0, 46.0, 63.0, 80.0, 134.0, 119.0, 113.0, 129.0, 52.0, 41.0, 27.0, 24.0, 10.0, 10.0, 8.0, 4.0, 8.0, 9.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5616416931152344e-05, -1.5106983482837677e-05, -1.459755003452301e-05, -1.4088116586208344e-05, -1.3578683137893677e-05, -1.306924968957901e-05, -1.2559816241264343e-05, -1.2050382792949677e-05, -1.154094934463501e-05, -1.1031515896320343e-05, -1.0522082448005676e-05, -1.001264899969101e-05, -9.503215551376343e-06, -8.993782103061676e-06, -8.48434865474701e-06, -7.974915206432343e-06, -7.465481758117676e-06, -6.956048309803009e-06, -6.446614861488342e-06, -5.9371814131736755e-06, -5.427747964859009e-06, -4.918314516544342e-06, -4.408881068229675e-06, -3.8994476199150085e-06, -3.390014171600342e-06, -2.880580723285675e-06, -2.3711472749710083e-06, -1.8617138266563416e-06, -1.3522803783416748e-06, -8.428469300270081e-07, -3.334134817123413e-07, 1.7601996660232544e-07, 6.854534149169922e-07, 1.194886863231659e-06, 1.7043203115463257e-06, 2.2137537598609924e-06, 2.723187208175659e-06, 3.232620656490326e-06, 3.7420541048049927e-06, 4.2514875531196594e-06, 4.760921001434326e-06, 5.270354449748993e-06, 5.77978789806366e-06, 6.289221346378326e-06, 6.798654794692993e-06, 7.30808824300766e-06, 7.817521691322327e-06, 8.326955139636993e-06, 8.83638858795166e-06, 9.345822036266327e-06, 9.855255484580994e-06, 1.036468893289566e-05, 1.0874122381210327e-05, 1.1383555829524994e-05, 1.189298927783966e-05, 1.2402422726154327e-05, 1.2911856174468994e-05, 1.3421289622783661e-05, 1.3930723071098328e-05, 1.4440156519412994e-05, 1.4949589967727661e-05, 1.5459023416042328e-05, 1.5968456864356995e-05, 1.647789031267166e-05, 1.6987323760986328e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 13.0, 20.0, 21.0, 35.0, 70.0, 106.0, 160.0, 276.0, 465.0, 838.0, 1585.0, 3513.0, 9430.0, 41734.0, 594093.0, 352506.0, 29839.0, 7579.0, 2980.0, 1411.0, 738.0, 442.0, 254.0, 171.0, 107.0, 63.0, 35.0, 24.0, 14.0, 9.0, 6.0, 5.0, 2.0, 2.0, 7.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2088623046875, -0.2036285400390625, -0.198394775390625, -0.1931610107421875, -0.18792724609375, -0.1826934814453125, -0.177459716796875, -0.1722259521484375, -0.1669921875, -0.1617584228515625, -0.156524658203125, -0.1512908935546875, -0.14605712890625, -0.1408233642578125, -0.135589599609375, -0.1303558349609375, -0.1251220703125, -0.1198883056640625, -0.114654541015625, -0.1094207763671875, -0.10418701171875, -0.0989532470703125, -0.093719482421875, -0.0884857177734375, -0.083251953125, -0.0780181884765625, -0.072784423828125, -0.0675506591796875, -0.06231689453125, -0.0570831298828125, -0.051849365234375, -0.0466156005859375, -0.0413818359375, -0.0361480712890625, -0.030914306640625, -0.0256805419921875, -0.02044677734375, -0.0152130126953125, -0.009979248046875, -0.0047454833984375, 0.00048828125, 0.0057220458984375, 0.010955810546875, 0.0161895751953125, 0.02142333984375, 0.0266571044921875, 0.031890869140625, 0.0371246337890625, 0.0423583984375, 0.0475921630859375, 0.052825927734375, 0.0580596923828125, 0.06329345703125, 0.0685272216796875, 0.073760986328125, 0.0789947509765625, 0.084228515625, 0.0894622802734375, 0.094696044921875, 0.0999298095703125, 0.10516357421875, 0.1103973388671875, 0.115631103515625, 0.1208648681640625, 0.1260986328125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 11.0, 3.0, 12.0, 15.0, 26.0, 21.0, 40.0, 61.0, 102.0, 101.0, 150.0, 158.0, 82.0, 85.0, 42.0, 22.0, 20.0, 7.0, 10.0, 6.0, 5.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0626220703125, -0.06041908264160156, -0.058216094970703125, -0.05601310729980469, -0.05381011962890625, -0.05160713195800781, -0.049404144287109375, -0.04720115661621094, -0.0449981689453125, -0.04279518127441406, -0.040592193603515625, -0.03838920593261719, -0.03618621826171875, -0.03398323059082031, -0.031780242919921875, -0.029577255249023438, -0.027374267578125, -0.025171279907226562, -0.022968292236328125, -0.020765304565429688, -0.01856231689453125, -0.016359329223632812, -0.014156341552734375, -0.011953353881835938, -0.0097503662109375, -0.0075473785400390625, -0.005344390869140625, -0.0031414031982421875, -0.00093841552734375, 0.0012645721435546875, 0.003467559814453125, 0.0056705474853515625, 0.00787353515625, 0.010076522827148438, 0.012279510498046875, 0.014482498168945312, 0.01668548583984375, 0.018888473510742188, 0.021091461181640625, 0.023294448852539062, 0.0254974365234375, 0.027700424194335938, 0.029903411865234375, 0.03210639953613281, 0.03430938720703125, 0.03651237487792969, 0.038715362548828125, 0.04091835021972656, 0.043121337890625, 0.04532432556152344, 0.047527313232421875, 0.04973030090332031, 0.05193328857421875, 0.05413627624511719, 0.056339263916015625, 0.05854225158691406, 0.0607452392578125, 0.06294822692871094, 0.06515121459960938, 0.06735420227050781, 0.06955718994140625, 0.07176017761230469, 0.07396316528320312, 0.07616615295410156, 0.078369140625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 6.0, 0.0, 8.0, 10.0, 16.0, 17.0, 38.0, 54.0, 125.0, 190.0, 200.0, 136.0, 77.0, 57.0, 32.0, 14.0, 12.0, 9.0, 6.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.283629894256592, -3.2141385078430176, -3.1446471214294434, -3.07515549659729, -3.005664110183716, -2.9361727237701416, -2.8666810989379883, -2.797189712524414, -2.72769832611084, -2.6582069396972656, -2.5887155532836914, -2.519223928451538, -2.449732542037964, -2.3802411556243896, -2.3107495307922363, -2.241258144378662, -2.171766757965088, -2.1022753715515137, -2.0327839851379395, -1.9632923603057861, -1.893800973892212, -1.8243095874786377, -1.754818081855774, -1.6853265762329102, -1.615835189819336, -1.5463438034057617, -1.476852297782898, -1.4073607921600342, -1.33786940574646, -1.2683780193328857, -1.198886513710022, -1.1293950080871582, -1.0599033832550049, -0.9904119372367859, -0.9209204912185669, -0.8514290452003479, -0.7819375991821289, -0.7124461531639099, -0.6429547071456909, -0.5734632611274719, -0.5039718151092529, -0.43448036909103394, -0.36498892307281494, -0.29549747705459595, -0.22600603103637695, -0.15651458501815796, -0.08702313899993896, -0.01753169298171997, 0.05195975303649902, 0.12145119905471802, 0.190942645072937, 0.260434091091156, 0.329925537109375, 0.399416983127594, 0.468908429145813, 0.538399875164032, 0.607891321182251, 0.67738276720047, 0.746874213218689, 0.816365659236908, 0.885857105255127, 0.955348551273346, 1.024839997291565, 1.0943315029144287, 1.163822889328003]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 5.0, 10.0, 8.0, 7.0, 11.0, 13.0, 13.0, 20.0, 17.0, 22.0, 36.0, 38.0, 32.0, 29.0, 51.0, 47.0, 46.0, 40.0, 47.0, 38.0, 50.0, 44.0, 53.0, 30.0, 35.0, 44.0, 39.0, 27.0, 28.0, 16.0, 29.0, 20.0, 14.0, 11.0, 2.0, 4.0, 9.0, 4.0, 6.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3882209062576294, -1.3489383459091187, -1.3096556663513184, -1.2703731060028076, -1.2310905456542969, -1.1918078660964966, -1.1525253057479858, -1.1132426261901855, -1.0739600658416748, -1.034677505493164, -0.9953948259353638, -0.956112265586853, -0.9168296456336975, -0.877547025680542, -0.8382644653320312, -0.7989818453788757, -0.7596992254257202, -0.7204166054725647, -0.6811339855194092, -0.6418514251708984, -0.6025688052177429, -0.5632861852645874, -0.5240036249160767, -0.48472100496292114, -0.4454383850097656, -0.4061557650566101, -0.366873174905777, -0.32759058475494385, -0.28830796480178833, -0.249025359749794, -0.20974275469779968, -0.17046016454696655, -0.13117754459381104, -0.09189493954181671, -0.05261233448982239, -0.013329729437828064, 0.02595287561416626, 0.06523548066616058, 0.10451808571815491, 0.14380067586898804, 0.18308329582214355, 0.22236590087413788, 0.2616485059261322, 0.30093109607696533, 0.34021371603012085, 0.37949633598327637, 0.4187789261341095, 0.4580615162849426, 0.49734413623809814, 0.5366267561912537, 0.5759093761444092, 0.6151919364929199, 0.6544745564460754, 0.693757176399231, 0.7330397367477417, 0.7723223567008972, 0.8116049766540527, 0.8508875966072083, 0.8901702165603638, 0.9294527769088745, 0.96873539686203, 1.0080180168151855, 1.0473005771636963, 1.086583137512207, 1.1258658170700073]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 9.0, 16.0, 25.0, 35.0, 45.0, 63.0, 92.0, 152.0, 230.0, 442.0, 959.0, 2669.0, 11402.0, 520328.0, 3621067.0, 29429.0, 4399.0, 1432.0, 581.0, 323.0, 203.0, 104.0, 69.0, 67.0, 50.0, 27.0, 17.0, 14.0, 16.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9501953125, -1.8785247802734375, -1.806854248046875, -1.7351837158203125, -1.66351318359375, -1.5918426513671875, -1.520172119140625, -1.4485015869140625, -1.3768310546875, -1.3051605224609375, -1.233489990234375, -1.1618194580078125, -1.09014892578125, -1.0184783935546875, -0.946807861328125, -0.8751373291015625, -0.803466796875, -0.7317962646484375, -0.660125732421875, -0.5884552001953125, -0.51678466796875, -0.4451141357421875, -0.373443603515625, -0.3017730712890625, -0.2301025390625, -0.1584320068359375, -0.086761474609375, -0.0150909423828125, 0.05657958984375, 0.1282501220703125, 0.199920654296875, 0.2715911865234375, 0.34326171875, 0.4149322509765625, 0.486602783203125, 0.5582733154296875, 0.62994384765625, 0.7016143798828125, 0.773284912109375, 0.8449554443359375, 0.9166259765625, 0.9882965087890625, 1.059967041015625, 1.1316375732421875, 1.20330810546875, 1.2749786376953125, 1.346649169921875, 1.4183197021484375, 1.489990234375, 1.5616607666015625, 1.633331298828125, 1.7050018310546875, 1.77667236328125, 1.8483428955078125, 1.920013427734375, 1.9916839599609375, 2.0633544921875, 2.1350250244140625, 2.206695556640625, 2.2783660888671875, 2.35003662109375, 2.4217071533203125, 2.493377685546875, 2.5650482177734375, 2.63671875]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 6.0, 2.0, 5.0, 5.0, 10.0, 13.0, 13.0, 11.0, 21.0, 17.0, 26.0, 30.0, 44.0, 40.0, 49.0, 57.0, 67.0, 56.0, 57.0, 55.0, 74.0, 62.0, 45.0, 53.0, 39.0, 32.0, 27.0, 17.0, 18.0, 13.0, 11.0, 4.0, 11.0, 7.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5244140625, -0.5053939819335938, -0.4863739013671875, -0.46735382080078125, -0.448333740234375, -0.42931365966796875, -0.4102935791015625, -0.39127349853515625, -0.37225341796875, -0.35323333740234375, -0.3342132568359375, -0.31519317626953125, -0.296173095703125, -0.27715301513671875, -0.2581329345703125, -0.23911285400390625, -0.2200927734375, -0.20107269287109375, -0.1820526123046875, -0.16303253173828125, -0.144012451171875, -0.12499237060546875, -0.1059722900390625, -0.08695220947265625, -0.06793212890625, -0.04891204833984375, -0.0298919677734375, -0.01087188720703125, 0.008148193359375, 0.02716827392578125, 0.0461883544921875, 0.06520843505859375, 0.084228515625, 0.10324859619140625, 0.1222686767578125, 0.14128875732421875, 0.160308837890625, 0.17932891845703125, 0.1983489990234375, 0.21736907958984375, 0.23638916015625, 0.25540924072265625, 0.2744293212890625, 0.29344940185546875, 0.312469482421875, 0.33148956298828125, 0.3505096435546875, 0.36952972412109375, 0.3885498046875, 0.40756988525390625, 0.4265899658203125, 0.44561004638671875, 0.464630126953125, 0.48365020751953125, 0.5026702880859375, 0.5216903686523438, 0.54071044921875, 0.5597305297851562, 0.5787506103515625, 0.5977706909179688, 0.616790771484375, 0.6358108520507812, 0.6548309326171875, 0.6738510131835938, 0.69287109375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 3.0, 10.0, 3.0, 8.0, 16.0, 20.0, 40.0, 43.0, 78.0, 121.0, 187.0, 325.0, 636.0, 1334.0, 3130.0, 8630.0, 34577.0, 472973.0, 3553691.0, 93208.0, 16378.0, 5064.0, 1854.0, 861.0, 447.0, 247.0, 121.0, 88.0, 58.0, 45.0, 30.0, 13.0, 10.0, 5.0, 5.0, 8.0, 6.0, 2.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9052734375, -0.87322998046875, -0.8411865234375, -0.80914306640625, -0.777099609375, -0.74505615234375, -0.7130126953125, -0.68096923828125, -0.64892578125, -0.61688232421875, -0.5848388671875, -0.55279541015625, -0.520751953125, -0.48870849609375, -0.4566650390625, -0.42462158203125, -0.392578125, -0.36053466796875, -0.3284912109375, -0.29644775390625, -0.264404296875, -0.23236083984375, -0.2003173828125, -0.16827392578125, -0.13623046875, -0.10418701171875, -0.0721435546875, -0.04010009765625, -0.008056640625, 0.02398681640625, 0.0560302734375, 0.08807373046875, 0.1201171875, 0.15216064453125, 0.1842041015625, 0.21624755859375, 0.248291015625, 0.28033447265625, 0.3123779296875, 0.34442138671875, 0.37646484375, 0.40850830078125, 0.4405517578125, 0.47259521484375, 0.504638671875, 0.53668212890625, 0.5687255859375, 0.60076904296875, 0.6328125, 0.66485595703125, 0.6968994140625, 0.72894287109375, 0.760986328125, 0.79302978515625, 0.8250732421875, 0.85711669921875, 0.88916015625, 0.92120361328125, 0.9532470703125, 0.98529052734375, 1.017333984375, 1.04937744140625, 1.0814208984375, 1.11346435546875, 1.1455078125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 5.0, 11.0, 16.0, 18.0, 28.0, 45.0, 62.0, 123.0, 277.0, 651.0, 1252.0, 824.0, 352.0, 162.0, 86.0, 56.0, 27.0, 22.0, 10.0, 12.0, 11.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.285400390625, -0.2750701904296875, -0.264739990234375, -0.2544097900390625, -0.24407958984375, -0.2337493896484375, -0.223419189453125, -0.2130889892578125, -0.2027587890625, -0.1924285888671875, -0.182098388671875, -0.1717681884765625, -0.16143798828125, -0.1511077880859375, -0.140777587890625, -0.1304473876953125, -0.1201171875, -0.1097869873046875, -0.099456787109375, -0.0891265869140625, -0.07879638671875, -0.0684661865234375, -0.058135986328125, -0.0478057861328125, -0.0374755859375, -0.0271453857421875, -0.016815185546875, -0.0064849853515625, 0.00384521484375, 0.0141754150390625, 0.024505615234375, 0.0348358154296875, 0.045166015625, 0.0554962158203125, 0.065826416015625, 0.0761566162109375, 0.08648681640625, 0.0968170166015625, 0.107147216796875, 0.1174774169921875, 0.1278076171875, 0.1381378173828125, 0.148468017578125, 0.1587982177734375, 0.16912841796875, 0.1794586181640625, 0.189788818359375, 0.2001190185546875, 0.21044921875, 0.2207794189453125, 0.231109619140625, 0.2414398193359375, 0.25177001953125, 0.2621002197265625, 0.272430419921875, 0.2827606201171875, 0.2930908203125, 0.3034210205078125, 0.313751220703125, 0.3240814208984375, 0.33441162109375, 0.3447418212890625, 0.355072021484375, 0.3654022216796875, 0.375732421875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 6.0, 7.0, 13.0, 13.0, 21.0, 32.0, 44.0, 51.0, 70.0, 98.0, 116.0, 114.0, 113.0, 84.0, 45.0, 38.0, 32.0, 24.0, 23.0, 12.0, 8.0, 7.0, 7.0, 5.0, 3.0, 1.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.154934048652649, -1.1261039972305298, -1.097273826599121, -1.068443775177002, -1.0396137237548828, -1.0107836723327637, -0.981953501701355, -0.9531234502792358, -0.9242933988571167, -0.8954632878303528, -0.8666332364082336, -0.8378031253814697, -0.8089730739593506, -0.7801429629325867, -0.7513128519058228, -0.7224828004837036, -0.6936526894569397, -0.6648225784301758, -0.6359925270080566, -0.6071624159812927, -0.5783323645591736, -0.5495022535324097, -0.5206722021102905, -0.4918420910835266, -0.4630120098590851, -0.43418192863464355, -0.405351847410202, -0.3765217661857605, -0.3476916551589966, -0.31886160373687744, -0.2900314927101135, -0.261201411485672, -0.23237133026123047, -0.20354124903678894, -0.1747111678123474, -0.1458810716867447, -0.11705099046230316, -0.08822090923786163, -0.05939081311225891, -0.030560731887817383, -0.0017306506633758545, 0.027099434286355972, 0.0559295192360878, 0.08475960791110992, 0.11358968913555145, 0.14241977035999298, 0.1712498664855957, 0.20007994771003723, 0.22891002893447876, 0.2577401101589203, 0.2865701913833618, 0.31540030241012573, 0.3442303538322449, 0.3730604648590088, 0.4018905460834503, 0.43072062730789185, 0.4595507085323334, 0.4883807897567749, 0.5172109007835388, 0.546040952205658, 0.5748710632324219, 0.603701114654541, 0.6325312256813049, 0.6613613367080688, 0.690191388130188]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 7.0, 10.0, 11.0, 21.0, 17.0, 23.0, 28.0, 38.0, 41.0, 47.0, 42.0, 50.0, 52.0, 44.0, 54.0, 59.0, 59.0, 64.0, 63.0, 44.0, 37.0, 36.0, 40.0, 24.0, 21.0, 17.0, 10.0, 14.0, 7.0, 10.0, 3.0, 6.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6195239424705505, -0.5981258153915405, -0.5767276287078857, -0.5553295016288757, -0.5339313745498657, -0.5125331878662109, -0.4911350607872009, -0.46973690390586853, -0.44833874702453613, -0.42694059014320374, -0.40554243326187134, -0.38414430618286133, -0.36274614930152893, -0.34134799242019653, -0.3199498653411865, -0.2985517084598541, -0.27715355157852173, -0.25575539469718933, -0.23435725271701813, -0.21295911073684692, -0.19156095385551453, -0.17016279697418213, -0.14876465499401093, -0.12736651301383972, -0.10596835613250732, -0.08457020670175552, -0.06317205727100372, -0.04177390784025192, -0.020375758409500122, 0.0010223910212516785, 0.02242054045200348, 0.04381868243217468, 0.0652167797088623, 0.0866149291396141, 0.1080130785703659, 0.1294112205505371, 0.1508093774318695, 0.1722075343132019, 0.1936056762933731, 0.2150038182735443, 0.2364019751548767, 0.2578001320362091, 0.2791982889175415, 0.3005964159965515, 0.3219945728778839, 0.3433927297592163, 0.3647908568382263, 0.3861890137195587, 0.4075871706008911, 0.4289853274822235, 0.4503834843635559, 0.4717816114425659, 0.4931797683238983, 0.5145779252052307, 0.5359760522842407, 0.5573742389678955, 0.5787723660469055, 0.6001704931259155, 0.6215686798095703, 0.6429668068885803, 0.6643649339675903, 0.6857631206512451, 0.7071612477302551, 0.7285593748092651, 0.7499575614929199]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 10.0, 5.0, 16.0, 38.0, 30.0, 77.0, 140.0, 276.0, 564.0, 1108.0, 2955.0, 11651.0, 108605.0, 829282.0, 79221.0, 9899.0, 2617.0, 1046.0, 454.0, 235.0, 132.0, 82.0, 47.0, 30.0, 10.0, 9.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29541015625, -0.28537750244140625, -0.2753448486328125, -0.26531219482421875, -0.255279541015625, -0.24524688720703125, -0.2352142333984375, -0.22518157958984375, -0.21514892578125, -0.20511627197265625, -0.1950836181640625, -0.18505096435546875, -0.175018310546875, -0.16498565673828125, -0.1549530029296875, -0.14492034912109375, -0.1348876953125, -0.12485504150390625, -0.1148223876953125, -0.10478973388671875, -0.094757080078125, -0.08472442626953125, -0.0746917724609375, -0.06465911865234375, -0.05462646484375, -0.04459381103515625, -0.0345611572265625, -0.02452850341796875, -0.014495849609375, -0.00446319580078125, 0.0055694580078125, 0.01560211181640625, 0.025634765625, 0.03566741943359375, 0.0457000732421875, 0.05573272705078125, 0.065765380859375, 0.07579803466796875, 0.0858306884765625, 0.09586334228515625, 0.10589599609375, 0.11592864990234375, 0.1259613037109375, 0.13599395751953125, 0.146026611328125, 0.15605926513671875, 0.1660919189453125, 0.17612457275390625, 0.1861572265625, 0.19618988037109375, 0.2062225341796875, 0.21625518798828125, 0.226287841796875, 0.23632049560546875, 0.2463531494140625, 0.25638580322265625, 0.26641845703125, 0.27645111083984375, 0.2864837646484375, 0.29651641845703125, 0.306549072265625, 0.31658172607421875, 0.3266143798828125, 0.33664703369140625, 0.3466796875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 3.0, 0.0, 3.0, 4.0, 8.0, 7.0, 14.0, 18.0, 18.0, 18.0, 34.0, 36.0, 51.0, 39.0, 48.0, 66.0, 41.0, 50.0, 70.0, 59.0, 59.0, 61.0, 63.0, 42.0, 41.0, 18.0, 36.0, 25.0, 15.0, 14.0, 15.0, 7.0, 7.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33837890625, -0.32334136962890625, -0.3083038330078125, -0.29326629638671875, -0.278228759765625, -0.26319122314453125, -0.2481536865234375, -0.23311614990234375, -0.21807861328125, -0.20304107666015625, -0.1880035400390625, -0.17296600341796875, -0.157928466796875, -0.14289093017578125, -0.1278533935546875, -0.11281585693359375, -0.0977783203125, -0.08274078369140625, -0.0677032470703125, -0.05266571044921875, -0.037628173828125, -0.02259063720703125, -0.0075531005859375, 0.00748443603515625, 0.02252197265625, 0.03755950927734375, 0.0525970458984375, 0.06763458251953125, 0.082672119140625, 0.09770965576171875, 0.1127471923828125, 0.12778472900390625, 0.142822265625, 0.15785980224609375, 0.1728973388671875, 0.18793487548828125, 0.202972412109375, 0.21800994873046875, 0.2330474853515625, 0.24808502197265625, 0.26312255859375, 0.27816009521484375, 0.2931976318359375, 0.30823516845703125, 0.323272705078125, 0.33831024169921875, 0.3533477783203125, 0.36838531494140625, 0.3834228515625, 0.39846038818359375, 0.4134979248046875, 0.42853546142578125, 0.443572998046875, 0.45861053466796875, 0.4736480712890625, 0.48868560791015625, 0.50372314453125, 0.5187606811523438, 0.5337982177734375, 0.5488357543945312, 0.563873291015625, 0.5789108276367188, 0.5939483642578125, 0.6089859008789062, 0.6240234375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 6.0, 6.0, 7.0, 12.0, 14.0, 7.0, 20.0, 34.0, 31.0, 52.0, 69.0, 114.0, 165.0, 223.0, 330.0, 543.0, 857.0, 1602.0, 2995.0, 6646.0, 15998.0, 46093.0, 180777.0, 517453.0, 194433.0, 49235.0, 16777.0, 6739.0, 3115.0, 1638.0, 894.0, 533.0, 344.0, 241.0, 135.0, 121.0, 83.0, 65.0, 35.0, 28.0, 25.0, 22.0, 13.0, 6.0, 4.0, 5.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1170654296875, -0.11322975158691406, -0.10939407348632812, -0.10555839538574219, -0.10172271728515625, -0.09788703918457031, -0.09405136108398438, -0.09021568298339844, -0.0863800048828125, -0.08254432678222656, -0.07870864868164062, -0.07487297058105469, -0.07103729248046875, -0.06720161437988281, -0.06336593627929688, -0.05953025817871094, -0.055694580078125, -0.05185890197753906, -0.048023223876953125, -0.04418754577636719, -0.04035186767578125, -0.03651618957519531, -0.032680511474609375, -0.028844833374023438, -0.0250091552734375, -0.021173477172851562, -0.017337799072265625, -0.013502120971679688, -0.00966644287109375, -0.0058307647705078125, -0.001995086669921875, 0.0018405914306640625, 0.00567626953125, 0.009511947631835938, 0.013347625732421875, 0.017183303833007812, 0.02101898193359375, 0.024854660034179688, 0.028690338134765625, 0.03252601623535156, 0.0363616943359375, 0.04019737243652344, 0.044033050537109375, 0.04786872863769531, 0.05170440673828125, 0.05554008483886719, 0.059375762939453125, 0.06321144104003906, 0.067047119140625, 0.07088279724121094, 0.07471847534179688, 0.07855415344238281, 0.08238983154296875, 0.08622550964355469, 0.09006118774414062, 0.09389686584472656, 0.0977325439453125, 0.10156822204589844, 0.10540390014648438, 0.10923957824707031, 0.11307525634765625, 0.11691093444824219, 0.12074661254882812, 0.12458229064941406, 0.12841796875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 8.0, 2.0, 2.0, 4.0, 4.0, 10.0, 3.0, 12.0, 11.0, 6.0, 15.0, 24.0, 8.0, 19.0, 28.0, 21.0, 30.0, 34.0, 35.0, 34.0, 42.0, 38.0, 52.0, 48.0, 42.0, 48.0, 55.0, 50.0, 39.0, 32.0, 36.0, 43.0, 17.0, 26.0, 20.0, 10.0, 23.0, 13.0, 14.0, 3.0, 8.0, 6.0, 5.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.61767578125, -0.5970077514648438, -0.5763397216796875, -0.5556716918945312, -0.535003662109375, -0.5143356323242188, -0.4936676025390625, -0.47299957275390625, -0.45233154296875, -0.43166351318359375, -0.4109954833984375, -0.39032745361328125, -0.369659423828125, -0.34899139404296875, -0.3283233642578125, -0.30765533447265625, -0.2869873046875, -0.26631927490234375, -0.2456512451171875, -0.22498321533203125, -0.204315185546875, -0.18364715576171875, -0.1629791259765625, -0.14231109619140625, -0.12164306640625, -0.10097503662109375, -0.0803070068359375, -0.05963897705078125, -0.038970947265625, -0.01830291748046875, 0.0023651123046875, 0.02303314208984375, 0.043701171875, 0.06436920166015625, 0.0850372314453125, 0.10570526123046875, 0.126373291015625, 0.14704132080078125, 0.1677093505859375, 0.18837738037109375, 0.20904541015625, 0.22971343994140625, 0.2503814697265625, 0.27104949951171875, 0.291717529296875, 0.31238555908203125, 0.3330535888671875, 0.35372161865234375, 0.3743896484375, 0.39505767822265625, 0.4157257080078125, 0.43639373779296875, 0.457061767578125, 0.47772979736328125, 0.4983978271484375, 0.5190658569335938, 0.53973388671875, 0.5604019165039062, 0.5810699462890625, 0.6017379760742188, 0.622406005859375, 0.6430740356445312, 0.6637420654296875, 0.6844100952148438, 0.705078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 7.0, 8.0, 11.0, 9.0, 17.0, 39.0, 59.0, 106.0, 179.0, 277.0, 538.0, 1002.0, 1874.0, 4064.0, 9535.0, 27572.0, 107252.0, 521443.0, 287043.0, 57247.0, 17446.0, 6675.0, 2976.0, 1420.0, 738.0, 453.0, 195.0, 125.0, 92.0, 56.0, 30.0, 28.0, 10.0, 8.0, 8.0, 2.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.04376220703125, -0.04229307174682617, -0.040823936462402344, -0.039354801177978516, -0.03788566589355469, -0.03641653060913086, -0.03494739532470703, -0.0334782600402832, -0.032009124755859375, -0.030539989471435547, -0.02907085418701172, -0.02760171890258789, -0.026132583618164062, -0.024663448333740234, -0.023194313049316406, -0.021725177764892578, -0.02025604248046875, -0.018786907196044922, -0.017317771911621094, -0.015848636627197266, -0.014379501342773438, -0.01291036605834961, -0.011441230773925781, -0.009972095489501953, -0.008502960205078125, -0.007033824920654297, -0.005564689636230469, -0.004095554351806641, -0.0026264190673828125, -0.0011572837829589844, 0.00031185150146484375, 0.0017809867858886719, 0.0032501220703125, 0.004719257354736328, 0.006188392639160156, 0.007657527923583984, 0.009126663208007812, 0.01059579849243164, 0.012064933776855469, 0.013534069061279297, 0.015003204345703125, 0.016472339630126953, 0.01794147491455078, 0.01941061019897461, 0.020879745483398438, 0.022348880767822266, 0.023818016052246094, 0.025287151336669922, 0.02675628662109375, 0.028225421905517578, 0.029694557189941406, 0.031163692474365234, 0.03263282775878906, 0.03410196304321289, 0.03557109832763672, 0.03704023361206055, 0.038509368896484375, 0.0399785041809082, 0.04144763946533203, 0.04291677474975586, 0.04438591003417969, 0.045855045318603516, 0.047324180603027344, 0.04879331588745117, 0.050262451171875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 7.0, 13.0, 18.0, 16.0, 19.0, 27.0, 48.0, 75.0, 99.0, 143.0, 152.0, 126.0, 78.0, 67.0, 33.0, 15.0, 10.0, 11.0, 17.0, 7.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.707408905029297e-05, -3.601983189582825e-05, -3.4965574741363525e-05, -3.3911317586898804e-05, -3.285706043243408e-05, -3.180280327796936e-05, -3.074854612350464e-05, -2.9694288969039917e-05, -2.8640031814575195e-05, -2.7585774660110474e-05, -2.6531517505645752e-05, -2.547726035118103e-05, -2.442300319671631e-05, -2.3368746042251587e-05, -2.2314488887786865e-05, -2.1260231733322144e-05, -2.0205974578857422e-05, -1.91517174243927e-05, -1.809746026992798e-05, -1.7043203115463257e-05, -1.5988945960998535e-05, -1.4934688806533813e-05, -1.3880431652069092e-05, -1.282617449760437e-05, -1.1771917343139648e-05, -1.0717660188674927e-05, -9.663403034210205e-06, -8.609145879745483e-06, -7.554888725280762e-06, -6.50063157081604e-06, -5.446374416351318e-06, -4.392117261886597e-06, -3.337860107421875e-06, -2.2836029529571533e-06, -1.2293457984924316e-06, -1.7508864402770996e-07, 8.791685104370117e-07, 1.9334256649017334e-06, 2.987682819366455e-06, 4.041939973831177e-06, 5.0961971282958984e-06, 6.15045428276062e-06, 7.204711437225342e-06, 8.258968591690063e-06, 9.313225746154785e-06, 1.0367482900619507e-05, 1.1421740055084229e-05, 1.247599720954895e-05, 1.3530254364013672e-05, 1.4584511518478394e-05, 1.5638768672943115e-05, 1.6693025827407837e-05, 1.774728298187256e-05, 1.880154013633728e-05, 1.9855797290802002e-05, 2.0910054445266724e-05, 2.1964311599731445e-05, 2.3018568754196167e-05, 2.407282590866089e-05, 2.512708306312561e-05, 2.6181340217590332e-05, 2.7235597372055054e-05, 2.8289854526519775e-05, 2.9344111680984497e-05, 3.039836883544922e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 4.0, 5.0, 9.0, 12.0, 28.0, 30.0, 59.0, 93.0, 123.0, 249.0, 433.0, 760.0, 1374.0, 2689.0, 5246.0, 11301.0, 26458.0, 69848.0, 210543.0, 415106.0, 194319.0, 64238.0, 24427.0, 10600.0, 5002.0, 2455.0, 1350.0, 769.0, 386.0, 245.0, 141.0, 80.0, 58.0, 40.0, 22.0, 15.0, 14.0, 11.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0290985107421875, -0.02817368507385254, -0.027248859405517578, -0.026324033737182617, -0.025399208068847656, -0.024474382400512695, -0.023549556732177734, -0.022624731063842773, -0.021699905395507812, -0.02077507972717285, -0.01985025405883789, -0.01892542839050293, -0.01800060272216797, -0.017075777053833008, -0.016150951385498047, -0.015226125717163086, -0.014301300048828125, -0.013376474380493164, -0.012451648712158203, -0.011526823043823242, -0.010601997375488281, -0.00967717170715332, -0.00875234603881836, -0.007827520370483398, -0.0069026947021484375, -0.0059778690338134766, -0.005053043365478516, -0.004128217697143555, -0.0032033920288085938, -0.002278566360473633, -0.0013537406921386719, -0.00042891502380371094, 0.00049591064453125, 0.001420736312866211, 0.002345561981201172, 0.003270387649536133, 0.004195213317871094, 0.005120038986206055, 0.006044864654541016, 0.0069696903228759766, 0.007894515991210938, 0.008819341659545898, 0.00974416732788086, 0.01066899299621582, 0.011593818664550781, 0.012518644332885742, 0.013443470001220703, 0.014368295669555664, 0.015293121337890625, 0.016217947006225586, 0.017142772674560547, 0.018067598342895508, 0.01899242401123047, 0.01991724967956543, 0.02084207534790039, 0.02176690101623535, 0.022691726684570312, 0.023616552352905273, 0.024541378021240234, 0.025466203689575195, 0.026391029357910156, 0.027315855026245117, 0.028240680694580078, 0.02916550636291504, 0.03009033203125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 7.0, 4.0, 10.0, 17.0, 9.0, 13.0, 13.0, 15.0, 21.0, 29.0, 24.0, 38.0, 56.0, 49.0, 53.0, 64.0, 57.0, 71.0, 60.0, 54.0, 59.0, 51.0, 47.0, 33.0, 35.0, 17.0, 21.0, 10.0, 10.0, 9.0, 9.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.00872039794921875, -0.008465349674224854, -0.008210301399230957, -0.00795525312423706, -0.007700204849243164, -0.007445156574249268, -0.007190108299255371, -0.006935060024261475, -0.006680011749267578, -0.006424963474273682, -0.006169915199279785, -0.005914866924285889, -0.005659818649291992, -0.005404770374298096, -0.005149722099304199, -0.004894673824310303, -0.004639625549316406, -0.00438457727432251, -0.004129528999328613, -0.003874480724334717, -0.0036194324493408203, -0.003364384174346924, -0.0031093358993530273, -0.002854287624359131, -0.0025992393493652344, -0.002344191074371338, -0.0020891427993774414, -0.001834094524383545, -0.0015790462493896484, -0.001323997974395752, -0.0010689496994018555, -0.000813901424407959, -0.0005588531494140625, -0.000303804874420166, -4.875659942626953e-05, 0.00020629167556762695, 0.00046133995056152344, 0.0007163882255554199, 0.0009714365005493164, 0.0012264847755432129, 0.0014815330505371094, 0.0017365813255310059, 0.0019916296005249023, 0.002246677875518799, 0.0025017261505126953, 0.002756774425506592, 0.0030118227005004883, 0.0032668709754943848, 0.0035219192504882812, 0.0037769675254821777, 0.004032015800476074, 0.004287064075469971, 0.004542112350463867, 0.004797160625457764, 0.00505220890045166, 0.005307257175445557, 0.005562305450439453, 0.00581735372543335, 0.006072402000427246, 0.006327450275421143, 0.006582498550415039, 0.0068375468254089355, 0.007092595100402832, 0.0073476433753967285, 0.007602691650390625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 11.0, 20.0, 49.0, 109.0, 232.0, 313.0, 136.0, 61.0, 35.0, 12.0, 9.0, 11.0, 2.0, 1.0, 3.0, 1.0], "bins": [-2.4478647708892822, -2.401827335357666, -2.355790138244629, -2.3097527027130127, -2.2637152671813965, -2.2176780700683594, -2.171640634536743, -2.125603199005127, -2.07956600189209, -2.0335285663604736, -1.987491250038147, -1.9414539337158203, -1.895416498184204, -1.8493791818618774, -1.8033418655395508, -1.7573044300079346, -1.7112669944763184, -1.6652296781539917, -1.6191922426223755, -1.5731549263000488, -1.5271174907684326, -1.481080174446106, -1.4350428581237793, -1.389005422592163, -1.3429681062698364, -1.2969307899475098, -1.2508933544158936, -1.204856038093567, -1.1588187217712402, -1.112781286239624, -1.0667439699172974, -1.0207066535949707, -0.9746692180633545, -0.9286318421363831, -0.8825944662094116, -0.836557149887085, -0.7905197739601135, -0.7444823980331421, -0.6984450817108154, -0.652407705783844, -0.6063703298568726, -0.5603329539299011, -0.5142955780029297, -0.468258261680603, -0.4222208857536316, -0.37618350982666016, -0.3301461637020111, -0.28410881757736206, -0.238071471452713, -0.19203411042690277, -0.14599674940109253, -0.09995938837528229, -0.053922027349472046, -0.007884666323661804, 0.03815269470214844, 0.08419004082679749, 0.13022741675376892, 0.17626477777957916, 0.2223021388053894, 0.26833951473236084, 0.3143768608570099, 0.36041420698165894, 0.40645158290863037, 0.4524889290332794, 0.49852630496025085]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 6.0, 4.0, 13.0, 15.0, 21.0, 24.0, 29.0, 34.0, 44.0, 45.0, 53.0, 53.0, 51.0, 60.0, 56.0, 70.0, 78.0, 63.0, 55.0, 41.0, 43.0, 34.0, 25.0, 19.0, 20.0, 10.0, 10.0, 9.0, 8.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42076849937438965, -0.4054759442806244, -0.39018338918685913, -0.37489083409309387, -0.3595982789993286, -0.34430569410324097, -0.3290131688117981, -0.31372058391571045, -0.2984280288219452, -0.28313547372817993, -0.2678429186344147, -0.2525503635406494, -0.23725779354572296, -0.2219652384519577, -0.20667268335819244, -0.191380113363266, -0.17608757317066193, -0.16079501807689667, -0.1455024629831314, -0.13020989298820496, -0.1149173378944397, -0.09962478280067444, -0.08433222770690918, -0.06903966516256332, -0.053747110068798065, -0.03845455124974251, -0.0231619942933321, -0.007869437336921692, 0.007423121482133865, 0.022715680301189423, 0.03800823539495468, 0.05330079793930054, 0.0685933530330658, 0.08388590812683105, 0.09917847067117691, 0.11447102576494217, 0.12976358830928802, 0.14505614340305328, 0.16034869849681854, 0.175641268491745, 0.19093382358551025, 0.2062263786792755, 0.22151893377304077, 0.23681148886680603, 0.2521040439605713, 0.26739662885665894, 0.2826891541481018, 0.29798173904418945, 0.3132742643356323, 0.3285668194293976, 0.34385937452316284, 0.3591519296169281, 0.37444448471069336, 0.389737069606781, 0.4050295948982239, 0.4203221797943115, 0.4356147348880768, 0.45090728998184204, 0.4661998450756073, 0.48149240016937256, 0.4967849552631378, 0.5120775103569031, 0.5273700952529907, 0.5426626205444336, 0.5579552054405212]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 10.0, 11.0, 12.0, 20.0, 38.0, 71.0, 95.0, 188.0, 329.0, 586.0, 1222.0, 2534.0, 6624.0, 20019.0, 99461.0, 615374.0, 246921.0, 37295.0, 10243.0, 3977.0, 1683.0, 859.0, 397.0, 232.0, 120.0, 76.0, 44.0, 28.0, 24.0, 21.0, 12.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.37255859375, -0.3608131408691406, -0.34906768798828125, -0.3373222351074219, -0.3255767822265625, -0.3138313293457031, -0.30208587646484375, -0.2903404235839844, -0.278594970703125, -0.2668495178222656, -0.25510406494140625, -0.24335861206054688, -0.2316131591796875, -0.21986770629882812, -0.20812225341796875, -0.19637680053710938, -0.18463134765625, -0.17288589477539062, -0.16114044189453125, -0.14939498901367188, -0.1376495361328125, -0.12590408325195312, -0.11415863037109375, -0.10241317749023438, -0.090667724609375, -0.07892227172851562, -0.06717681884765625, -0.055431365966796875, -0.0436859130859375, -0.031940460205078125, -0.02019500732421875, -0.008449554443359375, 0.0032958984375, 0.015041351318359375, 0.02678680419921875, 0.038532257080078125, 0.0502777099609375, 0.062023162841796875, 0.07376861572265625, 0.08551406860351562, 0.097259521484375, 0.10900497436523438, 0.12075042724609375, 0.13249588012695312, 0.1442413330078125, 0.15598678588867188, 0.16773223876953125, 0.17947769165039062, 0.19122314453125, 0.20296859741210938, 0.21471405029296875, 0.22645950317382812, 0.2382049560546875, 0.24995040893554688, 0.26169586181640625, 0.2734413146972656, 0.285186767578125, 0.2969322204589844, 0.30867767333984375, 0.3204231262207031, 0.3321685791015625, 0.3439140319824219, 0.35565948486328125, 0.3674049377441406, 0.379150390625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 4.0, 9.0, 8.0, 22.0, 30.0, 37.0, 40.0, 47.0, 60.0, 66.0, 69.0, 85.0, 80.0, 99.0, 85.0, 62.0, 49.0, 43.0, 36.0, 20.0, 15.0, 10.0, 11.0, 7.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98583984375, -0.9449996948242188, -0.9041595458984375, -0.8633193969726562, -0.822479248046875, -0.7816390991210938, -0.7407989501953125, -0.6999588012695312, -0.65911865234375, -0.6182785034179688, -0.5774383544921875, -0.5365982055664062, -0.495758056640625, -0.45491790771484375, -0.4140777587890625, -0.37323760986328125, -0.3323974609375, -0.29155731201171875, -0.2507171630859375, -0.20987701416015625, -0.169036865234375, -0.12819671630859375, -0.0873565673828125, -0.04651641845703125, -0.00567626953125, 0.03516387939453125, 0.0760040283203125, 0.11684417724609375, 0.157684326171875, 0.19852447509765625, 0.2393646240234375, 0.28020477294921875, 0.321044921875, 0.36188507080078125, 0.4027252197265625, 0.44356536865234375, 0.484405517578125, 0.5252456665039062, 0.5660858154296875, 0.6069259643554688, 0.64776611328125, 0.6886062622070312, 0.7294464111328125, 0.7702865600585938, 0.811126708984375, 0.8519668579101562, 0.8928070068359375, 0.9336471557617188, 0.9744873046875, 1.0153274536132812, 1.0561676025390625, 1.0970077514648438, 1.137847900390625, 1.1786880493164062, 1.2195281982421875, 1.2603683471679688, 1.30120849609375, 1.3420486450195312, 1.3828887939453125, 1.4237289428710938, 1.464569091796875, 1.5054092407226562, 1.5462493896484375, 1.5870895385742188, 1.6279296875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 5.0, 11.0, 8.0, 13.0, 7.0, 18.0, 21.0, 27.0, 24.0, 40.0, 51.0, 70.0, 92.0, 111.0, 210.0, 450.0, 1397.0, 7774.0, 119225.0, 876392.0, 36915.0, 3872.0, 914.0, 314.0, 132.0, 94.0, 67.0, 60.0, 47.0, 43.0, 35.0, 25.0, 21.0, 17.0, 15.0, 7.0, 6.0, 5.0, 7.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.62060546875, -0.6001434326171875, -0.579681396484375, -0.5592193603515625, -0.53875732421875, -0.5182952880859375, -0.497833251953125, -0.4773712158203125, -0.4569091796875, -0.4364471435546875, -0.415985107421875, -0.3955230712890625, -0.37506103515625, -0.3545989990234375, -0.334136962890625, -0.3136749267578125, -0.293212890625, -0.2727508544921875, -0.252288818359375, -0.2318267822265625, -0.21136474609375, -0.1909027099609375, -0.170440673828125, -0.1499786376953125, -0.1295166015625, -0.1090545654296875, -0.088592529296875, -0.0681304931640625, -0.04766845703125, -0.0272064208984375, -0.006744384765625, 0.0137176513671875, 0.0341796875, 0.0546417236328125, 0.075103759765625, 0.0955657958984375, 0.11602783203125, 0.1364898681640625, 0.156951904296875, 0.1774139404296875, 0.1978759765625, 0.2183380126953125, 0.238800048828125, 0.2592620849609375, 0.27972412109375, 0.3001861572265625, 0.320648193359375, 0.3411102294921875, 0.361572265625, 0.3820343017578125, 0.402496337890625, 0.4229583740234375, 0.44342041015625, 0.4638824462890625, 0.484344482421875, 0.5048065185546875, 0.5252685546875, 0.5457305908203125, 0.566192626953125, 0.5866546630859375, 0.60711669921875, 0.6275787353515625, 0.648040771484375, 0.6685028076171875, 0.68896484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 8.0, 9.0, 6.0, 7.0, 14.0, 9.0, 14.0, 21.0, 25.0, 21.0, 35.0, 29.0, 44.0, 33.0, 44.0, 52.0, 44.0, 41.0, 40.0, 56.0, 51.0, 46.0, 30.0, 43.0, 28.0, 42.0, 33.0, 26.0, 32.0, 26.0, 17.0, 17.0, 10.0, 19.0, 10.0, 4.0, 2.0, 3.0, 5.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.77587890625, -0.7499008178710938, -0.7239227294921875, -0.6979446411132812, -0.671966552734375, -0.6459884643554688, -0.6200103759765625, -0.5940322875976562, -0.56805419921875, -0.5420761108398438, -0.5160980224609375, -0.49011993408203125, -0.464141845703125, -0.43816375732421875, -0.4121856689453125, -0.38620758056640625, -0.3602294921875, -0.33425140380859375, -0.3082733154296875, -0.28229522705078125, -0.256317138671875, -0.23033905029296875, -0.2043609619140625, -0.17838287353515625, -0.15240478515625, -0.12642669677734375, -0.1004486083984375, -0.07447052001953125, -0.048492431640625, -0.02251434326171875, 0.0034637451171875, 0.02944183349609375, 0.055419921875, 0.08139801025390625, 0.1073760986328125, 0.13335418701171875, 0.159332275390625, 0.18531036376953125, 0.2112884521484375, 0.23726654052734375, 0.26324462890625, 0.28922271728515625, 0.3152008056640625, 0.34117889404296875, 0.367156982421875, 0.39313507080078125, 0.4191131591796875, 0.44509124755859375, 0.4710693359375, 0.49704742431640625, 0.5230255126953125, 0.5490036010742188, 0.574981689453125, 0.6009597778320312, 0.6269378662109375, 0.6529159545898438, 0.67889404296875, 0.7048721313476562, 0.7308502197265625, 0.7568283081054688, 0.782806396484375, 0.8087844848632812, 0.8347625732421875, 0.8607406616210938, 0.88671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 0.0, 2.0, 5.0, 3.0, 4.0, 9.0, 10.0, 11.0, 14.0, 25.0, 48.0, 122.0, 254.0, 668.0, 2547.0, 15920.0, 552025.0, 458691.0, 14703.0, 2317.0, 653.0, 268.0, 106.0, 60.0, 33.0, 20.0, 8.0, 6.0, 5.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2017822265625, -0.19370460510253906, -0.18562698364257812, -0.1775493621826172, -0.16947174072265625, -0.1613941192626953, -0.15331649780273438, -0.14523887634277344, -0.1371612548828125, -0.12908363342285156, -0.12100601196289062, -0.11292839050292969, -0.10485076904296875, -0.09677314758300781, -0.08869552612304688, -0.08061790466308594, -0.072540283203125, -0.06446266174316406, -0.056385040283203125, -0.04830741882324219, -0.04022979736328125, -0.03215217590332031, -0.024074554443359375, -0.015996932983398438, -0.0079193115234375, 0.0001583099365234375, 0.008235931396484375, 0.016313552856445312, 0.02439117431640625, 0.03246879577636719, 0.040546417236328125, 0.04862403869628906, 0.05670166015625, 0.06477928161621094, 0.07285690307617188, 0.08093452453613281, 0.08901214599609375, 0.09708976745605469, 0.10516738891601562, 0.11324501037597656, 0.1213226318359375, 0.12940025329589844, 0.13747787475585938, 0.1455554962158203, 0.15363311767578125, 0.1617107391357422, 0.16978836059570312, 0.17786598205566406, 0.185943603515625, 0.19402122497558594, 0.20209884643554688, 0.2101764678955078, 0.21825408935546875, 0.2263317108154297, 0.23440933227539062, 0.24248695373535156, 0.2505645751953125, 0.25864219665527344, 0.2667198181152344, 0.2747974395751953, 0.28287506103515625, 0.2909526824951172, 0.2990303039550781, 0.30710792541503906, 0.315185546875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 5.0, 4.0, 4.0, 3.0, 10.0, 10.0, 14.0, 22.0, 33.0, 45.0, 49.0, 81.0, 113.0, 150.0, 125.0, 118.0, 45.0, 54.0, 37.0, 19.0, 21.0, 5.0, 15.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.6941299438476562e-05, -2.629496157169342e-05, -2.564862370491028e-05, -2.5002285838127136e-05, -2.4355947971343994e-05, -2.3709610104560852e-05, -2.306327223777771e-05, -2.2416934370994568e-05, -2.1770596504211426e-05, -2.1124258637428284e-05, -2.047792077064514e-05, -1.9831582903862e-05, -1.9185245037078857e-05, -1.8538907170295715e-05, -1.7892569303512573e-05, -1.724623143672943e-05, -1.659989356994629e-05, -1.5953555703163147e-05, -1.5307217836380005e-05, -1.4660879969596863e-05, -1.401454210281372e-05, -1.3368204236030579e-05, -1.2721866369247437e-05, -1.2075528502464294e-05, -1.1429190635681152e-05, -1.078285276889801e-05, -1.0136514902114868e-05, -9.490177035331726e-06, -8.843839168548584e-06, -8.197501301765442e-06, -7.5511634349823e-06, -6.904825568199158e-06, -6.258487701416016e-06, -5.6121498346328735e-06, -4.9658119678497314e-06, -4.319474101066589e-06, -3.6731362342834473e-06, -3.026798367500305e-06, -2.380460500717163e-06, -1.734122633934021e-06, -1.087784767150879e-06, -4.414469003677368e-07, 2.0489096641540527e-07, 8.512288331985474e-07, 1.4975666999816895e-06, 2.1439045667648315e-06, 2.7902424335479736e-06, 3.4365803003311157e-06, 4.082918167114258e-06, 4.7292560338974e-06, 5.375593900680542e-06, 6.021931767463684e-06, 6.668269634246826e-06, 7.314607501029968e-06, 7.96094536781311e-06, 8.607283234596252e-06, 9.253621101379395e-06, 9.899958968162537e-06, 1.0546296834945679e-05, 1.119263470172882e-05, 1.1838972568511963e-05, 1.2485310435295105e-05, 1.3131648302078247e-05, 1.377798616886139e-05, 1.4424324035644531e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 9.0, 13.0, 17.0, 23.0, 24.0, 69.0, 67.0, 108.0, 192.0, 309.0, 597.0, 1224.0, 3398.0, 13280.0, 102916.0, 828731.0, 80614.0, 11268.0, 3184.0, 1208.0, 520.0, 278.0, 177.0, 109.0, 72.0, 47.0, 33.0, 23.0, 18.0, 6.0, 11.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.241455078125, -0.23500823974609375, -0.2285614013671875, -0.22211456298828125, -0.215667724609375, -0.20922088623046875, -0.2027740478515625, -0.19632720947265625, -0.18988037109375, -0.18343353271484375, -0.1769866943359375, -0.17053985595703125, -0.164093017578125, -0.15764617919921875, -0.1511993408203125, -0.14475250244140625, -0.1383056640625, -0.13185882568359375, -0.1254119873046875, -0.11896514892578125, -0.112518310546875, -0.10607147216796875, -0.0996246337890625, -0.09317779541015625, -0.08673095703125, -0.08028411865234375, -0.0738372802734375, -0.06739044189453125, -0.060943603515625, -0.05449676513671875, -0.0480499267578125, -0.04160308837890625, -0.03515625, -0.02870941162109375, -0.0222625732421875, -0.01581573486328125, -0.009368896484375, -0.00292205810546875, 0.0035247802734375, 0.00997161865234375, 0.01641845703125, 0.02286529541015625, 0.0293121337890625, 0.03575897216796875, 0.042205810546875, 0.04865264892578125, 0.0550994873046875, 0.06154632568359375, 0.0679931640625, 0.07444000244140625, 0.0808868408203125, 0.08733367919921875, 0.093780517578125, 0.10022735595703125, 0.1066741943359375, 0.11312103271484375, 0.11956787109375, 0.12601470947265625, 0.1324615478515625, 0.13890838623046875, 0.145355224609375, 0.15180206298828125, 0.1582489013671875, 0.16469573974609375, 0.171142578125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 4.0, 10.0, 11.0, 17.0, 23.0, 16.0, 59.0, 52.0, 100.0, 150.0, 157.0, 113.0, 102.0, 51.0, 42.0, 29.0, 23.0, 14.0, 4.0, 9.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06781005859375, -0.06533336639404297, -0.06285667419433594, -0.060379981994628906, -0.057903289794921875, -0.055426597595214844, -0.05294990539550781, -0.05047321319580078, -0.04799652099609375, -0.04551982879638672, -0.04304313659667969, -0.040566444396972656, -0.038089752197265625, -0.035613059997558594, -0.03313636779785156, -0.03065967559814453, -0.0281829833984375, -0.02570629119873047, -0.023229598999023438, -0.020752906799316406, -0.018276214599609375, -0.015799522399902344, -0.013322830200195312, -0.010846138000488281, -0.00836944580078125, -0.005892753601074219, -0.0034160614013671875, -0.0009393692016601562, 0.001537322998046875, 0.004014015197753906, 0.0064907073974609375, 0.008967399597167969, 0.011444091796875, 0.013920783996582031, 0.016397476196289062, 0.018874168395996094, 0.021350860595703125, 0.023827552795410156, 0.026304244995117188, 0.02878093719482422, 0.03125762939453125, 0.03373432159423828, 0.03621101379394531, 0.038687705993652344, 0.041164398193359375, 0.043641090393066406, 0.04611778259277344, 0.04859447479248047, 0.0510711669921875, 0.05354785919189453, 0.05602455139160156, 0.058501243591308594, 0.060977935791015625, 0.06345462799072266, 0.06593132019042969, 0.06840801239013672, 0.07088470458984375, 0.07336139678955078, 0.07583808898925781, 0.07831478118896484, 0.08079147338867188, 0.0832681655883789, 0.08574485778808594, 0.08822154998779297, 0.0906982421875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 13.0, 19.0, 40.0, 84.0, 125.0, 238.0, 241.0, 105.0, 54.0, 27.0, 16.0, 13.0, 7.0, 9.0, 5.0, 1.0, 1.0, 3.0], "bins": [-3.7459495067596436, -3.673616886138916, -3.6012845039367676, -3.52895188331604, -3.4566192626953125, -3.384286880493164, -3.3119542598724365, -3.239621639251709, -3.1672892570495605, -3.094956636428833, -3.0226242542266846, -2.950291633605957, -2.8779590129852295, -2.805626392364502, -2.7332940101623535, -2.660961389541626, -2.5886287689208984, -2.516296148300171, -2.4439637660980225, -2.371631145477295, -2.2992985248565674, -2.22696590423584, -2.1546335220336914, -2.082300901412964, -2.0099682807922363, -1.9376357793807983, -1.8653031587600708, -1.7929706573486328, -1.7206380367279053, -1.6483055353164673, -1.5759730339050293, -1.5036404132843018, -1.4313082695007324, -1.3589757680892944, -1.286643147468567, -1.214310646057129, -1.1419780254364014, -1.0696455240249634, -0.9973130226135254, -0.9249804615974426, -0.8526478409767151, -0.7803152799606323, -0.7079827785491943, -0.6356502175331116, -0.5633176565170288, -0.49098509550094604, -0.41865256428718567, -0.3463200330734253, -0.27398747205734253, -0.20165492594242096, -0.1293223798274994, -0.05698983371257782, 0.01534271240234375, 0.08767527341842651, 0.1600078046321869, 0.23234033584594727, 0.30467289686203003, 0.3770054578781128, 0.44933798909187317, 0.5216705203056335, 0.5940030813217163, 0.6663356423377991, 0.7386682033538818, 0.8110007047653198, 0.8833332657814026]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 7.0, 5.0, 5.0, 9.0, 14.0, 16.0, 12.0, 14.0, 27.0, 33.0, 33.0, 28.0, 40.0, 37.0, 37.0, 45.0, 40.0, 42.0, 35.0, 46.0, 41.0, 52.0, 34.0, 45.0, 41.0, 43.0, 20.0, 41.0, 29.0, 26.0, 16.0, 23.0, 11.0, 15.0, 8.0, 8.0, 6.0, 5.0, 4.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3355566263198853, -1.291715383529663, -1.247874140739441, -1.2040328979492188, -1.1601916551589966, -1.1163504123687744, -1.0725090503692627, -1.0286678075790405, -0.9848265647888184, -0.9409853219985962, -0.897144079208374, -0.8533028364181519, -0.8094615340232849, -0.7656202912330627, -0.7217790484428406, -0.6779377460479736, -0.6340965628623962, -0.5902553200721741, -0.5464140772819519, -0.502572774887085, -0.4587315320968628, -0.4148902893066406, -0.37104904651641846, -0.3272077739238739, -0.28336653113365173, -0.23952527344226837, -0.195684015750885, -0.15184277296066284, -0.10800151526927948, -0.06416025757789612, -0.02031901478767395, 0.023522257804870605, 0.06736350059509277, 0.11120475828647614, 0.1550460159778595, 0.19888725876808167, 0.24272851645946503, 0.2865697741508484, 0.33041101694107056, 0.3742522895336151, 0.4180935323238373, 0.46193477511405945, 0.505776047706604, 0.5496172904968262, 0.5934585332870483, 0.6372997760772705, 0.6811410188674927, 0.7249823212623596, 0.7688235640525818, 0.812664806842804, 0.8565060496330261, 0.9003473520278931, 0.9441885948181152, 0.9880298376083374, 1.0318710803985596, 1.0757123231887817, 1.119553565979004, 1.163394808769226, 1.2072360515594482, 1.2510772943496704, 1.2949185371398926, 1.3387598991394043, 1.382601022720337, 1.4264423847198486, 1.4702836275100708]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 3.0, 9.0, 10.0, 14.0, 25.0, 39.0, 64.0, 106.0, 166.0, 339.0, 646.0, 1240.0, 3008.0, 9173.0, 304686.0, 3819075.0, 46396.0, 5381.0, 1983.0, 903.0, 404.0, 259.0, 155.0, 81.0, 41.0, 24.0, 18.0, 9.0, 7.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.53125, -1.470733642578125, -1.41021728515625, -1.349700927734375, -1.2891845703125, -1.228668212890625, -1.16815185546875, -1.107635498046875, -1.047119140625, -0.986602783203125, -0.92608642578125, -0.865570068359375, -0.8050537109375, -0.744537353515625, -0.68402099609375, -0.623504638671875, -0.56298828125, -0.502471923828125, -0.44195556640625, -0.381439208984375, -0.3209228515625, -0.260406494140625, -0.19989013671875, -0.139373779296875, -0.078857421875, -0.018341064453125, 0.04217529296875, 0.102691650390625, 0.1632080078125, 0.223724365234375, 0.28424072265625, 0.344757080078125, 0.4052734375, 0.465789794921875, 0.52630615234375, 0.586822509765625, 0.6473388671875, 0.707855224609375, 0.76837158203125, 0.828887939453125, 0.889404296875, 0.949920654296875, 1.01043701171875, 1.070953369140625, 1.1314697265625, 1.191986083984375, 1.25250244140625, 1.313018798828125, 1.37353515625, 1.434051513671875, 1.49456787109375, 1.555084228515625, 1.6156005859375, 1.676116943359375, 1.73663330078125, 1.797149658203125, 1.857666015625, 1.918182373046875, 1.97869873046875, 2.039215087890625, 2.0997314453125, 2.160247802734375, 2.22076416015625, 2.281280517578125, 2.341796875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 8.0, 3.0, 5.0, 8.0, 20.0, 19.0, 30.0, 29.0, 35.0, 35.0, 50.0, 52.0, 53.0, 61.0, 72.0, 70.0, 52.0, 78.0, 56.0, 64.0, 35.0, 23.0, 36.0, 30.0, 17.0, 17.0, 11.0, 6.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58544921875, -0.5660552978515625, -0.546661376953125, -0.5272674560546875, -0.50787353515625, -0.4884796142578125, -0.469085693359375, -0.4496917724609375, -0.4302978515625, -0.4109039306640625, -0.391510009765625, -0.3721160888671875, -0.35272216796875, -0.3333282470703125, -0.313934326171875, -0.2945404052734375, -0.275146484375, -0.2557525634765625, -0.236358642578125, -0.2169647216796875, -0.19757080078125, -0.1781768798828125, -0.158782958984375, -0.1393890380859375, -0.1199951171875, -0.1006011962890625, -0.081207275390625, -0.0618133544921875, -0.04241943359375, -0.0230255126953125, -0.003631591796875, 0.0157623291015625, 0.03515625, 0.0545501708984375, 0.073944091796875, 0.0933380126953125, 0.11273193359375, 0.1321258544921875, 0.151519775390625, 0.1709136962890625, 0.1903076171875, 0.2097015380859375, 0.229095458984375, 0.2484893798828125, 0.26788330078125, 0.2872772216796875, 0.306671142578125, 0.3260650634765625, 0.345458984375, 0.3648529052734375, 0.384246826171875, 0.4036407470703125, 0.42303466796875, 0.4424285888671875, 0.461822509765625, 0.4812164306640625, 0.5006103515625, 0.5200042724609375, 0.539398193359375, 0.5587921142578125, 0.57818603515625, 0.5975799560546875, 0.616973876953125, 0.6363677978515625, 0.65576171875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 8.0, 12.0, 11.0, 18.0, 38.0, 35.0, 58.0, 110.0, 147.0, 243.0, 371.0, 604.0, 1046.0, 1914.0, 3423.0, 7207.0, 19611.0, 87656.0, 2487563.0, 1483216.0, 69777.0, 17077.0, 6655.0, 3228.0, 1663.0, 991.0, 596.0, 364.0, 199.0, 138.0, 96.0, 68.0, 34.0, 31.0, 20.0, 12.0, 8.0, 15.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.71044921875, -0.6888809204101562, -0.6673126220703125, -0.6457443237304688, -0.624176025390625, -0.6026077270507812, -0.5810394287109375, -0.5594711303710938, -0.53790283203125, -0.5163345336914062, -0.4947662353515625, -0.47319793701171875, -0.451629638671875, -0.43006134033203125, -0.4084930419921875, -0.38692474365234375, -0.3653564453125, -0.34378814697265625, -0.3222198486328125, -0.30065155029296875, -0.279083251953125, -0.25751495361328125, -0.2359466552734375, -0.21437835693359375, -0.19281005859375, -0.17124176025390625, -0.1496734619140625, -0.12810516357421875, -0.106536865234375, -0.08496856689453125, -0.0634002685546875, -0.04183197021484375, -0.020263671875, 0.00130462646484375, 0.0228729248046875, 0.04444122314453125, 0.066009521484375, 0.08757781982421875, 0.1091461181640625, 0.13071441650390625, 0.15228271484375, 0.17385101318359375, 0.1954193115234375, 0.21698760986328125, 0.238555908203125, 0.26012420654296875, 0.2816925048828125, 0.30326080322265625, 0.3248291015625, 0.34639739990234375, 0.3679656982421875, 0.38953399658203125, 0.411102294921875, 0.43267059326171875, 0.4542388916015625, 0.47580718994140625, 0.49737548828125, 0.5189437866210938, 0.5405120849609375, 0.5620803833007812, 0.583648681640625, 0.6052169799804688, 0.6267852783203125, 0.6483535766601562, 0.669921875]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 4.0, 5.0, 6.0, 5.0, 9.0, 13.0, 9.0, 13.0, 28.0, 35.0, 57.0, 110.0, 197.0, 357.0, 690.0, 987.0, 694.0, 374.0, 183.0, 91.0, 67.0, 33.0, 23.0, 11.0, 12.0, 8.0, 11.0, 3.0, 6.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2161865234375, -0.2088489532470703, -0.20151138305664062, -0.19417381286621094, -0.18683624267578125, -0.17949867248535156, -0.17216110229492188, -0.1648235321044922, -0.1574859619140625, -0.1501483917236328, -0.14281082153320312, -0.13547325134277344, -0.12813568115234375, -0.12079811096191406, -0.11346054077148438, -0.10612297058105469, -0.098785400390625, -0.09144783020019531, -0.08411026000976562, -0.07677268981933594, -0.06943511962890625, -0.06209754943847656, -0.054759979248046875, -0.04742240905761719, -0.0400848388671875, -0.03274726867675781, -0.025409698486328125, -0.018072128295898438, -0.01073455810546875, -0.0033969879150390625, 0.003940582275390625, 0.011278152465820312, 0.01861572265625, 0.025953292846679688, 0.033290863037109375, 0.04062843322753906, 0.04796600341796875, 0.05530357360839844, 0.06264114379882812, 0.06997871398925781, 0.0773162841796875, 0.08465385437011719, 0.09199142456054688, 0.09932899475097656, 0.10666656494140625, 0.11400413513183594, 0.12134170532226562, 0.1286792755126953, 0.136016845703125, 0.1433544158935547, 0.15069198608398438, 0.15802955627441406, 0.16536712646484375, 0.17270469665527344, 0.18004226684570312, 0.1873798370361328, 0.1947174072265625, 0.2020549774169922, 0.20939254760742188, 0.21673011779785156, 0.22406768798828125, 0.23140525817871094, 0.23874282836914062, 0.2460803985595703, 0.25341796875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 8.0, 9.0, 15.0, 25.0, 30.0, 45.0, 65.0, 104.0, 115.0, 153.0, 121.0, 73.0, 61.0, 48.0, 27.0, 21.0, 11.0, 9.0, 8.0, 8.0, 7.0, 5.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.006345510482788, -0.9785889387130737, -0.9508323669433594, -0.923075795173645, -0.8953192234039307, -0.8675626516342163, -0.839806079864502, -0.8120495080947876, -0.7842929363250732, -0.7565363645553589, -0.7287797927856445, -0.7010232210159302, -0.6732666492462158, -0.6455100774765015, -0.6177535057067871, -0.5899969339370728, -0.5622404217720032, -0.5344838500022888, -0.5067272782325745, -0.4789707064628601, -0.45121413469314575, -0.4234575629234314, -0.39570102095603943, -0.3679444491863251, -0.3401878774166107, -0.31243130564689636, -0.284674733877182, -0.25691819190979004, -0.2291616052389145, -0.20140503346920013, -0.17364847660064697, -0.14589190483093262, -0.11813539266586304, -0.09037882089614868, -0.06262225657701492, -0.034865692257881165, -0.007109120488166809, 0.020647451281547546, 0.04840400815010071, 0.07616057991981506, 0.10391715168952942, 0.13167372345924377, 0.15943029522895813, 0.1871868520975113, 0.21494342386722565, 0.24269999563694, 0.27045655250549316, 0.2982131242752075, 0.3259696960449219, 0.35372626781463623, 0.3814828395843506, 0.40923941135406494, 0.4369959831237793, 0.46475255489349365, 0.4925090968608856, 0.5202656984329224, 0.5480222702026367, 0.5757788419723511, 0.6035354137420654, 0.6312919855117798, 0.6590485572814941, 0.6868051290512085, 0.7145617008209229, 0.7423182725906372, 0.7700747847557068]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 9.0, 6.0, 17.0, 24.0, 26.0, 25.0, 31.0, 31.0, 41.0, 43.0, 45.0, 52.0, 45.0, 60.0, 58.0, 60.0, 62.0, 53.0, 52.0, 44.0, 39.0, 33.0, 25.0, 26.0, 23.0, 14.0, 21.0, 11.0, 11.0, 4.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5457655191421509, -0.5264434814453125, -0.5071214437484741, -0.48779940605163574, -0.46847739815711975, -0.44915536046028137, -0.429833322763443, -0.410511314868927, -0.3911892771720886, -0.37186723947525024, -0.35254520177841187, -0.3332231640815735, -0.3139011561870575, -0.2945791184902191, -0.27525708079338074, -0.25593507289886475, -0.23661300539970398, -0.2172909677028656, -0.19796894490718842, -0.17864690721035004, -0.15932488441467285, -0.14000284671783447, -0.1206808090209961, -0.10135878622531891, -0.08203674852848053, -0.06271471828222275, -0.04339268431067467, -0.024070650339126587, -0.004748620092868805, 0.014573410153388977, 0.033895447850227356, 0.05321747064590454, 0.07253950834274292, 0.0918615385890007, 0.11118356883525848, 0.13050560653209686, 0.14982762932777405, 0.16914966702461243, 0.1884717047214508, 0.207793727517128, 0.22711576521396637, 0.24643780291080475, 0.26575982570648193, 0.2850818634033203, 0.3044039011001587, 0.32372593879699707, 0.34304797649383545, 0.36236998438835144, 0.3816920220851898, 0.4010140597820282, 0.4203360974788666, 0.43965810537338257, 0.45898014307022095, 0.4783021807670593, 0.4976242184638977, 0.5169462561607361, 0.5362682938575745, 0.5555903315544128, 0.5749123692512512, 0.5942344069480896, 0.613556444644928, 0.6328784227371216, 0.65220046043396, 0.6715224981307983, 0.6908445358276367]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 8.0, 6.0, 7.0, 12.0, 9.0, 19.0, 27.0, 32.0, 43.0, 58.0, 67.0, 116.0, 170.0, 254.0, 452.0, 746.0, 1424.0, 2700.0, 5500.0, 11426.0, 26122.0, 66329.0, 197824.0, 419762.0, 198922.0, 66516.0, 26680.0, 11607.0, 5531.0, 2711.0, 1411.0, 781.0, 432.0, 287.0, 176.0, 103.0, 89.0, 50.0, 40.0, 31.0, 20.0, 13.0, 11.0, 5.0, 5.0, 9.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.0755615234375, -0.07316303253173828, -0.07076454162597656, -0.06836605072021484, -0.06596755981445312, -0.0635690689086914, -0.06117057800292969, -0.05877208709716797, -0.05637359619140625, -0.05397510528564453, -0.05157661437988281, -0.049178123474121094, -0.046779632568359375, -0.044381141662597656, -0.04198265075683594, -0.03958415985107422, -0.0371856689453125, -0.03478717803955078, -0.03238868713378906, -0.029990196228027344, -0.027591705322265625, -0.025193214416503906, -0.022794723510742188, -0.02039623260498047, -0.01799774169921875, -0.015599250793457031, -0.013200759887695312, -0.010802268981933594, -0.008403778076171875, -0.006005287170410156, -0.0036067962646484375, -0.0012083053588867188, 0.001190185546875, 0.0035886764526367188, 0.0059871673583984375, 0.008385658264160156, 0.010784149169921875, 0.013182640075683594, 0.015581130981445312, 0.01797962188720703, 0.02037811279296875, 0.02277660369873047, 0.025175094604492188, 0.027573585510253906, 0.029972076416015625, 0.032370567321777344, 0.03476905822753906, 0.03716754913330078, 0.0395660400390625, 0.04196453094482422, 0.04436302185058594, 0.046761512756347656, 0.049160003662109375, 0.051558494567871094, 0.05395698547363281, 0.05635547637939453, 0.05875396728515625, 0.06115245819091797, 0.06355094909667969, 0.0659494400024414, 0.06834793090820312, 0.07074642181396484, 0.07314491271972656, 0.07554340362548828, 0.07794189453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 12.0, 15.0, 32.0, 28.0, 35.0, 51.0, 54.0, 65.0, 77.0, 93.0, 89.0, 92.0, 70.0, 64.0, 47.0, 35.0, 42.0, 21.0, 25.0, 16.0, 13.0, 6.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42236328125, -0.4050445556640625, -0.387725830078125, -0.3704071044921875, -0.35308837890625, -0.3357696533203125, -0.318450927734375, -0.3011322021484375, -0.2838134765625, -0.2664947509765625, -0.249176025390625, -0.2318572998046875, -0.21453857421875, -0.1972198486328125, -0.179901123046875, -0.1625823974609375, -0.145263671875, -0.1279449462890625, -0.110626220703125, -0.0933074951171875, -0.07598876953125, -0.0586700439453125, -0.041351318359375, -0.0240325927734375, -0.0067138671875, 0.0106048583984375, 0.027923583984375, 0.0452423095703125, 0.06256103515625, 0.0798797607421875, 0.097198486328125, 0.1145172119140625, 0.1318359375, 0.1491546630859375, 0.166473388671875, 0.1837921142578125, 0.20111083984375, 0.2184295654296875, 0.235748291015625, 0.2530670166015625, 0.2703857421875, 0.2877044677734375, 0.305023193359375, 0.3223419189453125, 0.33966064453125, 0.3569793701171875, 0.374298095703125, 0.3916168212890625, 0.408935546875, 0.4262542724609375, 0.443572998046875, 0.4608917236328125, 0.47821044921875, 0.4955291748046875, 0.512847900390625, 0.5301666259765625, 0.5474853515625, 0.5648040771484375, 0.582122802734375, 0.5994415283203125, 0.61676025390625, 0.6340789794921875, 0.651397705078125, 0.6687164306640625, 0.68603515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 2.0, 7.0, 19.0, 13.0, 18.0, 33.0, 46.0, 46.0, 105.0, 153.0, 248.0, 349.0, 634.0, 1089.0, 1856.0, 3389.0, 6196.0, 12906.0, 27814.0, 65877.0, 168063.0, 344421.0, 241246.0, 96810.0, 39893.0, 18068.0, 8680.0, 4504.0, 2505.0, 1403.0, 787.0, 493.0, 295.0, 178.0, 140.0, 77.0, 50.0, 47.0, 29.0, 26.0, 11.0, 10.0, 5.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055755615234375, -0.0538783073425293, -0.052000999450683594, -0.05012369155883789, -0.04824638366699219, -0.046369075775146484, -0.04449176788330078, -0.04261445999145508, -0.040737152099609375, -0.03885984420776367, -0.03698253631591797, -0.035105228424072266, -0.03322792053222656, -0.03135061264038086, -0.029473304748535156, -0.027595996856689453, -0.02571868896484375, -0.023841381072998047, -0.021964073181152344, -0.02008676528930664, -0.018209457397460938, -0.016332149505615234, -0.014454841613769531, -0.012577533721923828, -0.010700225830078125, -0.008822917938232422, -0.006945610046386719, -0.005068302154541016, -0.0031909942626953125, -0.0013136863708496094, 0.0005636215209960938, 0.002440929412841797, 0.0043182373046875, 0.006195545196533203, 0.008072853088378906, 0.00995016098022461, 0.011827468872070312, 0.013704776763916016, 0.015582084655761719, 0.017459392547607422, 0.019336700439453125, 0.021214008331298828, 0.02309131622314453, 0.024968624114990234, 0.026845932006835938, 0.02872323989868164, 0.030600547790527344, 0.03247785568237305, 0.03435516357421875, 0.03623247146606445, 0.038109779357910156, 0.03998708724975586, 0.04186439514160156, 0.043741703033447266, 0.04561901092529297, 0.04749631881713867, 0.049373626708984375, 0.05125093460083008, 0.05312824249267578, 0.055005550384521484, 0.05688285827636719, 0.05876016616821289, 0.060637474060058594, 0.0625147819519043, 0.06439208984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 7.0, 6.0, 5.0, 8.0, 11.0, 7.0, 11.0, 11.0, 9.0, 16.0, 17.0, 23.0, 31.0, 20.0, 30.0, 48.0, 38.0, 41.0, 46.0, 56.0, 43.0, 42.0, 47.0, 41.0, 44.0, 41.0, 36.0, 34.0, 29.0, 22.0, 22.0, 22.0, 24.0, 24.0, 14.0, 8.0, 14.0, 12.0, 9.0, 6.0, 11.0, 3.0, 7.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.57763671875, -0.5601806640625, -0.542724609375, -0.5252685546875, -0.5078125, -0.4903564453125, -0.472900390625, -0.4554443359375, -0.43798828125, -0.4205322265625, -0.403076171875, -0.3856201171875, -0.3681640625, -0.3507080078125, -0.333251953125, -0.3157958984375, -0.29833984375, -0.2808837890625, -0.263427734375, -0.2459716796875, -0.228515625, -0.2110595703125, -0.193603515625, -0.1761474609375, -0.15869140625, -0.1412353515625, -0.123779296875, -0.1063232421875, -0.0888671875, -0.0714111328125, -0.053955078125, -0.0364990234375, -0.01904296875, -0.0015869140625, 0.015869140625, 0.0333251953125, 0.05078125, 0.0682373046875, 0.085693359375, 0.1031494140625, 0.12060546875, 0.1380615234375, 0.155517578125, 0.1729736328125, 0.1904296875, 0.2078857421875, 0.225341796875, 0.2427978515625, 0.26025390625, 0.2777099609375, 0.295166015625, 0.3126220703125, 0.330078125, 0.3475341796875, 0.364990234375, 0.3824462890625, 0.39990234375, 0.4173583984375, 0.434814453125, 0.4522705078125, 0.4697265625, 0.4871826171875, 0.504638671875, 0.5220947265625, 0.53955078125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 6.0, 2.0, 14.0, 19.0, 28.0, 38.0, 55.0, 124.0, 229.0, 448.0, 850.0, 2068.0, 5245.0, 16776.0, 72480.0, 459626.0, 403635.0, 63116.0, 15177.0, 4865.0, 1988.0, 886.0, 423.0, 181.0, 105.0, 73.0, 43.0, 18.0, 13.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0443115234375, -0.04314422607421875, -0.0419769287109375, -0.04080963134765625, -0.039642333984375, -0.03847503662109375, -0.0373077392578125, -0.03614044189453125, -0.03497314453125, -0.03380584716796875, -0.0326385498046875, -0.03147125244140625, -0.030303955078125, -0.02913665771484375, -0.0279693603515625, -0.02680206298828125, -0.025634765625, -0.02446746826171875, -0.0233001708984375, -0.02213287353515625, -0.020965576171875, -0.01979827880859375, -0.0186309814453125, -0.01746368408203125, -0.01629638671875, -0.01512908935546875, -0.0139617919921875, -0.01279449462890625, -0.011627197265625, -0.01045989990234375, -0.0092926025390625, -0.00812530517578125, -0.0069580078125, -0.00579071044921875, -0.0046234130859375, -0.00345611572265625, -0.002288818359375, -0.00112152099609375, 4.57763671875e-05, 0.00121307373046875, 0.00238037109375, 0.00354766845703125, 0.0047149658203125, 0.00588226318359375, 0.007049560546875, 0.00821685791015625, 0.0093841552734375, 0.01055145263671875, 0.01171875, 0.01288604736328125, 0.0140533447265625, 0.01522064208984375, 0.016387939453125, 0.01755523681640625, 0.0187225341796875, 0.01988983154296875, 0.02105712890625, 0.02222442626953125, 0.0233917236328125, 0.02455902099609375, 0.025726318359375, 0.02689361572265625, 0.0280609130859375, 0.02922821044921875, 0.0303955078125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 5.0, 8.0, 10.0, 20.0, 20.0, 20.0, 41.0, 55.0, 96.0, 104.0, 129.0, 148.0, 92.0, 78.0, 50.0, 32.0, 26.0, 17.0, 14.0, 6.0, 6.0, 3.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7583370208740234e-05, -1.690257340669632e-05, -1.6221776604652405e-05, -1.554097980260849e-05, -1.4860183000564575e-05, -1.417938619852066e-05, -1.3498589396476746e-05, -1.281779259443283e-05, -1.2136995792388916e-05, -1.1456198990345001e-05, -1.0775402188301086e-05, -1.0094605386257172e-05, -9.413808584213257e-06, -8.733011782169342e-06, -8.052214980125427e-06, -7.3714181780815125e-06, -6.690621376037598e-06, -6.009824573993683e-06, -5.329027771949768e-06, -4.648230969905853e-06, -3.9674341678619385e-06, -3.2866373658180237e-06, -2.605840563774109e-06, -1.925043761730194e-06, -1.2442469596862793e-06, -5.634501576423645e-07, 1.1734664440155029e-07, 7.981434464454651e-07, 1.4789402484893799e-06, 2.1597370505332947e-06, 2.8405338525772095e-06, 3.5213306546211243e-06, 4.202127456665039e-06, 4.882924258708954e-06, 5.563721060752869e-06, 6.2445178627967834e-06, 6.925314664840698e-06, 7.606111466884613e-06, 8.286908268928528e-06, 8.967705070972443e-06, 9.648501873016357e-06, 1.0329298675060272e-05, 1.1010095477104187e-05, 1.1690892279148102e-05, 1.2371689081192017e-05, 1.3052485883235931e-05, 1.3733282685279846e-05, 1.4414079487323761e-05, 1.5094876289367676e-05, 1.577567309141159e-05, 1.6456469893455505e-05, 1.713726669549942e-05, 1.7818063497543335e-05, 1.849886029958725e-05, 1.9179657101631165e-05, 1.986045390367508e-05, 2.0541250705718994e-05, 2.122204750776291e-05, 2.1902844309806824e-05, 2.258364111185074e-05, 2.3264437913894653e-05, 2.3945234715938568e-05, 2.4626031517982483e-05, 2.5306828320026398e-05, 2.5987625122070312e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 6.0, 5.0, 10.0, 17.0, 16.0, 30.0, 37.0, 55.0, 88.0, 119.0, 221.0, 332.0, 605.0, 1058.0, 1968.0, 3654.0, 7472.0, 16687.0, 41348.0, 112174.0, 319239.0, 341410.0, 123158.0, 44183.0, 17858.0, 8037.0, 3926.0, 2087.0, 1114.0, 647.0, 401.0, 223.0, 119.0, 76.0, 53.0, 43.0, 19.0, 22.0, 11.0, 10.0, 6.0, 4.0, 2.0, 4.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0227508544921875, -0.022062301635742188, -0.021373748779296875, -0.020685195922851562, -0.01999664306640625, -0.019308090209960938, -0.018619537353515625, -0.017930984497070312, -0.017242431640625, -0.016553878784179688, -0.015865325927734375, -0.015176773071289062, -0.01448822021484375, -0.013799667358398438, -0.013111114501953125, -0.012422561645507812, -0.0117340087890625, -0.011045455932617188, -0.010356903076171875, -0.009668350219726562, -0.00897979736328125, -0.008291244506835938, -0.007602691650390625, -0.0069141387939453125, -0.0062255859375, -0.0055370330810546875, -0.004848480224609375, -0.0041599273681640625, -0.00347137451171875, -0.0027828216552734375, -0.002094268798828125, -0.0014057159423828125, -0.0007171630859375, -2.86102294921875e-05, 0.000659942626953125, 0.0013484954833984375, 0.00203704833984375, 0.0027256011962890625, 0.003414154052734375, 0.0041027069091796875, 0.004791259765625, 0.0054798126220703125, 0.006168365478515625, 0.0068569183349609375, 0.00754547119140625, 0.008234024047851562, 0.008922576904296875, 0.009611129760742188, 0.0102996826171875, 0.010988235473632812, 0.011676788330078125, 0.012365341186523438, 0.01305389404296875, 0.013742446899414062, 0.014430999755859375, 0.015119552612304688, 0.01580810546875, 0.016496658325195312, 0.017185211181640625, 0.017873764038085938, 0.01856231689453125, 0.019250869750976562, 0.019939422607421875, 0.020627975463867188, 0.0213165283203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 4.0, 7.0, 7.0, 8.0, 15.0, 6.0, 16.0, 21.0, 21.0, 28.0, 43.0, 46.0, 50.0, 53.0, 56.0, 85.0, 65.0, 60.0, 66.0, 70.0, 55.0, 48.0, 32.0, 30.0, 20.0, 24.0, 18.0, 17.0, 11.0, 4.0, 7.0, 2.0, 3.0, 7.0, 0.0, 5.0, 1.0, 1.0], "bins": [-0.010040283203125, -0.009804010391235352, -0.009567737579345703, -0.009331464767456055, -0.009095191955566406, -0.008858919143676758, -0.00862264633178711, -0.008386373519897461, -0.008150100708007812, -0.007913827896118164, -0.007677555084228516, -0.007441282272338867, -0.007205009460449219, -0.00696873664855957, -0.006732463836669922, -0.0064961910247802734, -0.006259918212890625, -0.0060236454010009766, -0.005787372589111328, -0.00555109977722168, -0.005314826965332031, -0.005078554153442383, -0.004842281341552734, -0.004606008529663086, -0.0043697357177734375, -0.004133462905883789, -0.0038971900939941406, -0.003660917282104492, -0.0034246444702148438, -0.0031883716583251953, -0.002952098846435547, -0.0027158260345458984, -0.00247955322265625, -0.0022432804107666016, -0.002007007598876953, -0.0017707347869873047, -0.0015344619750976562, -0.0012981891632080078, -0.0010619163513183594, -0.0008256435394287109, -0.0005893707275390625, -0.00035309791564941406, -0.00011682510375976562, 0.00011944770812988281, 0.00035572052001953125, 0.0005919933319091797, 0.0008282661437988281, 0.0010645389556884766, 0.001300811767578125, 0.0015370845794677734, 0.0017733573913574219, 0.0020096302032470703, 0.0022459030151367188, 0.002482175827026367, 0.0027184486389160156, 0.002954721450805664, 0.0031909942626953125, 0.003427267074584961, 0.0036635398864746094, 0.003899812698364258, 0.004136085510253906, 0.004372358322143555, 0.004608631134033203, 0.0048449039459228516, 0.0050811767578125]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 2.0, 12.0, 15.0, 43.0, 98.0, 275.0, 335.0, 137.0, 35.0, 23.0, 11.0, 13.0, 3.0, 2.0, 1.0, 2.0, 3.0], "bins": [-2.4358296394348145, -2.389970541000366, -2.344111204147339, -2.2982521057128906, -2.2523930072784424, -2.206533670425415, -2.160674571990967, -2.1148154735565186, -2.0689563751220703, -2.023097276687622, -1.9772380590438843, -1.9313788414001465, -1.8855197429656982, -1.8396605253219604, -1.7938013076782227, -1.7479422092437744, -1.702082872390747, -1.6562236547470093, -1.610364556312561, -1.5645053386688232, -1.518646240234375, -1.4727870225906372, -1.4269278049468994, -1.3810687065124512, -1.3352094888687134, -1.2893502712249756, -1.2434911727905273, -1.1976319551467896, -1.1517727375030518, -1.1059136390686035, -1.0600544214248657, -1.014195203781128, -0.9683359861373901, -0.9224768280982971, -0.8766176700592041, -0.8307584524154663, -0.7848992943763733, -0.7390401363372803, -0.6931809186935425, -0.6473217606544495, -0.6014626026153564, -0.5556034445762634, -0.5097442865371704, -0.4638850688934326, -0.4180259108543396, -0.3721667528152466, -0.3263075649738312, -0.28044837713241577, -0.23458921909332275, -0.18873004615306854, -0.14287087321281433, -0.09701170027256012, -0.05115252733230591, -0.005293354392051697, 0.040565818548202515, 0.08642500638961792, 0.13228416442871094, 0.17814333736896515, 0.22400251030921936, 0.26986169815063477, 0.3157208561897278, 0.3615800142288208, 0.4074392020702362, 0.4532983899116516, 0.49915754795074463]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 8.0, 5.0, 14.0, 23.0, 23.0, 21.0, 37.0, 40.0, 37.0, 52.0, 52.0, 64.0, 66.0, 68.0, 69.0, 72.0, 57.0, 62.0, 42.0, 38.0, 36.0, 27.0, 17.0, 20.0, 16.0, 13.0, 6.0, 3.0, 9.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3846094310283661, -0.37079745531082153, -0.35698550939559937, -0.3431735336780548, -0.32936158776283264, -0.3155496120452881, -0.3017376661300659, -0.28792569041252136, -0.2741137146949768, -0.26030173897743225, -0.24648979306221008, -0.23267781734466553, -0.21886587142944336, -0.2050538957118988, -0.19124193489551544, -0.17742997407913208, -0.1636180281639099, -0.14980606734752655, -0.1359941065311432, -0.12218213826417923, -0.10837017744779587, -0.0945582166314125, -0.08074624836444855, -0.06693428754806519, -0.053122326731681824, -0.03931036591529846, -0.0254984013736248, -0.011686436831951141, 0.0021255239844322205, 0.015937484800815582, 0.02974945306777954, 0.0435614138841629, 0.057373374700546265, 0.07118533551692963, 0.08499729633331299, 0.09880926460027695, 0.11262122541666031, 0.12643319368362427, 0.14024515450000763, 0.154057115316391, 0.16786907613277435, 0.18168103694915771, 0.19549299776554108, 0.20930495858192444, 0.223116934299469, 0.23692888021469116, 0.2507408559322357, 0.2645528316497803, 0.27836477756500244, 0.292176753282547, 0.30598869919776917, 0.3198006749153137, 0.3336126208305359, 0.34742459654808044, 0.361236572265625, 0.37504851818084717, 0.38886046409606934, 0.4026724398136139, 0.41648438572883606, 0.4302963614463806, 0.4441083073616028, 0.45792028307914734, 0.4717322587966919, 0.48554420471191406, 0.4993561804294586]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 8.0, 8.0, 7.0, 19.0, 23.0, 35.0, 48.0, 75.0, 126.0, 241.0, 375.0, 723.0, 1237.0, 2643.0, 6032.0, 16155.0, 59343.0, 378934.0, 477513.0, 73438.0, 18814.0, 6755.0, 2816.0, 1381.0, 715.0, 434.0, 236.0, 156.0, 89.0, 64.0, 26.0, 29.0, 18.0, 12.0, 12.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2734375, -0.26369476318359375, -0.2539520263671875, -0.24420928955078125, -0.234466552734375, -0.22472381591796875, -0.2149810791015625, -0.20523834228515625, -0.19549560546875, -0.18575286865234375, -0.1760101318359375, -0.16626739501953125, -0.156524658203125, -0.14678192138671875, -0.1370391845703125, -0.12729644775390625, -0.1175537109375, -0.10781097412109375, -0.0980682373046875, -0.08832550048828125, -0.078582763671875, -0.06884002685546875, -0.0590972900390625, -0.04935455322265625, -0.03961181640625, -0.02986907958984375, -0.0201263427734375, -0.01038360595703125, -0.000640869140625, 0.00910186767578125, 0.0188446044921875, 0.02858734130859375, 0.038330078125, 0.04807281494140625, 0.0578155517578125, 0.06755828857421875, 0.077301025390625, 0.08704376220703125, 0.0967864990234375, 0.10652923583984375, 0.11627197265625, 0.12601470947265625, 0.1357574462890625, 0.14550018310546875, 0.155242919921875, 0.16498565673828125, 0.1747283935546875, 0.18447113037109375, 0.1942138671875, 0.20395660400390625, 0.2136993408203125, 0.22344207763671875, 0.233184814453125, 0.24292755126953125, 0.2526702880859375, 0.26241302490234375, 0.27215576171875, 0.28189849853515625, 0.2916412353515625, 0.30138397216796875, 0.311126708984375, 0.32086944580078125, 0.3306121826171875, 0.34035491943359375, 0.35009765625]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 7.0, 1.0, 5.0, 14.0, 15.0, 28.0, 21.0, 25.0, 41.0, 44.0, 42.0, 63.0, 74.0, 72.0, 67.0, 70.0, 84.0, 55.0, 61.0, 46.0, 38.0, 26.0, 19.0, 24.0, 16.0, 15.0, 9.0, 8.0, 2.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8662109375, -0.836090087890625, -0.80596923828125, -0.775848388671875, -0.7457275390625, -0.715606689453125, -0.68548583984375, -0.655364990234375, -0.625244140625, -0.595123291015625, -0.56500244140625, -0.534881591796875, -0.5047607421875, -0.474639892578125, -0.44451904296875, -0.414398193359375, -0.38427734375, -0.354156494140625, -0.32403564453125, -0.293914794921875, -0.2637939453125, -0.233673095703125, -0.20355224609375, -0.173431396484375, -0.143310546875, -0.113189697265625, -0.08306884765625, -0.052947998046875, -0.0228271484375, 0.007293701171875, 0.03741455078125, 0.067535400390625, 0.09765625, 0.127777099609375, 0.15789794921875, 0.188018798828125, 0.2181396484375, 0.248260498046875, 0.27838134765625, 0.308502197265625, 0.338623046875, 0.368743896484375, 0.39886474609375, 0.428985595703125, 0.4591064453125, 0.489227294921875, 0.51934814453125, 0.549468994140625, 0.57958984375, 0.609710693359375, 0.63983154296875, 0.669952392578125, 0.7000732421875, 0.730194091796875, 0.76031494140625, 0.790435791015625, 0.820556640625, 0.850677490234375, 0.88079833984375, 0.910919189453125, 0.9410400390625, 0.971160888671875, 1.00128173828125, 1.031402587890625, 1.0615234375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 8.0, 16.0, 20.0, 18.0, 30.0, 36.0, 65.0, 105.0, 159.0, 249.0, 562.0, 2199.0, 17864.0, 678809.0, 334272.0, 11391.0, 1598.0, 513.0, 228.0, 123.0, 82.0, 68.0, 41.0, 30.0, 19.0, 8.0, 8.0, 5.0, 6.0, 2.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.673828125, -0.6545257568359375, -0.635223388671875, -0.6159210205078125, -0.59661865234375, -0.5773162841796875, -0.558013916015625, -0.5387115478515625, -0.5194091796875, -0.5001068115234375, -0.480804443359375, -0.4615020751953125, -0.44219970703125, -0.4228973388671875, -0.403594970703125, -0.3842926025390625, -0.364990234375, -0.3456878662109375, -0.326385498046875, -0.3070831298828125, -0.28778076171875, -0.2684783935546875, -0.249176025390625, -0.2298736572265625, -0.2105712890625, -0.1912689208984375, -0.171966552734375, -0.1526641845703125, -0.13336181640625, -0.1140594482421875, -0.094757080078125, -0.0754547119140625, -0.05615234375, -0.0368499755859375, -0.017547607421875, 0.0017547607421875, 0.02105712890625, 0.0403594970703125, 0.059661865234375, 0.0789642333984375, 0.0982666015625, 0.1175689697265625, 0.136871337890625, 0.1561737060546875, 0.17547607421875, 0.1947784423828125, 0.214080810546875, 0.2333831787109375, 0.252685546875, 0.2719879150390625, 0.291290283203125, 0.3105926513671875, 0.32989501953125, 0.3491973876953125, 0.368499755859375, 0.3878021240234375, 0.4071044921875, 0.4264068603515625, 0.445709228515625, 0.4650115966796875, 0.48431396484375, 0.5036163330078125, 0.522918701171875, 0.5422210693359375, 0.5615234375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 4.0, 9.0, 5.0, 7.0, 8.0, 8.0, 12.0, 20.0, 19.0, 20.0, 26.0, 29.0, 26.0, 29.0, 44.0, 40.0, 48.0, 38.0, 33.0, 44.0, 40.0, 60.0, 48.0, 52.0, 54.0, 35.0, 47.0, 25.0, 23.0, 16.0, 24.0, 15.0, 14.0, 16.0, 14.0, 7.0, 10.0, 5.0, 6.0, 10.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.67431640625, -0.6527099609375, -0.631103515625, -0.6094970703125, -0.587890625, -0.5662841796875, -0.544677734375, -0.5230712890625, -0.50146484375, -0.4798583984375, -0.458251953125, -0.4366455078125, -0.4150390625, -0.3934326171875, -0.371826171875, -0.3502197265625, -0.32861328125, -0.3070068359375, -0.285400390625, -0.2637939453125, -0.2421875, -0.2205810546875, -0.198974609375, -0.1773681640625, -0.15576171875, -0.1341552734375, -0.112548828125, -0.0909423828125, -0.0693359375, -0.0477294921875, -0.026123046875, -0.0045166015625, 0.01708984375, 0.0386962890625, 0.060302734375, 0.0819091796875, 0.103515625, 0.1251220703125, 0.146728515625, 0.1683349609375, 0.18994140625, 0.2115478515625, 0.233154296875, 0.2547607421875, 0.2763671875, 0.2979736328125, 0.319580078125, 0.3411865234375, 0.36279296875, 0.3843994140625, 0.406005859375, 0.4276123046875, 0.44921875, 0.4708251953125, 0.492431640625, 0.5140380859375, 0.53564453125, 0.5572509765625, 0.578857421875, 0.6004638671875, 0.6220703125, 0.6436767578125, 0.665283203125, 0.6868896484375, 0.70849609375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 10.0, 10.0, 16.0, 15.0, 26.0, 37.0, 82.0, 125.0, 251.0, 756.0, 2417.0, 12286.0, 192757.0, 803654.0, 29661.0, 4487.0, 1175.0, 403.0, 158.0, 95.0, 35.0, 23.0, 21.0, 10.0, 6.0, 10.0, 5.0, 6.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.239501953125, -0.2318267822265625, -0.224151611328125, -0.2164764404296875, -0.20880126953125, -0.2011260986328125, -0.193450927734375, -0.1857757568359375, -0.1781005859375, -0.1704254150390625, -0.162750244140625, -0.1550750732421875, -0.14739990234375, -0.1397247314453125, -0.132049560546875, -0.1243743896484375, -0.11669921875, -0.1090240478515625, -0.101348876953125, -0.0936737060546875, -0.08599853515625, -0.0783233642578125, -0.070648193359375, -0.0629730224609375, -0.0552978515625, -0.0476226806640625, -0.039947509765625, -0.0322723388671875, -0.02459716796875, -0.0169219970703125, -0.009246826171875, -0.0015716552734375, 0.006103515625, 0.0137786865234375, 0.021453857421875, 0.0291290283203125, 0.03680419921875, 0.0444793701171875, 0.052154541015625, 0.0598297119140625, 0.0675048828125, 0.0751800537109375, 0.082855224609375, 0.0905303955078125, 0.09820556640625, 0.1058807373046875, 0.113555908203125, 0.1212310791015625, 0.12890625, 0.1365814208984375, 0.144256591796875, 0.1519317626953125, 0.15960693359375, 0.1672821044921875, 0.174957275390625, 0.1826324462890625, 0.1903076171875, 0.1979827880859375, 0.205657958984375, 0.2133331298828125, 0.22100830078125, 0.2286834716796875, 0.236358642578125, 0.2440338134765625, 0.251708984375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 7.0, 18.0, 14.0, 29.0, 25.0, 40.0, 67.0, 89.0, 129.0, 136.0, 120.0, 96.0, 55.0, 43.0, 27.0, 17.0, 20.0, 12.0, 8.0, 8.0, 6.0, 7.0, 2.0, 7.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.2351741790771484e-05, -2.1683983504772186e-05, -2.1016225218772888e-05, -2.034846693277359e-05, -1.9680708646774292e-05, -1.9012950360774994e-05, -1.8345192074775696e-05, -1.7677433788776398e-05, -1.70096755027771e-05, -1.63419172167778e-05, -1.5674158930778503e-05, -1.5006400644779205e-05, -1.4338642358779907e-05, -1.3670884072780609e-05, -1.3003125786781311e-05, -1.2335367500782013e-05, -1.1667609214782715e-05, -1.0999850928783417e-05, -1.0332092642784119e-05, -9.66433435678482e-06, -8.996576070785522e-06, -8.328817784786224e-06, -7.661059498786926e-06, -6.993301212787628e-06, -6.32554292678833e-06, -5.657784640789032e-06, -4.990026354789734e-06, -4.322268068790436e-06, -3.6545097827911377e-06, -2.9867514967918396e-06, -2.3189932107925415e-06, -1.6512349247932434e-06, -9.834766387939453e-07, -3.157183527946472e-07, 3.520399332046509e-07, 1.019798219203949e-06, 1.687556505203247e-06, 2.355314791202545e-06, 3.0230730772018433e-06, 3.6908313632011414e-06, 4.3585896492004395e-06, 5.0263479351997375e-06, 5.694106221199036e-06, 6.361864507198334e-06, 7.029622793197632e-06, 7.69738107919693e-06, 8.365139365196228e-06, 9.032897651195526e-06, 9.700655937194824e-06, 1.0368414223194122e-05, 1.103617250919342e-05, 1.1703930795192719e-05, 1.2371689081192017e-05, 1.3039447367191315e-05, 1.3707205653190613e-05, 1.4374963939189911e-05, 1.5042722225189209e-05, 1.5710480511188507e-05, 1.6378238797187805e-05, 1.7045997083187103e-05, 1.77137553691864e-05, 1.83815136551857e-05, 1.9049271941184998e-05, 1.9717030227184296e-05, 2.0384788513183594e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 10.0, 5.0, 11.0, 17.0, 23.0, 32.0, 50.0, 48.0, 99.0, 144.0, 201.0, 336.0, 601.0, 1318.0, 3053.0, 9340.0, 50008.0, 719223.0, 230976.0, 23065.0, 5612.0, 2136.0, 944.0, 521.0, 262.0, 166.0, 108.0, 84.0, 54.0, 34.0, 29.0, 13.0, 11.0, 8.0, 7.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.238037109375, -0.2319011688232422, -0.22576522827148438, -0.21962928771972656, -0.21349334716796875, -0.20735740661621094, -0.20122146606445312, -0.1950855255126953, -0.1889495849609375, -0.1828136444091797, -0.17667770385742188, -0.17054176330566406, -0.16440582275390625, -0.15826988220214844, -0.15213394165039062, -0.1459980010986328, -0.139862060546875, -0.1337261199951172, -0.12759017944335938, -0.12145423889160156, -0.11531829833984375, -0.10918235778808594, -0.10304641723632812, -0.09691047668457031, -0.0907745361328125, -0.08463859558105469, -0.07850265502929688, -0.07236671447753906, -0.06623077392578125, -0.06009483337402344, -0.053958892822265625, -0.04782295227050781, -0.04168701171875, -0.03555107116699219, -0.029415130615234375, -0.023279190063476562, -0.01714324951171875, -0.011007308959960938, -0.004871368408203125, 0.0012645721435546875, 0.0074005126953125, 0.013536453247070312, 0.019672393798828125, 0.025808334350585938, 0.03194427490234375, 0.03808021545410156, 0.044216156005859375, 0.05035209655761719, 0.056488037109375, 0.06262397766113281, 0.06875991821289062, 0.07489585876464844, 0.08103179931640625, 0.08716773986816406, 0.09330368041992188, 0.09943962097167969, 0.1055755615234375, 0.11171150207519531, 0.11784744262695312, 0.12398338317871094, 0.13011932373046875, 0.13625526428222656, 0.14239120483398438, 0.1485271453857422, 0.1546630859375]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 2.0, 8.0, 11.0, 11.0, 20.0, 23.0, 29.0, 39.0, 65.0, 118.0, 154.0, 142.0, 121.0, 78.0, 54.0, 37.0, 25.0, 18.0, 8.0, 7.0, 5.0, 11.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05908203125, -0.05674266815185547, -0.05440330505371094, -0.052063941955566406, -0.049724578857421875, -0.047385215759277344, -0.04504585266113281, -0.04270648956298828, -0.04036712646484375, -0.03802776336669922, -0.03568840026855469, -0.033349037170410156, -0.031009674072265625, -0.028670310974121094, -0.026330947875976562, -0.02399158477783203, -0.0216522216796875, -0.01931285858154297, -0.016973495483398438, -0.014634132385253906, -0.012294769287109375, -0.009955406188964844, -0.0076160430908203125, -0.005276679992675781, -0.00293731689453125, -0.0005979537963867188, 0.0017414093017578125, 0.004080772399902344, 0.006420135498046875, 0.008759498596191406, 0.011098861694335938, 0.013438224792480469, 0.015777587890625, 0.01811695098876953, 0.020456314086914062, 0.022795677185058594, 0.025135040283203125, 0.027474403381347656, 0.029813766479492188, 0.03215312957763672, 0.03449249267578125, 0.03683185577392578, 0.03917121887207031, 0.041510581970214844, 0.043849945068359375, 0.046189308166503906, 0.04852867126464844, 0.05086803436279297, 0.0532073974609375, 0.05554676055908203, 0.05788612365722656, 0.060225486755371094, 0.06256484985351562, 0.06490421295166016, 0.06724357604980469, 0.06958293914794922, 0.07192230224609375, 0.07426166534423828, 0.07660102844238281, 0.07894039154052734, 0.08127975463867188, 0.0836191177368164, 0.08595848083496094, 0.08829784393310547, 0.09063720703125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 7.0, 14.0, 22.0, 66.0, 169.0, 350.0, 210.0, 88.0, 35.0, 16.0, 10.0, 10.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1026254892349243, -1.0155296325683594, -0.9284337162971497, -0.8413378000259399, -0.754241943359375, -0.6671460866928101, -0.5800501704216003, -0.4929542541503906, -0.4058583974838257, -0.31876251101493835, -0.23166662454605103, -0.1445707380771637, -0.05747485160827637, 0.029621034860610962, 0.11671692132949829, 0.203812837600708, 0.29090869426727295, 0.3780045807361603, 0.4651004672050476, 0.5521963834762573, 0.6392922401428223, 0.7263880968093872, 0.8134840130805969, 0.9005799293518066, 0.9876757860183716, 1.0747716426849365, 1.161867618560791, 1.248963475227356, 1.336059331893921, 1.4231551885604858, 1.5102510452270508, 1.5973470211029053, 1.6844429969787598, 1.7715388536453247, 1.8586347103118896, 1.9457306861877441, 2.0328264236450195, 2.119922399520874, 2.2070183753967285, 2.294114112854004, 2.3812100887298584, 2.468306064605713, 2.5554018020629883, 2.6424977779388428, 2.7295937538146973, 2.8166894912719727, 2.903785467147827, 2.9908814430236816, 3.077977180480957, 3.1650731563568115, 3.252168893814087, 3.3392648696899414, 3.426360607147217, 3.5134565830230713, 3.600552558898926, 3.687648296356201, 3.7747442722320557, 3.86184024810791, 3.9489359855651855, 4.036031723022461, 4.1231279373168945, 4.21022367477417, 4.297319412231445, 4.384415626525879, 4.471511363983154]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 7.0, 4.0, 5.0, 9.0, 9.0, 17.0, 12.0, 30.0, 14.0, 25.0, 17.0, 31.0, 31.0, 17.0, 39.0, 33.0, 43.0, 47.0, 41.0, 35.0, 41.0, 46.0, 46.0, 34.0, 31.0, 39.0, 35.0, 32.0, 29.0, 32.0, 15.0, 21.0, 15.0, 14.0, 21.0, 24.0, 12.0, 9.0, 8.0, 11.0, 3.0, 4.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-1.1144568920135498, -1.0803848505020142, -1.046312928199768, -1.0122408866882324, -0.9781688451766968, -0.9440968632698059, -0.910024881362915, -0.8759528398513794, -0.8418807983398438, -0.8078088164329529, -0.7737367749214172, -0.7396647930145264, -0.7055927515029907, -0.6715207695960999, -0.637448787689209, -0.6033767461776733, -0.5693047642707825, -0.5352327823638916, -0.501160740852356, -0.4670887589454651, -0.43301671743392944, -0.3989447355270386, -0.3648727238178253, -0.33080071210861206, -0.2967287003993988, -0.26265668869018555, -0.2285846769809723, -0.19451268017292023, -0.16044066846370697, -0.1263686567544937, -0.09229665994644165, -0.058224648237228394, -0.024152636528015137, 0.009919371455907822, 0.04399137943983078, 0.07806338369846344, 0.1121353954076767, 0.14620740711688995, 0.18027940392494202, 0.21435141563415527, 0.24842342734336853, 0.2824954390525818, 0.31656745076179504, 0.3506394624710083, 0.38471144437789917, 0.4187834858894348, 0.4528554677963257, 0.48692747950553894, 0.5209994912147522, 0.5550714731216431, 0.5891435146331787, 0.6232154965400696, 0.6572875380516052, 0.6913595199584961, 0.7254315614700317, 0.7595035433769226, 0.7935755252838135, 0.8276475071907043, 0.86171954870224, 0.8957915306091309, 0.9298635721206665, 0.9639355540275574, 0.9980075359344482, 1.0320795774459839, 1.0661516189575195]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 1.0, 12.0, 11.0, 17.0, 12.0, 18.0, 11.0, 27.0, 35.0, 49.0, 73.0, 108.0, 130.0, 188.0, 302.0, 399.0, 669.0, 984.0, 1971.0, 3945.0, 11594.0, 161677.0, 3706916.0, 278504.0, 16602.0, 4627.0, 2113.0, 1197.0, 659.0, 458.0, 268.0, 206.0, 138.0, 113.0, 74.0, 40.0, 35.0, 36.0, 20.0, 16.0, 5.0, 1.0, 6.0, 9.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.27734375, -1.239288330078125, -1.20123291015625, -1.163177490234375, -1.1251220703125, -1.087066650390625, -1.04901123046875, -1.010955810546875, -0.972900390625, -0.934844970703125, -0.89678955078125, -0.858734130859375, -0.8206787109375, -0.782623291015625, -0.74456787109375, -0.706512451171875, -0.66845703125, -0.630401611328125, -0.59234619140625, -0.554290771484375, -0.5162353515625, -0.478179931640625, -0.44012451171875, -0.402069091796875, -0.364013671875, -0.325958251953125, -0.28790283203125, -0.249847412109375, -0.2117919921875, -0.173736572265625, -0.13568115234375, -0.097625732421875, -0.0595703125, -0.021514892578125, 0.01654052734375, 0.054595947265625, 0.0926513671875, 0.130706787109375, 0.16876220703125, 0.206817626953125, 0.244873046875, 0.282928466796875, 0.32098388671875, 0.359039306640625, 0.3970947265625, 0.435150146484375, 0.47320556640625, 0.511260986328125, 0.54931640625, 0.587371826171875, 0.62542724609375, 0.663482666015625, 0.7015380859375, 0.739593505859375, 0.77764892578125, 0.815704345703125, 0.853759765625, 0.891815185546875, 0.92987060546875, 0.967926025390625, 1.0059814453125, 1.044036865234375, 1.08209228515625, 1.120147705078125, 1.158203125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 8.0, 4.0, 2.0, 8.0, 11.0, 14.0, 20.0, 28.0, 25.0, 27.0, 36.0, 36.0, 46.0, 48.0, 43.0, 57.0, 63.0, 78.0, 66.0, 57.0, 63.0, 54.0, 43.0, 31.0, 28.0, 24.0, 18.0, 17.0, 6.0, 10.0, 15.0, 5.0, 5.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.53466796875, -0.5202560424804688, -0.5058441162109375, -0.49143218994140625, -0.477020263671875, -0.46260833740234375, -0.4481964111328125, -0.43378448486328125, -0.41937255859375, -0.40496063232421875, -0.3905487060546875, -0.37613677978515625, -0.361724853515625, -0.34731292724609375, -0.3329010009765625, -0.31848907470703125, -0.3040771484375, -0.28966522216796875, -0.2752532958984375, -0.26084136962890625, -0.246429443359375, -0.23201751708984375, -0.2176055908203125, -0.20319366455078125, -0.18878173828125, -0.17436981201171875, -0.1599578857421875, -0.14554595947265625, -0.131134033203125, -0.11672210693359375, -0.1023101806640625, -0.08789825439453125, -0.073486328125, -0.05907440185546875, -0.0446624755859375, -0.03025054931640625, -0.015838623046875, -0.00142669677734375, 0.0129852294921875, 0.02739715576171875, 0.04180908203125, 0.05622100830078125, 0.0706329345703125, 0.08504486083984375, 0.099456787109375, 0.11386871337890625, 0.1282806396484375, 0.14269256591796875, 0.1571044921875, 0.17151641845703125, 0.1859283447265625, 0.20034027099609375, 0.214752197265625, 0.22916412353515625, 0.2435760498046875, 0.25798797607421875, 0.27239990234375, 0.28681182861328125, 0.3012237548828125, 0.31563568115234375, 0.330047607421875, 0.34445953369140625, 0.3588714599609375, 0.37328338623046875, 0.3876953125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 8.0, 10.0, 10.0, 29.0, 24.0, 50.0, 77.0, 132.0, 196.0, 361.0, 685.0, 1281.0, 3132.0, 9888.0, 58161.0, 3548501.0, 535264.0, 25930.0, 6062.0, 2179.0, 1043.0, 512.0, 308.0, 180.0, 105.0, 62.0, 34.0, 27.0, 17.0, 3.0, 9.0, 3.0, 2.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.220703125, -1.1892471313476562, -1.1577911376953125, -1.1263351440429688, -1.094879150390625, -1.0634231567382812, -1.0319671630859375, -1.0005111694335938, -0.96905517578125, -0.9375991821289062, -0.9061431884765625, -0.8746871948242188, -0.843231201171875, -0.8117752075195312, -0.7803192138671875, -0.7488632202148438, -0.7174072265625, -0.6859512329101562, -0.6544952392578125, -0.6230392456054688, -0.591583251953125, -0.5601272583007812, -0.5286712646484375, -0.49721527099609375, -0.46575927734375, -0.43430328369140625, -0.4028472900390625, -0.37139129638671875, -0.339935302734375, -0.30847930908203125, -0.2770233154296875, -0.24556732177734375, -0.214111328125, -0.18265533447265625, -0.1511993408203125, -0.11974334716796875, -0.088287353515625, -0.05683135986328125, -0.0253753662109375, 0.00608062744140625, 0.03753662109375, 0.06899261474609375, 0.1004486083984375, 0.13190460205078125, 0.163360595703125, 0.19481658935546875, 0.2262725830078125, 0.25772857666015625, 0.2891845703125, 0.32064056396484375, 0.3520965576171875, 0.38355255126953125, 0.415008544921875, 0.44646453857421875, 0.4779205322265625, 0.5093765258789062, 0.54083251953125, 0.5722885131835938, 0.6037445068359375, 0.6352005004882812, 0.666656494140625, 0.6981124877929688, 0.7295684814453125, 0.7610244750976562, 0.79248046875]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 5.0, 8.0, 8.0, 11.0, 29.0, 39.0, 52.0, 107.0, 253.0, 544.0, 1075.0, 999.0, 469.0, 206.0, 86.0, 46.0, 50.0, 18.0, 17.0, 9.0, 8.0, 7.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2783203125, -0.2698707580566406, -0.26142120361328125, -0.2529716491699219, -0.2445220947265625, -0.23607254028320312, -0.22762298583984375, -0.21917343139648438, -0.210723876953125, -0.20227432250976562, -0.19382476806640625, -0.18537521362304688, -0.1769256591796875, -0.16847610473632812, -0.16002655029296875, -0.15157699584960938, -0.14312744140625, -0.13467788696289062, -0.12622833251953125, -0.11777877807617188, -0.1093292236328125, -0.10087966918945312, -0.09243011474609375, -0.08398056030273438, -0.075531005859375, -0.06708145141601562, -0.05863189697265625, -0.050182342529296875, -0.0417327880859375, -0.033283233642578125, -0.02483367919921875, -0.016384124755859375, -0.0079345703125, 0.000514984130859375, 0.00896453857421875, 0.017414093017578125, 0.0258636474609375, 0.034313201904296875, 0.04276275634765625, 0.051212310791015625, 0.059661865234375, 0.06811141967773438, 0.07656097412109375, 0.08501052856445312, 0.0934600830078125, 0.10190963745117188, 0.11035919189453125, 0.11880874633789062, 0.12725830078125, 0.13570785522460938, 0.14415740966796875, 0.15260696411132812, 0.1610565185546875, 0.16950607299804688, 0.17795562744140625, 0.18640518188476562, 0.194854736328125, 0.20330429077148438, 0.21175384521484375, 0.22020339965820312, 0.2286529541015625, 0.23710250854492188, 0.24555206298828125, 0.2540016174316406, 0.262451171875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 1.0, 3.0, 5.0, 11.0, 8.0, 20.0, 14.0, 34.0, 43.0, 65.0, 85.0, 133.0, 149.0, 125.0, 86.0, 59.0, 56.0, 35.0, 23.0, 13.0, 7.0, 8.0, 8.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0908448696136475, -1.0625654458999634, -1.0342860221862793, -1.0060065984725952, -0.9777271151542664, -0.9494476914405823, -0.9211682677268982, -0.8928887844085693, -0.8646093606948853, -0.8363299369812012, -0.8080505132675171, -0.7797710299491882, -0.7514916062355042, -0.7232121825218201, -0.694932758808136, -0.6666532754898071, -0.638373851776123, -0.610094428062439, -0.5818150043487549, -0.553535521030426, -0.5252560973167419, -0.49697667360305786, -0.4686972498893738, -0.4404177963733673, -0.4121384024620056, -0.38385897874832153, -0.35557952523231506, -0.327300101518631, -0.2990206480026245, -0.27074122428894043, -0.24246178567409515, -0.21418234705924988, -0.1859028935432434, -0.15762345492839813, -0.12934401631355286, -0.10106458514928818, -0.0727851465344429, -0.04450571537017822, -0.016226276755332947, 0.012053161859512329, 0.040332600474357605, 0.06861203908920288, 0.09689147770404816, 0.12517091631889343, 0.15345034003257751, 0.1817297786474228, 0.21000921726226807, 0.23828865587711334, 0.2665680944919586, 0.2948475182056427, 0.32312697172164917, 0.35140639543533325, 0.3796858489513397, 0.4079652726650238, 0.4362447261810303, 0.46452414989471436, 0.49280357360839844, 0.5210829973220825, 0.5493624210357666, 0.5776419043540955, 0.6059213280677795, 0.6342007517814636, 0.6624801754951477, 0.6907596588134766, 0.7190390825271606]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 9.0, 8.0, 5.0, 6.0, 22.0, 21.0, 21.0, 27.0, 43.0, 28.0, 42.0, 35.0, 43.0, 51.0, 54.0, 55.0, 56.0, 52.0, 48.0, 38.0, 43.0, 46.0, 41.0, 27.0, 38.0, 20.0, 23.0, 17.0, 13.0, 15.0, 12.0, 7.0, 10.0, 9.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.510971188545227, -0.49620920419692993, -0.4814472198486328, -0.4666852355003357, -0.4519232511520386, -0.43716126680374146, -0.42239928245544434, -0.4076372981071472, -0.3928753137588501, -0.378113329410553, -0.36335134506225586, -0.34858936071395874, -0.3338273763656616, -0.3190653920173645, -0.3043034076690674, -0.28954142332077026, -0.27477943897247314, -0.260017454624176, -0.2452554702758789, -0.2304934859275818, -0.21573150157928467, -0.20096951723098755, -0.18620753288269043, -0.1714455485343933, -0.1566835641860962, -0.14192157983779907, -0.12715959548950195, -0.11239761114120483, -0.09763562679290771, -0.0828736424446106, -0.06811165809631348, -0.05334967374801636, -0.03858768939971924, -0.02382570505142212, -0.009063720703125, 0.005698263645172119, 0.02046024799346924, 0.03522223234176636, 0.04998421669006348, 0.0647462010383606, 0.07950818538665771, 0.09427016973495483, 0.10903215408325195, 0.12379413843154907, 0.1385561227798462, 0.1533181071281433, 0.16808009147644043, 0.18284207582473755, 0.19760406017303467, 0.2123660445213318, 0.2271280288696289, 0.24189001321792603, 0.25665199756622314, 0.27141398191452026, 0.2861759662628174, 0.3009379506111145, 0.3156999349594116, 0.33046191930770874, 0.34522390365600586, 0.359985888004303, 0.3747478723526001, 0.3895098567008972, 0.40427184104919434, 0.41903382539749146, 0.4337958097457886]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 7.0, 7.0, 10.0, 18.0, 19.0, 28.0, 43.0, 57.0, 88.0, 119.0, 193.0, 299.0, 498.0, 850.0, 1458.0, 2708.0, 5178.0, 10694.0, 24983.0, 65598.0, 200869.0, 425952.0, 197335.0, 64584.0, 24813.0, 10737.0, 4995.0, 2709.0, 1434.0, 796.0, 528.0, 317.0, 208.0, 130.0, 83.0, 60.0, 42.0, 26.0, 27.0, 12.0, 8.0, 8.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.09173583984375, -0.08899688720703125, -0.0862579345703125, -0.08351898193359375, -0.080780029296875, -0.07804107666015625, -0.0753021240234375, -0.07256317138671875, -0.06982421875, -0.06708526611328125, -0.0643463134765625, -0.06160736083984375, -0.058868408203125, -0.05612945556640625, -0.0533905029296875, -0.05065155029296875, -0.04791259765625, -0.04517364501953125, -0.0424346923828125, -0.03969573974609375, -0.036956787109375, -0.03421783447265625, -0.0314788818359375, -0.02873992919921875, -0.0260009765625, -0.02326202392578125, -0.0205230712890625, -0.01778411865234375, -0.015045166015625, -0.01230621337890625, -0.0095672607421875, -0.00682830810546875, -0.00408935546875, -0.00135040283203125, 0.0013885498046875, 0.00412750244140625, 0.006866455078125, 0.00960540771484375, 0.0123443603515625, 0.01508331298828125, 0.017822265625, 0.02056121826171875, 0.0233001708984375, 0.02603912353515625, 0.028778076171875, 0.03151702880859375, 0.0342559814453125, 0.03699493408203125, 0.03973388671875, 0.04247283935546875, 0.0452117919921875, 0.04795074462890625, 0.050689697265625, 0.05342864990234375, 0.0561676025390625, 0.05890655517578125, 0.0616455078125, 0.06438446044921875, 0.0671234130859375, 0.06986236572265625, 0.072601318359375, 0.07534027099609375, 0.0780792236328125, 0.08081817626953125, 0.08355712890625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 8.0, 4.0, 4.0, 7.0, 4.0, 11.0, 9.0, 23.0, 18.0, 22.0, 31.0, 32.0, 36.0, 42.0, 46.0, 50.0, 59.0, 51.0, 62.0, 65.0, 71.0, 36.0, 45.0, 51.0, 33.0, 29.0, 28.0, 21.0, 25.0, 16.0, 13.0, 15.0, 10.0, 10.0, 5.0, 5.0, 4.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.340576171875, -0.32952880859375, -0.3184814453125, -0.30743408203125, -0.29638671875, -0.28533935546875, -0.2742919921875, -0.26324462890625, -0.252197265625, -0.24114990234375, -0.2301025390625, -0.21905517578125, -0.2080078125, -0.19696044921875, -0.1859130859375, -0.17486572265625, -0.163818359375, -0.15277099609375, -0.1417236328125, -0.13067626953125, -0.11962890625, -0.10858154296875, -0.0975341796875, -0.08648681640625, -0.075439453125, -0.06439208984375, -0.0533447265625, -0.04229736328125, -0.03125, -0.02020263671875, -0.0091552734375, 0.00189208984375, 0.012939453125, 0.02398681640625, 0.0350341796875, 0.04608154296875, 0.05712890625, 0.06817626953125, 0.0792236328125, 0.09027099609375, 0.101318359375, 0.11236572265625, 0.1234130859375, 0.13446044921875, 0.1455078125, 0.15655517578125, 0.1676025390625, 0.17864990234375, 0.189697265625, 0.20074462890625, 0.2117919921875, 0.22283935546875, 0.23388671875, 0.24493408203125, 0.2559814453125, 0.26702880859375, 0.278076171875, 0.28912353515625, 0.3001708984375, 0.31121826171875, 0.322265625, 0.33331298828125, 0.3443603515625, 0.35540771484375, 0.366455078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 8.0, 10.0, 22.0, 28.0, 45.0, 35.0, 70.0, 93.0, 123.0, 193.0, 284.0, 460.0, 697.0, 1096.0, 1924.0, 3184.0, 5631.0, 10427.0, 19500.0, 39308.0, 83136.0, 188957.0, 322460.0, 197202.0, 86987.0, 40860.0, 20457.0, 10717.0, 5939.0, 3355.0, 1942.0, 1211.0, 724.0, 485.0, 307.0, 197.0, 150.0, 99.0, 78.0, 52.0, 30.0, 14.0, 15.0, 15.0, 9.0, 8.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.05401611328125, -0.052186012268066406, -0.05035591125488281, -0.04852581024169922, -0.046695709228515625, -0.04486560821533203, -0.04303550720214844, -0.041205406188964844, -0.03937530517578125, -0.037545204162597656, -0.03571510314941406, -0.03388500213623047, -0.032054901123046875, -0.03022480010986328, -0.028394699096679688, -0.026564598083496094, -0.0247344970703125, -0.022904396057128906, -0.021074295043945312, -0.01924419403076172, -0.017414093017578125, -0.015583992004394531, -0.013753890991210938, -0.011923789978027344, -0.01009368896484375, -0.008263587951660156, -0.0064334869384765625, -0.004603385925292969, -0.002773284912109375, -0.0009431838989257812, 0.0008869171142578125, 0.0027170181274414062, 0.004547119140625, 0.006377220153808594, 0.008207321166992188, 0.010037422180175781, 0.011867523193359375, 0.013697624206542969, 0.015527725219726562, 0.017357826232910156, 0.01918792724609375, 0.021018028259277344, 0.022848129272460938, 0.02467823028564453, 0.026508331298828125, 0.02833843231201172, 0.030168533325195312, 0.031998634338378906, 0.0338287353515625, 0.035658836364746094, 0.03748893737792969, 0.03931903839111328, 0.041149139404296875, 0.04297924041748047, 0.04480934143066406, 0.046639442443847656, 0.04846954345703125, 0.050299644470214844, 0.05212974548339844, 0.05395984649658203, 0.055789947509765625, 0.05762004852294922, 0.05945014953613281, 0.061280250549316406, 0.0631103515625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 7.0, 5.0, 14.0, 6.0, 9.0, 13.0, 16.0, 13.0, 18.0, 22.0, 19.0, 17.0, 28.0, 23.0, 34.0, 39.0, 32.0, 32.0, 44.0, 45.0, 48.0, 50.0, 54.0, 40.0, 47.0, 33.0, 32.0, 34.0, 21.0, 36.0, 21.0, 21.0, 22.0, 20.0, 22.0, 14.0, 10.0, 4.0, 9.0, 6.0, 7.0, 3.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.5400390625, -0.523040771484375, -0.50604248046875, -0.489044189453125, -0.4720458984375, -0.455047607421875, -0.43804931640625, -0.421051025390625, -0.404052734375, -0.387054443359375, -0.37005615234375, -0.353057861328125, -0.3360595703125, -0.319061279296875, -0.30206298828125, -0.285064697265625, -0.26806640625, -0.251068115234375, -0.23406982421875, -0.217071533203125, -0.2000732421875, -0.183074951171875, -0.16607666015625, -0.149078369140625, -0.132080078125, -0.115081787109375, -0.09808349609375, -0.081085205078125, -0.0640869140625, -0.047088623046875, -0.03009033203125, -0.013092041015625, 0.00390625, 0.020904541015625, 0.03790283203125, 0.054901123046875, 0.0718994140625, 0.088897705078125, 0.10589599609375, 0.122894287109375, 0.139892578125, 0.156890869140625, 0.17388916015625, 0.190887451171875, 0.2078857421875, 0.224884033203125, 0.24188232421875, 0.258880615234375, 0.27587890625, 0.292877197265625, 0.30987548828125, 0.326873779296875, 0.3438720703125, 0.360870361328125, 0.37786865234375, 0.394866943359375, 0.411865234375, 0.428863525390625, 0.44586181640625, 0.462860107421875, 0.4798583984375, 0.496856689453125, 0.51385498046875, 0.530853271484375, 0.5478515625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 11.0, 17.0, 19.0, 25.0, 33.0, 65.0, 112.0, 202.0, 390.0, 721.0, 1561.0, 3669.0, 9399.0, 29132.0, 116315.0, 517442.0, 283745.0, 58674.0, 16482.0, 5946.0, 2287.0, 1077.0, 513.0, 281.0, 189.0, 76.0, 68.0, 33.0, 26.0, 14.0, 4.0, 5.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.048828125, -0.04760026931762695, -0.046372413635253906, -0.04514455795288086, -0.04391670227050781, -0.042688846588134766, -0.04146099090576172, -0.04023313522338867, -0.039005279541015625, -0.03777742385864258, -0.03654956817626953, -0.035321712493896484, -0.03409385681152344, -0.03286600112915039, -0.031638145446777344, -0.030410289764404297, -0.02918243408203125, -0.027954578399658203, -0.026726722717285156, -0.02549886703491211, -0.024271011352539062, -0.023043155670166016, -0.02181529998779297, -0.020587444305419922, -0.019359588623046875, -0.018131732940673828, -0.01690387725830078, -0.015676021575927734, -0.014448165893554688, -0.01322031021118164, -0.011992454528808594, -0.010764598846435547, -0.0095367431640625, -0.008308887481689453, -0.007081031799316406, -0.005853176116943359, -0.0046253204345703125, -0.0033974647521972656, -0.0021696090698242188, -0.0009417533874511719, 0.000286102294921875, 0.0015139579772949219, 0.0027418136596679688, 0.003969669342041016, 0.0051975250244140625, 0.006425380706787109, 0.007653236389160156, 0.008881092071533203, 0.01010894775390625, 0.011336803436279297, 0.012564659118652344, 0.01379251480102539, 0.015020370483398438, 0.016248226165771484, 0.01747608184814453, 0.018703937530517578, 0.019931793212890625, 0.021159648895263672, 0.02238750457763672, 0.023615360260009766, 0.024843215942382812, 0.02607107162475586, 0.027298927307128906, 0.028526782989501953, 0.029754638671875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 8.0, 5.0, 8.0, 10.0, 16.0, 24.0, 40.0, 62.0, 98.0, 107.0, 136.0, 146.0, 111.0, 64.0, 44.0, 33.0, 32.0, 9.0, 12.0, 7.0, 8.0, 6.0, 5.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.159046173095703e-05, -3.07764858007431e-05, -2.9962509870529175e-05, -2.9148533940315247e-05, -2.833455801010132e-05, -2.752058207988739e-05, -2.6706606149673462e-05, -2.5892630219459534e-05, -2.5078654289245605e-05, -2.4264678359031677e-05, -2.345070242881775e-05, -2.263672649860382e-05, -2.1822750568389893e-05, -2.1008774638175964e-05, -2.0194798707962036e-05, -1.9380822777748108e-05, -1.856684684753418e-05, -1.775287091732025e-05, -1.6938894987106323e-05, -1.6124919056892395e-05, -1.5310943126678467e-05, -1.4496967196464539e-05, -1.368299126625061e-05, -1.2869015336036682e-05, -1.2055039405822754e-05, -1.1241063475608826e-05, -1.0427087545394897e-05, -9.61311161518097e-06, -8.799135684967041e-06, -7.985159754753113e-06, -7.1711838245391846e-06, -6.357207894325256e-06, -5.543231964111328e-06, -4.7292560338974e-06, -3.915280103683472e-06, -3.1013041734695435e-06, -2.2873282432556152e-06, -1.473352313041687e-06, -6.593763828277588e-07, 1.5459954738616943e-07, 9.685754776000977e-07, 1.7825514078140259e-06, 2.596527338027954e-06, 3.4105032682418823e-06, 4.2244791984558105e-06, 5.038455128669739e-06, 5.852431058883667e-06, 6.666406989097595e-06, 7.4803829193115234e-06, 8.294358849525452e-06, 9.10833477973938e-06, 9.922310709953308e-06, 1.0736286640167236e-05, 1.1550262570381165e-05, 1.2364238500595093e-05, 1.3178214430809021e-05, 1.399219036102295e-05, 1.4806166291236877e-05, 1.5620142221450806e-05, 1.6434118151664734e-05, 1.7248094081878662e-05, 1.806207001209259e-05, 1.887604594230652e-05, 1.9690021872520447e-05, 2.0503997802734375e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 7.0, 6.0, 13.0, 24.0, 28.0, 31.0, 59.0, 88.0, 143.0, 229.0, 377.0, 568.0, 983.0, 1588.0, 2869.0, 5558.0, 11076.0, 23334.0, 53624.0, 136157.0, 323894.0, 287083.0, 114624.0, 45520.0, 20048.0, 9336.0, 4809.0, 2685.0, 1522.0, 845.0, 539.0, 322.0, 208.0, 124.0, 90.0, 56.0, 33.0, 23.0, 15.0, 11.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0244140625, -0.02369403839111328, -0.022974014282226562, -0.022253990173339844, -0.021533966064453125, -0.020813941955566406, -0.020093917846679688, -0.01937389373779297, -0.01865386962890625, -0.01793384552001953, -0.017213821411132812, -0.016493797302246094, -0.015773773193359375, -0.015053749084472656, -0.014333724975585938, -0.013613700866699219, -0.0128936767578125, -0.012173652648925781, -0.011453628540039062, -0.010733604431152344, -0.010013580322265625, -0.009293556213378906, -0.008573532104492188, -0.007853507995605469, -0.00713348388671875, -0.006413459777832031, -0.0056934356689453125, -0.004973411560058594, -0.004253387451171875, -0.0035333633422851562, -0.0028133392333984375, -0.0020933151245117188, -0.001373291015625, -0.0006532669067382812, 6.67572021484375e-05, 0.0007867813110351562, 0.001506805419921875, 0.0022268295288085938, 0.0029468536376953125, 0.0036668777465820312, 0.00438690185546875, 0.005106925964355469, 0.0058269500732421875, 0.006546974182128906, 0.007266998291015625, 0.007987022399902344, 0.008707046508789062, 0.009427070617675781, 0.0101470947265625, 0.010867118835449219, 0.011587142944335938, 0.012307167053222656, 0.013027191162109375, 0.013747215270996094, 0.014467239379882812, 0.015187263488769531, 0.01590728759765625, 0.01662731170654297, 0.017347335815429688, 0.018067359924316406, 0.018787384033203125, 0.019507408142089844, 0.020227432250976562, 0.02094745635986328, 0.02166748046875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 4.0, 4.0, 3.0, 13.0, 14.0, 15.0, 10.0, 15.0, 22.0, 34.0, 28.0, 37.0, 42.0, 46.0, 47.0, 54.0, 60.0, 67.0, 64.0, 44.0, 48.0, 57.0, 48.0, 31.0, 36.0, 27.0, 24.0, 16.0, 14.0, 18.0, 11.0, 13.0, 5.0, 4.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0079498291015625, -0.007714807987213135, -0.0074797868728637695, -0.007244765758514404, -0.007009744644165039, -0.006774723529815674, -0.006539702415466309, -0.006304681301116943, -0.006069660186767578, -0.005834639072418213, -0.005599617958068848, -0.005364596843719482, -0.005129575729370117, -0.004894554615020752, -0.004659533500671387, -0.0044245123863220215, -0.004189491271972656, -0.003954470157623291, -0.0037194490432739258, -0.0034844279289245605, -0.0032494068145751953, -0.00301438570022583, -0.002779364585876465, -0.0025443434715270996, -0.0023093223571777344, -0.002074301242828369, -0.001839280128479004, -0.0016042590141296387, -0.0013692378997802734, -0.0011342167854309082, -0.000899195671081543, -0.0006641745567321777, -0.0004291534423828125, -0.00019413232803344727, 4.088878631591797e-05, 0.0002759099006652832, 0.0005109310150146484, 0.0007459521293640137, 0.000980973243713379, 0.0012159943580627441, 0.0014510154724121094, 0.0016860365867614746, 0.0019210577011108398, 0.002156078815460205, 0.0023910999298095703, 0.0026261210441589355, 0.0028611421585083008, 0.003096163272857666, 0.0033311843872070312, 0.0035662055015563965, 0.0038012266159057617, 0.004036247730255127, 0.004271268844604492, 0.004506289958953857, 0.004741311073303223, 0.004976332187652588, 0.005211353302001953, 0.005446374416351318, 0.005681395530700684, 0.005916416645050049, 0.006151437759399414, 0.006386458873748779, 0.0066214799880981445, 0.00685650110244751, 0.007091522216796875]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 4.0, 4.0, 4.0, 4.0, 12.0, 24.0, 38.0, 89.0, 145.0, 236.0, 191.0, 105.0, 63.0, 41.0, 19.0, 11.0, 5.0, 2.0, 4.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2030118703842163, -1.174246072769165, -1.1454803943634033, -1.1167147159576416, -1.0879489183425903, -1.059183120727539, -1.0304174423217773, -1.0016517639160156, -0.9728859663009644, -0.9441202282905579, -0.9153544902801514, -0.8865887522697449, -0.8578230142593384, -0.8290572762489319, -0.8002915382385254, -0.7715258002281189, -0.7427600622177124, -0.7139943242073059, -0.6852285861968994, -0.6564628481864929, -0.6276971101760864, -0.5989313721656799, -0.5701656341552734, -0.5413998961448669, -0.5126341581344604, -0.48386842012405396, -0.45510268211364746, -0.42633694410324097, -0.3975712060928345, -0.368805468082428, -0.3400397300720215, -0.311273992061615, -0.2825081944465637, -0.2537424564361572, -0.22497671842575073, -0.19621098041534424, -0.16744524240493774, -0.13867950439453125, -0.10991376638412476, -0.08114802837371826, -0.05238229036331177, -0.023616552352905273, 0.005149185657501221, 0.033914923667907715, 0.06268066167831421, 0.0914463996887207, 0.1202121376991272, 0.1489778757095337, 0.17774361371994019, 0.20650935173034668, 0.23527508974075317, 0.26404082775115967, 0.29280656576156616, 0.32157230377197266, 0.35033804178237915, 0.37910377979278564, 0.40786951780319214, 0.43663525581359863, 0.4654009938240051, 0.4941667318344116, 0.5229324698448181, 0.5516982078552246, 0.5804639458656311, 0.6092296838760376, 0.6379954218864441]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 4.0, 7.0, 8.0, 9.0, 10.0, 9.0, 20.0, 17.0, 29.0, 30.0, 28.0, 41.0, 35.0, 42.0, 48.0, 53.0, 52.0, 62.0, 68.0, 37.0, 55.0, 43.0, 43.0, 50.0, 25.0, 37.0, 29.0, 23.0, 16.0, 15.0, 10.0, 6.0, 10.0, 12.0, 7.0, 2.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3230491578578949, -0.31289345026016235, -0.3027377128601074, -0.2925819754600525, -0.28242626786231995, -0.2722705602645874, -0.26211482286453247, -0.25195908546447754, -0.241803377866745, -0.23164765536785126, -0.22149193286895752, -0.21133621037006378, -0.20118048787117004, -0.1910247653722763, -0.18086904287338257, -0.17071332037448883, -0.1605575978755951, -0.15040187537670135, -0.14024615287780762, -0.13009043037891388, -0.11993470788002014, -0.1097789853811264, -0.09962326288223267, -0.08946754038333893, -0.07931181788444519, -0.06915609538555145, -0.059000372886657715, -0.04884465038776398, -0.03868892788887024, -0.0285332053899765, -0.018377482891082764, -0.008221760392189026, 0.0019339919090270996, 0.012089714407920837, 0.022245436906814575, 0.03240115940570831, 0.04255688190460205, 0.05271260440349579, 0.06286832690238953, 0.07302404940128326, 0.083179771900177, 0.09333549439907074, 0.10349121689796448, 0.11364693939685822, 0.12380266189575195, 0.1339583843946457, 0.14411410689353943, 0.15426982939243317, 0.1644255518913269, 0.17458127439022064, 0.18473699688911438, 0.19489271938800812, 0.20504844188690186, 0.2152041643857956, 0.22535988688468933, 0.23551560938358307, 0.2456713318824768, 0.25582706928253174, 0.2659827768802643, 0.2761384844779968, 0.28629422187805176, 0.2964499592781067, 0.30660566687583923, 0.3167613744735718, 0.3269171118736267]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 4.0, 5.0, 4.0, 1.0, 7.0, 12.0, 17.0, 18.0, 27.0, 42.0, 52.0, 65.0, 101.0, 143.0, 228.0, 412.0, 591.0, 947.0, 1690.0, 3206.0, 6810.0, 20802.0, 166446.0, 761878.0, 61500.0, 12616.0, 4857.0, 2511.0, 1321.0, 789.0, 480.0, 301.0, 210.0, 134.0, 92.0, 76.0, 45.0, 29.0, 16.0, 19.0, 18.0, 12.0, 6.0, 8.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.358154296875, -0.3467140197753906, -0.33527374267578125, -0.3238334655761719, -0.3123931884765625, -0.3009529113769531, -0.28951263427734375, -0.2780723571777344, -0.266632080078125, -0.2551918029785156, -0.24375152587890625, -0.23231124877929688, -0.2208709716796875, -0.20943069458007812, -0.19799041748046875, -0.18655014038085938, -0.17510986328125, -0.16366958618164062, -0.15222930908203125, -0.14078903198242188, -0.1293487548828125, -0.11790847778320312, -0.10646820068359375, -0.09502792358398438, -0.083587646484375, -0.07214736938476562, -0.06070709228515625, -0.049266815185546875, -0.0378265380859375, -0.026386260986328125, -0.01494598388671875, -0.003505706787109375, 0.0079345703125, 0.019374847412109375, 0.03081512451171875, 0.042255401611328125, 0.0536956787109375, 0.06513595581054688, 0.07657623291015625, 0.08801651000976562, 0.099456787109375, 0.11089706420898438, 0.12233734130859375, 0.13377761840820312, 0.1452178955078125, 0.15665817260742188, 0.16809844970703125, 0.17953872680664062, 0.19097900390625, 0.20241928100585938, 0.21385955810546875, 0.22529983520507812, 0.2367401123046875, 0.24818038940429688, 0.25962066650390625, 0.2710609436035156, 0.282501220703125, 0.2939414978027344, 0.30538177490234375, 0.3168220520019531, 0.3282623291015625, 0.3397026062011719, 0.35114288330078125, 0.3625831604003906, 0.3740234375]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 6.0, 10.0, 9.0, 8.0, 11.0, 12.0, 22.0, 33.0, 36.0, 32.0, 44.0, 64.0, 47.0, 56.0, 51.0, 76.0, 68.0, 58.0, 59.0, 49.0, 54.0, 38.0, 36.0, 28.0, 18.0, 21.0, 12.0, 9.0, 13.0, 6.0, 5.0, 5.0, 5.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73828125, -0.7150039672851562, -0.6917266845703125, -0.6684494018554688, -0.645172119140625, -0.6218948364257812, -0.5986175537109375, -0.5753402709960938, -0.55206298828125, -0.5287857055664062, -0.5055084228515625, -0.48223114013671875, -0.458953857421875, -0.43567657470703125, -0.4123992919921875, -0.38912200927734375, -0.3658447265625, -0.34256744384765625, -0.3192901611328125, -0.29601287841796875, -0.272735595703125, -0.24945831298828125, -0.2261810302734375, -0.20290374755859375, -0.17962646484375, -0.15634918212890625, -0.1330718994140625, -0.10979461669921875, -0.086517333984375, -0.06324005126953125, -0.0399627685546875, -0.01668548583984375, 0.006591796875, 0.02986907958984375, 0.0531463623046875, 0.07642364501953125, 0.099700927734375, 0.12297821044921875, 0.1462554931640625, 0.16953277587890625, 0.19281005859375, 0.21608734130859375, 0.2393646240234375, 0.26264190673828125, 0.285919189453125, 0.30919647216796875, 0.3324737548828125, 0.35575103759765625, 0.3790283203125, 0.40230560302734375, 0.4255828857421875, 0.44886016845703125, 0.472137451171875, 0.49541473388671875, 0.5186920166015625, 0.5419692993164062, 0.56524658203125, 0.5885238647460938, 0.6118011474609375, 0.6350784301757812, 0.658355712890625, 0.6816329956054688, 0.7049102783203125, 0.7281875610351562, 0.75146484375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 9.0, 7.0, 8.0, 21.0, 28.0, 55.0, 115.0, 266.0, 812.0, 3481.0, 67036.0, 965316.0, 9074.0, 1501.0, 478.0, 178.0, 86.0, 36.0, 22.0, 13.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0888671875, -1.0540008544921875, -1.019134521484375, -0.9842681884765625, -0.94940185546875, -0.9145355224609375, -0.879669189453125, -0.8448028564453125, -0.8099365234375, -0.7750701904296875, -0.740203857421875, -0.7053375244140625, -0.67047119140625, -0.6356048583984375, -0.600738525390625, -0.5658721923828125, -0.531005859375, -0.4961395263671875, -0.461273193359375, -0.4264068603515625, -0.39154052734375, -0.3566741943359375, -0.321807861328125, -0.2869415283203125, -0.2520751953125, -0.2172088623046875, -0.182342529296875, -0.1474761962890625, -0.11260986328125, -0.0777435302734375, -0.042877197265625, -0.0080108642578125, 0.02685546875, 0.0617218017578125, 0.096588134765625, 0.1314544677734375, 0.16632080078125, 0.2011871337890625, 0.236053466796875, 0.2709197998046875, 0.3057861328125, 0.3406524658203125, 0.375518798828125, 0.4103851318359375, 0.44525146484375, 0.4801177978515625, 0.514984130859375, 0.5498504638671875, 0.584716796875, 0.6195831298828125, 0.654449462890625, 0.6893157958984375, 0.72418212890625, 0.7590484619140625, 0.793914794921875, 0.8287811279296875, 0.8636474609375, 0.8985137939453125, 0.933380126953125, 0.9682464599609375, 1.00311279296875, 1.0379791259765625, 1.072845458984375, 1.1077117919921875, 1.142578125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 6.0, 4.0, 5.0, 13.0, 8.0, 8.0, 12.0, 15.0, 19.0, 24.0, 15.0, 27.0, 28.0, 32.0, 33.0, 31.0, 39.0, 34.0, 29.0, 55.0, 42.0, 50.0, 38.0, 44.0, 48.0, 37.0, 43.0, 35.0, 30.0, 13.0, 36.0, 19.0, 20.0, 24.0, 18.0, 8.0, 9.0, 6.0, 5.0, 8.0, 7.0, 4.0, 3.0, 9.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.55322265625, -0.5345077514648438, -0.5157928466796875, -0.49707794189453125, -0.478363037109375, -0.45964813232421875, -0.4409332275390625, -0.42221832275390625, -0.40350341796875, -0.38478851318359375, -0.3660736083984375, -0.34735870361328125, -0.328643798828125, -0.30992889404296875, -0.2912139892578125, -0.27249908447265625, -0.2537841796875, -0.23506927490234375, -0.2163543701171875, -0.19763946533203125, -0.178924560546875, -0.16020965576171875, -0.1414947509765625, -0.12277984619140625, -0.10406494140625, -0.08535003662109375, -0.0666351318359375, -0.04792022705078125, -0.029205322265625, -0.01049041748046875, 0.0082244873046875, 0.02693939208984375, 0.045654296875, 0.06436920166015625, 0.0830841064453125, 0.10179901123046875, 0.120513916015625, 0.13922882080078125, 0.1579437255859375, 0.17665863037109375, 0.19537353515625, 0.21408843994140625, 0.2328033447265625, 0.25151824951171875, 0.270233154296875, 0.28894805908203125, 0.3076629638671875, 0.32637786865234375, 0.3450927734375, 0.36380767822265625, 0.3825225830078125, 0.40123748779296875, 0.419952392578125, 0.43866729736328125, 0.4573822021484375, 0.47609710693359375, 0.49481201171875, 0.5135269165039062, 0.5322418212890625, 0.5509567260742188, 0.569671630859375, 0.5883865356445312, 0.6071014404296875, 0.6258163452148438, 0.64453125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 10.0, 24.0, 34.0, 83.0, 230.0, 674.0, 3352.0, 118792.0, 914863.0, 8783.0, 1133.0, 331.0, 124.0, 48.0, 30.0, 17.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2568359375, -0.24860382080078125, -0.2403717041015625, -0.23213958740234375, -0.223907470703125, -0.21567535400390625, -0.2074432373046875, -0.19921112060546875, -0.19097900390625, -0.18274688720703125, -0.1745147705078125, -0.16628265380859375, -0.158050537109375, -0.14981842041015625, -0.1415863037109375, -0.13335418701171875, -0.1251220703125, -0.11688995361328125, -0.1086578369140625, -0.10042572021484375, -0.092193603515625, -0.08396148681640625, -0.0757293701171875, -0.06749725341796875, -0.05926513671875, -0.05103302001953125, -0.0428009033203125, -0.03456878662109375, -0.026336669921875, -0.01810455322265625, -0.0098724365234375, -0.00164031982421875, 0.006591796875, 0.01482391357421875, 0.0230560302734375, 0.03128814697265625, 0.039520263671875, 0.04775238037109375, 0.0559844970703125, 0.06421661376953125, 0.07244873046875, 0.08068084716796875, 0.0889129638671875, 0.09714508056640625, 0.105377197265625, 0.11360931396484375, 0.1218414306640625, 0.13007354736328125, 0.1383056640625, 0.14653778076171875, 0.1547698974609375, 0.16300201416015625, 0.171234130859375, 0.17946624755859375, 0.1876983642578125, 0.19593048095703125, 0.20416259765625, 0.21239471435546875, 0.2206268310546875, 0.22885894775390625, 0.237091064453125, 0.24532318115234375, 0.2535552978515625, 0.26178741455078125, 0.27001953125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 4.0, 2.0, 9.0, 16.0, 34.0, 31.0, 95.0, 178.0, 266.0, 163.0, 75.0, 55.0, 31.0, 13.0, 11.0, 10.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9265880584716797e-05, -2.8505921363830566e-05, -2.7745962142944336e-05, -2.6986002922058105e-05, -2.6226043701171875e-05, -2.5466084480285645e-05, -2.4706125259399414e-05, -2.3946166038513184e-05, -2.3186206817626953e-05, -2.2426247596740723e-05, -2.1666288375854492e-05, -2.0906329154968262e-05, -2.014636993408203e-05, -1.93864107131958e-05, -1.862645149230957e-05, -1.786649227142334e-05, -1.710653305053711e-05, -1.634657382965088e-05, -1.558661460876465e-05, -1.4826655387878418e-05, -1.4066696166992188e-05, -1.3306736946105957e-05, -1.2546777725219727e-05, -1.1786818504333496e-05, -1.1026859283447266e-05, -1.0266900062561035e-05, -9.506940841674805e-06, -8.746981620788574e-06, -7.987022399902344e-06, -7.227063179016113e-06, -6.467103958129883e-06, -5.707144737243652e-06, -4.947185516357422e-06, -4.187226295471191e-06, -3.427267074584961e-06, -2.6673078536987305e-06, -1.9073486328125e-06, -1.1473894119262695e-06, -3.8743019104003906e-07, 3.725290298461914e-07, 1.1324882507324219e-06, 1.8924474716186523e-06, 2.652406692504883e-06, 3.4123659133911133e-06, 4.172325134277344e-06, 4.932284355163574e-06, 5.692243576049805e-06, 6.452202796936035e-06, 7.212162017822266e-06, 7.972121238708496e-06, 8.732080459594727e-06, 9.492039680480957e-06, 1.0251998901367188e-05, 1.1011958122253418e-05, 1.1771917343139648e-05, 1.2531876564025879e-05, 1.329183578491211e-05, 1.405179500579834e-05, 1.481175422668457e-05, 1.55717134475708e-05, 1.633167266845703e-05, 1.7091631889343262e-05, 1.7851591110229492e-05, 1.8611550331115723e-05, 1.9371509552001953e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 8.0, 8.0, 11.0, 25.0, 38.0, 61.0, 129.0, 209.0, 443.0, 969.0, 2794.0, 12670.0, 356866.0, 653338.0, 15736.0, 3187.0, 1107.0, 429.0, 219.0, 127.0, 81.0, 45.0, 19.0, 19.0, 10.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2376708984375, -0.2317371368408203, -0.22580337524414062, -0.21986961364746094, -0.21393585205078125, -0.20800209045410156, -0.20206832885742188, -0.1961345672607422, -0.1902008056640625, -0.1842670440673828, -0.17833328247070312, -0.17239952087402344, -0.16646575927734375, -0.16053199768066406, -0.15459823608398438, -0.1486644744873047, -0.142730712890625, -0.1367969512939453, -0.13086318969726562, -0.12492942810058594, -0.11899566650390625, -0.11306190490722656, -0.10712814331054688, -0.10119438171386719, -0.0952606201171875, -0.08932685852050781, -0.08339309692382812, -0.07745933532714844, -0.07152557373046875, -0.06559181213378906, -0.059658050537109375, -0.05372428894042969, -0.04779052734375, -0.04185676574707031, -0.035923004150390625, -0.029989242553710938, -0.02405548095703125, -0.018121719360351562, -0.012187957763671875, -0.0062541961669921875, -0.0003204345703125, 0.0056133270263671875, 0.011547088623046875, 0.017480850219726562, 0.02341461181640625, 0.029348373413085938, 0.035282135009765625, 0.04121589660644531, 0.047149658203125, 0.05308341979980469, 0.059017181396484375, 0.06495094299316406, 0.07088470458984375, 0.07681846618652344, 0.08275222778320312, 0.08868598937988281, 0.0946197509765625, 0.10055351257324219, 0.10648727416992188, 0.11242103576660156, 0.11835479736328125, 0.12428855895996094, 0.13022232055664062, 0.1361560821533203, 0.14208984375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 4.0, 9.0, 4.0, 7.0, 21.0, 27.0, 24.0, 38.0, 45.0, 69.0, 76.0, 149.0, 160.0, 91.0, 74.0, 55.0, 42.0, 26.0, 13.0, 15.0, 9.0, 8.0, 10.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02728271484375, -0.0260467529296875, -0.024810791015625, -0.0235748291015625, -0.0223388671875, -0.0211029052734375, -0.019866943359375, -0.0186309814453125, -0.01739501953125, -0.0161590576171875, -0.014923095703125, -0.0136871337890625, -0.012451171875, -0.0112152099609375, -0.009979248046875, -0.0087432861328125, -0.00750732421875, -0.0062713623046875, -0.005035400390625, -0.0037994384765625, -0.0025634765625, -0.0013275146484375, -9.1552734375e-05, 0.0011444091796875, 0.00238037109375, 0.0036163330078125, 0.004852294921875, 0.0060882568359375, 0.00732421875, 0.0085601806640625, 0.009796142578125, 0.0110321044921875, 0.01226806640625, 0.0135040283203125, 0.014739990234375, 0.0159759521484375, 0.0172119140625, 0.0184478759765625, 0.019683837890625, 0.0209197998046875, 0.02215576171875, 0.0233917236328125, 0.024627685546875, 0.0258636474609375, 0.027099609375, 0.0283355712890625, 0.029571533203125, 0.0308074951171875, 0.03204345703125, 0.0332794189453125, 0.034515380859375, 0.0357513427734375, 0.0369873046875, 0.0382232666015625, 0.039459228515625, 0.0406951904296875, 0.04193115234375, 0.0431671142578125, 0.044403076171875, 0.0456390380859375, 0.046875, 0.0481109619140625, 0.049346923828125, 0.0505828857421875, 0.05181884765625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 2.0, 1.0, 7.0, 15.0, 13.0, 37.0, 83.0, 137.0, 203.0, 207.0, 113.0, 72.0, 50.0, 23.0, 13.0, 7.0, 5.0, 6.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4265085458755493, -1.3737664222717285, -1.3210242986679077, -1.268282175064087, -1.2155400514602661, -1.1627979278564453, -1.110055685043335, -1.0573135614395142, -1.0045714378356934, -0.9518293142318726, -0.8990871906280518, -0.846345067024231, -0.7936028838157654, -0.7408607602119446, -0.6881186366081238, -0.6353764533996582, -0.5826343894004822, -0.5298922657966614, -0.4771501123905182, -0.4244079887866974, -0.3716658353805542, -0.3189237117767334, -0.2661815881729126, -0.2134394347667694, -0.1606973111629486, -0.10795517265796661, -0.055213041603565216, -0.0024709105491638184, 0.050271227955818176, 0.10301336646080017, 0.15575549006462097, 0.20849764347076416, 0.26123976707458496, 0.31398189067840576, 0.36672404408454895, 0.41946616768836975, 0.47220832109451294, 0.5249504446983337, 0.5776925683021545, 0.6304347515106201, 0.6831768751144409, 0.7359189987182617, 0.7886611223220825, 0.8414032459259033, 0.8941454291343689, 0.9468875527381897, 0.9996296763420105, 1.052371859550476, 1.1051139831542969, 1.1578561067581177, 1.2105982303619385, 1.2633403539657593, 1.31608247756958, 1.3688247203826904, 1.4215667247772217, 1.474308967590332, 1.5270509719848633, 1.579793095588684, 1.6325352191925049, 1.6852773427963257, 1.7380194664001465, 1.7907617092132568, 1.843503713607788, 1.8962459564208984, 1.9489880800247192]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 13.0, 3.0, 9.0, 11.0, 11.0, 9.0, 16.0, 10.0, 14.0, 16.0, 11.0, 28.0, 21.0, 22.0, 28.0, 22.0, 25.0, 32.0, 45.0, 29.0, 35.0, 34.0, 37.0, 31.0, 41.0, 40.0, 35.0, 28.0, 31.0, 32.0, 24.0, 29.0, 40.0, 30.0, 16.0, 20.0, 11.0, 18.0, 12.0, 14.0, 7.0, 16.0, 19.0, 7.0, 2.0, 7.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8438077569007874, -0.815995991230011, -0.7881841659545898, -0.7603724002838135, -0.7325605750083923, -0.704748809337616, -0.6769369840621948, -0.6491252183914185, -0.6213134527206421, -0.5935016870498657, -0.5656898617744446, -0.5378780961036682, -0.5100662708282471, -0.4822545051574707, -0.45444270968437195, -0.4266309142112732, -0.39881908893585205, -0.3710072934627533, -0.34319549798965454, -0.3153837323188782, -0.28757190704345703, -0.25976014137268066, -0.2319483458995819, -0.20413655042648315, -0.1763247549533844, -0.14851295948028564, -0.12070117145776749, -0.09288938343524933, -0.06507758796215057, -0.03726579248905182, -0.009454011917114258, 0.018357783555984497, 0.04616951942443848, 0.07398131489753723, 0.10179310292005539, 0.12960489094257355, 0.1574166864156723, 0.18522848188877106, 0.21304026246070862, 0.24085205793380737, 0.26866385340690613, 0.2964756488800049, 0.32428744435310364, 0.3520992398262024, 0.37991100549697876, 0.4077228307723999, 0.43553459644317627, 0.463346391916275, 0.4911581873893738, 0.5189699530601501, 0.5467817783355713, 0.5745935440063477, 0.6024053692817688, 0.6302171349525452, 0.6580289602279663, 0.6858407258987427, 0.713652491569519, 0.7414642572402954, 0.7692760825157166, 0.7970878481864929, 0.8248996734619141, 0.8527114391326904, 0.8805232048034668, 0.9083350300788879, 0.9361468553543091]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 16.0, 11.0, 16.0, 22.0, 19.0, 29.0, 35.0, 36.0, 46.0, 67.0, 126.0, 153.0, 243.0, 422.0, 650.0, 1095.0, 2235.0, 5718.0, 31711.0, 1835508.0, 2266340.0, 38438.0, 5955.0, 2293.0, 1201.0, 664.0, 397.0, 214.0, 184.0, 107.0, 82.0, 48.0, 53.0, 30.0, 28.0, 16.0, 20.0, 12.0, 9.0, 9.0, 4.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96923828125, -0.9358444213867188, -0.9024505615234375, -0.8690567016601562, -0.835662841796875, -0.8022689819335938, -0.7688751220703125, -0.7354812622070312, -0.70208740234375, -0.6686935424804688, -0.6352996826171875, -0.6019058227539062, -0.568511962890625, -0.5351181030273438, -0.5017242431640625, -0.46833038330078125, -0.4349365234375, -0.40154266357421875, -0.3681488037109375, -0.33475494384765625, -0.301361083984375, -0.26796722412109375, -0.2345733642578125, -0.20117950439453125, -0.16778564453125, -0.13439178466796875, -0.1009979248046875, -0.06760406494140625, -0.034210205078125, -0.00081634521484375, 0.0325775146484375, 0.06597137451171875, 0.099365234375, 0.13275909423828125, 0.1661529541015625, 0.19954681396484375, 0.232940673828125, 0.26633453369140625, 0.2997283935546875, 0.33312225341796875, 0.36651611328125, 0.39990997314453125, 0.4333038330078125, 0.46669769287109375, 0.500091552734375, 0.5334854125976562, 0.5668792724609375, 0.6002731323242188, 0.6336669921875, 0.6670608520507812, 0.7004547119140625, 0.7338485717773438, 0.767242431640625, 0.8006362915039062, 0.8340301513671875, 0.8674240112304688, 0.90081787109375, 0.9342117309570312, 0.9676055908203125, 1.0009994506835938, 1.034393310546875, 1.0677871704101562, 1.1011810302734375, 1.1345748901367188, 1.16796875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 7.0, 5.0, 7.0, 14.0, 14.0, 17.0, 19.0, 26.0, 24.0, 23.0, 34.0, 45.0, 41.0, 62.0, 53.0, 52.0, 50.0, 51.0, 53.0, 68.0, 48.0, 46.0, 42.0, 41.0, 19.0, 32.0, 26.0, 12.0, 17.0, 8.0, 9.0, 11.0, 3.0, 8.0, 5.0, 4.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.340087890625, -0.3283653259277344, -0.31664276123046875, -0.3049201965332031, -0.2931976318359375, -0.2814750671386719, -0.26975250244140625, -0.2580299377441406, -0.246307373046875, -0.23458480834960938, -0.22286224365234375, -0.21113967895507812, -0.1994171142578125, -0.18769454956054688, -0.17597198486328125, -0.16424942016601562, -0.15252685546875, -0.14080429077148438, -0.12908172607421875, -0.11735916137695312, -0.1056365966796875, -0.09391403198242188, -0.08219146728515625, -0.07046890258789062, -0.058746337890625, -0.047023773193359375, -0.03530120849609375, -0.023578643798828125, -0.0118560791015625, -0.000133514404296875, 0.01158905029296875, 0.023311614990234375, 0.0350341796875, 0.046756744384765625, 0.05847930908203125, 0.07020187377929688, 0.0819244384765625, 0.09364700317382812, 0.10536956787109375, 0.11709213256835938, 0.128814697265625, 0.14053726196289062, 0.15225982666015625, 0.16398239135742188, 0.1757049560546875, 0.18742752075195312, 0.19915008544921875, 0.21087265014648438, 0.22259521484375, 0.23431777954101562, 0.24604034423828125, 0.2577629089355469, 0.2694854736328125, 0.2812080383300781, 0.29293060302734375, 0.3046531677246094, 0.316375732421875, 0.3280982971191406, 0.33982086181640625, 0.3515434265136719, 0.3632659912109375, 0.3749885559082031, 0.38671112060546875, 0.3984336853027344, 0.41015625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 6.0, 5.0, 7.0, 10.0, 15.0, 23.0, 45.0, 45.0, 81.0, 147.0, 250.0, 543.0, 1119.0, 2638.0, 8344.0, 44778.0, 3008414.0, 1086484.0, 30774.0, 6609.0, 2135.0, 862.0, 412.0, 232.0, 105.0, 67.0, 42.0, 28.0, 22.0, 16.0, 9.0, 5.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.99267578125, -0.9650344848632812, -0.9373931884765625, -0.9097518920898438, -0.882110595703125, -0.8544692993164062, -0.8268280029296875, -0.7991867065429688, -0.77154541015625, -0.7439041137695312, -0.7162628173828125, -0.6886215209960938, -0.660980224609375, -0.6333389282226562, -0.6056976318359375, -0.5780563354492188, -0.5504150390625, -0.5227737426757812, -0.4951324462890625, -0.46749114990234375, -0.439849853515625, -0.41220855712890625, -0.3845672607421875, -0.35692596435546875, -0.32928466796875, -0.30164337158203125, -0.2740020751953125, -0.24636077880859375, -0.218719482421875, -0.19107818603515625, -0.1634368896484375, -0.13579559326171875, -0.108154296875, -0.08051300048828125, -0.0528717041015625, -0.02523040771484375, 0.002410888671875, 0.03005218505859375, 0.0576934814453125, 0.08533477783203125, 0.11297607421875, 0.14061737060546875, 0.1682586669921875, 0.19589996337890625, 0.223541259765625, 0.25118255615234375, 0.2788238525390625, 0.30646514892578125, 0.3341064453125, 0.36174774169921875, 0.3893890380859375, 0.41703033447265625, 0.444671630859375, 0.47231292724609375, 0.4999542236328125, 0.5275955200195312, 0.55523681640625, 0.5828781127929688, 0.6105194091796875, 0.6381607055664062, 0.665802001953125, 0.6934432983398438, 0.7210845947265625, 0.7487258911132812, 0.7763671875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 6.0, 6.0, 10.0, 22.0, 16.0, 15.0, 49.0, 69.0, 157.0, 296.0, 574.0, 988.0, 877.0, 415.0, 241.0, 114.0, 66.0, 37.0, 27.0, 23.0, 15.0, 12.0, 7.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1683349609375, -0.1618175506591797, -0.15530014038085938, -0.14878273010253906, -0.14226531982421875, -0.13574790954589844, -0.12923049926757812, -0.12271308898925781, -0.1161956787109375, -0.10967826843261719, -0.10316085815429688, -0.09664344787597656, -0.09012603759765625, -0.08360862731933594, -0.07709121704101562, -0.07057380676269531, -0.064056396484375, -0.05753898620605469, -0.051021575927734375, -0.04450416564941406, -0.03798675537109375, -0.03146934509277344, -0.024951934814453125, -0.018434524536132812, -0.0119171142578125, -0.0053997039794921875, 0.001117706298828125, 0.0076351165771484375, 0.01415252685546875, 0.020669937133789062, 0.027187347412109375, 0.03370475769042969, 0.04022216796875, 0.04673957824707031, 0.053256988525390625, 0.05977439880371094, 0.06629180908203125, 0.07280921936035156, 0.07932662963867188, 0.08584403991699219, 0.0923614501953125, 0.09887886047363281, 0.10539627075195312, 0.11191368103027344, 0.11843109130859375, 0.12494850158691406, 0.13146591186523438, 0.1379833221435547, 0.144500732421875, 0.1510181427001953, 0.15753555297851562, 0.16405296325683594, 0.17057037353515625, 0.17708778381347656, 0.18360519409179688, 0.1901226043701172, 0.1966400146484375, 0.2031574249267578, 0.20967483520507812, 0.21619224548339844, 0.22270965576171875, 0.22922706604003906, 0.23574447631835938, 0.2422618865966797, 0.248779296875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 10.0, 15.0, 13.0, 44.0, 52.0, 139.0, 189.0, 185.0, 136.0, 92.0, 58.0, 31.0, 15.0, 7.0, 9.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4539974927902222, -1.416054368019104, -1.3781112432479858, -1.3401682376861572, -1.302225112915039, -1.264281988143921, -1.2263388633728027, -1.1883957386016846, -1.1504526138305664, -1.1125094890594482, -1.07456636428833, -1.036623239517212, -0.9986801743507385, -0.9607371091842651, -0.922793984413147, -0.8848508596420288, -0.8469077944755554, -0.8089646697044373, -0.7710216045379639, -0.7330784797668457, -0.6951353549957275, -0.6571922302246094, -0.619249165058136, -0.5813060402870178, -0.5433629751205444, -0.5054198503494263, -0.4674767553806305, -0.4295336604118347, -0.39159053564071655, -0.3536474406719208, -0.315704345703125, -0.27776122093200684, -0.23981809616088867, -0.2018749862909317, -0.16393187642097473, -0.12598878145217896, -0.08804567158222198, -0.050102561712265015, -0.012159466743469238, 0.025783658027648926, 0.0637267529964447, 0.10166986286640167, 0.13961297273635864, 0.17755606770515442, 0.2154991775751114, 0.25344228744506836, 0.29138538241386414, 0.3293285071849823, 0.3672716021537781, 0.40521469712257385, 0.443157821893692, 0.4811009168624878, 0.519044041633606, 0.5569871664047241, 0.5949302315711975, 0.6328733563423157, 0.6708164215087891, 0.7087595462799072, 0.7467026114463806, 0.7846457362174988, 0.8225888609886169, 0.8605319261550903, 0.8984750509262085, 0.9364181756973267, 0.9743613004684448]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 2.0, 9.0, 3.0, 10.0, 11.0, 11.0, 13.0, 10.0, 18.0, 12.0, 20.0, 21.0, 22.0, 29.0, 40.0, 46.0, 41.0, 42.0, 35.0, 39.0, 44.0, 41.0, 34.0, 41.0, 42.0, 45.0, 47.0, 35.0, 35.0, 26.0, 31.0, 23.0, 31.0, 18.0, 11.0, 9.0, 10.0, 11.0, 7.0, 6.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3959617614746094, -0.3849647045135498, -0.37396761775016785, -0.3629705607891083, -0.3519735038280487, -0.34097644686698914, -0.3299793601036072, -0.3189823031425476, -0.30798524618148804, -0.29698818922042847, -0.2859911024570465, -0.27499404549598694, -0.26399698853492737, -0.2529999315738678, -0.24200284481048584, -0.23100578784942627, -0.2200087159872055, -0.20901164412498474, -0.19801458716392517, -0.1870175153017044, -0.17602045834064484, -0.16502338647842407, -0.1540263295173645, -0.14302925765514374, -0.13203218579292297, -0.1210351213812828, -0.11003805696964264, -0.09904098510742188, -0.0880439281463623, -0.07704685628414154, -0.06604979187250137, -0.055052727460861206, -0.044055670499801636, -0.03305860608816147, -0.022061539813876152, -0.011064473539590836, -6.740912795066833e-05, 0.010929655283689499, 0.021926723420619965, 0.03292378783226013, 0.0439208522439003, 0.054917916655540466, 0.06591498106718063, 0.0769120454788208, 0.08790911734104156, 0.09890617430210114, 0.1099032461643219, 0.12090031057596207, 0.13189737498760223, 0.142894446849823, 0.15389150381088257, 0.16488857567310333, 0.1758856326341629, 0.18688270449638367, 0.19787976145744324, 0.208876833319664, 0.21987390518188477, 0.23087097704410553, 0.2418680340051651, 0.25286510586738586, 0.26386216282844543, 0.274859219789505, 0.28585630655288696, 0.29685336351394653, 0.3078504204750061]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 7.0, 9.0, 15.0, 23.0, 32.0, 59.0, 102.0, 181.0, 339.0, 677.0, 1483.0, 4088.0, 14162.0, 80342.0, 663418.0, 242384.0, 29971.0, 6967.0, 2318.0, 942.0, 443.0, 218.0, 131.0, 96.0, 44.0, 34.0, 14.0, 14.0, 8.0, 7.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1497802734375, -0.1441783905029297, -0.13857650756835938, -0.13297462463378906, -0.12737274169921875, -0.12177085876464844, -0.11616897583007812, -0.11056709289550781, -0.1049652099609375, -0.09936332702636719, -0.09376144409179688, -0.08815956115722656, -0.08255767822265625, -0.07695579528808594, -0.07135391235351562, -0.06575202941894531, -0.060150146484375, -0.05454826354980469, -0.048946380615234375, -0.04334449768066406, -0.03774261474609375, -0.03214073181152344, -0.026538848876953125, -0.020936965942382812, -0.0153350830078125, -0.009733200073242188, -0.004131317138671875, 0.0014705657958984375, 0.00707244873046875, 0.012674331665039062, 0.018276214599609375, 0.023878097534179688, 0.02947998046875, 0.03508186340332031, 0.040683746337890625, 0.04628562927246094, 0.05188751220703125, 0.05748939514160156, 0.06309127807617188, 0.06869316101074219, 0.0742950439453125, 0.07989692687988281, 0.08549880981445312, 0.09110069274902344, 0.09670257568359375, 0.10230445861816406, 0.10790634155273438, 0.11350822448730469, 0.119110107421875, 0.12471199035644531, 0.13031387329101562, 0.13591575622558594, 0.14151763916015625, 0.14711952209472656, 0.15272140502929688, 0.1583232879638672, 0.1639251708984375, 0.1695270538330078, 0.17512893676757812, 0.18073081970214844, 0.18633270263671875, 0.19193458557128906, 0.19753646850585938, 0.2031383514404297, 0.208740234375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 6.0, 2.0, 9.0, 7.0, 12.0, 11.0, 14.0, 9.0, 18.0, 30.0, 25.0, 38.0, 48.0, 53.0, 47.0, 54.0, 53.0, 63.0, 55.0, 58.0, 60.0, 43.0, 56.0, 38.0, 32.0, 36.0, 35.0, 28.0, 15.0, 10.0, 14.0, 4.0, 5.0, 6.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.286865234375, -0.2773017883300781, -0.26773834228515625, -0.2581748962402344, -0.2486114501953125, -0.23904800415039062, -0.22948455810546875, -0.21992111206054688, -0.210357666015625, -0.20079421997070312, -0.19123077392578125, -0.18166732788085938, -0.1721038818359375, -0.16254043579101562, -0.15297698974609375, -0.14341354370117188, -0.13385009765625, -0.12428665161132812, -0.11472320556640625, -0.10515975952148438, -0.0955963134765625, -0.08603286743164062, -0.07646942138671875, -0.06690597534179688, -0.057342529296875, -0.047779083251953125, -0.03821563720703125, -0.028652191162109375, -0.0190887451171875, -0.009525299072265625, 3.814697265625e-05, 0.009601593017578125, 0.0191650390625, 0.028728485107421875, 0.03829193115234375, 0.047855377197265625, 0.0574188232421875, 0.06698226928710938, 0.07654571533203125, 0.08610916137695312, 0.095672607421875, 0.10523605346679688, 0.11479949951171875, 0.12436294555664062, 0.1339263916015625, 0.14348983764648438, 0.15305328369140625, 0.16261672973632812, 0.17218017578125, 0.18174362182617188, 0.19130706787109375, 0.20087051391601562, 0.2104339599609375, 0.21999740600585938, 0.22956085205078125, 0.23912429809570312, 0.248687744140625, 0.2582511901855469, 0.26781463623046875, 0.2773780822753906, 0.2869415283203125, 0.2965049743652344, 0.30606842041015625, 0.3156318664550781, 0.3251953125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 7.0, 7.0, 14.0, 19.0, 25.0, 26.0, 53.0, 82.0, 100.0, 140.0, 183.0, 320.0, 514.0, 799.0, 1380.0, 2535.0, 5544.0, 14214.0, 47166.0, 210498.0, 534732.0, 166962.0, 39489.0, 12687.0, 5100.0, 2407.0, 1367.0, 763.0, 428.0, 310.0, 200.0, 142.0, 112.0, 66.0, 55.0, 25.0, 25.0, 19.0, 10.0, 12.0, 5.0, 1.0, 2.0, 5.0, 4.0, 3.0, 1.0], "bins": [-0.11151123046875, -0.10853195190429688, -0.10555267333984375, -0.10257339477539062, -0.0995941162109375, -0.09661483764648438, -0.09363555908203125, -0.09065628051757812, -0.087677001953125, -0.08469772338867188, -0.08171844482421875, -0.07873916625976562, -0.0757598876953125, -0.07278060913085938, -0.06980133056640625, -0.06682205200195312, -0.0638427734375, -0.060863494873046875, -0.05788421630859375, -0.054904937744140625, -0.0519256591796875, -0.048946380615234375, -0.04596710205078125, -0.042987823486328125, -0.040008544921875, -0.037029266357421875, -0.03404998779296875, -0.031070709228515625, -0.0280914306640625, -0.025112152099609375, -0.02213287353515625, -0.019153594970703125, -0.01617431640625, -0.013195037841796875, -0.01021575927734375, -0.007236480712890625, -0.0042572021484375, -0.001277923583984375, 0.00170135498046875, 0.004680633544921875, 0.007659912109375, 0.010639190673828125, 0.01361846923828125, 0.016597747802734375, 0.0195770263671875, 0.022556304931640625, 0.02553558349609375, 0.028514862060546875, 0.031494140625, 0.034473419189453125, 0.03745269775390625, 0.040431976318359375, 0.0434112548828125, 0.046390533447265625, 0.04936981201171875, 0.052349090576171875, 0.055328369140625, 0.058307647705078125, 0.06128692626953125, 0.06426620483398438, 0.0672454833984375, 0.07022476196289062, 0.07320404052734375, 0.07618331909179688, 0.07916259765625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 7.0, 4.0, 10.0, 7.0, 10.0, 19.0, 18.0, 27.0, 25.0, 28.0, 40.0, 36.0, 35.0, 37.0, 45.0, 59.0, 48.0, 53.0, 55.0, 52.0, 47.0, 51.0, 39.0, 39.0, 38.0, 31.0, 23.0, 18.0, 23.0, 10.0, 18.0, 8.0, 5.0, 10.0, 5.0, 9.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.482177734375, -0.4663810729980469, -0.45058441162109375, -0.4347877502441406, -0.4189910888671875, -0.4031944274902344, -0.38739776611328125, -0.3716011047363281, -0.355804443359375, -0.3400077819824219, -0.32421112060546875, -0.3084144592285156, -0.2926177978515625, -0.2768211364746094, -0.26102447509765625, -0.24522781372070312, -0.22943115234375, -0.21363449096679688, -0.19783782958984375, -0.18204116821289062, -0.1662445068359375, -0.15044784545898438, -0.13465118408203125, -0.11885452270507812, -0.103057861328125, -0.08726119995117188, -0.07146453857421875, -0.055667877197265625, -0.0398712158203125, -0.024074554443359375, -0.00827789306640625, 0.007518768310546875, 0.0233154296875, 0.039112091064453125, 0.05490875244140625, 0.07070541381835938, 0.0865020751953125, 0.10229873657226562, 0.11809539794921875, 0.13389205932617188, 0.149688720703125, 0.16548538208007812, 0.18128204345703125, 0.19707870483398438, 0.2128753662109375, 0.22867202758789062, 0.24446868896484375, 0.2602653503417969, 0.27606201171875, 0.2918586730957031, 0.30765533447265625, 0.3234519958496094, 0.3392486572265625, 0.3550453186035156, 0.37084197998046875, 0.3866386413574219, 0.402435302734375, 0.4182319641113281, 0.43402862548828125, 0.4498252868652344, 0.4656219482421875, 0.4814186096191406, 0.49721527099609375, 0.5130119323730469, 0.52880859375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 8.0, 10.0, 17.0, 17.0, 28.0, 44.0, 52.0, 101.0, 162.0, 258.0, 478.0, 998.0, 2073.0, 4651.0, 12838.0, 45234.0, 230089.0, 557710.0, 144950.0, 31728.0, 9828.0, 3766.0, 1625.0, 833.0, 425.0, 216.0, 155.0, 86.0, 53.0, 36.0, 28.0, 10.0, 12.0, 14.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03021240234375, -0.029249191284179688, -0.028285980224609375, -0.027322769165039062, -0.02635955810546875, -0.025396347045898438, -0.024433135986328125, -0.023469924926757812, -0.0225067138671875, -0.021543502807617188, -0.020580291748046875, -0.019617080688476562, -0.01865386962890625, -0.017690658569335938, -0.016727447509765625, -0.015764236450195312, -0.014801025390625, -0.013837814331054688, -0.012874603271484375, -0.011911392211914062, -0.01094818115234375, -0.009984970092773438, -0.009021759033203125, -0.008058547973632812, -0.0070953369140625, -0.0061321258544921875, -0.005168914794921875, -0.0042057037353515625, -0.00324249267578125, -0.0022792816162109375, -0.001316070556640625, -0.0003528594970703125, 0.0006103515625, 0.0015735626220703125, 0.002536773681640625, 0.0034999847412109375, 0.00446319580078125, 0.0054264068603515625, 0.006389617919921875, 0.0073528289794921875, 0.0083160400390625, 0.009279251098632812, 0.010242462158203125, 0.011205673217773438, 0.01216888427734375, 0.013132095336914062, 0.014095306396484375, 0.015058517456054688, 0.016021728515625, 0.016984939575195312, 0.017948150634765625, 0.018911361694335938, 0.01987457275390625, 0.020837783813476562, 0.021800994873046875, 0.022764205932617188, 0.0237274169921875, 0.024690628051757812, 0.025653839111328125, 0.026617050170898438, 0.02758026123046875, 0.028543472290039062, 0.029506683349609375, 0.030469894409179688, 0.03143310546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 1.0, 5.0, 8.0, 7.0, 22.0, 12.0, 32.0, 38.0, 49.0, 65.0, 94.0, 112.0, 110.0, 110.0, 71.0, 69.0, 52.0, 31.0, 30.0, 20.0, 18.0, 7.0, 9.0, 7.0, 7.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.4781951904296875e-05, -1.4241784811019897e-05, -1.370161771774292e-05, -1.3161450624465942e-05, -1.2621283531188965e-05, -1.2081116437911987e-05, -1.154094934463501e-05, -1.1000782251358032e-05, -1.0460615158081055e-05, -9.920448064804077e-06, -9.3802809715271e-06, -8.840113878250122e-06, -8.299946784973145e-06, -7.759779691696167e-06, -7.2196125984191895e-06, -6.679445505142212e-06, -6.139278411865234e-06, -5.599111318588257e-06, -5.058944225311279e-06, -4.518777132034302e-06, -3.978610038757324e-06, -3.4384429454803467e-06, -2.898275852203369e-06, -2.3581087589263916e-06, -1.817941665649414e-06, -1.2777745723724365e-06, -7.37607479095459e-07, -1.9744038581848145e-07, 3.427267074584961e-07, 8.828938007354736e-07, 1.4230608940124512e-06, 1.9632279872894287e-06, 2.5033950805664062e-06, 3.043562173843384e-06, 3.5837292671203613e-06, 4.123896360397339e-06, 4.664063453674316e-06, 5.204230546951294e-06, 5.7443976402282715e-06, 6.284564733505249e-06, 6.8247318267822266e-06, 7.364898920059204e-06, 7.905066013336182e-06, 8.44523310661316e-06, 8.985400199890137e-06, 9.525567293167114e-06, 1.0065734386444092e-05, 1.060590147972107e-05, 1.1146068572998047e-05, 1.1686235666275024e-05, 1.2226402759552002e-05, 1.276656985282898e-05, 1.3306736946105957e-05, 1.3846904039382935e-05, 1.4387071132659912e-05, 1.492723822593689e-05, 1.5467405319213867e-05, 1.6007572412490845e-05, 1.6547739505767822e-05, 1.70879065990448e-05, 1.7628073692321777e-05, 1.8168240785598755e-05, 1.8708407878875732e-05, 1.924857497215271e-05, 1.9788742065429688e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 13.0, 15.0, 18.0, 37.0, 46.0, 84.0, 121.0, 160.0, 287.0, 466.0, 766.0, 1242.0, 2375.0, 4582.0, 8882.0, 19570.0, 46646.0, 123927.0, 304241.0, 314509.0, 130991.0, 49634.0, 20278.0, 9289.0, 4528.0, 2439.0, 1314.0, 780.0, 463.0, 302.0, 182.0, 112.0, 74.0, 57.0, 42.0, 27.0, 19.0, 8.0, 7.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017547607421875, -0.016921520233154297, -0.016295433044433594, -0.01566934585571289, -0.015043258666992188, -0.014417171478271484, -0.013791084289550781, -0.013164997100830078, -0.012538909912109375, -0.011912822723388672, -0.011286735534667969, -0.010660648345947266, -0.010034561157226562, -0.00940847396850586, -0.008782386779785156, -0.008156299591064453, -0.00753021240234375, -0.006904125213623047, -0.006278038024902344, -0.005651950836181641, -0.0050258636474609375, -0.004399776458740234, -0.0037736892700195312, -0.003147602081298828, -0.002521514892578125, -0.0018954277038574219, -0.0012693405151367188, -0.0006432533264160156, -1.71661376953125e-05, 0.0006089210510253906, 0.0012350082397460938, 0.0018610954284667969, 0.0024871826171875, 0.003113269805908203, 0.0037393569946289062, 0.004365444183349609, 0.0049915313720703125, 0.005617618560791016, 0.006243705749511719, 0.006869792938232422, 0.007495880126953125, 0.008121967315673828, 0.008748054504394531, 0.009374141693115234, 0.010000228881835938, 0.01062631607055664, 0.011252403259277344, 0.011878490447998047, 0.01250457763671875, 0.013130664825439453, 0.013756752014160156, 0.01438283920288086, 0.015008926391601562, 0.015635013580322266, 0.01626110076904297, 0.016887187957763672, 0.017513275146484375, 0.018139362335205078, 0.01876544952392578, 0.019391536712646484, 0.020017623901367188, 0.02064371109008789, 0.021269798278808594, 0.021895885467529297, 0.02252197265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 4.0, 7.0, 6.0, 14.0, 18.0, 14.0, 20.0, 23.0, 31.0, 35.0, 40.0, 59.0, 54.0, 77.0, 79.0, 51.0, 69.0, 74.0, 52.0, 48.0, 51.0, 24.0, 38.0, 30.0, 24.0, 12.0, 10.0, 8.0, 9.0, 7.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.00891876220703125, -0.008684635162353516, -0.008450508117675781, -0.008216381072998047, -0.007982254028320312, -0.007748126983642578, -0.007513999938964844, -0.007279872894287109, -0.007045745849609375, -0.006811618804931641, -0.006577491760253906, -0.006343364715576172, -0.0061092376708984375, -0.005875110626220703, -0.005640983581542969, -0.005406856536865234, -0.0051727294921875, -0.004938602447509766, -0.004704475402832031, -0.004470348358154297, -0.0042362213134765625, -0.004002094268798828, -0.0037679672241210938, -0.0035338401794433594, -0.003299713134765625, -0.0030655860900878906, -0.0028314590454101562, -0.002597332000732422, -0.0023632049560546875, -0.002129077911376953, -0.0018949508666992188, -0.0016608238220214844, -0.00142669677734375, -0.0011925697326660156, -0.0009584426879882812, -0.0007243156433105469, -0.0004901885986328125, -0.0002560615539550781, -2.193450927734375e-05, 0.00021219253540039062, 0.000446319580078125, 0.0006804466247558594, 0.0009145736694335938, 0.0011487007141113281, 0.0013828277587890625, 0.0016169548034667969, 0.0018510818481445312, 0.0020852088928222656, 0.0023193359375, 0.0025534629821777344, 0.0027875900268554688, 0.003021717071533203, 0.0032558441162109375, 0.003489971160888672, 0.0037240982055664062, 0.003958225250244141, 0.004192352294921875, 0.004426479339599609, 0.004660606384277344, 0.004894733428955078, 0.0051288604736328125, 0.005362987518310547, 0.005597114562988281, 0.005831241607666016, 0.00606536865234375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 9.0, 13.0, 44.0, 51.0, 104.0, 159.0, 174.0, 157.0, 104.0, 61.0, 43.0, 19.0, 19.0, 10.0, 5.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.8640743494033813, -0.8442875146865845, -0.8245007395744324, -0.8047139048576355, -0.7849271297454834, -0.7651402950286865, -0.7453534603118896, -0.7255666255950928, -0.7057798504829407, -0.6859930157661438, -0.6662062406539917, -0.6464194059371948, -0.626632571220398, -0.6068457961082458, -0.587058961391449, -0.5672721862792969, -0.5474853515625, -0.5276985168457031, -0.507911741733551, -0.48812490701675415, -0.46833810210227966, -0.4485512971878052, -0.4287644624710083, -0.4089776575565338, -0.3891908526420593, -0.36940404772758484, -0.34961724281311035, -0.3298304080963135, -0.310043603181839, -0.2902567982673645, -0.2704699635505676, -0.25068315863609314, -0.23089641332626343, -0.21110960841178894, -0.19132278859615326, -0.17153596878051758, -0.1517491638660431, -0.1319623589515686, -0.11217553913593292, -0.09238871932029724, -0.07260191440582275, -0.05281510204076767, -0.033028289675712585, -0.013241477310657501, 0.006545335054397583, 0.026332147419452667, 0.04611895978450775, 0.06590577960014343, 0.08569258451461792, 0.105479396879673, 0.1252662092447281, 0.14505302906036377, 0.16483983397483826, 0.18462663888931274, 0.20441345870494843, 0.2242002785205841, 0.2439870834350586, 0.2637738883495331, 0.28356069326400757, 0.30334752798080444, 0.32313433289527893, 0.3429211378097534, 0.3627079725265503, 0.3824947774410248, 0.40228158235549927]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 10.0, 6.0, 3.0, 10.0, 7.0, 16.0, 11.0, 15.0, 15.0, 19.0, 27.0, 28.0, 35.0, 46.0, 42.0, 60.0, 53.0, 41.0, 50.0, 43.0, 62.0, 53.0, 57.0, 43.0, 48.0, 32.0, 43.0, 33.0, 22.0, 17.0, 12.0, 14.0, 8.0, 6.0, 4.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2526215612888336, -0.24417267739772797, -0.23572379350662231, -0.22727490961551666, -0.218826025724411, -0.21037714183330536, -0.2019282579421997, -0.19347938895225525, -0.1850304901599884, -0.17658160626888275, -0.1681327223777771, -0.15968383848667145, -0.1512349545955658, -0.14278607070446014, -0.1343371868133545, -0.12588831782341003, -0.11743943393230438, -0.10899055004119873, -0.10054166615009308, -0.09209278225898743, -0.08364389836788177, -0.07519501447677612, -0.06674613803625107, -0.058297254145145416, -0.049848370254039764, -0.04139948636293411, -0.03295060247182846, -0.024501722306013107, -0.016052838414907455, -0.007603954523801804, 0.0008449256420135498, 0.009293809533119202, 0.017742693424224854, 0.026191577315330505, 0.03464046120643616, 0.04308934137225151, 0.05153822526335716, 0.059987109154462814, 0.06843598932027817, 0.07688487321138382, 0.08533375710248947, 0.09378264099359512, 0.10223152488470078, 0.11068040132522583, 0.11912928521633148, 0.12757816910743713, 0.13602705299854279, 0.14447593688964844, 0.1529248207807541, 0.16137370467185974, 0.1698225885629654, 0.17827147245407104, 0.1867203563451767, 0.19516924023628235, 0.2036181092262268, 0.21206700801849365, 0.2205158770084381, 0.22896476089954376, 0.23741364479064941, 0.24586252868175507, 0.2543114125728607, 0.2627602815628052, 0.271209180355072, 0.2796580493450165, 0.2881069481372833]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 8.0, 12.0, 11.0, 18.0, 23.0, 28.0, 50.0, 69.0, 88.0, 118.0, 202.0, 273.0, 448.0, 699.0, 1246.0, 2173.0, 4392.0, 8942.0, 21255.0, 56364.0, 244036.0, 559658.0, 92269.0, 30941.0, 12612.0, 5724.0, 2887.0, 1552.0, 834.0, 548.0, 308.0, 229.0, 160.0, 107.0, 76.0, 50.0, 32.0, 26.0, 24.0, 23.0, 12.0, 9.0, 3.0, 5.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0], "bins": [-0.196044921875, -0.19031333923339844, -0.18458175659179688, -0.1788501739501953, -0.17311859130859375, -0.1673870086669922, -0.16165542602539062, -0.15592384338378906, -0.1501922607421875, -0.14446067810058594, -0.13872909545898438, -0.1329975128173828, -0.12726593017578125, -0.12153434753417969, -0.11580276489257812, -0.11007118225097656, -0.104339599609375, -0.09860801696777344, -0.09287643432617188, -0.08714485168457031, -0.08141326904296875, -0.07568168640136719, -0.06995010375976562, -0.06421852111816406, -0.0584869384765625, -0.05275535583496094, -0.047023773193359375, -0.04129219055175781, -0.03556060791015625, -0.029829025268554688, -0.024097442626953125, -0.018365859985351562, -0.01263427734375, -0.0069026947021484375, -0.001171112060546875, 0.0045604705810546875, 0.01029205322265625, 0.016023635864257812, 0.021755218505859375, 0.027486801147460938, 0.0332183837890625, 0.03894996643066406, 0.044681549072265625, 0.05041313171386719, 0.05614471435546875, 0.06187629699707031, 0.06760787963867188, 0.07333946228027344, 0.079071044921875, 0.08480262756347656, 0.09053421020507812, 0.09626579284667969, 0.10199737548828125, 0.10772895812988281, 0.11346054077148438, 0.11919212341308594, 0.1249237060546875, 0.13065528869628906, 0.13638687133789062, 0.1421184539794922, 0.14785003662109375, 0.1535816192626953, 0.15931320190429688, 0.16504478454589844, 0.1707763671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 2.0, 6.0, 5.0, 6.0, 8.0, 11.0, 14.0, 10.0, 18.0, 17.0, 18.0, 28.0, 34.0, 54.0, 50.0, 66.0, 47.0, 56.0, 66.0, 50.0, 58.0, 60.0, 63.0, 50.0, 29.0, 44.0, 24.0, 34.0, 18.0, 14.0, 13.0, 5.0, 6.0, 3.0, 6.0, 2.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54052734375, -0.5216445922851562, -0.5027618408203125, -0.48387908935546875, -0.464996337890625, -0.44611358642578125, -0.4272308349609375, -0.40834808349609375, -0.38946533203125, -0.37058258056640625, -0.3516998291015625, -0.33281707763671875, -0.313934326171875, -0.29505157470703125, -0.2761688232421875, -0.25728607177734375, -0.2384033203125, -0.21952056884765625, -0.2006378173828125, -0.18175506591796875, -0.162872314453125, -0.14398956298828125, -0.1251068115234375, -0.10622406005859375, -0.08734130859375, -0.06845855712890625, -0.0495758056640625, -0.03069305419921875, -0.011810302734375, 0.00707244873046875, 0.0259552001953125, 0.04483795166015625, 0.063720703125, 0.08260345458984375, 0.1014862060546875, 0.12036895751953125, 0.139251708984375, 0.15813446044921875, 0.1770172119140625, 0.19589996337890625, 0.21478271484375, 0.23366546630859375, 0.2525482177734375, 0.27143096923828125, 0.290313720703125, 0.30919647216796875, 0.3280792236328125, 0.34696197509765625, 0.3658447265625, 0.38472747802734375, 0.4036102294921875, 0.42249298095703125, 0.441375732421875, 0.46025848388671875, 0.4791412353515625, 0.49802398681640625, 0.51690673828125, 0.5357894897460938, 0.5546722412109375, 0.5735549926757812, 0.592437744140625, 0.6113204956054688, 0.6302032470703125, 0.6490859985351562, 0.66796875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 9.0, 8.0, 8.0, 12.0, 10.0, 22.0, 17.0, 20.0, 37.0, 49.0, 66.0, 80.0, 139.0, 404.0, 2014.0, 46598.0, 970749.0, 25869.0, 1553.0, 382.0, 140.0, 93.0, 49.0, 42.0, 34.0, 34.0, 15.0, 20.0, 24.0, 16.0, 8.0, 5.0, 4.0, 4.0, 5.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.80517578125, -0.7824478149414062, -0.7597198486328125, -0.7369918823242188, -0.714263916015625, -0.6915359497070312, -0.6688079833984375, -0.6460800170898438, -0.62335205078125, -0.6006240844726562, -0.5778961181640625, -0.5551681518554688, -0.532440185546875, -0.5097122192382812, -0.4869842529296875, -0.46425628662109375, -0.4415283203125, -0.41880035400390625, -0.3960723876953125, -0.37334442138671875, -0.350616455078125, -0.32788848876953125, -0.3051605224609375, -0.28243255615234375, -0.25970458984375, -0.23697662353515625, -0.2142486572265625, -0.19152069091796875, -0.168792724609375, -0.14606475830078125, -0.1233367919921875, -0.10060882568359375, -0.077880859375, -0.05515289306640625, -0.0324249267578125, -0.00969696044921875, 0.013031005859375, 0.03575897216796875, 0.0584869384765625, 0.08121490478515625, 0.10394287109375, 0.12667083740234375, 0.1493988037109375, 0.17212677001953125, 0.194854736328125, 0.21758270263671875, 0.2403106689453125, 0.26303863525390625, 0.2857666015625, 0.30849456787109375, 0.3312225341796875, 0.35395050048828125, 0.376678466796875, 0.39940643310546875, 0.4221343994140625, 0.44486236572265625, 0.46759033203125, 0.49031829833984375, 0.5130462646484375, 0.5357742309570312, 0.558502197265625, 0.5812301635742188, 0.6039581298828125, 0.6266860961914062, 0.6494140625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 6.0, 7.0, 13.0, 5.0, 10.0, 6.0, 15.0, 12.0, 14.0, 23.0, 28.0, 39.0, 34.0, 47.0, 45.0, 51.0, 64.0, 60.0, 53.0, 54.0, 57.0, 51.0, 44.0, 53.0, 39.0, 26.0, 22.0, 25.0, 19.0, 24.0, 13.0, 12.0, 9.0, 6.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61279296875, -0.59356689453125, -0.5743408203125, -0.55511474609375, -0.535888671875, -0.51666259765625, -0.4974365234375, -0.47821044921875, -0.458984375, -0.43975830078125, -0.4205322265625, -0.40130615234375, -0.382080078125, -0.36285400390625, -0.3436279296875, -0.32440185546875, -0.30517578125, -0.28594970703125, -0.2667236328125, -0.24749755859375, -0.228271484375, -0.20904541015625, -0.1898193359375, -0.17059326171875, -0.1513671875, -0.13214111328125, -0.1129150390625, -0.09368896484375, -0.074462890625, -0.05523681640625, -0.0360107421875, -0.01678466796875, 0.00244140625, 0.02166748046875, 0.0408935546875, 0.06011962890625, 0.079345703125, 0.09857177734375, 0.1177978515625, 0.13702392578125, 0.15625, 0.17547607421875, 0.1947021484375, 0.21392822265625, 0.233154296875, 0.25238037109375, 0.2716064453125, 0.29083251953125, 0.31005859375, 0.32928466796875, 0.3485107421875, 0.36773681640625, 0.386962890625, 0.40618896484375, 0.4254150390625, 0.44464111328125, 0.4638671875, 0.48309326171875, 0.5023193359375, 0.52154541015625, 0.540771484375, 0.55999755859375, 0.5792236328125, 0.59844970703125, 0.61767578125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 0.0, 7.0, 8.0, 15.0, 25.0, 45.0, 99.0, 212.0, 552.0, 1684.0, 9674.0, 318866.0, 702227.0, 12258.0, 1840.0, 566.0, 261.0, 87.0, 58.0, 19.0, 21.0, 9.0, 8.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.152099609375, -0.14550018310546875, -0.1389007568359375, -0.13230133056640625, -0.125701904296875, -0.11910247802734375, -0.1125030517578125, -0.10590362548828125, -0.09930419921875, -0.09270477294921875, -0.0861053466796875, -0.07950592041015625, -0.072906494140625, -0.06630706787109375, -0.0597076416015625, -0.05310821533203125, -0.0465087890625, -0.03990936279296875, -0.0333099365234375, -0.02671051025390625, -0.020111083984375, -0.01351165771484375, -0.0069122314453125, -0.00031280517578125, 0.00628662109375, 0.01288604736328125, 0.0194854736328125, 0.02608489990234375, 0.032684326171875, 0.03928375244140625, 0.0458831787109375, 0.05248260498046875, 0.05908203125, 0.06568145751953125, 0.0722808837890625, 0.07888031005859375, 0.085479736328125, 0.09207916259765625, 0.0986785888671875, 0.10527801513671875, 0.11187744140625, 0.11847686767578125, 0.1250762939453125, 0.13167572021484375, 0.138275146484375, 0.14487457275390625, 0.1514739990234375, 0.15807342529296875, 0.1646728515625, 0.17127227783203125, 0.1778717041015625, 0.18447113037109375, 0.191070556640625, 0.19766998291015625, 0.2042694091796875, 0.21086883544921875, 0.21746826171875, 0.22406768798828125, 0.2306671142578125, 0.23726654052734375, 0.243865966796875, 0.25046539306640625, 0.2570648193359375, 0.26366424560546875, 0.270263671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 7.0, 2.0, 8.0, 15.0, 19.0, 20.0, 30.0, 41.0, 76.0, 212.0, 291.0, 98.0, 50.0, 41.0, 19.0, 16.0, 20.0, 14.0, 4.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4497509002685547e-05, -2.3801811039447784e-05, -2.3106113076210022e-05, -2.241041511297226e-05, -2.1714717149734497e-05, -2.1019019186496735e-05, -2.0323321223258972e-05, -1.962762326002121e-05, -1.8931925296783447e-05, -1.8236227333545685e-05, -1.7540529370307922e-05, -1.684483140707016e-05, -1.6149133443832397e-05, -1.5453435480594635e-05, -1.4757737517356873e-05, -1.406203955411911e-05, -1.3366341590881348e-05, -1.2670643627643585e-05, -1.1974945664405823e-05, -1.127924770116806e-05, -1.0583549737930298e-05, -9.887851774692535e-06, -9.192153811454773e-06, -8.49645584821701e-06, -7.800757884979248e-06, -7.105059921741486e-06, -6.409361958503723e-06, -5.713663995265961e-06, -5.017966032028198e-06, -4.322268068790436e-06, -3.6265701055526733e-06, -2.930872142314911e-06, -2.2351741790771484e-06, -1.539476215839386e-06, -8.437782526016235e-07, -1.4808028936386108e-07, 5.476176738739014e-07, 1.2433156371116638e-06, 1.9390136003494263e-06, 2.6347115635871887e-06, 3.330409526824951e-06, 4.026107490062714e-06, 4.721805453300476e-06, 5.4175034165382385e-06, 6.113201379776001e-06, 6.8088993430137634e-06, 7.504597306251526e-06, 8.200295269489288e-06, 8.89599323272705e-06, 9.591691195964813e-06, 1.0287389159202576e-05, 1.0983087122440338e-05, 1.16787850856781e-05, 1.2374483048915863e-05, 1.3070181012153625e-05, 1.3765878975391388e-05, 1.446157693862915e-05, 1.5157274901866913e-05, 1.5852972865104675e-05, 1.6548670828342438e-05, 1.72443687915802e-05, 1.7940066754817963e-05, 1.8635764718055725e-05, 1.9331462681293488e-05, 2.002716064453125e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 6.0, 6.0, 7.0, 7.0, 12.0, 18.0, 36.0, 42.0, 63.0, 72.0, 139.0, 195.0, 318.0, 559.0, 1172.0, 3501.0, 24299.0, 855156.0, 149600.0, 9192.0, 2107.0, 779.0, 470.0, 257.0, 179.0, 119.0, 77.0, 64.0, 43.0, 19.0, 18.0, 13.0, 5.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.26708984375, -0.2606983184814453, -0.2543067932128906, -0.24791526794433594, -0.24152374267578125, -0.23513221740722656, -0.22874069213867188, -0.2223491668701172, -0.2159576416015625, -0.2095661163330078, -0.20317459106445312, -0.19678306579589844, -0.19039154052734375, -0.18400001525878906, -0.17760848999023438, -0.1712169647216797, -0.164825439453125, -0.1584339141845703, -0.15204238891601562, -0.14565086364746094, -0.13925933837890625, -0.13286781311035156, -0.12647628784179688, -0.12008476257324219, -0.1136932373046875, -0.10730171203613281, -0.10091018676757812, -0.09451866149902344, -0.08812713623046875, -0.08173561096191406, -0.07534408569335938, -0.06895256042480469, -0.06256103515625, -0.05616950988769531, -0.049777984619140625, -0.04338645935058594, -0.03699493408203125, -0.030603408813476562, -0.024211883544921875, -0.017820358276367188, -0.0114288330078125, -0.0050373077392578125, 0.001354217529296875, 0.0077457427978515625, 0.01413726806640625, 0.020528793334960938, 0.026920318603515625, 0.03331184387207031, 0.039703369140625, 0.04609489440917969, 0.052486419677734375, 0.05887794494628906, 0.06526947021484375, 0.07166099548339844, 0.07805252075195312, 0.08444404602050781, 0.0908355712890625, 0.09722709655761719, 0.10361862182617188, 0.11001014709472656, 0.11640167236328125, 0.12279319763183594, 0.12918472290039062, 0.1355762481689453, 0.1419677734375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 9.0, 8.0, 13.0, 20.0, 25.0, 36.0, 48.0, 66.0, 114.0, 311.0, 107.0, 64.0, 47.0, 32.0, 28.0, 21.0, 9.0, 8.0, 9.0, 6.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0455322265625, -0.04398965835571289, -0.04244709014892578, -0.04090452194213867, -0.03936195373535156, -0.03781938552856445, -0.036276817321777344, -0.034734249114990234, -0.033191680908203125, -0.031649112701416016, -0.030106544494628906, -0.028563976287841797, -0.027021408081054688, -0.025478839874267578, -0.02393627166748047, -0.02239370346069336, -0.02085113525390625, -0.01930856704711914, -0.01776599884033203, -0.016223430633544922, -0.014680862426757812, -0.013138294219970703, -0.011595726013183594, -0.010053157806396484, -0.008510589599609375, -0.006968021392822266, -0.005425453186035156, -0.003882884979248047, -0.0023403167724609375, -0.0007977485656738281, 0.0007448196411132812, 0.0022873878479003906, 0.0038299560546875, 0.005372524261474609, 0.006915092468261719, 0.008457660675048828, 0.010000228881835938, 0.011542797088623047, 0.013085365295410156, 0.014627933502197266, 0.016170501708984375, 0.017713069915771484, 0.019255638122558594, 0.020798206329345703, 0.022340774536132812, 0.023883342742919922, 0.02542591094970703, 0.02696847915649414, 0.02851104736328125, 0.03005361557006836, 0.03159618377685547, 0.03313875198364258, 0.03468132019042969, 0.0362238883972168, 0.037766456604003906, 0.039309024810791016, 0.040851593017578125, 0.042394161224365234, 0.043936729431152344, 0.04547929763793945, 0.04702186584472656, 0.04856443405151367, 0.05010700225830078, 0.05164957046508789, 0.053192138671875]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 11.0, 19.0, 35.0, 85.0, 199.0, 253.0, 203.0, 92.0, 53.0, 25.0, 11.0, 9.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.837075710296631, -2.7774691581726074, -2.717862606048584, -2.6582562923431396, -2.598649740219116, -2.5390431880950928, -2.4794368743896484, -2.419830322265625, -2.3602237701416016, -2.300617218017578, -2.2410106658935547, -2.1814043521881104, -2.121797800064087, -2.0621912479400635, -2.002584934234619, -1.9429783821105957, -1.8833718299865723, -1.8237652778625488, -1.764158844947815, -1.704552412033081, -1.6449458599090576, -1.5853393077850342, -1.5257328748703003, -1.4661264419555664, -1.406519889831543, -1.3469133377075195, -1.2873069047927856, -1.2277004718780518, -1.1680939197540283, -1.1084873676300049, -1.048880934715271, -0.9892744421958923, -0.9296679496765137, -0.870061457157135, -0.8104549646377563, -0.7508484721183777, -0.691241979598999, -0.6316354870796204, -0.5720289945602417, -0.512422502040863, -0.4528160095214844, -0.3932095170021057, -0.33360302448272705, -0.2739965319633484, -0.21439003944396973, -0.15478354692459106, -0.0951770544052124, -0.03557056188583374, 0.024035930633544922, 0.08364242315292358, 0.14324891567230225, 0.2028554081916809, 0.26246190071105957, 0.32206839323043823, 0.3816748857498169, 0.44128137826919556, 0.5008878707885742, 0.5604943633079529, 0.6201008558273315, 0.6797073483467102, 0.7393138408660889, 0.7989203333854675, 0.8585268259048462, 0.9181333184242249, 0.9777398109436035]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 4.0, 8.0, 10.0, 10.0, 6.0, 12.0, 13.0, 13.0, 30.0, 16.0, 18.0, 26.0, 30.0, 27.0, 35.0, 32.0, 28.0, 37.0, 41.0, 37.0, 48.0, 40.0, 42.0, 55.0, 45.0, 37.0, 31.0, 32.0, 34.0, 30.0, 21.0, 19.0, 23.0, 17.0, 21.0, 12.0, 9.0, 15.0, 12.0, 8.0, 8.0, 5.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7865099310874939, -0.7614437937736511, -0.7363776564598083, -0.7113115191459656, -0.6862453818321228, -0.66117924451828, -0.6361130475997925, -0.6110469102859497, -0.5859807729721069, -0.5609146356582642, -0.5358484983444214, -0.5107823610305786, -0.48571622371673584, -0.46065008640289307, -0.4355839192867279, -0.41051778197288513, -0.38545167446136475, -0.360385537147522, -0.3353193998336792, -0.3102532625198364, -0.28518712520599365, -0.2601209878921509, -0.23505482077598572, -0.20998868346214294, -0.18492254614830017, -0.1598564088344574, -0.13479027152061462, -0.10972411930561066, -0.08465798199176788, -0.05959184467792511, -0.03452569246292114, -0.00945955514907837, 0.01560664176940918, 0.04067278280854225, 0.06573892384767532, 0.0908050686120987, 0.11587120592594147, 0.14093734323978424, 0.1660034954547882, 0.19106963276863098, 0.21613577008247375, 0.24120190739631653, 0.2662680447101593, 0.29133421182632446, 0.31640034914016724, 0.34146648645401, 0.3665326237678528, 0.39159876108169556, 0.41666489839553833, 0.4417310357093811, 0.4667971730232239, 0.49186331033706665, 0.5169294476509094, 0.5419955849647522, 0.5670617818832397, 0.5921279191970825, 0.6171940565109253, 0.6422601938247681, 0.6673263311386108, 0.6923924684524536, 0.7174586057662964, 0.7425247430801392, 0.7675908803939819, 0.7926570177078247, 0.8177231550216675]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 6.0, 4.0, 10.0, 5.0, 11.0, 22.0, 18.0, 27.0, 37.0, 55.0, 81.0, 117.0, 172.0, 257.0, 393.0, 598.0, 1036.0, 2005.0, 4166.0, 14365.0, 147184.0, 3508166.0, 478432.0, 25545.0, 5891.0, 2398.0, 1238.0, 743.0, 417.0, 270.0, 196.0, 122.0, 88.0, 68.0, 47.0, 19.0, 24.0, 10.0, 10.0, 9.0, 7.0, 7.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.6826171875, -0.6587905883789062, -0.6349639892578125, -0.6111373901367188, -0.587310791015625, -0.5634841918945312, -0.5396575927734375, -0.5158309936523438, -0.49200439453125, -0.46817779541015625, -0.4443511962890625, -0.42052459716796875, -0.396697998046875, -0.37287139892578125, -0.3490447998046875, -0.32521820068359375, -0.3013916015625, -0.27756500244140625, -0.2537384033203125, -0.22991180419921875, -0.206085205078125, -0.18225860595703125, -0.1584320068359375, -0.13460540771484375, -0.11077880859375, -0.08695220947265625, -0.0631256103515625, -0.03929901123046875, -0.015472412109375, 0.00835418701171875, 0.0321807861328125, 0.05600738525390625, 0.079833984375, 0.10366058349609375, 0.1274871826171875, 0.15131378173828125, 0.175140380859375, 0.19896697998046875, 0.2227935791015625, 0.24662017822265625, 0.27044677734375, 0.29427337646484375, 0.3180999755859375, 0.34192657470703125, 0.365753173828125, 0.38957977294921875, 0.4134063720703125, 0.43723297119140625, 0.4610595703125, 0.48488616943359375, 0.5087127685546875, 0.5325393676757812, 0.556365966796875, 0.5801925659179688, 0.6040191650390625, 0.6278457641601562, 0.65167236328125, 0.6754989624023438, 0.6993255615234375, 0.7231521606445312, 0.746978759765625, 0.7708053588867188, 0.7946319580078125, 0.8184585571289062, 0.84228515625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 11.0, 5.0, 3.0, 8.0, 6.0, 20.0, 22.0, 18.0, 36.0, 33.0, 36.0, 40.0, 42.0, 56.0, 53.0, 63.0, 65.0, 70.0, 74.0, 51.0, 53.0, 55.0, 37.0, 47.0, 25.0, 13.0, 18.0, 10.0, 8.0, 10.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.370361328125, -0.3595390319824219, -0.34871673583984375, -0.3378944396972656, -0.3270721435546875, -0.3162498474121094, -0.30542755126953125, -0.2946052551269531, -0.283782958984375, -0.2729606628417969, -0.26213836669921875, -0.2513160705566406, -0.2404937744140625, -0.22967147827148438, -0.21884918212890625, -0.20802688598632812, -0.19720458984375, -0.18638229370117188, -0.17555999755859375, -0.16473770141601562, -0.1539154052734375, -0.14309310913085938, -0.13227081298828125, -0.12144851684570312, -0.110626220703125, -0.09980392456054688, -0.08898162841796875, -0.07815933227539062, -0.0673370361328125, -0.056514739990234375, -0.04569244384765625, -0.034870147705078125, -0.0240478515625, -0.013225555419921875, -0.00240325927734375, 0.008419036865234375, 0.0192413330078125, 0.030063629150390625, 0.04088592529296875, 0.051708221435546875, 0.062530517578125, 0.07335281372070312, 0.08417510986328125, 0.09499740600585938, 0.1058197021484375, 0.11664199829101562, 0.12746429443359375, 0.13828659057617188, 0.14910888671875, 0.15993118286132812, 0.17075347900390625, 0.18157577514648438, 0.1923980712890625, 0.20322036743164062, 0.21404266357421875, 0.22486495971679688, 0.235687255859375, 0.24650955200195312, 0.25733184814453125, 0.2681541442871094, 0.2789764404296875, 0.2897987365722656, 0.30062103271484375, 0.3114433288574219, 0.322265625]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 13.0, 14.0, 21.0, 28.0, 28.0, 60.0, 116.0, 174.0, 354.0, 801.0, 2048.0, 6818.0, 41918.0, 3486077.0, 627117.0, 21514.0, 4472.0, 1479.0, 618.0, 235.0, 146.0, 84.0, 59.0, 23.0, 17.0, 11.0, 9.0, 12.0, 10.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.076171875, -1.046966552734375, -1.01776123046875, -0.988555908203125, -0.9593505859375, -0.930145263671875, -0.90093994140625, -0.871734619140625, -0.842529296875, -0.813323974609375, -0.78411865234375, -0.754913330078125, -0.7257080078125, -0.696502685546875, -0.66729736328125, -0.638092041015625, -0.60888671875, -0.579681396484375, -0.55047607421875, -0.521270751953125, -0.4920654296875, -0.462860107421875, -0.43365478515625, -0.404449462890625, -0.375244140625, -0.346038818359375, -0.31683349609375, -0.287628173828125, -0.2584228515625, -0.229217529296875, -0.20001220703125, -0.170806884765625, -0.1416015625, -0.112396240234375, -0.08319091796875, -0.053985595703125, -0.0247802734375, 0.004425048828125, 0.03363037109375, 0.062835693359375, 0.092041015625, 0.121246337890625, 0.15045166015625, 0.179656982421875, 0.2088623046875, 0.238067626953125, 0.26727294921875, 0.296478271484375, 0.32568359375, 0.354888916015625, 0.38409423828125, 0.413299560546875, 0.4425048828125, 0.471710205078125, 0.50091552734375, 0.530120849609375, 0.559326171875, 0.588531494140625, 0.61773681640625, 0.646942138671875, 0.6761474609375, 0.705352783203125, 0.73455810546875, 0.763763427734375, 0.79296875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 4.0, 4.0, 8.0, 13.0, 13.0, 19.0, 21.0, 32.0, 62.0, 141.0, 290.0, 764.0, 1202.0, 791.0, 330.0, 155.0, 85.0, 39.0, 28.0, 35.0, 10.0, 9.0, 11.0, 1.0, 3.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1534423828125, -0.1463298797607422, -0.13921737670898438, -0.13210487365722656, -0.12499237060546875, -0.11787986755371094, -0.11076736450195312, -0.10365486145019531, -0.0965423583984375, -0.08942985534667969, -0.08231735229492188, -0.07520484924316406, -0.06809234619140625, -0.06097984313964844, -0.053867340087890625, -0.04675483703613281, -0.039642333984375, -0.03252983093261719, -0.025417327880859375, -0.018304824829101562, -0.01119232177734375, -0.0040798187255859375, 0.003032684326171875, 0.010145187377929688, 0.0172576904296875, 0.024370193481445312, 0.031482696533203125, 0.03859519958496094, 0.04570770263671875, 0.05282020568847656, 0.059932708740234375, 0.06704521179199219, 0.07415771484375, 0.08127021789550781, 0.08838272094726562, 0.09549522399902344, 0.10260772705078125, 0.10972023010253906, 0.11683273315429688, 0.12394523620605469, 0.1310577392578125, 0.1381702423095703, 0.14528274536132812, 0.15239524841308594, 0.15950775146484375, 0.16662025451660156, 0.17373275756835938, 0.1808452606201172, 0.187957763671875, 0.1950702667236328, 0.20218276977539062, 0.20929527282714844, 0.21640777587890625, 0.22352027893066406, 0.23063278198242188, 0.2377452850341797, 0.2448577880859375, 0.2519702911376953, 0.2590827941894531, 0.26619529724121094, 0.27330780029296875, 0.28042030334472656, 0.2875328063964844, 0.2946453094482422, 0.3017578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 6.0, 12.0, 37.0, 76.0, 108.0, 170.0, 216.0, 152.0, 95.0, 48.0, 36.0, 14.0, 15.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3474003076553345, -1.3131623268127441, -1.2789243459701538, -1.2446863651275635, -1.2104483842849731, -1.1762104034423828, -1.1419724225997925, -1.1077344417572021, -1.0734963417053223, -1.039258360862732, -1.0050203800201416, -0.9707823991775513, -0.9365444183349609, -0.9023064374923706, -0.8680683970451355, -0.8338304162025452, -0.7995924949645996, -0.7653545141220093, -0.731116533279419, -0.6968785524368286, -0.6626405715942383, -0.628402590751648, -0.5941645503044128, -0.5599265694618225, -0.5256885886192322, -0.49145060777664185, -0.4572126269340515, -0.4229746162891388, -0.38873663544654846, -0.35449865460395813, -0.3202606439590454, -0.2860226631164551, -0.2517847418785095, -0.2175467610359192, -0.18330876529216766, -0.14907076954841614, -0.1148327887058258, -0.08059480786323547, -0.04635681211948395, -0.012118816375732422, 0.02211916446685791, 0.05635715276002884, 0.09059514105319977, 0.1248331293463707, 0.15907111763954163, 0.19330909848213196, 0.22754709422588348, 0.261785089969635, 0.29602307081222534, 0.3302610516548157, 0.364499032497406, 0.3987370431423187, 0.43297502398490906, 0.4672130048274994, 0.5014510154724121, 0.5356889963150024, 0.5699269771575928, 0.6041649580001831, 0.6384029388427734, 0.6726409196853638, 0.7068789005279541, 0.7411168813705444, 0.7753549218177795, 0.8095929026603699, 0.8438308835029602]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 8.0, 12.0, 17.0, 12.0, 11.0, 26.0, 20.0, 22.0, 27.0, 26.0, 28.0, 33.0, 38.0, 44.0, 33.0, 43.0, 51.0, 39.0, 52.0, 44.0, 42.0, 51.0, 30.0, 32.0, 45.0, 45.0, 25.0, 20.0, 23.0, 21.0, 20.0, 14.0, 14.0, 5.0, 4.0, 6.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3229515254497528, -0.31225916743278503, -0.3015667796134949, -0.2908744215965271, -0.2801820635795593, -0.26948967576026917, -0.2587973177433014, -0.24810494482517242, -0.23741257190704346, -0.2267201989889145, -0.21602782607078552, -0.20533546805381775, -0.19464309513568878, -0.18395072221755981, -0.17325836420059204, -0.16256599128246307, -0.1518736183643341, -0.14118124544620514, -0.13048887252807617, -0.1197965145111084, -0.10910414159297943, -0.09841176867485046, -0.0877194032073021, -0.07702703773975372, -0.06633466482162476, -0.05564229562878609, -0.04494992643594742, -0.03425755724310875, -0.02356518805027008, -0.012872818857431412, -0.002180449664592743, 0.008511915802955627, 0.019204288721084595, 0.029896657913923264, 0.04058902710676193, 0.0512813962996006, 0.06197376549243927, 0.07266613841056824, 0.08335850387811661, 0.09405086934566498, 0.10474324226379395, 0.11543561518192291, 0.12612798810005188, 0.13682034611701965, 0.14751271903514862, 0.1582050919532776, 0.16889744997024536, 0.17958982288837433, 0.1902821958065033, 0.20097456872463226, 0.21166694164276123, 0.222359299659729, 0.23305167257785797, 0.24374404549598694, 0.2544364035129547, 0.2651287913322449, 0.27582114934921265, 0.2865135073661804, 0.2972058951854706, 0.30789825320243835, 0.3185906410217285, 0.3292829990386963, 0.33997535705566406, 0.35066771507263184, 0.361360102891922]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 9.0, 9.0, 19.0, 21.0, 25.0, 34.0, 57.0, 116.0, 186.0, 384.0, 750.0, 1617.0, 3582.0, 9799.0, 36458.0, 391295.0, 539358.0, 45711.0, 11466.0, 4125.0, 1749.0, 838.0, 388.0, 217.0, 139.0, 69.0, 39.0, 33.0, 19.0, 14.0, 9.0, 9.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.265869140625, -0.25806427001953125, -0.2502593994140625, -0.24245452880859375, -0.234649658203125, -0.22684478759765625, -0.2190399169921875, -0.21123504638671875, -0.20343017578125, -0.19562530517578125, -0.1878204345703125, -0.18001556396484375, -0.172210693359375, -0.16440582275390625, -0.1566009521484375, -0.14879608154296875, -0.1409912109375, -0.13318634033203125, -0.1253814697265625, -0.11757659912109375, -0.109771728515625, -0.10196685791015625, -0.0941619873046875, -0.08635711669921875, -0.07855224609375, -0.07074737548828125, -0.0629425048828125, -0.05513763427734375, -0.047332763671875, -0.03952789306640625, -0.0317230224609375, -0.02391815185546875, -0.01611328125, -0.00830841064453125, -0.0005035400390625, 0.00730133056640625, 0.015106201171875, 0.02291107177734375, 0.0307159423828125, 0.03852081298828125, 0.04632568359375, 0.05413055419921875, 0.0619354248046875, 0.06974029541015625, 0.077545166015625, 0.08535003662109375, 0.0931549072265625, 0.10095977783203125, 0.1087646484375, 0.11656951904296875, 0.1243743896484375, 0.13217926025390625, 0.139984130859375, 0.14778900146484375, 0.1555938720703125, 0.16339874267578125, 0.17120361328125, 0.17900848388671875, 0.1868133544921875, 0.19461822509765625, 0.202423095703125, 0.21022796630859375, 0.2180328369140625, 0.22583770751953125, 0.233642578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 5.0, 8.0, 10.0, 5.0, 12.0, 22.0, 18.0, 20.0, 20.0, 19.0, 31.0, 34.0, 39.0, 32.0, 46.0, 37.0, 42.0, 52.0, 41.0, 46.0, 53.0, 50.0, 31.0, 29.0, 45.0, 35.0, 39.0, 37.0, 15.0, 22.0, 23.0, 15.0, 17.0, 13.0, 15.0, 5.0, 2.0, 1.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2283935546875, -0.22100448608398438, -0.21361541748046875, -0.20622634887695312, -0.1988372802734375, -0.19144821166992188, -0.18405914306640625, -0.17667007446289062, -0.169281005859375, -0.16189193725585938, -0.15450286865234375, -0.14711380004882812, -0.1397247314453125, -0.13233566284179688, -0.12494659423828125, -0.11755752563476562, -0.11016845703125, -0.10277938842773438, -0.09539031982421875, -0.08800125122070312, -0.0806121826171875, -0.07322311401367188, -0.06583404541015625, -0.058444976806640625, -0.051055908203125, -0.043666839599609375, -0.03627777099609375, -0.028888702392578125, -0.0214996337890625, -0.014110565185546875, -0.00672149658203125, 0.000667572021484375, 0.008056640625, 0.015445709228515625, 0.02283477783203125, 0.030223846435546875, 0.0376129150390625, 0.045001983642578125, 0.05239105224609375, 0.059780120849609375, 0.067169189453125, 0.07455825805664062, 0.08194732666015625, 0.08933639526367188, 0.0967254638671875, 0.10411453247070312, 0.11150360107421875, 0.11889266967773438, 0.12628173828125, 0.13367080688476562, 0.14105987548828125, 0.14844894409179688, 0.1558380126953125, 0.16322708129882812, 0.17061614990234375, 0.17800521850585938, 0.185394287109375, 0.19278335571289062, 0.20017242431640625, 0.20756149291992188, 0.2149505615234375, 0.22233963012695312, 0.22972869873046875, 0.23711776733398438, 0.2445068359375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 7.0, 11.0, 20.0, 28.0, 37.0, 68.0, 85.0, 120.0, 170.0, 279.0, 448.0, 691.0, 1181.0, 1945.0, 3568.0, 6779.0, 14572.0, 35874.0, 114657.0, 422093.0, 312213.0, 81087.0, 27549.0, 11791.0, 5752.0, 3030.0, 1722.0, 1043.0, 618.0, 391.0, 225.0, 150.0, 128.0, 75.0, 53.0, 30.0, 16.0, 14.0, 12.0, 9.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09893798828125, -0.09583282470703125, -0.0927276611328125, -0.08962249755859375, -0.086517333984375, -0.08341217041015625, -0.0803070068359375, -0.07720184326171875, -0.0740966796875, -0.07099151611328125, -0.0678863525390625, -0.06478118896484375, -0.061676025390625, -0.05857086181640625, -0.0554656982421875, -0.05236053466796875, -0.04925537109375, -0.04615020751953125, -0.0430450439453125, -0.03993988037109375, -0.036834716796875, -0.03372955322265625, -0.0306243896484375, -0.02751922607421875, -0.0244140625, -0.02130889892578125, -0.0182037353515625, -0.01509857177734375, -0.011993408203125, -0.00888824462890625, -0.0057830810546875, -0.00267791748046875, 0.00042724609375, 0.00353240966796875, 0.0066375732421875, 0.00974273681640625, 0.012847900390625, 0.01595306396484375, 0.0190582275390625, 0.02216339111328125, 0.0252685546875, 0.02837371826171875, 0.0314788818359375, 0.03458404541015625, 0.037689208984375, 0.04079437255859375, 0.0438995361328125, 0.04700469970703125, 0.05010986328125, 0.05321502685546875, 0.0563201904296875, 0.05942535400390625, 0.062530517578125, 0.06563568115234375, 0.0687408447265625, 0.07184600830078125, 0.074951171875, 0.07805633544921875, 0.0811614990234375, 0.08426666259765625, 0.087371826171875, 0.09047698974609375, 0.0935821533203125, 0.09668731689453125, 0.09979248046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 7.0, 8.0, 5.0, 5.0, 13.0, 22.0, 14.0, 29.0, 25.0, 31.0, 25.0, 28.0, 41.0, 46.0, 59.0, 49.0, 62.0, 52.0, 55.0, 48.0, 55.0, 41.0, 34.0, 32.0, 32.0, 32.0, 37.0, 23.0, 12.0, 15.0, 9.0, 13.0, 9.0, 12.0, 7.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52783203125, -0.5111312866210938, -0.4944305419921875, -0.47772979736328125, -0.461029052734375, -0.44432830810546875, -0.4276275634765625, -0.41092681884765625, -0.39422607421875, -0.37752532958984375, -0.3608245849609375, -0.34412384033203125, -0.327423095703125, -0.31072235107421875, -0.2940216064453125, -0.27732086181640625, -0.2606201171875, -0.24391937255859375, -0.2272186279296875, -0.21051788330078125, -0.193817138671875, -0.17711639404296875, -0.1604156494140625, -0.14371490478515625, -0.12701416015625, -0.11031341552734375, -0.0936126708984375, -0.07691192626953125, -0.060211181640625, -0.04351043701171875, -0.0268096923828125, -0.01010894775390625, 0.006591796875, 0.02329254150390625, 0.0399932861328125, 0.05669403076171875, 0.073394775390625, 0.09009552001953125, 0.1067962646484375, 0.12349700927734375, 0.14019775390625, 0.15689849853515625, 0.1735992431640625, 0.19029998779296875, 0.207000732421875, 0.22370147705078125, 0.2404022216796875, 0.25710296630859375, 0.2738037109375, 0.29050445556640625, 0.3072052001953125, 0.32390594482421875, 0.340606689453125, 0.35730743408203125, 0.3740081787109375, 0.39070892333984375, 0.40740966796875, 0.42411041259765625, 0.4408111572265625, 0.45751190185546875, 0.474212646484375, 0.49091339111328125, 0.5076141357421875, 0.5243148803710938, 0.541015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 8.0, 5.0, 12.0, 10.0, 25.0, 27.0, 75.0, 99.0, 182.0, 334.0, 607.0, 1370.0, 3362.0, 9684.0, 35866.0, 181399.0, 567005.0, 194186.0, 37909.0, 10132.0, 3474.0, 1347.0, 643.0, 345.0, 188.0, 100.0, 53.0, 42.0, 22.0, 19.0, 12.0, 3.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0241241455078125, -0.023247480392456055, -0.02237081527709961, -0.021494150161743164, -0.02061748504638672, -0.019740819931030273, -0.018864154815673828, -0.017987489700317383, -0.017110824584960938, -0.016234159469604492, -0.015357494354248047, -0.014480829238891602, -0.013604164123535156, -0.012727499008178711, -0.011850833892822266, -0.01097416877746582, -0.010097503662109375, -0.00922083854675293, -0.008344173431396484, -0.007467508316040039, -0.006590843200683594, -0.0057141780853271484, -0.004837512969970703, -0.003960847854614258, -0.0030841827392578125, -0.002207517623901367, -0.0013308525085449219, -0.00045418739318847656, 0.00042247772216796875, 0.001299142837524414, 0.0021758079528808594, 0.0030524730682373047, 0.00392913818359375, 0.004805803298950195, 0.005682468414306641, 0.006559133529663086, 0.007435798645019531, 0.008312463760375977, 0.009189128875732422, 0.010065793991088867, 0.010942459106445312, 0.011819124221801758, 0.012695789337158203, 0.013572454452514648, 0.014449119567871094, 0.015325784683227539, 0.016202449798583984, 0.01707911491394043, 0.017955780029296875, 0.01883244514465332, 0.019709110260009766, 0.02058577537536621, 0.021462440490722656, 0.0223391056060791, 0.023215770721435547, 0.024092435836791992, 0.024969100952148438, 0.025845766067504883, 0.026722431182861328, 0.027599096298217773, 0.02847576141357422, 0.029352426528930664, 0.03022909164428711, 0.031105756759643555, 0.031982421875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 6.0, 10.0, 9.0, 16.0, 11.0, 27.0, 29.0, 36.0, 61.0, 42.0, 83.0, 82.0, 107.0, 83.0, 84.0, 67.0, 66.0, 41.0, 38.0, 21.0, 22.0, 18.0, 6.0, 8.0, 3.0, 2.0, 7.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.0788440704345703e-05, -1.0398216545581818e-05, -1.0007992386817932e-05, -9.617768228054047e-06, -9.227544069290161e-06, -8.837319910526276e-06, -8.44709575176239e-06, -8.056871592998505e-06, -7.666647434234619e-06, -7.276423275470734e-06, -6.886199116706848e-06, -6.495974957942963e-06, -6.105750799179077e-06, -5.715526640415192e-06, -5.325302481651306e-06, -4.935078322887421e-06, -4.544854164123535e-06, -4.15463000535965e-06, -3.764405846595764e-06, -3.3741816878318787e-06, -2.983957529067993e-06, -2.5937333703041077e-06, -2.203509211540222e-06, -1.8132850527763367e-06, -1.4230608940124512e-06, -1.0328367352485657e-06, -6.426125764846802e-07, -2.523884177207947e-07, 1.3783574104309082e-07, 5.280598998069763e-07, 9.182840585708618e-07, 1.3085082173347473e-06, 1.6987323760986328e-06, 2.0889565348625183e-06, 2.479180693626404e-06, 2.8694048523902893e-06, 3.259629011154175e-06, 3.6498531699180603e-06, 4.040077328681946e-06, 4.430301487445831e-06, 4.820525646209717e-06, 5.210749804973602e-06, 5.600973963737488e-06, 5.991198122501373e-06, 6.381422281265259e-06, 6.771646440029144e-06, 7.16187059879303e-06, 7.552094757556915e-06, 7.9423189163208e-06, 8.332543075084686e-06, 8.722767233848572e-06, 9.112991392612457e-06, 9.503215551376343e-06, 9.893439710140228e-06, 1.0283663868904114e-05, 1.0673888027668e-05, 1.1064112186431885e-05, 1.145433634519577e-05, 1.1844560503959656e-05, 1.2234784662723541e-05, 1.2625008821487427e-05, 1.3015232980251312e-05, 1.3405457139015198e-05, 1.3795681297779083e-05, 1.4185905456542969e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 7.0, 11.0, 9.0, 19.0, 29.0, 38.0, 62.0, 78.0, 104.0, 197.0, 279.0, 495.0, 903.0, 1738.0, 3275.0, 7195.0, 16942.0, 45026.0, 129020.0, 318710.0, 319082.0, 128580.0, 45373.0, 16915.0, 7134.0, 3276.0, 1751.0, 878.0, 533.0, 297.0, 205.0, 120.0, 83.0, 57.0, 41.0, 20.0, 26.0, 16.0, 8.0, 4.0, 3.0, 3.0, 0.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0204010009765625, -0.019763469696044922, -0.019125938415527344, -0.018488407135009766, -0.017850875854492188, -0.01721334457397461, -0.01657581329345703, -0.015938282012939453, -0.015300750732421875, -0.014663219451904297, -0.014025688171386719, -0.01338815689086914, -0.012750625610351562, -0.012113094329833984, -0.011475563049316406, -0.010838031768798828, -0.01020050048828125, -0.009562969207763672, -0.008925437927246094, -0.008287906646728516, -0.0076503753662109375, -0.007012844085693359, -0.006375312805175781, -0.005737781524658203, -0.005100250244140625, -0.004462718963623047, -0.0038251876831054688, -0.0031876564025878906, -0.0025501251220703125, -0.0019125938415527344, -0.0012750625610351562, -0.0006375312805175781, 0.0, 0.0006375312805175781, 0.0012750625610351562, 0.0019125938415527344, 0.0025501251220703125, 0.0031876564025878906, 0.0038251876831054688, 0.004462718963623047, 0.005100250244140625, 0.005737781524658203, 0.006375312805175781, 0.007012844085693359, 0.0076503753662109375, 0.008287906646728516, 0.008925437927246094, 0.009562969207763672, 0.01020050048828125, 0.010838031768798828, 0.011475563049316406, 0.012113094329833984, 0.012750625610351562, 0.01338815689086914, 0.014025688171386719, 0.014663219451904297, 0.015300750732421875, 0.015938282012939453, 0.01657581329345703, 0.01721334457397461, 0.017850875854492188, 0.018488407135009766, 0.019125938415527344, 0.019763469696044922, 0.0204010009765625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 2.0, 7.0, 4.0, 7.0, 8.0, 12.0, 18.0, 13.0, 18.0, 23.0, 13.0, 29.0, 31.0, 42.0, 44.0, 39.0, 55.0, 47.0, 53.0, 60.0, 49.0, 59.0, 27.0, 56.0, 39.0, 38.0, 23.0, 24.0, 31.0, 18.0, 16.0, 23.0, 15.0, 15.0, 7.0, 8.0, 5.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005664825439453125, -0.005479335784912109, -0.005293846130371094, -0.005108356475830078, -0.0049228668212890625, -0.004737377166748047, -0.004551887512207031, -0.004366397857666016, -0.004180908203125, -0.003995418548583984, -0.0038099288940429688, -0.003624439239501953, -0.0034389495849609375, -0.003253459930419922, -0.0030679702758789062, -0.0028824806213378906, -0.002696990966796875, -0.0025115013122558594, -0.0023260116577148438, -0.002140522003173828, -0.0019550323486328125, -0.0017695426940917969, -0.0015840530395507812, -0.0013985633850097656, -0.00121307373046875, -0.0010275840759277344, -0.0008420944213867188, -0.0006566047668457031, -0.0004711151123046875, -0.0002856254577636719, -0.00010013580322265625, 8.535385131835938e-05, 0.000270843505859375, 0.0004563331604003906, 0.0006418228149414062, 0.0008273124694824219, 0.0010128021240234375, 0.0011982917785644531, 0.0013837814331054688, 0.0015692710876464844, 0.0017547607421875, 0.0019402503967285156, 0.0021257400512695312, 0.002311229705810547, 0.0024967193603515625, 0.002682209014892578, 0.0028676986694335938, 0.0030531883239746094, 0.003238677978515625, 0.0034241676330566406, 0.0036096572875976562, 0.003795146942138672, 0.0039806365966796875, 0.004166126251220703, 0.004351615905761719, 0.004537105560302734, 0.00472259521484375, 0.004908084869384766, 0.005093574523925781, 0.005279064178466797, 0.0054645538330078125, 0.005650043487548828, 0.005835533142089844, 0.006021022796630859, 0.006206512451171875]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 8.0, 8.0, 13.0, 29.0, 49.0, 80.0, 137.0, 202.0, 185.0, 124.0, 74.0, 37.0, 16.0, 19.0, 11.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7547540664672852, -0.7331125736236572, -0.7114710807800293, -0.6898295879364014, -0.6681880950927734, -0.6465466022491455, -0.6249051094055176, -0.6032635569572449, -0.5816220641136169, -0.559980571269989, -0.5383390784263611, -0.5166975855827332, -0.49505606293678284, -0.4734145700931549, -0.451773077249527, -0.43013155460357666, -0.4084900915622711, -0.3868485987186432, -0.36520710587501526, -0.34356558322906494, -0.321924090385437, -0.3002825975418091, -0.27864110469818115, -0.2569996118545532, -0.2353581041097641, -0.21371661126613617, -0.19207510352134705, -0.17043361067771912, -0.1487921178340912, -0.12715061008930206, -0.10550911724567413, -0.08386760950088501, -0.06222611665725708, -0.04058461636304855, -0.018943119794130325, 0.002698376774787903, 0.02433987706899643, 0.045981377363204956, 0.06762287020683289, 0.08926437795162201, 0.11090587079524994, 0.13254736363887787, 0.154188871383667, 0.17583036422729492, 0.19747185707092285, 0.21911336481571198, 0.2407548576593399, 0.26239636540412903, 0.28403785824775696, 0.3056793510913849, 0.3273208439350128, 0.34896236658096313, 0.37060385942459106, 0.392245352268219, 0.4138868451118469, 0.43552833795547485, 0.4571698307991028, 0.4788113236427307, 0.5004528164863586, 0.5220943093299866, 0.5437358021736145, 0.5653773546218872, 0.5870188474655151, 0.6086603403091431, 0.630301833152771]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 13.0, 13.0, 10.0, 13.0, 16.0, 23.0, 20.0, 26.0, 21.0, 28.0, 41.0, 39.0, 40.0, 36.0, 38.0, 48.0, 36.0, 49.0, 45.0, 56.0, 44.0, 32.0, 43.0, 37.0, 47.0, 24.0, 20.0, 31.0, 21.0, 21.0, 14.0, 15.0, 8.0, 6.0, 5.0, 2.0, 5.0, 1.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22479639947414398, -0.21756847202777863, -0.21034054458141327, -0.2031126171350479, -0.19588468968868256, -0.1886567622423172, -0.18142881989479065, -0.1742008924484253, -0.16697296500205994, -0.15974503755569458, -0.15251711010932922, -0.14528918266296387, -0.1380612552165985, -0.13083332777023315, -0.1236053928732872, -0.11637746542692184, -0.10914954543113708, -0.10192161798477173, -0.09469369053840637, -0.08746576309204102, -0.08023783564567566, -0.0730099081993103, -0.06578197330236435, -0.05855404585599899, -0.051326118409633636, -0.04409819096326828, -0.036870263516902924, -0.02964233234524727, -0.022414404898881912, -0.015186477452516556, -0.007958546280860901, -0.0007306188344955444, 0.006497308611869812, 0.013725236989557743, 0.020953165367245674, 0.02818109467625618, 0.035409022122621536, 0.04263694956898689, 0.04986488074064255, 0.057092808187007904, 0.06432073563337326, 0.07154866307973862, 0.07877659052610397, 0.08600452542304993, 0.09323245286941528, 0.10046038031578064, 0.107688307762146, 0.11491623520851135, 0.12214416265487671, 0.12937209010124207, 0.13660001754760742, 0.14382794499397278, 0.15105587244033813, 0.1582837998867035, 0.16551172733306885, 0.1727396547794342, 0.17996758222579956, 0.18719550967216492, 0.19442343711853027, 0.20165136456489563, 0.208879292011261, 0.21610721945762634, 0.2233351469039917, 0.23056307435035706, 0.2377910166978836]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 8.0, 7.0, 18.0, 8.0, 20.0, 31.0, 31.0, 45.0, 80.0, 112.0, 152.0, 240.0, 400.0, 767.0, 1277.0, 2590.0, 7216.0, 26726.0, 163875.0, 704753.0, 109247.0, 19914.0, 5934.0, 2303.0, 1104.0, 628.0, 356.0, 244.0, 157.0, 96.0, 50.0, 48.0, 35.0, 27.0, 19.0, 13.0, 7.0, 3.0, 7.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29833984375, -0.28745269775390625, -0.2765655517578125, -0.26567840576171875, -0.254791259765625, -0.24390411376953125, -0.2330169677734375, -0.22212982177734375, -0.21124267578125, -0.20035552978515625, -0.1894683837890625, -0.17858123779296875, -0.167694091796875, -0.15680694580078125, -0.1459197998046875, -0.13503265380859375, -0.1241455078125, -0.11325836181640625, -0.1023712158203125, -0.09148406982421875, -0.080596923828125, -0.06970977783203125, -0.0588226318359375, -0.04793548583984375, -0.03704833984375, -0.02616119384765625, -0.0152740478515625, -0.00438690185546875, 0.006500244140625, 0.01738739013671875, 0.0282745361328125, 0.03916168212890625, 0.050048828125, 0.06093597412109375, 0.0718231201171875, 0.08271026611328125, 0.093597412109375, 0.10448455810546875, 0.1153717041015625, 0.12625885009765625, 0.13714599609375, 0.14803314208984375, 0.1589202880859375, 0.16980743408203125, 0.180694580078125, 0.19158172607421875, 0.2024688720703125, 0.21335601806640625, 0.2242431640625, 0.23513031005859375, 0.2460174560546875, 0.25690460205078125, 0.267791748046875, 0.27867889404296875, 0.2895660400390625, 0.30045318603515625, 0.31134033203125, 0.32222747802734375, 0.3331146240234375, 0.34400177001953125, 0.354888916015625, 0.36577606201171875, 0.3766632080078125, 0.38755035400390625, 0.3984375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 3.0, 6.0, 10.0, 14.0, 9.0, 16.0, 12.0, 29.0, 20.0, 38.0, 33.0, 52.0, 38.0, 50.0, 53.0, 51.0, 53.0, 40.0, 47.0, 58.0, 56.0, 48.0, 43.0, 37.0, 26.0, 35.0, 26.0, 21.0, 14.0, 17.0, 8.0, 9.0, 5.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45556640625, -0.43991851806640625, -0.4242706298828125, -0.40862274169921875, -0.392974853515625, -0.37732696533203125, -0.3616790771484375, -0.34603118896484375, -0.33038330078125, -0.31473541259765625, -0.2990875244140625, -0.28343963623046875, -0.267791748046875, -0.25214385986328125, -0.2364959716796875, -0.22084808349609375, -0.2052001953125, -0.18955230712890625, -0.1739044189453125, -0.15825653076171875, -0.142608642578125, -0.12696075439453125, -0.1113128662109375, -0.09566497802734375, -0.08001708984375, -0.06436920166015625, -0.0487213134765625, -0.03307342529296875, -0.017425537109375, -0.00177764892578125, 0.0138702392578125, 0.02951812744140625, 0.045166015625, 0.06081390380859375, 0.0764617919921875, 0.09210968017578125, 0.107757568359375, 0.12340545654296875, 0.1390533447265625, 0.15470123291015625, 0.17034912109375, 0.18599700927734375, 0.2016448974609375, 0.21729278564453125, 0.232940673828125, 0.24858856201171875, 0.2642364501953125, 0.27988433837890625, 0.2955322265625, 0.31118011474609375, 0.3268280029296875, 0.34247589111328125, 0.358123779296875, 0.37377166748046875, 0.3894195556640625, 0.40506744384765625, 0.42071533203125, 0.43636322021484375, 0.4520111083984375, 0.46765899658203125, 0.483306884765625, 0.49895477294921875, 0.5146026611328125, 0.5302505493164062, 0.5458984375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 6.0, 4.0, 6.0, 15.0, 9.0, 11.0, 17.0, 29.0, 30.0, 43.0, 50.0, 112.0, 236.0, 646.0, 3289.0, 110254.0, 923446.0, 8400.0, 1210.0, 341.0, 138.0, 72.0, 39.0, 33.0, 26.0, 28.0, 13.0, 14.0, 9.0, 8.0, 9.0, 4.0, 7.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3251953125, -1.2895736694335938, -1.2539520263671875, -1.2183303833007812, -1.182708740234375, -1.1470870971679688, -1.1114654541015625, -1.0758438110351562, -1.04022216796875, -1.0046005249023438, -0.9689788818359375, -0.9333572387695312, -0.897735595703125, -0.8621139526367188, -0.8264923095703125, -0.7908706665039062, -0.7552490234375, -0.7196273803710938, -0.6840057373046875, -0.6483840942382812, -0.612762451171875, -0.5771408081054688, -0.5415191650390625, -0.5058975219726562, -0.47027587890625, -0.43465423583984375, -0.3990325927734375, -0.36341094970703125, -0.327789306640625, -0.29216766357421875, -0.2565460205078125, -0.22092437744140625, -0.185302734375, -0.14968109130859375, -0.1140594482421875, -0.07843780517578125, -0.042816162109375, -0.00719451904296875, 0.0284271240234375, 0.06404876708984375, 0.09967041015625, 0.13529205322265625, 0.1709136962890625, 0.20653533935546875, 0.242156982421875, 0.27777862548828125, 0.3134002685546875, 0.34902191162109375, 0.3846435546875, 0.42026519775390625, 0.4558868408203125, 0.49150848388671875, 0.527130126953125, 0.5627517700195312, 0.5983734130859375, 0.6339950561523438, 0.66961669921875, 0.7052383422851562, 0.7408599853515625, 0.7764816284179688, 0.812103271484375, 0.8477249145507812, 0.8833465576171875, 0.9189682006835938, 0.95458984375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 8.0, 9.0, 7.0, 12.0, 19.0, 30.0, 31.0, 35.0, 30.0, 56.0, 54.0, 42.0, 52.0, 58.0, 63.0, 68.0, 63.0, 61.0, 55.0, 43.0, 24.0, 30.0, 27.0, 26.0, 18.0, 12.0, 11.0, 10.0, 11.0, 8.0, 5.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.73046875, -0.7108688354492188, -0.6912689208984375, -0.6716690063476562, -0.652069091796875, -0.6324691772460938, -0.6128692626953125, -0.5932693481445312, -0.57366943359375, -0.5540695190429688, -0.5344696044921875, -0.5148696899414062, -0.495269775390625, -0.47566986083984375, -0.4560699462890625, -0.43647003173828125, -0.4168701171875, -0.39727020263671875, -0.3776702880859375, -0.35807037353515625, -0.338470458984375, -0.31887054443359375, -0.2992706298828125, -0.27967071533203125, -0.26007080078125, -0.24047088623046875, -0.2208709716796875, -0.20127105712890625, -0.181671142578125, -0.16207122802734375, -0.1424713134765625, -0.12287139892578125, -0.103271484375, -0.08367156982421875, -0.0640716552734375, -0.04447174072265625, -0.024871826171875, -0.00527191162109375, 0.0143280029296875, 0.03392791748046875, 0.05352783203125, 0.07312774658203125, 0.0927276611328125, 0.11232757568359375, 0.131927490234375, 0.15152740478515625, 0.1711273193359375, 0.19072723388671875, 0.2103271484375, 0.22992706298828125, 0.2495269775390625, 0.26912689208984375, 0.288726806640625, 0.30832672119140625, 0.3279266357421875, 0.34752655029296875, 0.36712646484375, 0.38672637939453125, 0.4063262939453125, 0.42592620849609375, 0.445526123046875, 0.46512603759765625, 0.4847259521484375, 0.5043258666992188, 0.52392578125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 7.0, 12.0, 15.0, 23.0, 21.0, 46.0, 63.0, 100.0, 177.0, 366.0, 776.0, 2459.0, 9830.0, 60643.0, 791727.0, 158488.0, 17575.0, 3980.0, 1181.0, 472.0, 204.0, 117.0, 71.0, 47.0, 29.0, 25.0, 14.0, 19.0, 15.0, 13.0, 5.0, 8.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.1466064453125, -0.14225387573242188, -0.13790130615234375, -0.13354873657226562, -0.1291961669921875, -0.12484359741210938, -0.12049102783203125, -0.11613845825195312, -0.111785888671875, -0.10743331909179688, -0.10308074951171875, -0.09872817993164062, -0.0943756103515625, -0.09002304077148438, -0.08567047119140625, -0.08131790161132812, -0.07696533203125, -0.07261276245117188, -0.06826019287109375, -0.06390762329101562, -0.0595550537109375, -0.055202484130859375, -0.05084991455078125, -0.046497344970703125, -0.042144775390625, -0.037792205810546875, -0.03343963623046875, -0.029087066650390625, -0.0247344970703125, -0.020381927490234375, -0.01602935791015625, -0.011676788330078125, -0.00732421875, -0.002971649169921875, 0.00138092041015625, 0.005733489990234375, 0.0100860595703125, 0.014438629150390625, 0.01879119873046875, 0.023143768310546875, 0.027496337890625, 0.031848907470703125, 0.03620147705078125, 0.040554046630859375, 0.0449066162109375, 0.049259185791015625, 0.05361175537109375, 0.057964324951171875, 0.06231689453125, 0.06666946411132812, 0.07102203369140625, 0.07537460327148438, 0.0797271728515625, 0.08407974243164062, 0.08843231201171875, 0.09278488159179688, 0.097137451171875, 0.10149002075195312, 0.10584259033203125, 0.11019515991210938, 0.1145477294921875, 0.11890029907226562, 0.12325286865234375, 0.12760543823242188, 0.1319580078125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 5.0, 3.0, 7.0, 6.0, 10.0, 12.0, 23.0, 31.0, 41.0, 54.0, 72.0, 127.0, 144.0, 127.0, 100.0, 68.0, 46.0, 35.0, 23.0, 15.0, 18.0, 7.0, 5.0, 4.0, 6.0, 4.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7762184143066406e-05, -1.7202459275722504e-05, -1.66427344083786e-05, -1.60830095410347e-05, -1.5523284673690796e-05, -1.4963559806346893e-05, -1.440383493900299e-05, -1.3844110071659088e-05, -1.3284385204315186e-05, -1.2724660336971283e-05, -1.216493546962738e-05, -1.1605210602283478e-05, -1.1045485734939575e-05, -1.0485760867595673e-05, -9.92603600025177e-06, -9.366311132907867e-06, -8.806586265563965e-06, -8.246861398220062e-06, -7.68713653087616e-06, -7.127411663532257e-06, -6.5676867961883545e-06, -6.007961928844452e-06, -5.448237061500549e-06, -4.888512194156647e-06, -4.328787326812744e-06, -3.7690624594688416e-06, -3.209337592124939e-06, -2.6496127247810364e-06, -2.089887857437134e-06, -1.5301629900932312e-06, -9.704381227493286e-07, -4.10713255405426e-07, 1.4901161193847656e-07, 7.087364792823792e-07, 1.2684613466262817e-06, 1.8281862139701843e-06, 2.387911081314087e-06, 2.9476359486579895e-06, 3.507360816001892e-06, 4.067085683345795e-06, 4.626810550689697e-06, 5.1865354180336e-06, 5.7462602853775024e-06, 6.305985152721405e-06, 6.865710020065308e-06, 7.42543488740921e-06, 7.985159754753113e-06, 8.544884622097015e-06, 9.104609489440918e-06, 9.66433435678482e-06, 1.0224059224128723e-05, 1.0783784091472626e-05, 1.1343508958816528e-05, 1.1903233826160431e-05, 1.2462958693504333e-05, 1.3022683560848236e-05, 1.3582408428192139e-05, 1.4142133295536041e-05, 1.4701858162879944e-05, 1.5261583030223846e-05, 1.582130789756775e-05, 1.638103276491165e-05, 1.6940757632255554e-05, 1.7500482499599457e-05, 1.806020736694336e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 8.0, 16.0, 27.0, 44.0, 47.0, 63.0, 114.0, 168.0, 267.0, 492.0, 1093.0, 3180.0, 16029.0, 311102.0, 684747.0, 24267.0, 4068.0, 1328.0, 590.0, 329.0, 219.0, 134.0, 78.0, 58.0, 34.0, 12.0, 12.0, 4.0, 10.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.224609375, -0.21871376037597656, -0.21281814575195312, -0.2069225311279297, -0.20102691650390625, -0.1951313018798828, -0.18923568725585938, -0.18334007263183594, -0.1774444580078125, -0.17154884338378906, -0.16565322875976562, -0.1597576141357422, -0.15386199951171875, -0.1479663848876953, -0.14207077026367188, -0.13617515563964844, -0.130279541015625, -0.12438392639160156, -0.11848831176757812, -0.11259269714355469, -0.10669708251953125, -0.10080146789550781, -0.09490585327148438, -0.08901023864746094, -0.0831146240234375, -0.07721900939941406, -0.07132339477539062, -0.06542778015136719, -0.05953216552734375, -0.05363655090332031, -0.047740936279296875, -0.04184532165527344, -0.03594970703125, -0.030054092407226562, -0.024158477783203125, -0.018262863159179688, -0.01236724853515625, -0.0064716339111328125, -0.000576019287109375, 0.0053195953369140625, 0.0112152099609375, 0.017110824584960938, 0.023006439208984375, 0.028902053833007812, 0.03479766845703125, 0.04069328308105469, 0.046588897705078125, 0.05248451232910156, 0.058380126953125, 0.06427574157714844, 0.07017135620117188, 0.07606697082519531, 0.08196258544921875, 0.08785820007324219, 0.09375381469726562, 0.09964942932128906, 0.1055450439453125, 0.11144065856933594, 0.11733627319335938, 0.12323188781738281, 0.12912750244140625, 0.1350231170654297, 0.14091873168945312, 0.14681434631347656, 0.1527099609375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 10.0, 17.0, 19.0, 16.0, 22.0, 53.0, 72.0, 121.0, 192.0, 161.0, 110.0, 67.0, 51.0, 24.0, 19.0, 13.0, 16.0, 4.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053070068359375, -0.051023006439208984, -0.04897594451904297, -0.04692888259887695, -0.04488182067871094, -0.04283475875854492, -0.040787696838378906, -0.03874063491821289, -0.036693572998046875, -0.03464651107788086, -0.032599449157714844, -0.030552387237548828, -0.028505325317382812, -0.026458263397216797, -0.02441120147705078, -0.022364139556884766, -0.02031707763671875, -0.018270015716552734, -0.01622295379638672, -0.014175891876220703, -0.012128829956054688, -0.010081768035888672, -0.008034706115722656, -0.005987644195556641, -0.003940582275390625, -0.0018935203552246094, 0.00015354156494140625, 0.002200603485107422, 0.0042476654052734375, 0.006294727325439453, 0.008341789245605469, 0.010388851165771484, 0.0124359130859375, 0.014482975006103516, 0.01653003692626953, 0.018577098846435547, 0.020624160766601562, 0.022671222686767578, 0.024718284606933594, 0.02676534652709961, 0.028812408447265625, 0.03085947036743164, 0.032906532287597656, 0.03495359420776367, 0.03700065612792969, 0.0390477180480957, 0.04109477996826172, 0.043141841888427734, 0.04518890380859375, 0.047235965728759766, 0.04928302764892578, 0.0513300895690918, 0.05337715148925781, 0.05542421340942383, 0.057471275329589844, 0.05951833724975586, 0.061565399169921875, 0.06361246109008789, 0.0656595230102539, 0.06770658493041992, 0.06975364685058594, 0.07180070877075195, 0.07384777069091797, 0.07589483261108398, 0.07794189453125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 10.0, 14.0, 28.0, 24.0, 63.0, 90.0, 151.0, 158.0, 169.0, 114.0, 77.0, 36.0, 28.0, 15.0, 7.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4249154329299927, -1.3880575895309448, -1.351199746131897, -1.3143419027328491, -1.2774841785430908, -1.240626335144043, -1.2037684917449951, -1.1669106483459473, -1.1300528049468994, -1.0931949615478516, -1.0563371181488037, -1.0194792747497559, -0.9826214909553528, -0.9457636475563049, -0.9089058637619019, -0.872048020362854, -0.8351901769638062, -0.7983323335647583, -0.7614744901657104, -0.7246167063713074, -0.6877588629722595, -0.6509010195732117, -0.6140432357788086, -0.5771853923797607, -0.5403275489807129, -0.503469705581665, -0.4666118919849396, -0.4297540783882141, -0.39289623498916626, -0.3560383915901184, -0.31918057799339294, -0.2823227643966675, -0.24546504020690918, -0.20860721170902252, -0.17174938321113586, -0.1348915547132492, -0.09803372621536255, -0.06117589771747589, -0.024318069219589233, 0.01253974437713623, 0.04939758777618408, 0.08625541627407074, 0.1231132447719574, 0.15997107326984406, 0.1968289017677307, 0.23368673026561737, 0.27054455876350403, 0.3074023723602295, 0.34426021575927734, 0.3811180591583252, 0.41797587275505066, 0.4548336863517761, 0.491691529750824, 0.5285493731498718, 0.5654071569442749, 0.6022650003433228, 0.6391228437423706, 0.6759806871414185, 0.7128385305404663, 0.7496963143348694, 0.7865541577339172, 0.8234120011329651, 0.8602697849273682, 0.897127628326416, 0.9339854717254639]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 7.0, 13.0, 20.0, 12.0, 15.0, 13.0, 14.0, 21.0, 35.0, 37.0, 23.0, 30.0, 29.0, 38.0, 39.0, 41.0, 41.0, 42.0, 36.0, 36.0, 43.0, 34.0, 35.0, 44.0, 37.0, 30.0, 26.0, 32.0, 33.0, 19.0, 13.0, 18.0, 15.0, 21.0, 6.0, 9.0, 9.0, 6.0, 7.0, 4.0, 2.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.8621527552604675, -0.8366901874542236, -0.8112276196479797, -0.7857650518417358, -0.7603024840354919, -0.734839916229248, -0.7093773484230042, -0.6839147806167603, -0.6584522128105164, -0.6329896450042725, -0.6075270771980286, -0.5820645093917847, -0.5566019415855408, -0.5311393737792969, -0.505676805973053, -0.4802142381668091, -0.4547517001628876, -0.4292891323566437, -0.4038265645503998, -0.3783639967441559, -0.352901428937912, -0.3274388909339905, -0.3019763231277466, -0.2765137553215027, -0.2510511875152588, -0.2255886197090149, -0.200126051902771, -0.1746634840965271, -0.1492009162902832, -0.1237383633852005, -0.0982757955789566, -0.07281322777271271, -0.04735064506530762, -0.02188807912170887, 0.0035744868218898773, 0.029037050902843475, 0.05449961870908737, 0.07996217906475067, 0.10542474687099457, 0.13088731467723846, 0.15634988248348236, 0.18181245028972626, 0.20727501809597015, 0.23273757100105286, 0.25820013880729675, 0.28366270661354065, 0.30912527441978455, 0.33458784222602844, 0.36005041003227234, 0.38551297783851624, 0.41097554564476013, 0.43643811345100403, 0.4619006812572479, 0.48736321926116943, 0.5128257870674133, 0.5382883548736572, 0.5637509226799011, 0.589213490486145, 0.6146760582923889, 0.6401386260986328, 0.6656011939048767, 0.6910637617111206, 0.7165263295173645, 0.7419888973236084, 0.7674514651298523]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 10.0, 3.0, 5.0, 8.0, 8.0, 13.0, 23.0, 35.0, 34.0, 42.0, 85.0, 127.0, 216.0, 316.0, 538.0, 1035.0, 2078.0, 5484.0, 34678.0, 1549681.0, 2533678.0, 53223.0, 7802.0, 2492.0, 1086.0, 581.0, 345.0, 229.0, 131.0, 93.0, 61.0, 49.0, 22.0, 24.0, 13.0, 11.0, 10.0, 11.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.890625, -0.8666000366210938, -0.8425750732421875, -0.8185501098632812, -0.794525146484375, -0.7705001831054688, -0.7464752197265625, -0.7224502563476562, -0.69842529296875, -0.6744003295898438, -0.6503753662109375, -0.6263504028320312, -0.602325439453125, -0.5783004760742188, -0.5542755126953125, -0.5302505493164062, -0.5062255859375, -0.48220062255859375, -0.4581756591796875, -0.43415069580078125, -0.410125732421875, -0.38610076904296875, -0.3620758056640625, -0.33805084228515625, -0.31402587890625, -0.29000091552734375, -0.2659759521484375, -0.24195098876953125, -0.217926025390625, -0.19390106201171875, -0.1698760986328125, -0.14585113525390625, -0.121826171875, -0.09780120849609375, -0.0737762451171875, -0.04975128173828125, -0.025726318359375, -0.00170135498046875, 0.0223236083984375, 0.04634857177734375, 0.07037353515625, 0.09439849853515625, 0.1184234619140625, 0.14244842529296875, 0.166473388671875, 0.19049835205078125, 0.2145233154296875, 0.23854827880859375, 0.2625732421875, 0.28659820556640625, 0.3106231689453125, 0.33464813232421875, 0.358673095703125, 0.38269805908203125, 0.4067230224609375, 0.43074798583984375, 0.45477294921875, 0.47879791259765625, 0.5028228759765625, 0.5268478393554688, 0.550872802734375, 0.5748977661132812, 0.5989227294921875, 0.6229476928710938, 0.64697265625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 5.0, 11.0, 14.0, 18.0, 18.0, 27.0, 17.0, 26.0, 35.0, 43.0, 41.0, 46.0, 35.0, 64.0, 69.0, 60.0, 53.0, 51.0, 66.0, 34.0, 50.0, 33.0, 33.0, 28.0, 28.0, 21.0, 21.0, 11.0, 9.0, 8.0, 8.0, 7.0, 2.0, 6.0, 4.0, 0.0, 1.0, 3.0], "bins": [-0.413330078125, -0.4033489227294922, -0.3933677673339844, -0.38338661193847656, -0.37340545654296875, -0.36342430114746094, -0.3534431457519531, -0.3434619903564453, -0.3334808349609375, -0.3234996795654297, -0.3135185241699219, -0.30353736877441406, -0.29355621337890625, -0.28357505798339844, -0.2735939025878906, -0.2636127471923828, -0.253631591796875, -0.2436504364013672, -0.23366928100585938, -0.22368812561035156, -0.21370697021484375, -0.20372581481933594, -0.19374465942382812, -0.1837635040283203, -0.1737823486328125, -0.1638011932373047, -0.15382003784179688, -0.14383888244628906, -0.13385772705078125, -0.12387657165527344, -0.11389541625976562, -0.10391426086425781, -0.09393310546875, -0.08395195007324219, -0.07397079467773438, -0.06398963928222656, -0.05400848388671875, -0.04402732849121094, -0.034046173095703125, -0.024065017700195312, -0.0140838623046875, -0.0041027069091796875, 0.005878448486328125, 0.015859603881835938, 0.02584075927734375, 0.03582191467285156, 0.045803070068359375, 0.05578422546386719, 0.065765380859375, 0.07574653625488281, 0.08572769165039062, 0.09570884704589844, 0.10569000244140625, 0.11567115783691406, 0.12565231323242188, 0.1356334686279297, 0.1456146240234375, 0.1555957794189453, 0.16557693481445312, 0.17555809020996094, 0.18553924560546875, 0.19552040100097656, 0.20550155639648438, 0.2154827117919922, 0.2254638671875]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 8.0, 13.0, 16.0, 21.0, 42.0, 54.0, 138.0, 259.0, 469.0, 1027.0, 2764.0, 9440.0, 67206.0, 3656740.0, 426244.0, 22098.0, 4744.0, 1601.0, 619.0, 330.0, 178.0, 98.0, 63.0, 30.0, 19.0, 19.0, 11.0, 5.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8544921875, -0.8299026489257812, -0.8053131103515625, -0.7807235717773438, -0.756134033203125, -0.7315444946289062, -0.7069549560546875, -0.6823654174804688, -0.65777587890625, -0.6331863403320312, -0.6085968017578125, -0.5840072631835938, -0.559417724609375, -0.5348281860351562, -0.5102386474609375, -0.48564910888671875, -0.4610595703125, -0.43647003173828125, -0.4118804931640625, -0.38729095458984375, -0.362701416015625, -0.33811187744140625, -0.3135223388671875, -0.28893280029296875, -0.26434326171875, -0.23975372314453125, -0.2151641845703125, -0.19057464599609375, -0.165985107421875, -0.14139556884765625, -0.1168060302734375, -0.09221649169921875, -0.067626953125, -0.04303741455078125, -0.0184478759765625, 0.00614166259765625, 0.030731201171875, 0.05532073974609375, 0.0799102783203125, 0.10449981689453125, 0.12908935546875, 0.15367889404296875, 0.1782684326171875, 0.20285797119140625, 0.227447509765625, 0.25203704833984375, 0.2766265869140625, 0.30121612548828125, 0.3258056640625, 0.35039520263671875, 0.3749847412109375, 0.39957427978515625, 0.424163818359375, 0.44875335693359375, 0.4733428955078125, 0.49793243408203125, 0.52252197265625, 0.5471115112304688, 0.5717010498046875, 0.5962905883789062, 0.620880126953125, 0.6454696655273438, 0.6700592041015625, 0.6946487426757812, 0.71923828125]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 8.0, 6.0, 3.0, 11.0, 12.0, 15.0, 33.0, 22.0, 44.0, 94.0, 142.0, 341.0, 593.0, 906.0, 779.0, 498.0, 239.0, 128.0, 72.0, 42.0, 24.0, 14.0, 15.0, 8.0, 7.0, 4.0, 2.0, 4.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.174072265625, -0.1684112548828125, -0.162750244140625, -0.1570892333984375, -0.15142822265625, -0.1457672119140625, -0.140106201171875, -0.1344451904296875, -0.1287841796875, -0.1231231689453125, -0.117462158203125, -0.1118011474609375, -0.10614013671875, -0.1004791259765625, -0.094818115234375, -0.0891571044921875, -0.08349609375, -0.0778350830078125, -0.072174072265625, -0.0665130615234375, -0.06085205078125, -0.0551910400390625, -0.049530029296875, -0.0438690185546875, -0.0382080078125, -0.0325469970703125, -0.026885986328125, -0.0212249755859375, -0.01556396484375, -0.0099029541015625, -0.004241943359375, 0.0014190673828125, 0.007080078125, 0.0127410888671875, 0.018402099609375, 0.0240631103515625, 0.02972412109375, 0.0353851318359375, 0.041046142578125, 0.0467071533203125, 0.0523681640625, 0.0580291748046875, 0.063690185546875, 0.0693511962890625, 0.07501220703125, 0.0806732177734375, 0.086334228515625, 0.0919952392578125, 0.09765625, 0.1033172607421875, 0.108978271484375, 0.1146392822265625, 0.12030029296875, 0.1259613037109375, 0.131622314453125, 0.1372833251953125, 0.1429443359375, 0.1486053466796875, 0.154266357421875, 0.1599273681640625, 0.16558837890625, 0.1712493896484375, 0.176910400390625, 0.1825714111328125, 0.188232421875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 13.0, 13.0, 23.0, 22.0, 35.0, 43.0, 62.0, 81.0, 117.0, 100.0, 107.0, 87.0, 86.0, 65.0, 35.0, 34.0, 21.0, 11.0, 14.0, 7.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6039164662361145, -0.5869348645210266, -0.5699533224105835, -0.5529717206954956, -0.5359901785850525, -0.5190085768699646, -0.5020270347595215, -0.4850454330444336, -0.4680638313293457, -0.4510822594165802, -0.4341006875038147, -0.4171190857887268, -0.4001375138759613, -0.3831559419631958, -0.3661743700504303, -0.3491927981376648, -0.3322112262248993, -0.3152296543121338, -0.2982480823993683, -0.2812665104866028, -0.2642849087715149, -0.2473033368587494, -0.2303217649459839, -0.21334019303321838, -0.1963586062192917, -0.17937703430652618, -0.1623954474925995, -0.14541387557983398, -0.12843230366706848, -0.11145071685314178, -0.09446914494037628, -0.07748756557703018, -0.06050598621368408, -0.04352440685033798, -0.02654283121228218, -0.00956125557422638, 0.0074203237891197205, 0.02440190315246582, 0.04138347506523132, 0.05836505442857742, 0.07534663379192352, 0.09232821315526962, 0.10930979251861572, 0.12629136443138123, 0.14327293634414673, 0.16025452315807343, 0.17723609507083893, 0.19421768188476562, 0.21119925379753113, 0.22818082571029663, 0.24516241252422333, 0.26214396953582764, 0.2791255712509155, 0.29610714316368103, 0.31308871507644653, 0.33007028698921204, 0.34705185890197754, 0.36403343081474304, 0.38101500272750854, 0.39799660444259644, 0.41497817635536194, 0.43195974826812744, 0.44894132018089294, 0.46592289209365845, 0.48290449380874634]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 2.0, 6.0, 5.0, 9.0, 7.0, 5.0, 13.0, 11.0, 22.0, 20.0, 23.0, 26.0, 31.0, 33.0, 32.0, 26.0, 34.0, 24.0, 38.0, 49.0, 40.0, 41.0, 48.0, 37.0, 44.0, 36.0, 35.0, 40.0, 24.0, 22.0, 28.0, 28.0, 28.0, 20.0, 18.0, 15.0, 14.0, 12.0, 19.0, 6.0, 8.0, 6.0, 5.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.23238198459148407, -0.22363820672035217, -0.21489444375038147, -0.20615066587924957, -0.19740688800811768, -0.18866312503814697, -0.17991934716701508, -0.17117556929588318, -0.16243180632591248, -0.15368802845478058, -0.14494426548480988, -0.13620048761367798, -0.12745672464370728, -0.11871294677257538, -0.10996916890144348, -0.10122539848089218, -0.09248162806034088, -0.08373785763978958, -0.07499408721923828, -0.06625030934810638, -0.057506538927555084, -0.048762768507003784, -0.040018994361162186, -0.03127522021532059, -0.022531449794769287, -0.013787677511572838, -0.0050439052283763885, 0.0036998670548200607, 0.01244363933801651, 0.02118740975856781, 0.02993118390440941, 0.03867495805025101, 0.04741871356964111, 0.05616248399019241, 0.06490625441074371, 0.07365003228187561, 0.08239380270242691, 0.09113757312297821, 0.09988135099411011, 0.10862512141466141, 0.11736889183521271, 0.1261126697063446, 0.1348564326763153, 0.1436002105474472, 0.1523439884185791, 0.1610877513885498, 0.1698315292596817, 0.1785753071308136, 0.1873190701007843, 0.1960628479719162, 0.2048066109418869, 0.2135503888130188, 0.2222941517829895, 0.2310379296541214, 0.2397817075252533, 0.248525470495224, 0.2572692632675171, 0.2660130262374878, 0.2747568190097809, 0.2835005819797516, 0.2922443449497223, 0.3009881377220154, 0.3097319006919861, 0.3184756636619568, 0.3272194266319275]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 5.0, 10.0, 13.0, 20.0, 27.0, 39.0, 73.0, 84.0, 118.0, 214.0, 312.0, 460.0, 759.0, 1270.0, 2170.0, 4156.0, 9171.0, 24218.0, 98379.0, 586832.0, 248921.0, 43965.0, 14166.0, 5990.0, 2918.0, 1600.0, 933.0, 591.0, 389.0, 262.0, 170.0, 106.0, 62.0, 45.0, 36.0, 20.0, 15.0, 9.0, 5.0, 12.0, 7.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1444091796875, -0.13955307006835938, -0.13469696044921875, -0.12984085083007812, -0.1249847412109375, -0.12012863159179688, -0.11527252197265625, -0.11041641235351562, -0.105560302734375, -0.10070419311523438, -0.09584808349609375, -0.09099197387695312, -0.0861358642578125, -0.08127975463867188, -0.07642364501953125, -0.07156753540039062, -0.06671142578125, -0.061855316162109375, -0.05699920654296875, -0.052143096923828125, -0.0472869873046875, -0.042430877685546875, -0.03757476806640625, -0.032718658447265625, -0.027862548828125, -0.023006439208984375, -0.01815032958984375, -0.013294219970703125, -0.0084381103515625, -0.003582000732421875, 0.00127410888671875, 0.006130218505859375, 0.010986328125, 0.015842437744140625, 0.02069854736328125, 0.025554656982421875, 0.0304107666015625, 0.035266876220703125, 0.04012298583984375, 0.044979095458984375, 0.049835205078125, 0.054691314697265625, 0.05954742431640625, 0.06440353393554688, 0.0692596435546875, 0.07411575317382812, 0.07897186279296875, 0.08382797241210938, 0.08868408203125, 0.09354019165039062, 0.09839630126953125, 0.10325241088867188, 0.1081085205078125, 0.11296463012695312, 0.11782073974609375, 0.12267684936523438, 0.127532958984375, 0.13238906860351562, 0.13724517822265625, 0.14210128784179688, 0.1469573974609375, 0.15181350708007812, 0.15666961669921875, 0.16152572631835938, 0.1663818359375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 11.0, 10.0, 13.0, 16.0, 15.0, 23.0, 27.0, 22.0, 37.0, 26.0, 33.0, 33.0, 37.0, 40.0, 42.0, 50.0, 47.0, 46.0, 47.0, 54.0, 46.0, 35.0, 41.0, 31.0, 33.0, 25.0, 32.0, 17.0, 19.0, 13.0, 17.0, 10.0, 6.0, 7.0, 7.0, 6.0, 4.0, 3.0, 4.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.163330078125, -0.15766334533691406, -0.15199661254882812, -0.1463298797607422, -0.14066314697265625, -0.1349964141845703, -0.12932968139648438, -0.12366294860839844, -0.1179962158203125, -0.11232948303222656, -0.10666275024414062, -0.10099601745605469, -0.09532928466796875, -0.08966255187988281, -0.08399581909179688, -0.07832908630371094, -0.072662353515625, -0.06699562072753906, -0.061328887939453125, -0.05566215515136719, -0.04999542236328125, -0.04432868957519531, -0.038661956787109375, -0.03299522399902344, -0.0273284912109375, -0.021661758422851562, -0.015995025634765625, -0.010328292846679688, -0.00466156005859375, 0.0010051727294921875, 0.006671905517578125, 0.012338638305664062, 0.01800537109375, 0.023672103881835938, 0.029338836669921875, 0.03500556945800781, 0.04067230224609375, 0.04633903503417969, 0.052005767822265625, 0.05767250061035156, 0.0633392333984375, 0.06900596618652344, 0.07467269897460938, 0.08033943176269531, 0.08600616455078125, 0.09167289733886719, 0.09733963012695312, 0.10300636291503906, 0.108673095703125, 0.11433982849121094, 0.12000656127929688, 0.1256732940673828, 0.13134002685546875, 0.1370067596435547, 0.14267349243164062, 0.14834022521972656, 0.1540069580078125, 0.15967369079589844, 0.16534042358398438, 0.1710071563720703, 0.17667388916015625, 0.1823406219482422, 0.18800735473632812, 0.19367408752441406, 0.1993408203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 15.0, 12.0, 18.0, 29.0, 36.0, 57.0, 64.0, 122.0, 171.0, 243.0, 386.0, 551.0, 914.0, 1617.0, 2973.0, 5527.0, 11247.0, 24351.0, 59996.0, 167231.0, 394070.0, 235657.0, 81571.0, 32087.0, 14017.0, 6841.0, 3598.0, 2021.0, 1147.0, 668.0, 437.0, 303.0, 168.0, 112.0, 85.0, 61.0, 52.0, 35.0, 17.0, 9.0, 9.0, 7.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.0687255859375, -0.06668376922607422, -0.06464195251464844, -0.06260013580322266, -0.060558319091796875, -0.058516502380371094, -0.05647468566894531, -0.05443286895751953, -0.05239105224609375, -0.05034923553466797, -0.04830741882324219, -0.046265602111816406, -0.044223785400390625, -0.042181968688964844, -0.04014015197753906, -0.03809833526611328, -0.0360565185546875, -0.03401470184326172, -0.03197288513183594, -0.029931068420410156, -0.027889251708984375, -0.025847434997558594, -0.023805618286132812, -0.02176380157470703, -0.01972198486328125, -0.01768016815185547, -0.015638351440429688, -0.013596534729003906, -0.011554718017578125, -0.009512901306152344, -0.0074710845947265625, -0.005429267883300781, -0.003387451171875, -0.0013456344604492188, 0.0006961822509765625, 0.0027379989624023438, 0.004779815673828125, 0.006821632385253906, 0.008863449096679688, 0.010905265808105469, 0.01294708251953125, 0.014988899230957031, 0.017030715942382812, 0.019072532653808594, 0.021114349365234375, 0.023156166076660156, 0.025197982788085938, 0.02723979949951172, 0.0292816162109375, 0.03132343292236328, 0.03336524963378906, 0.035407066345214844, 0.037448883056640625, 0.039490699768066406, 0.04153251647949219, 0.04357433319091797, 0.04561614990234375, 0.04765796661376953, 0.04969978332519531, 0.051741600036621094, 0.053783416748046875, 0.055825233459472656, 0.05786705017089844, 0.05990886688232422, 0.06195068359375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 4.0, 7.0, 6.0, 9.0, 28.0, 8.0, 17.0, 22.0, 27.0, 15.0, 25.0, 37.0, 37.0, 35.0, 45.0, 40.0, 44.0, 39.0, 34.0, 64.0, 46.0, 37.0, 41.0, 29.0, 45.0, 36.0, 35.0, 21.0, 21.0, 14.0, 18.0, 17.0, 18.0, 16.0, 11.0, 13.0, 7.0, 5.0, 2.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.3994140625, -0.387939453125, -0.37646484375, -0.364990234375, -0.353515625, -0.342041015625, -0.33056640625, -0.319091796875, -0.3076171875, -0.296142578125, -0.28466796875, -0.273193359375, -0.26171875, -0.250244140625, -0.23876953125, -0.227294921875, -0.2158203125, -0.204345703125, -0.19287109375, -0.181396484375, -0.169921875, -0.158447265625, -0.14697265625, -0.135498046875, -0.1240234375, -0.112548828125, -0.10107421875, -0.089599609375, -0.078125, -0.066650390625, -0.05517578125, -0.043701171875, -0.0322265625, -0.020751953125, -0.00927734375, 0.002197265625, 0.013671875, 0.025146484375, 0.03662109375, 0.048095703125, 0.0595703125, 0.071044921875, 0.08251953125, 0.093994140625, 0.10546875, 0.116943359375, 0.12841796875, 0.139892578125, 0.1513671875, 0.162841796875, 0.17431640625, 0.185791015625, 0.197265625, 0.208740234375, 0.22021484375, 0.231689453125, 0.2431640625, 0.254638671875, 0.26611328125, 0.277587890625, 0.2890625, 0.300537109375, 0.31201171875, 0.323486328125, 0.3349609375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 8.0, 13.0, 12.0, 20.0, 25.0, 43.0, 74.0, 108.0, 191.0, 301.0, 527.0, 1107.0, 2395.0, 6390.0, 21525.0, 109799.0, 570345.0, 273751.0, 44278.0, 10650.0, 3658.0, 1579.0, 773.0, 376.0, 214.0, 126.0, 88.0, 59.0, 31.0, 32.0, 15.0, 8.0, 10.0, 2.0, 6.0, 6.0, 1.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031890869140625, -0.030818462371826172, -0.029746055603027344, -0.028673648834228516, -0.027601242065429688, -0.02652883529663086, -0.02545642852783203, -0.024384021759033203, -0.023311614990234375, -0.022239208221435547, -0.02116680145263672, -0.02009439468383789, -0.019021987915039062, -0.017949581146240234, -0.016877174377441406, -0.015804767608642578, -0.01473236083984375, -0.013659954071044922, -0.012587547302246094, -0.011515140533447266, -0.010442733764648438, -0.00937032699584961, -0.008297920227050781, -0.007225513458251953, -0.006153106689453125, -0.005080699920654297, -0.004008293151855469, -0.0029358863830566406, -0.0018634796142578125, -0.0007910728454589844, 0.00028133392333984375, 0.0013537406921386719, 0.0024261474609375, 0.003498554229736328, 0.004570960998535156, 0.005643367767333984, 0.0067157745361328125, 0.007788181304931641, 0.008860588073730469, 0.009932994842529297, 0.011005401611328125, 0.012077808380126953, 0.013150215148925781, 0.01422262191772461, 0.015295028686523438, 0.016367435455322266, 0.017439842224121094, 0.018512248992919922, 0.01958465576171875, 0.020657062530517578, 0.021729469299316406, 0.022801876068115234, 0.023874282836914062, 0.02494668960571289, 0.02601909637451172, 0.027091503143310547, 0.028163909912109375, 0.029236316680908203, 0.03030872344970703, 0.03138113021850586, 0.03245353698730469, 0.033525943756103516, 0.034598350524902344, 0.03567075729370117, 0.0367431640625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 0.0, 4.0, 2.0, 6.0, 7.0, 10.0, 9.0, 16.0, 16.0, 25.0, 27.0, 31.0, 53.0, 65.0, 77.0, 99.0, 91.0, 105.0, 85.0, 56.0, 60.0, 40.0, 24.0, 27.0, 11.0, 16.0, 8.0, 7.0, 7.0, 3.0, 3.0, 0.0, 2.0, 3.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0788440704345703e-05, -1.0347925126552582e-05, -9.90740954875946e-06, -9.466893970966339e-06, -9.026378393173218e-06, -8.585862815380096e-06, -8.145347237586975e-06, -7.704831659793854e-06, -7.264316082000732e-06, -6.823800504207611e-06, -6.38328492641449e-06, -5.942769348621368e-06, -5.502253770828247e-06, -5.061738193035126e-06, -4.621222615242004e-06, -4.180707037448883e-06, -3.7401914596557617e-06, -3.2996758818626404e-06, -2.859160304069519e-06, -2.4186447262763977e-06, -1.9781291484832764e-06, -1.537613570690155e-06, -1.0970979928970337e-06, -6.565824151039124e-07, -2.1606683731079102e-07, 2.2444874048233032e-07, 6.649643182754517e-07, 1.105479896068573e-06, 1.5459954738616943e-06, 1.9865110516548157e-06, 2.427026629447937e-06, 2.8675422072410583e-06, 3.3080577850341797e-06, 3.748573362827301e-06, 4.189088940620422e-06, 4.629604518413544e-06, 5.070120096206665e-06, 5.510635673999786e-06, 5.951151251792908e-06, 6.391666829586029e-06, 6.83218240737915e-06, 7.272697985172272e-06, 7.713213562965393e-06, 8.153729140758514e-06, 8.594244718551636e-06, 9.034760296344757e-06, 9.475275874137878e-06, 9.915791451931e-06, 1.0356307029724121e-05, 1.0796822607517242e-05, 1.1237338185310364e-05, 1.1677853763103485e-05, 1.2118369340896606e-05, 1.2558884918689728e-05, 1.2999400496482849e-05, 1.343991607427597e-05, 1.3880431652069092e-05, 1.4320947229862213e-05, 1.4761462807655334e-05, 1.5201978385448456e-05, 1.5642493963241577e-05, 1.60830095410347e-05, 1.652352511882782e-05, 1.696404069662094e-05, 1.7404556274414062e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 5.0, 7.0, 11.0, 13.0, 24.0, 24.0, 52.0, 77.0, 129.0, 216.0, 391.0, 614.0, 1201.0, 2307.0, 4991.0, 11319.0, 27877.0, 75350.0, 209710.0, 380238.0, 209781.0, 75007.0, 27908.0, 11228.0, 4973.0, 2362.0, 1213.0, 630.0, 358.0, 215.0, 124.0, 79.0, 47.0, 20.0, 24.0, 9.0, 7.0, 4.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0277862548828125, -0.02700352668762207, -0.02622079849243164, -0.02543807029724121, -0.02465534210205078, -0.02387261390686035, -0.023089885711669922, -0.022307157516479492, -0.021524429321289062, -0.020741701126098633, -0.019958972930908203, -0.019176244735717773, -0.018393516540527344, -0.017610788345336914, -0.016828060150146484, -0.016045331954956055, -0.015262603759765625, -0.014479875564575195, -0.013697147369384766, -0.012914419174194336, -0.012131690979003906, -0.011348962783813477, -0.010566234588623047, -0.009783506393432617, -0.009000778198242188, -0.008218050003051758, -0.007435321807861328, -0.0066525936126708984, -0.005869865417480469, -0.005087137222290039, -0.004304409027099609, -0.0035216808319091797, -0.00273895263671875, -0.0019562244415283203, -0.0011734962463378906, -0.00039076805114746094, 0.00039196014404296875, 0.0011746883392333984, 0.001957416534423828, 0.002740144729614258, 0.0035228729248046875, 0.004305601119995117, 0.005088329315185547, 0.0058710575103759766, 0.006653785705566406, 0.007436513900756836, 0.008219242095947266, 0.009001970291137695, 0.009784698486328125, 0.010567426681518555, 0.011350154876708984, 0.012132883071899414, 0.012915611267089844, 0.013698339462280273, 0.014481067657470703, 0.015263795852661133, 0.016046524047851562, 0.016829252243041992, 0.017611980438232422, 0.01839470863342285, 0.01917743682861328, 0.01996016502380371, 0.02074289321899414, 0.02152562141418457, 0.022308349609375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 5.0, 6.0, 5.0, 8.0, 9.0, 15.0, 14.0, 25.0, 21.0, 22.0, 26.0, 38.0, 33.0, 61.0, 58.0, 56.0, 59.0, 56.0, 66.0, 63.0, 48.0, 54.0, 44.0, 35.0, 32.0, 40.0, 33.0, 10.0, 9.0, 12.0, 12.0, 9.0, 9.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005947113037109375, -0.005723774433135986, -0.005500435829162598, -0.005277097225189209, -0.00505375862121582, -0.004830420017242432, -0.004607081413269043, -0.004383742809295654, -0.004160404205322266, -0.003937065601348877, -0.0037137269973754883, -0.0034903883934020996, -0.003267049789428711, -0.0030437111854553223, -0.0028203725814819336, -0.002597033977508545, -0.0023736953735351562, -0.0021503567695617676, -0.001927018165588379, -0.0017036795616149902, -0.0014803409576416016, -0.0012570023536682129, -0.0010336637496948242, -0.0008103251457214355, -0.0005869865417480469, -0.0003636479377746582, -0.00014030933380126953, 8.302927017211914e-05, 0.0003063678741455078, 0.0005297064781188965, 0.0007530450820922852, 0.0009763836860656738, 0.0011997222900390625, 0.0014230608940124512, 0.0016463994979858398, 0.0018697381019592285, 0.002093076705932617, 0.002316415309906006, 0.0025397539138793945, 0.002763092517852783, 0.002986431121826172, 0.0032097697257995605, 0.0034331083297729492, 0.003656446933746338, 0.0038797855377197266, 0.004103124141693115, 0.004326462745666504, 0.004549801349639893, 0.004773139953613281, 0.00499647855758667, 0.005219817161560059, 0.005443155765533447, 0.005666494369506836, 0.005889832973480225, 0.006113171577453613, 0.006336510181427002, 0.006559848785400391, 0.006783187389373779, 0.007006525993347168, 0.007229864597320557, 0.007453203201293945, 0.007676541805267334, 0.007899880409240723, 0.008123219013214111, 0.0083465576171875]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 14.0, 14.0, 23.0, 36.0, 61.0, 63.0, 98.0, 109.0, 145.0, 129.0, 78.0, 75.0, 42.0, 45.0, 18.0, 14.0, 11.0, 5.0, 2.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.373170405626297, -0.3620213270187378, -0.3508722484111786, -0.3397231698036194, -0.32857412099838257, -0.31742504239082336, -0.30627596378326416, -0.29512688517570496, -0.28397780656814575, -0.27282872796058655, -0.26167964935302734, -0.2505306005477905, -0.23938152194023132, -0.22823244333267212, -0.21708336472511292, -0.2059342861175537, -0.1947852373123169, -0.1836361587047577, -0.17248709499835968, -0.16133801639080048, -0.15018895268440247, -0.13903987407684326, -0.12789079546928406, -0.11674172431230545, -0.10559265315532684, -0.09444358199834824, -0.08329451084136963, -0.07214543223381042, -0.06099636107683182, -0.04984728991985321, -0.038698211312294006, -0.0275491401553154, -0.016400068998336792, -0.005250995978713036, 0.005898077040910721, 0.017047151923179626, 0.028196223080158234, 0.03934529423713684, 0.050494372844696045, 0.06164344400167465, 0.07279251515865326, 0.08394158631563187, 0.09509065747261047, 0.10623973608016968, 0.11738880723714828, 0.1285378783941269, 0.1396869570016861, 0.1508360207080841, 0.1619850993156433, 0.17313417792320251, 0.18428324162960052, 0.19543232023715973, 0.20658138394355774, 0.21773046255111694, 0.22887954115867615, 0.24002861976623535, 0.25117766857147217, 0.26232674717903137, 0.2734758257865906, 0.2846248745918274, 0.2957739531993866, 0.3069230318069458, 0.318072110414505, 0.3292211890220642, 0.3403702676296234]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 7.0, 13.0, 9.0, 14.0, 22.0, 21.0, 35.0, 31.0, 42.0, 33.0, 42.0, 42.0, 48.0, 54.0, 54.0, 62.0, 52.0, 48.0, 49.0, 44.0, 38.0, 35.0, 40.0, 30.0, 33.0, 17.0, 14.0, 12.0, 18.0, 15.0, 5.0, 5.0, 4.0, 8.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.22568418085575104, -0.21931801736354828, -0.2129518687725067, -0.20658570528030396, -0.2002195417881012, -0.19385339319705963, -0.18748722970485687, -0.1811210811138153, -0.17475491762161255, -0.1683887541294098, -0.16202260553836823, -0.15565644204616547, -0.1492902785539627, -0.14292412996292114, -0.13655796647071838, -0.13019180297851562, -0.12382564693689346, -0.1174594908952713, -0.11109332740306854, -0.10472717136144638, -0.09836101531982422, -0.09199485182762146, -0.0856286957859993, -0.07926253974437714, -0.07289637625217438, -0.06653022021055222, -0.060164060443639755, -0.053797900676727295, -0.04743174463510513, -0.04106558486819267, -0.03469942510128021, -0.02833326905965805, -0.02196711301803589, -0.015600955113768578, -0.009234796278178692, -0.002868637442588806, 0.003497520461678505, 0.009863678365945816, 0.016229838132858276, 0.022595994174480438, 0.0289621539413929, 0.03532831370830536, 0.04169446974992752, 0.04806062951683998, 0.05442678928375244, 0.0607929453253746, 0.06715910136699677, 0.07352526485919952, 0.07989142090082169, 0.08625757694244385, 0.0926237404346466, 0.09898989647626877, 0.10535605251789093, 0.11172221601009369, 0.11808837205171585, 0.12445452809333801, 0.13082069158554077, 0.13718685507774353, 0.1435530036687851, 0.14991916716098785, 0.1562853306531906, 0.16265147924423218, 0.16901764273643494, 0.1753838062286377, 0.18174995481967926]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 7.0, 5.0, 17.0, 14.0, 17.0, 21.0, 40.0, 68.0, 79.0, 135.0, 229.0, 315.0, 435.0, 766.0, 1268.0, 2184.0, 3842.0, 7524.0, 15444.0, 36895.0, 110461.0, 471382.0, 277656.0, 68769.0, 25994.0, 11590.0, 5701.0, 3065.0, 1735.0, 1045.0, 644.0, 411.0, 275.0, 170.0, 107.0, 85.0, 50.0, 31.0, 19.0, 19.0, 15.0, 7.0, 6.0, 4.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.27685546875, -0.2678680419921875, -0.258880615234375, -0.2498931884765625, -0.24090576171875, -0.2319183349609375, -0.222930908203125, -0.2139434814453125, -0.2049560546875, -0.1959686279296875, -0.186981201171875, -0.1779937744140625, -0.16900634765625, -0.1600189208984375, -0.151031494140625, -0.1420440673828125, -0.133056640625, -0.1240692138671875, -0.115081787109375, -0.1060943603515625, -0.09710693359375, -0.0881195068359375, -0.079132080078125, -0.0701446533203125, -0.0611572265625, -0.0521697998046875, -0.043182373046875, -0.0341949462890625, -0.02520751953125, -0.0162200927734375, -0.007232666015625, 0.0017547607421875, 0.0107421875, 0.0197296142578125, 0.028717041015625, 0.0377044677734375, 0.04669189453125, 0.0556793212890625, 0.064666748046875, 0.0736541748046875, 0.0826416015625, 0.0916290283203125, 0.100616455078125, 0.1096038818359375, 0.11859130859375, 0.1275787353515625, 0.136566162109375, 0.1455535888671875, 0.154541015625, 0.1635284423828125, 0.172515869140625, 0.1815032958984375, 0.19049072265625, 0.1994781494140625, 0.208465576171875, 0.2174530029296875, 0.2264404296875, 0.2354278564453125, 0.244415283203125, 0.2534027099609375, 0.26239013671875, 0.2713775634765625, 0.280364990234375, 0.2893524169921875, 0.29833984375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 4.0, 4.0, 12.0, 8.0, 15.0, 21.0, 20.0, 24.0, 24.0, 23.0, 37.0, 41.0, 44.0, 44.0, 46.0, 44.0, 41.0, 52.0, 58.0, 64.0, 41.0, 52.0, 28.0, 43.0, 37.0, 25.0, 27.0, 22.0, 16.0, 18.0, 16.0, 8.0, 12.0, 9.0, 6.0, 5.0, 3.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.437255859375, -0.4253082275390625, -0.413360595703125, -0.4014129638671875, -0.38946533203125, -0.3775177001953125, -0.365570068359375, -0.3536224365234375, -0.3416748046875, -0.3297271728515625, -0.317779541015625, -0.3058319091796875, -0.29388427734375, -0.2819366455078125, -0.269989013671875, -0.2580413818359375, -0.24609375, -0.2341461181640625, -0.222198486328125, -0.2102508544921875, -0.19830322265625, -0.1863555908203125, -0.174407958984375, -0.1624603271484375, -0.1505126953125, -0.1385650634765625, -0.126617431640625, -0.1146697998046875, -0.10272216796875, -0.0907745361328125, -0.078826904296875, -0.0668792724609375, -0.054931640625, -0.0429840087890625, -0.031036376953125, -0.0190887451171875, -0.00714111328125, 0.0048065185546875, 0.016754150390625, 0.0287017822265625, 0.0406494140625, 0.0525970458984375, 0.064544677734375, 0.0764923095703125, 0.08843994140625, 0.1003875732421875, 0.112335205078125, 0.1242828369140625, 0.13623046875, 0.1481781005859375, 0.160125732421875, 0.1720733642578125, 0.18402099609375, 0.1959686279296875, 0.207916259765625, 0.2198638916015625, 0.2318115234375, 0.2437591552734375, 0.255706787109375, 0.2676544189453125, 0.27960205078125, 0.2915496826171875, 0.303497314453125, 0.3154449462890625, 0.327392578125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 4.0, 15.0, 15.0, 18.0, 21.0, 27.0, 42.0, 76.0, 101.0, 161.0, 368.0, 782.0, 2165.0, 8315.0, 42808.0, 537312.0, 409296.0, 36514.0, 7090.0, 2018.0, 665.0, 300.0, 147.0, 113.0, 64.0, 33.0, 18.0, 20.0, 14.0, 10.0, 4.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.489990234375, -0.4724617004394531, -0.45493316650390625, -0.4374046325683594, -0.4198760986328125, -0.4023475646972656, -0.38481903076171875, -0.3672904968261719, -0.349761962890625, -0.3322334289550781, -0.31470489501953125, -0.2971763610839844, -0.2796478271484375, -0.2621192932128906, -0.24459075927734375, -0.22706222534179688, -0.20953369140625, -0.19200515747070312, -0.17447662353515625, -0.15694808959960938, -0.1394195556640625, -0.12189102172851562, -0.10436248779296875, -0.08683395385742188, -0.069305419921875, -0.051776885986328125, -0.03424835205078125, -0.016719818115234375, 0.0008087158203125, 0.018337249755859375, 0.03586578369140625, 0.053394317626953125, 0.0709228515625, 0.08845138549804688, 0.10597991943359375, 0.12350845336914062, 0.1410369873046875, 0.15856552124023438, 0.17609405517578125, 0.19362258911132812, 0.211151123046875, 0.22867965698242188, 0.24620819091796875, 0.2637367248535156, 0.2812652587890625, 0.2987937927246094, 0.31632232666015625, 0.3338508605957031, 0.35137939453125, 0.3689079284667969, 0.38643646240234375, 0.4039649963378906, 0.4214935302734375, 0.4390220642089844, 0.45655059814453125, 0.4740791320800781, 0.491607666015625, 0.5091361999511719, 0.5266647338867188, 0.5441932678222656, 0.5617218017578125, 0.5792503356933594, 0.5967788696289062, 0.6143074035644531, 0.6318359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 4.0, 6.0, 6.0, 7.0, 9.0, 12.0, 11.0, 12.0, 11.0, 22.0, 20.0, 26.0, 41.0, 36.0, 48.0, 48.0, 41.0, 50.0, 43.0, 65.0, 54.0, 51.0, 57.0, 48.0, 51.0, 35.0, 30.0, 29.0, 33.0, 23.0, 12.0, 15.0, 9.0, 13.0, 8.0, 5.0, 6.0, 2.0, 1.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.51171875, -0.4971504211425781, -0.48258209228515625, -0.4680137634277344, -0.4534454345703125, -0.4388771057128906, -0.42430877685546875, -0.4097404479980469, -0.395172119140625, -0.3806037902832031, -0.36603546142578125, -0.3514671325683594, -0.3368988037109375, -0.3223304748535156, -0.30776214599609375, -0.2931938171386719, -0.27862548828125, -0.2640571594238281, -0.24948883056640625, -0.23492050170898438, -0.2203521728515625, -0.20578384399414062, -0.19121551513671875, -0.17664718627929688, -0.162078857421875, -0.14751052856445312, -0.13294219970703125, -0.11837387084960938, -0.1038055419921875, -0.08923721313476562, -0.07466888427734375, -0.060100555419921875, -0.0455322265625, -0.030963897705078125, -0.01639556884765625, -0.001827239990234375, 0.0127410888671875, 0.027309417724609375, 0.04187774658203125, 0.056446075439453125, 0.071014404296875, 0.08558273315429688, 0.10015106201171875, 0.11471939086914062, 0.1292877197265625, 0.14385604858398438, 0.15842437744140625, 0.17299270629882812, 0.18756103515625, 0.20212936401367188, 0.21669769287109375, 0.23126602172851562, 0.2458343505859375, 0.2604026794433594, 0.27497100830078125, 0.2895393371582031, 0.304107666015625, 0.3186759948730469, 0.33324432373046875, 0.3478126525878906, 0.3623809814453125, 0.3769493103027344, 0.39151763916015625, 0.4060859680175781, 0.420654296875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 6.0, 2.0, 4.0, 4.0, 6.0, 13.0, 14.0, 17.0, 33.0, 57.0, 155.0, 397.0, 1425.0, 8287.0, 141495.0, 853355.0, 38279.0, 3683.0, 804.0, 263.0, 119.0, 47.0, 41.0, 13.0, 7.0, 11.0, 6.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1829833984375, -0.17731857299804688, -0.17165374755859375, -0.16598892211914062, -0.1603240966796875, -0.15465927124023438, -0.14899444580078125, -0.14332962036132812, -0.137664794921875, -0.13199996948242188, -0.12633514404296875, -0.12067031860351562, -0.1150054931640625, -0.10934066772460938, -0.10367584228515625, -0.09801101684570312, -0.09234619140625, -0.08668136596679688, -0.08101654052734375, -0.07535171508789062, -0.0696868896484375, -0.06402206420898438, -0.05835723876953125, -0.052692413330078125, -0.047027587890625, -0.041362762451171875, -0.03569793701171875, -0.030033111572265625, -0.0243682861328125, -0.018703460693359375, -0.01303863525390625, -0.007373809814453125, -0.001708984375, 0.003955841064453125, 0.00962066650390625, 0.015285491943359375, 0.0209503173828125, 0.026615142822265625, 0.03227996826171875, 0.037944793701171875, 0.043609619140625, 0.049274444580078125, 0.05493927001953125, 0.060604095458984375, 0.0662689208984375, 0.07193374633789062, 0.07759857177734375, 0.08326339721679688, 0.08892822265625, 0.09459304809570312, 0.10025787353515625, 0.10592269897460938, 0.1115875244140625, 0.11725234985351562, 0.12291717529296875, 0.12858200073242188, 0.134246826171875, 0.13991165161132812, 0.14557647705078125, 0.15124130249023438, 0.1569061279296875, 0.16257095336914062, 0.16823577880859375, 0.17390060424804688, 0.1795654296875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 3.0, 3.0, 8.0, 8.0, 9.0, 18.0, 30.0, 27.0, 69.0, 79.0, 102.0, 191.0, 155.0, 88.0, 70.0, 39.0, 30.0, 19.0, 11.0, 12.0, 8.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2576580047607422e-05, -1.2024305760860443e-05, -1.1472031474113464e-05, -1.0919757187366486e-05, -1.0367482900619507e-05, -9.815208613872528e-06, -9.26293432712555e-06, -8.71066004037857e-06, -8.158385753631592e-06, -7.606111466884613e-06, -7.053837180137634e-06, -6.5015628933906555e-06, -5.949288606643677e-06, -5.397014319896698e-06, -4.844740033149719e-06, -4.2924657464027405e-06, -3.7401914596557617e-06, -3.187917172908783e-06, -2.635642886161804e-06, -2.0833685994148254e-06, -1.5310943126678467e-06, -9.78820025920868e-07, -4.2654573917388916e-07, 1.257285475730896e-07, 6.780028343200684e-07, 1.2302771210670471e-06, 1.7825514078140259e-06, 2.3348256945610046e-06, 2.8870999813079834e-06, 3.439374268054962e-06, 3.991648554801941e-06, 4.54392284154892e-06, 5.0961971282958984e-06, 5.648471415042877e-06, 6.200745701789856e-06, 6.753019988536835e-06, 7.3052942752838135e-06, 7.857568562030792e-06, 8.409842848777771e-06, 8.96211713552475e-06, 9.514391422271729e-06, 1.0066665709018707e-05, 1.0618939995765686e-05, 1.1171214282512665e-05, 1.1723488569259644e-05, 1.2275762856006622e-05, 1.2828037142753601e-05, 1.338031142950058e-05, 1.3932585716247559e-05, 1.4484860002994537e-05, 1.5037134289741516e-05, 1.5589408576488495e-05, 1.6141682863235474e-05, 1.6693957149982452e-05, 1.724623143672943e-05, 1.779850572347641e-05, 1.835078001022339e-05, 1.8903054296970367e-05, 1.9455328583717346e-05, 2.0007602870464325e-05, 2.0559877157211304e-05, 2.1112151443958282e-05, 2.166442573070526e-05, 2.221670001745224e-05, 2.276897430419922e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 8.0, 21.0, 40.0, 60.0, 110.0, 210.0, 425.0, 826.0, 1726.0, 4588.0, 19135.0, 193150.0, 753078.0, 60098.0, 9558.0, 2974.0, 1238.0, 609.0, 338.0, 146.0, 75.0, 53.0, 29.0, 10.0, 15.0, 9.0, 5.0, 3.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1558837890625, -0.151336669921875, -0.14678955078125, -0.142242431640625, -0.1376953125, -0.133148193359375, -0.12860107421875, -0.124053955078125, -0.1195068359375, -0.114959716796875, -0.11041259765625, -0.105865478515625, -0.101318359375, -0.096771240234375, -0.09222412109375, -0.087677001953125, -0.0831298828125, -0.078582763671875, -0.07403564453125, -0.069488525390625, -0.06494140625, -0.060394287109375, -0.05584716796875, -0.051300048828125, -0.0467529296875, -0.042205810546875, -0.03765869140625, -0.033111572265625, -0.028564453125, -0.024017333984375, -0.01947021484375, -0.014923095703125, -0.0103759765625, -0.005828857421875, -0.00128173828125, 0.003265380859375, 0.0078125, 0.012359619140625, 0.01690673828125, 0.021453857421875, 0.0260009765625, 0.030548095703125, 0.03509521484375, 0.039642333984375, 0.044189453125, 0.048736572265625, 0.05328369140625, 0.057830810546875, 0.0623779296875, 0.066925048828125, 0.07147216796875, 0.076019287109375, 0.08056640625, 0.085113525390625, 0.08966064453125, 0.094207763671875, 0.0987548828125, 0.103302001953125, 0.10784912109375, 0.112396240234375, 0.116943359375, 0.121490478515625, 0.12603759765625, 0.130584716796875, 0.1351318359375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 5.0, 8.0, 4.0, 10.0, 13.0, 10.0, 29.0, 51.0, 73.0, 104.0, 118.0, 178.0, 128.0, 95.0, 51.0, 41.0, 25.0, 18.0, 12.0, 10.0, 5.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0643310546875, -0.062290191650390625, -0.06024932861328125, -0.058208465576171875, -0.0561676025390625, -0.054126739501953125, -0.05208587646484375, -0.050045013427734375, -0.048004150390625, -0.045963287353515625, -0.04392242431640625, -0.041881561279296875, -0.0398406982421875, -0.037799835205078125, -0.03575897216796875, -0.033718109130859375, -0.03167724609375, -0.029636383056640625, -0.02759552001953125, -0.025554656982421875, -0.0235137939453125, -0.021472930908203125, -0.01943206787109375, -0.017391204833984375, -0.015350341796875, -0.013309478759765625, -0.01126861572265625, -0.009227752685546875, -0.0071868896484375, -0.005146026611328125, -0.00310516357421875, -0.001064300537109375, 0.0009765625, 0.003017425537109375, 0.00505828857421875, 0.007099151611328125, 0.0091400146484375, 0.011180877685546875, 0.01322174072265625, 0.015262603759765625, 0.017303466796875, 0.019344329833984375, 0.02138519287109375, 0.023426055908203125, 0.0254669189453125, 0.027507781982421875, 0.02954864501953125, 0.031589508056640625, 0.03363037109375, 0.035671234130859375, 0.03771209716796875, 0.039752960205078125, 0.0417938232421875, 0.043834686279296875, 0.04587554931640625, 0.047916412353515625, 0.049957275390625, 0.051998138427734375, 0.05403900146484375, 0.056079864501953125, 0.0581207275390625, 0.060161590576171875, 0.06220245361328125, 0.06424331665039062, 0.0662841796875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [19.0, 112.0, 500.0, 333.0, 45.0, 9.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33184677362442017, -0.2141825258731842, -0.09651826322078705, 0.021145999431610107, 0.13881024718284607, 0.25647449493408203, 0.3741387724876404, 0.49180299043655396, 0.6094672679901123, 0.7271315455436707, 0.8447957634925842, 0.9624600410461426, 1.0801242589950562, 1.1977884769439697, 1.3154528141021729, 1.4331170320510864, 1.55078125, 1.6684454679489136, 1.7861098051071167, 1.9037740230560303, 2.0214383602142334, 2.1391024589538574, 2.2567667961120605, 2.3744311332702637, 2.492095470428467, 2.60975980758667, 2.727423906326294, 2.845088243484497, 2.9627525806427, 3.080416679382324, 3.1980810165405273, 3.3157453536987305, 3.4334094524383545, 3.5510737895965576, 3.6687378883361816, 3.7864022254943848, 3.904066562652588, 4.021730899810791, 4.139394760131836, 4.257059097290039, 4.374723434448242, 4.492387771606445, 4.610052108764648, 4.727716445922852, 4.8453803062438965, 4.9630446434021, 5.080708980560303, 5.198373317718506, 5.316037654876709, 5.433701992034912, 5.551366329193115, 5.66903018951416, 5.786694526672363, 5.904358863830566, 6.0220232009887695, 6.139687538146973, 6.257351398468018, 6.375015735626221, 6.492680072784424, 6.610343933105469, 6.728008270263672, 6.845672607421875, 6.963336944580078, 7.081001281738281, 7.198665618896484]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 7.0, 2.0, 6.0, 7.0, 2.0, 5.0, 9.0, 10.0, 24.0, 17.0, 14.0, 13.0, 21.0, 23.0, 26.0, 38.0, 26.0, 38.0, 33.0, 41.0, 48.0, 49.0, 40.0, 37.0, 36.0, 47.0, 42.0, 42.0, 37.0, 28.0, 25.0, 33.0, 34.0, 20.0, 24.0, 11.0, 18.0, 17.0, 13.0, 11.0, 6.0, 6.0, 2.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5970219373703003, -0.5782413482666016, -0.5594608187675476, -0.5406802296638489, -0.5218996405601501, -0.5031190514564514, -0.48433852195739746, -0.46555793285369873, -0.44677734375, -0.42799678444862366, -0.4092161953449249, -0.3904356360435486, -0.37165504693984985, -0.3528744876384735, -0.33409392833709717, -0.31531333923339844, -0.2965327799320221, -0.27775222063064575, -0.258971631526947, -0.24019107222557068, -0.22141048312187195, -0.2026299238204956, -0.18384934961795807, -0.16506877541542053, -0.146288201212883, -0.12750762701034546, -0.10872705280780792, -0.08994648605585098, -0.07116591185331345, -0.05238533765077591, -0.03360477089881897, -0.014824196696281433, 0.0039563775062561035, 0.02273694984614849, 0.04151752218604088, 0.060298092663288116, 0.07907866686582565, 0.09785924106836319, 0.11663980782032013, 0.13542038202285767, 0.1542009562253952, 0.17298153042793274, 0.19176210463047028, 0.2105426788330078, 0.22932323813438416, 0.24810382723808289, 0.26688438653945923, 0.28566497564315796, 0.3044455349445343, 0.32322609424591064, 0.3420066833496094, 0.3607872426509857, 0.37956783175468445, 0.3983483910560608, 0.4171289801597595, 0.43590953946113586, 0.4546900987625122, 0.47347065806388855, 0.4922512471675873, 0.5110318064689636, 0.5298123955726624, 0.5485929846763611, 0.567373514175415, 0.5861541032791138, 0.6049346923828125]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 4.0, 7.0, 13.0, 16.0, 27.0, 31.0, 61.0, 100.0, 172.0, 319.0, 516.0, 973.0, 1792.0, 3760.0, 10696.0, 85813.0, 3086244.0, 961500.0, 29456.0, 6998.0, 2727.0, 1274.0, 713.0, 425.0, 251.0, 126.0, 90.0, 55.0, 50.0, 26.0, 21.0, 11.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48095703125, -0.4630126953125, -0.445068359375, -0.4271240234375, -0.4091796875, -0.3912353515625, -0.373291015625, -0.3553466796875, -0.33740234375, -0.3194580078125, -0.301513671875, -0.2835693359375, -0.265625, -0.2476806640625, -0.229736328125, -0.2117919921875, -0.19384765625, -0.1759033203125, -0.157958984375, -0.1400146484375, -0.1220703125, -0.1041259765625, -0.086181640625, -0.0682373046875, -0.05029296875, -0.0323486328125, -0.014404296875, 0.0035400390625, 0.021484375, 0.0394287109375, 0.057373046875, 0.0753173828125, 0.09326171875, 0.1112060546875, 0.129150390625, 0.1470947265625, 0.1650390625, 0.1829833984375, 0.200927734375, 0.2188720703125, 0.23681640625, 0.2547607421875, 0.272705078125, 0.2906494140625, 0.30859375, 0.3265380859375, 0.344482421875, 0.3624267578125, 0.38037109375, 0.3983154296875, 0.416259765625, 0.4342041015625, 0.4521484375, 0.4700927734375, 0.488037109375, 0.5059814453125, 0.52392578125, 0.5418701171875, 0.559814453125, 0.5777587890625, 0.595703125, 0.6136474609375, 0.631591796875, 0.6495361328125, 0.66748046875]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 7.0, 8.0, 13.0, 17.0, 15.0, 26.0, 30.0, 41.0, 34.0, 47.0, 61.0, 65.0, 68.0, 57.0, 67.0, 49.0, 47.0, 50.0, 50.0, 42.0, 37.0, 35.0, 32.0, 24.0, 16.0, 13.0, 8.0, 9.0, 15.0, 4.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.278076171875, -0.2706260681152344, -0.26317596435546875, -0.2557258605957031, -0.2482757568359375, -0.24082565307617188, -0.23337554931640625, -0.22592544555664062, -0.218475341796875, -0.21102523803710938, -0.20357513427734375, -0.19612503051757812, -0.1886749267578125, -0.18122482299804688, -0.17377471923828125, -0.16632461547851562, -0.15887451171875, -0.15142440795898438, -0.14397430419921875, -0.13652420043945312, -0.1290740966796875, -0.12162399291992188, -0.11417388916015625, -0.10672378540039062, -0.099273681640625, -0.09182357788085938, -0.08437347412109375, -0.07692337036132812, -0.0694732666015625, -0.062023162841796875, -0.05457305908203125, -0.047122955322265625, -0.0396728515625, -0.032222747802734375, -0.02477264404296875, -0.017322540283203125, -0.0098724365234375, -0.002422332763671875, 0.00502777099609375, 0.012477874755859375, 0.019927978515625, 0.027378082275390625, 0.03482818603515625, 0.042278289794921875, 0.0497283935546875, 0.057178497314453125, 0.06462860107421875, 0.07207870483398438, 0.07952880859375, 0.08697891235351562, 0.09442901611328125, 0.10187911987304688, 0.1093292236328125, 0.11677932739257812, 0.12422943115234375, 0.13167953491210938, 0.139129638671875, 0.14657974243164062, 0.15402984619140625, 0.16147994995117188, 0.1689300537109375, 0.17638015747070312, 0.18383026123046875, 0.19128036499023438, 0.19873046875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 6.0, 4.0, 6.0, 8.0, 6.0, 9.0, 8.0, 16.0, 23.0, 30.0, 38.0, 66.0, 92.0, 202.0, 407.0, 802.0, 1862.0, 4985.0, 17688.0, 124414.0, 3458518.0, 535635.0, 36028.0, 8119.0, 2907.0, 1196.0, 536.0, 270.0, 141.0, 79.0, 49.0, 38.0, 18.0, 13.0, 10.0, 10.0, 8.0, 6.0, 4.0, 4.0, 6.0, 6.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.478515625, -0.4629364013671875, -0.447357177734375, -0.4317779541015625, -0.41619873046875, -0.4006195068359375, -0.385040283203125, -0.3694610595703125, -0.3538818359375, -0.3383026123046875, -0.322723388671875, -0.3071441650390625, -0.29156494140625, -0.2759857177734375, -0.260406494140625, -0.2448272705078125, -0.229248046875, -0.2136688232421875, -0.198089599609375, -0.1825103759765625, -0.16693115234375, -0.1513519287109375, -0.135772705078125, -0.1201934814453125, -0.1046142578125, -0.0890350341796875, -0.073455810546875, -0.0578765869140625, -0.04229736328125, -0.0267181396484375, -0.011138916015625, 0.0044403076171875, 0.02001953125, 0.0355987548828125, 0.051177978515625, 0.0667572021484375, 0.08233642578125, 0.0979156494140625, 0.113494873046875, 0.1290740966796875, 0.1446533203125, 0.1602325439453125, 0.175811767578125, 0.1913909912109375, 0.20697021484375, 0.2225494384765625, 0.238128662109375, 0.2537078857421875, 0.269287109375, 0.2848663330078125, 0.300445556640625, 0.3160247802734375, 0.33160400390625, 0.3471832275390625, 0.362762451171875, 0.3783416748046875, 0.3939208984375, 0.4095001220703125, 0.425079345703125, 0.4406585693359375, 0.45623779296875, 0.4718170166015625, 0.487396240234375, 0.5029754638671875, 0.5185546875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 4.0, 5.0, 5.0, 3.0, 9.0, 12.0, 6.0, 19.0, 22.0, 38.0, 44.0, 69.0, 124.0, 188.0, 284.0, 484.0, 588.0, 653.0, 509.0, 355.0, 219.0, 131.0, 87.0, 56.0, 44.0, 26.0, 18.0, 14.0, 14.0, 7.0, 10.0, 2.0, 4.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.12042236328125, -0.11680030822753906, -0.11317825317382812, -0.10955619812011719, -0.10593414306640625, -0.10231208801269531, -0.09869003295898438, -0.09506797790527344, -0.0914459228515625, -0.08782386779785156, -0.08420181274414062, -0.08057975769042969, -0.07695770263671875, -0.07333564758300781, -0.06971359252929688, -0.06609153747558594, -0.062469482421875, -0.05884742736816406, -0.055225372314453125, -0.05160331726074219, -0.04798126220703125, -0.04435920715332031, -0.040737152099609375, -0.03711509704589844, -0.0334930419921875, -0.029870986938476562, -0.026248931884765625, -0.022626876831054688, -0.01900482177734375, -0.015382766723632812, -0.011760711669921875, -0.008138656616210938, -0.0045166015625, -0.0008945465087890625, 0.002727508544921875, 0.0063495635986328125, 0.00997161865234375, 0.013593673706054688, 0.017215728759765625, 0.020837783813476562, 0.0244598388671875, 0.028081893920898438, 0.031703948974609375, 0.03532600402832031, 0.03894805908203125, 0.04257011413574219, 0.046192169189453125, 0.04981422424316406, 0.053436279296875, 0.05705833435058594, 0.060680389404296875, 0.06430244445800781, 0.06792449951171875, 0.07154655456542969, 0.07516860961914062, 0.07879066467285156, 0.0824127197265625, 0.08603477478027344, 0.08965682983398438, 0.09327888488769531, 0.09690093994140625, 0.10052299499511719, 0.10414505004882812, 0.10776710510253906, 0.11138916015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 12.0, 3.0, 12.0, 13.0, 20.0, 21.0, 17.0, 23.0, 42.0, 36.0, 60.0, 67.0, 66.0, 67.0, 87.0, 72.0, 73.0, 50.0, 62.0, 43.0, 30.0, 25.0, 25.0, 21.0, 13.0, 4.0, 5.0, 7.0, 5.0, 6.0, 5.0, 6.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20238716900348663, -0.19300851225852966, -0.1836298406124115, -0.17425118386745453, -0.16487252712249756, -0.1554938554763794, -0.14611519873142242, -0.13673654198646545, -0.1273578703403473, -0.11797920614480972, -0.10860054939985275, -0.09922188520431519, -0.08984322845935822, -0.08046456426382065, -0.07108590006828308, -0.06170724332332611, -0.05232858657836914, -0.04294992610812187, -0.0335712656378746, -0.024192601442337036, -0.014813940972089767, -0.005435280501842499, 0.003943383693695068, 0.013322040438652039, 0.022700704634189606, 0.032079365104436874, 0.04145802557468414, 0.05083668977022171, 0.06021535024046898, 0.06959401071071625, 0.07897267490625381, 0.08835133165121078, 0.09773001074790955, 0.10710867494344711, 0.11648733168840408, 0.12586599588394165, 0.13524465262889862, 0.1446233093738556, 0.15400198101997375, 0.16338063776493073, 0.1727592945098877, 0.18213795125484467, 0.19151662290096283, 0.2008952796459198, 0.21027393639087677, 0.21965259313583374, 0.2290312647819519, 0.23840992152690887, 0.24778859317302704, 0.257167249917984, 0.2665459215641022, 0.27592456340789795, 0.2853032350540161, 0.2946819067001343, 0.30406057834625244, 0.3134392201900482, 0.3228178918361664, 0.33219656348228455, 0.3415752053260803, 0.3509538769721985, 0.36033254861831665, 0.3697111904621124, 0.3790898621082306, 0.38846850395202637, 0.39784717559814453]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 4.0, 9.0, 9.0, 4.0, 12.0, 10.0, 18.0, 18.0, 19.0, 25.0, 30.0, 36.0, 30.0, 36.0, 33.0, 35.0, 34.0, 44.0, 40.0, 33.0, 41.0, 44.0, 51.0, 37.0, 32.0, 33.0, 37.0, 39.0, 39.0, 18.0, 19.0, 17.0, 19.0, 18.0, 25.0, 12.0, 13.0, 5.0, 8.0, 11.0, 1.0, 3.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2659854292869568, -0.25872915983200073, -0.2514728903770447, -0.24421659111976624, -0.23696032166481018, -0.22970405220985413, -0.22244776785373688, -0.21519148349761963, -0.20793521404266357, -0.20067894458770752, -0.19342266023159027, -0.18616637587547302, -0.17891010642051697, -0.1716538369655609, -0.16439755260944366, -0.15714126825332642, -0.14988499879837036, -0.1426287293434143, -0.13537244498729706, -0.1281161606311798, -0.12085989117622375, -0.1136036142706871, -0.10634733736515045, -0.0990910604596138, -0.09183478355407715, -0.0845785066485405, -0.07732222974300385, -0.0700659528374672, -0.06280967593193054, -0.05555339902639389, -0.04829712212085724, -0.04104084521532059, -0.033784568309783936, -0.026528291404247284, -0.019272014498710632, -0.01201573759317398, -0.004759460687637329, 0.0024968162178993225, 0.009753093123435974, 0.017009370028972626, 0.024265646934509277, 0.03152192384004593, 0.03877820074558258, 0.04603447765111923, 0.053290754556655884, 0.060547031462192535, 0.06780330836772919, 0.07505958527326584, 0.08231586217880249, 0.08957213908433914, 0.0968284159898758, 0.10408469289541245, 0.1113409698009491, 0.11859724670648575, 0.1258535236120224, 0.13310980796813965, 0.1403660774230957, 0.14762234687805176, 0.154878631234169, 0.16213491559028625, 0.1693911850452423, 0.17664745450019836, 0.1839037388563156, 0.19116002321243286, 0.19841629266738892]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 4.0, 10.0, 19.0, 18.0, 34.0, 52.0, 90.0, 129.0, 179.0, 304.0, 418.0, 773.0, 1115.0, 1853.0, 3273.0, 5801.0, 11487.0, 28428.0, 114740.0, 574439.0, 229119.0, 43601.0, 15247.0, 7480.0, 3943.0, 2185.0, 1382.0, 866.0, 543.0, 365.0, 225.0, 121.0, 95.0, 71.0, 51.0, 29.0, 20.0, 17.0, 10.0, 7.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08251953125, -0.07953834533691406, -0.07655715942382812, -0.07357597351074219, -0.07059478759765625, -0.06761360168457031, -0.06463241577148438, -0.06165122985839844, -0.0586700439453125, -0.05568885803222656, -0.052707672119140625, -0.04972648620605469, -0.04674530029296875, -0.04376411437988281, -0.040782928466796875, -0.03780174255371094, -0.034820556640625, -0.03183937072753906, -0.028858184814453125, -0.025876998901367188, -0.02289581298828125, -0.019914627075195312, -0.016933441162109375, -0.013952255249023438, -0.0109710693359375, -0.007989883422851562, -0.005008697509765625, -0.0020275115966796875, 0.00095367431640625, 0.0039348602294921875, 0.006916046142578125, 0.009897232055664062, 0.01287841796875, 0.015859603881835938, 0.018840789794921875, 0.021821975708007812, 0.02480316162109375, 0.027784347534179688, 0.030765533447265625, 0.03374671936035156, 0.0367279052734375, 0.03970909118652344, 0.042690277099609375, 0.04567146301269531, 0.04865264892578125, 0.05163383483886719, 0.054615020751953125, 0.05759620666503906, 0.060577392578125, 0.06355857849121094, 0.06653976440429688, 0.06952095031738281, 0.07250213623046875, 0.07548332214355469, 0.07846450805664062, 0.08144569396972656, 0.0844268798828125, 0.08740806579589844, 0.09038925170898438, 0.09337043762207031, 0.09635162353515625, 0.09933280944824219, 0.10231399536132812, 0.10529518127441406, 0.1082763671875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 7.0, 14.0, 15.0, 5.0, 5.0, 19.0, 21.0, 22.0, 26.0, 30.0, 35.0, 32.0, 46.0, 43.0, 41.0, 45.0, 41.0, 46.0, 35.0, 40.0, 41.0, 49.0, 41.0, 29.0, 28.0, 43.0, 44.0, 15.0, 22.0, 19.0, 17.0, 19.0, 18.0, 9.0, 13.0, 9.0, 4.0, 5.0, 0.0, 0.0, 3.0, 2.0], "bins": [-0.19140625, -0.1866168975830078, -0.18182754516601562, -0.17703819274902344, -0.17224884033203125, -0.16745948791503906, -0.16267013549804688, -0.1578807830810547, -0.1530914306640625, -0.1483020782470703, -0.14351272583007812, -0.13872337341308594, -0.13393402099609375, -0.12914466857910156, -0.12435531616210938, -0.11956596374511719, -0.114776611328125, -0.10998725891113281, -0.10519790649414062, -0.10040855407714844, -0.09561920166015625, -0.09082984924316406, -0.08604049682617188, -0.08125114440917969, -0.0764617919921875, -0.07167243957519531, -0.06688308715820312, -0.06209373474121094, -0.05730438232421875, -0.05251502990722656, -0.047725677490234375, -0.04293632507324219, -0.03814697265625, -0.03335762023925781, -0.028568267822265625, -0.023778915405273438, -0.01898956298828125, -0.014200210571289062, -0.009410858154296875, -0.0046215057373046875, 0.0001678466796875, 0.0049571990966796875, 0.009746551513671875, 0.014535903930664062, 0.01932525634765625, 0.024114608764648438, 0.028903961181640625, 0.03369331359863281, 0.038482666015625, 0.04327201843261719, 0.048061370849609375, 0.05285072326660156, 0.05764007568359375, 0.06242942810058594, 0.06721878051757812, 0.07200813293457031, 0.0767974853515625, 0.08158683776855469, 0.08637619018554688, 0.09116554260253906, 0.09595489501953125, 0.10074424743652344, 0.10553359985351562, 0.11032295227050781, 0.1151123046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 9.0, 4.0, 13.0, 21.0, 22.0, 24.0, 57.0, 99.0, 171.0, 328.0, 565.0, 1197.0, 2599.0, 5967.0, 15438.0, 49752.0, 223505.0, 546030.0, 145001.0, 36168.0, 12377.0, 4911.0, 2184.0, 985.0, 497.0, 262.0, 161.0, 87.0, 47.0, 30.0, 25.0, 7.0, 7.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0826416015625, -0.08016490936279297, -0.07768821716308594, -0.0752115249633789, -0.07273483276367188, -0.07025814056396484, -0.06778144836425781, -0.06530475616455078, -0.06282806396484375, -0.06035137176513672, -0.05787467956542969, -0.055397987365722656, -0.052921295166015625, -0.050444602966308594, -0.04796791076660156, -0.04549121856689453, -0.0430145263671875, -0.04053783416748047, -0.03806114196777344, -0.035584449768066406, -0.033107757568359375, -0.030631065368652344, -0.028154373168945312, -0.02567768096923828, -0.02320098876953125, -0.02072429656982422, -0.018247604370117188, -0.015770912170410156, -0.013294219970703125, -0.010817527770996094, -0.008340835571289062, -0.005864143371582031, -0.003387451171875, -0.0009107589721679688, 0.0015659332275390625, 0.004042625427246094, 0.006519317626953125, 0.008996009826660156, 0.011472702026367188, 0.013949394226074219, 0.01642608642578125, 0.01890277862548828, 0.021379470825195312, 0.023856163024902344, 0.026332855224609375, 0.028809547424316406, 0.03128623962402344, 0.03376293182373047, 0.0362396240234375, 0.03871631622314453, 0.04119300842285156, 0.043669700622558594, 0.046146392822265625, 0.048623085021972656, 0.05109977722167969, 0.05357646942138672, 0.05605316162109375, 0.05852985382080078, 0.06100654602050781, 0.06348323822021484, 0.06595993041992188, 0.0684366226196289, 0.07091331481933594, 0.07339000701904297, 0.07586669921875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 5.0, 5.0, 4.0, 5.0, 8.0, 9.0, 10.0, 20.0, 22.0, 15.0, 32.0, 45.0, 30.0, 37.0, 35.0, 47.0, 44.0, 48.0, 56.0, 42.0, 54.0, 44.0, 35.0, 47.0, 34.0, 40.0, 31.0, 34.0, 31.0, 19.0, 24.0, 29.0, 10.0, 18.0, 4.0, 7.0, 4.0, 3.0, 6.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3564453125, -0.3443489074707031, -0.33225250244140625, -0.3201560974121094, -0.3080596923828125, -0.2959632873535156, -0.28386688232421875, -0.2717704772949219, -0.259674072265625, -0.24757766723632812, -0.23548126220703125, -0.22338485717773438, -0.2112884521484375, -0.19919204711914062, -0.18709564208984375, -0.17499923706054688, -0.16290283203125, -0.15080642700195312, -0.13871002197265625, -0.12661361694335938, -0.1145172119140625, -0.10242080688476562, -0.09032440185546875, -0.07822799682617188, -0.066131591796875, -0.054035186767578125, -0.04193878173828125, -0.029842376708984375, -0.0177459716796875, -0.005649566650390625, 0.00644683837890625, 0.018543243408203125, 0.0306396484375, 0.042736053466796875, 0.05483245849609375, 0.06692886352539062, 0.0790252685546875, 0.09112167358398438, 0.10321807861328125, 0.11531448364257812, 0.127410888671875, 0.13950729370117188, 0.15160369873046875, 0.16370010375976562, 0.1757965087890625, 0.18789291381835938, 0.19998931884765625, 0.21208572387695312, 0.22418212890625, 0.23627853393554688, 0.24837493896484375, 0.2604713439941406, 0.2725677490234375, 0.2846641540527344, 0.29676055908203125, 0.3088569641113281, 0.320953369140625, 0.3330497741699219, 0.34514617919921875, 0.3572425842285156, 0.3693389892578125, 0.3814353942871094, 0.39353179931640625, 0.4056282043457031, 0.417724609375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 2.0, 4.0, 3.0, 7.0, 13.0, 16.0, 22.0, 22.0, 30.0, 38.0, 68.0, 129.0, 193.0, 344.0, 568.0, 1093.0, 2389.0, 5629.0, 16717.0, 75272.0, 487436.0, 380813.0, 54924.0, 13451.0, 4867.0, 2117.0, 1002.0, 567.0, 292.0, 180.0, 132.0, 63.0, 54.0, 33.0, 23.0, 13.0, 13.0, 7.0, 2.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.035400390625, -0.03435659408569336, -0.03331279754638672, -0.03226900100708008, -0.031225204467773438, -0.030181407928466797, -0.029137611389160156, -0.028093814849853516, -0.027050018310546875, -0.026006221771240234, -0.024962425231933594, -0.023918628692626953, -0.022874832153320312, -0.021831035614013672, -0.02078723907470703, -0.01974344253540039, -0.01869964599609375, -0.01765584945678711, -0.01661205291748047, -0.015568256378173828, -0.014524459838867188, -0.013480663299560547, -0.012436866760253906, -0.011393070220947266, -0.010349273681640625, -0.009305477142333984, -0.008261680603027344, -0.007217884063720703, -0.0061740875244140625, -0.005130290985107422, -0.004086494445800781, -0.0030426979064941406, -0.0019989013671875, -0.0009551048278808594, 8.869171142578125e-05, 0.0011324882507324219, 0.0021762847900390625, 0.003220081329345703, 0.004263877868652344, 0.005307674407958984, 0.006351470947265625, 0.007395267486572266, 0.008439064025878906, 0.009482860565185547, 0.010526657104492188, 0.011570453643798828, 0.012614250183105469, 0.01365804672241211, 0.01470184326171875, 0.01574563980102539, 0.01678943634033203, 0.017833232879638672, 0.018877029418945312, 0.019920825958251953, 0.020964622497558594, 0.022008419036865234, 0.023052215576171875, 0.024096012115478516, 0.025139808654785156, 0.026183605194091797, 0.027227401733398438, 0.028271198272705078, 0.02931499481201172, 0.03035879135131836, 0.031402587890625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 1.0, 2.0, 9.0, 10.0, 20.0, 22.0, 35.0, 46.0, 54.0, 106.0, 107.0, 117.0, 113.0, 92.0, 100.0, 53.0, 46.0, 19.0, 11.0, 9.0, 8.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2040138244628906e-05, -1.1427327990531921e-05, -1.0814517736434937e-05, -1.0201707482337952e-05, -9.588897228240967e-06, -8.976086974143982e-06, -8.363276720046997e-06, -7.750466465950012e-06, -7.137656211853027e-06, -6.5248459577560425e-06, -5.912035703659058e-06, -5.299225449562073e-06, -4.686415195465088e-06, -4.073604941368103e-06, -3.460794687271118e-06, -2.8479844331741333e-06, -2.2351741790771484e-06, -1.6223639249801636e-06, -1.0095536708831787e-06, -3.9674341678619385e-07, 2.1606683731079102e-07, 8.288770914077759e-07, 1.4416873455047607e-06, 2.0544975996017456e-06, 2.6673078536987305e-06, 3.2801181077957153e-06, 3.8929283618927e-06, 4.505738615989685e-06, 5.11854887008667e-06, 5.731359124183655e-06, 6.34416937828064e-06, 6.9569796323776245e-06, 7.569789886474609e-06, 8.182600140571594e-06, 8.795410394668579e-06, 9.408220648765564e-06, 1.0021030902862549e-05, 1.0633841156959534e-05, 1.1246651411056519e-05, 1.1859461665153503e-05, 1.2472271919250488e-05, 1.3085082173347473e-05, 1.3697892427444458e-05, 1.4310702681541443e-05, 1.4923512935638428e-05, 1.5536323189735413e-05, 1.6149133443832397e-05, 1.6761943697929382e-05, 1.7374753952026367e-05, 1.7987564206123352e-05, 1.8600374460220337e-05, 1.9213184714317322e-05, 1.9825994968414307e-05, 2.043880522251129e-05, 2.1051615476608276e-05, 2.166442573070526e-05, 2.2277235984802246e-05, 2.289004623889923e-05, 2.3502856492996216e-05, 2.41156667470932e-05, 2.4728477001190186e-05, 2.534128725528717e-05, 2.5954097509384155e-05, 2.656690776348114e-05, 2.7179718017578125e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 9.0, 9.0, 13.0, 19.0, 19.0, 43.0, 44.0, 60.0, 89.0, 105.0, 199.0, 282.0, 348.0, 500.0, 744.0, 1144.0, 1693.0, 2571.0, 4011.0, 6581.0, 11892.0, 22024.0, 45239.0, 98604.0, 201733.0, 274090.0, 190721.0, 92569.0, 42840.0, 21263.0, 11322.0, 6342.0, 3860.0, 2412.0, 1595.0, 1064.0, 667.0, 478.0, 357.0, 262.0, 177.0, 137.0, 109.0, 86.0, 66.0, 38.0, 35.0, 31.0, 17.0, 15.0, 9.0, 6.0, 8.0, 7.0, 1.0, 0.0, 1.0], "bins": [-0.0149078369140625, -0.014448404312133789, -0.013988971710205078, -0.013529539108276367, -0.013070106506347656, -0.012610673904418945, -0.012151241302490234, -0.011691808700561523, -0.011232376098632812, -0.010772943496704102, -0.01031351089477539, -0.00985407829284668, -0.009394645690917969, -0.008935213088989258, -0.008475780487060547, -0.008016347885131836, -0.007556915283203125, -0.007097482681274414, -0.006638050079345703, -0.006178617477416992, -0.005719184875488281, -0.00525975227355957, -0.004800319671630859, -0.0043408870697021484, -0.0038814544677734375, -0.0034220218658447266, -0.0029625892639160156, -0.0025031566619873047, -0.0020437240600585938, -0.0015842914581298828, -0.0011248588562011719, -0.0006654262542724609, -0.00020599365234375, 0.00025343894958496094, 0.0007128715515136719, 0.0011723041534423828, 0.0016317367553710938, 0.0020911693572998047, 0.0025506019592285156, 0.0030100345611572266, 0.0034694671630859375, 0.0039288997650146484, 0.004388332366943359, 0.00484776496887207, 0.005307197570800781, 0.005766630172729492, 0.006226062774658203, 0.006685495376586914, 0.007144927978515625, 0.007604360580444336, 0.008063793182373047, 0.008523225784301758, 0.008982658386230469, 0.00944209098815918, 0.00990152359008789, 0.010360956192016602, 0.010820388793945312, 0.011279821395874023, 0.011739253997802734, 0.012198686599731445, 0.012658119201660156, 0.013117551803588867, 0.013576984405517578, 0.014036417007446289, 0.014495849609375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 4.0, 7.0, 6.0, 5.0, 6.0, 8.0, 13.0, 16.0, 16.0, 23.0, 22.0, 39.0, 43.0, 59.0, 57.0, 67.0, 66.0, 67.0, 56.0, 65.0, 64.0, 41.0, 46.0, 35.0, 28.0, 29.0, 20.0, 19.0, 12.0, 9.0, 9.0, 12.0, 5.0, 4.0, 4.0, 5.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006160736083984375, -0.005951225757598877, -0.005741715431213379, -0.005532205104827881, -0.005322694778442383, -0.005113184452056885, -0.004903674125671387, -0.004694163799285889, -0.004484653472900391, -0.004275143146514893, -0.0040656328201293945, -0.0038561224937438965, -0.0036466121673583984, -0.0034371018409729004, -0.0032275915145874023, -0.0030180811882019043, -0.0028085708618164062, -0.002599060535430908, -0.00238955020904541, -0.002180039882659912, -0.001970529556274414, -0.001761019229888916, -0.001551508903503418, -0.00134199857711792, -0.0011324882507324219, -0.0009229779243469238, -0.0007134675979614258, -0.0005039572715759277, -0.0002944469451904297, -8.493661880493164e-05, 0.0001245737075805664, 0.00033408403396606445, 0.0005435943603515625, 0.0007531046867370605, 0.0009626150131225586, 0.0011721253395080566, 0.0013816356658935547, 0.0015911459922790527, 0.0018006563186645508, 0.002010166645050049, 0.002219676971435547, 0.002429187297821045, 0.002638697624206543, 0.002848207950592041, 0.003057718276977539, 0.003267228603363037, 0.003476738929748535, 0.003686249256134033, 0.0038957595825195312, 0.004105269908905029, 0.004314780235290527, 0.004524290561676025, 0.0047338008880615234, 0.0049433112144470215, 0.0051528215408325195, 0.005362331867218018, 0.005571842193603516, 0.005781352519989014, 0.005990862846374512, 0.00620037317276001, 0.006409883499145508, 0.006619393825531006, 0.006828904151916504, 0.007038414478302002, 0.0072479248046875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 5.0, 9.0, 8.0, 13.0, 15.0, 39.0, 38.0, 34.0, 70.0, 73.0, 80.0, 93.0, 78.0, 96.0, 72.0, 75.0, 50.0, 34.0, 34.0, 20.0, 12.0, 13.0, 15.0, 8.0, 6.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22945018112659454, -0.2225847691297531, -0.21571935713291168, -0.20885394513607025, -0.20198851823806763, -0.1951231062412262, -0.18825769424438477, -0.18139228224754333, -0.1745268702507019, -0.16766145825386047, -0.16079604625701904, -0.1539306342601776, -0.14706522226333618, -0.14019981026649475, -0.13333438336849213, -0.1264689713716507, -0.11960355937480927, -0.11273814737796783, -0.1058727353811264, -0.09900731593370438, -0.09214190393686295, -0.08527649194002151, -0.07841107249259949, -0.07154566049575806, -0.06468024849891663, -0.057814836502075195, -0.050949420779943466, -0.04408400505781174, -0.037218593060970306, -0.030353181064128876, -0.023487765341997147, -0.016622349619865417, -0.00975695252418518, -0.0028915386646986008, 0.003973875194787979, 0.010839289054274559, 0.01770470291376114, 0.02457011491060257, 0.0314355306327343, 0.03830094635486603, 0.04516635835170746, 0.05203177034854889, 0.05889718607068062, 0.06576260179281235, 0.07262801378965378, 0.07949342578649521, 0.08635884523391724, 0.09322425723075867, 0.1000896692276001, 0.10695508122444153, 0.11382049322128296, 0.12068591266870499, 0.12755131721496582, 0.13441672921180725, 0.14128215610980988, 0.1481475681066513, 0.15501298010349274, 0.16187839210033417, 0.1687438040971756, 0.17560921609401703, 0.18247464299201965, 0.18934005498886108, 0.19620546698570251, 0.20307087898254395, 0.20993629097938538]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 0.0, 4.0, 3.0, 7.0, 6.0, 18.0, 9.0, 10.0, 10.0, 10.0, 30.0, 34.0, 25.0, 29.0, 36.0, 32.0, 36.0, 36.0, 36.0, 42.0, 37.0, 36.0, 40.0, 47.0, 36.0, 44.0, 36.0, 46.0, 35.0, 38.0, 31.0, 21.0, 17.0, 18.0, 17.0, 28.0, 15.0, 15.0, 8.0, 11.0, 6.0, 3.0, 8.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16031111776828766, -0.15586137771606445, -0.15141162276268005, -0.14696188271045685, -0.14251214265823364, -0.13806240260601044, -0.13361266255378723, -0.12916290760040283, -0.12471316754817963, -0.12026342749595642, -0.11581367999315262, -0.11136393249034882, -0.10691419243812561, -0.1024644523859024, -0.0980147048830986, -0.0935649573802948, -0.0891152173280716, -0.08466547727584839, -0.08021572977304459, -0.07576598227024078, -0.07131624221801758, -0.06686650216579437, -0.06241675466299057, -0.057967010885477066, -0.05351726710796356, -0.04906752333045006, -0.044617779552936554, -0.04016803577542305, -0.035718291997909546, -0.03126854822039604, -0.026818804442882538, -0.022369060665369034, -0.017919331789016724, -0.01346958801150322, -0.009019844233989716, -0.0045701004564762115, -0.00012035667896270752, 0.0043293870985507965, 0.0087791308760643, 0.013228874653577805, 0.01767861843109131, 0.022128362208604813, 0.026578105986118317, 0.03102784976363182, 0.035477593541145325, 0.03992733731865883, 0.04437708109617233, 0.04882682487368584, 0.05327656865119934, 0.057726312428712845, 0.06217605620622635, 0.06662580370903015, 0.07107554376125336, 0.07552528381347656, 0.07997503131628036, 0.08442477881908417, 0.08887451887130737, 0.09332425892353058, 0.09777400642633438, 0.10222375392913818, 0.10667349398136139, 0.1111232340335846, 0.1155729815363884, 0.1200227290391922, 0.1244724690914154]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 7.0, 4.0, 14.0, 14.0, 17.0, 30.0, 37.0, 62.0, 100.0, 154.0, 268.0, 411.0, 744.0, 1389.0, 2810.0, 6139.0, 14752.0, 38698.0, 118393.0, 378727.0, 329570.0, 99067.0, 33253.0, 12937.0, 5363.0, 2515.0, 1335.0, 715.0, 382.0, 244.0, 135.0, 79.0, 50.0, 37.0, 32.0, 25.0, 12.0, 9.0, 9.0, 8.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.292236328125, -0.28386878967285156, -0.2755012512207031, -0.2671337127685547, -0.25876617431640625, -0.2503986358642578, -0.24203109741210938, -0.23366355895996094, -0.2252960205078125, -0.21692848205566406, -0.20856094360351562, -0.2001934051513672, -0.19182586669921875, -0.1834583282470703, -0.17509078979492188, -0.16672325134277344, -0.158355712890625, -0.14998817443847656, -0.14162063598632812, -0.1332530975341797, -0.12488555908203125, -0.11651802062988281, -0.10815048217773438, -0.09978294372558594, -0.0914154052734375, -0.08304786682128906, -0.07468032836914062, -0.06631278991699219, -0.05794525146484375, -0.04957771301269531, -0.041210174560546875, -0.03284263610839844, -0.02447509765625, -0.016107559204101562, -0.007740020751953125, 0.0006275177001953125, 0.00899505615234375, 0.017362594604492188, 0.025730133056640625, 0.03409767150878906, 0.0424652099609375, 0.05083274841308594, 0.059200286865234375, 0.06756782531738281, 0.07593536376953125, 0.08430290222167969, 0.09267044067382812, 0.10103797912597656, 0.109405517578125, 0.11777305603027344, 0.12614059448242188, 0.1345081329345703, 0.14287567138671875, 0.1512432098388672, 0.15961074829101562, 0.16797828674316406, 0.1763458251953125, 0.18471336364746094, 0.19308090209960938, 0.2014484405517578, 0.20981597900390625, 0.2181835174560547, 0.22655105590820312, 0.23491859436035156, 0.2432861328125]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 12.0, 3.0, 7.0, 13.0, 21.0, 13.0, 21.0, 27.0, 29.0, 27.0, 38.0, 23.0, 32.0, 38.0, 44.0, 40.0, 45.0, 37.0, 39.0, 51.0, 47.0, 37.0, 40.0, 41.0, 39.0, 33.0, 26.0, 32.0, 15.0, 13.0, 17.0, 19.0, 17.0, 10.0, 16.0, 10.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.2841796875, -0.27631568908691406, -0.2684516906738281, -0.2605876922607422, -0.25272369384765625, -0.2448596954345703, -0.23699569702148438, -0.22913169860839844, -0.2212677001953125, -0.21340370178222656, -0.20553970336914062, -0.1976757049560547, -0.18981170654296875, -0.1819477081298828, -0.17408370971679688, -0.16621971130371094, -0.158355712890625, -0.15049171447753906, -0.14262771606445312, -0.1347637176513672, -0.12689971923828125, -0.11903572082519531, -0.11117172241210938, -0.10330772399902344, -0.0954437255859375, -0.08757972717285156, -0.07971572875976562, -0.07185173034667969, -0.06398773193359375, -0.05612373352050781, -0.048259735107421875, -0.04039573669433594, -0.03253173828125, -0.024667739868164062, -0.016803741455078125, -0.008939743041992188, -0.00107574462890625, 0.0067882537841796875, 0.014652252197265625, 0.022516250610351562, 0.0303802490234375, 0.03824424743652344, 0.046108245849609375, 0.05397224426269531, 0.06183624267578125, 0.06970024108886719, 0.07756423950195312, 0.08542823791503906, 0.093292236328125, 0.10115623474121094, 0.10902023315429688, 0.11688423156738281, 0.12474822998046875, 0.1326122283935547, 0.14047622680664062, 0.14834022521972656, 0.1562042236328125, 0.16406822204589844, 0.17193222045898438, 0.1797962188720703, 0.18766021728515625, 0.1955242156982422, 0.20338821411132812, 0.21125221252441406, 0.2191162109375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 0.0, 4.0, 4.0, 5.0, 9.0, 9.0, 21.0, 22.0, 19.0, 31.0, 45.0, 56.0, 82.0, 112.0, 156.0, 246.0, 466.0, 871.0, 1654.0, 3908.0, 10491.0, 30112.0, 97532.0, 342546.0, 389966.0, 114590.0, 35145.0, 11808.0, 4508.0, 1867.0, 879.0, 480.0, 286.0, 173.0, 120.0, 86.0, 68.0, 43.0, 27.0, 31.0, 19.0, 13.0, 18.0, 6.0, 5.0, 5.0, 8.0, 5.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.35302734375, -0.34323883056640625, -0.3334503173828125, -0.32366180419921875, -0.313873291015625, -0.30408477783203125, -0.2942962646484375, -0.28450775146484375, -0.27471923828125, -0.26493072509765625, -0.2551422119140625, -0.24535369873046875, -0.235565185546875, -0.22577667236328125, -0.2159881591796875, -0.20619964599609375, -0.1964111328125, -0.18662261962890625, -0.1768341064453125, -0.16704559326171875, -0.157257080078125, -0.14746856689453125, -0.1376800537109375, -0.12789154052734375, -0.11810302734375, -0.10831451416015625, -0.0985260009765625, -0.08873748779296875, -0.078948974609375, -0.06916046142578125, -0.0593719482421875, -0.04958343505859375, -0.039794921875, -0.03000640869140625, -0.0202178955078125, -0.01042938232421875, -0.000640869140625, 0.00914764404296875, 0.0189361572265625, 0.02872467041015625, 0.03851318359375, 0.04830169677734375, 0.0580902099609375, 0.06787872314453125, 0.077667236328125, 0.08745574951171875, 0.0972442626953125, 0.10703277587890625, 0.1168212890625, 0.12660980224609375, 0.1363983154296875, 0.14618682861328125, 0.155975341796875, 0.16576385498046875, 0.1755523681640625, 0.18534088134765625, 0.19512939453125, 0.20491790771484375, 0.2147064208984375, 0.22449493408203125, 0.234283447265625, 0.24407196044921875, 0.2538604736328125, 0.26364898681640625, 0.2734375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 10.0, 9.0, 8.0, 8.0, 7.0, 11.0, 17.0, 15.0, 21.0, 23.0, 23.0, 31.0, 43.0, 37.0, 35.0, 42.0, 49.0, 41.0, 53.0, 41.0, 46.0, 49.0, 40.0, 49.0, 40.0, 38.0, 28.0, 27.0, 24.0, 19.0, 28.0, 19.0, 16.0, 10.0, 10.0, 11.0, 2.0, 1.0, 5.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.3115234375, -0.3027076721191406, -0.29389190673828125, -0.2850761413574219, -0.2762603759765625, -0.2674446105957031, -0.25862884521484375, -0.24981307983398438, -0.240997314453125, -0.23218154907226562, -0.22336578369140625, -0.21455001831054688, -0.2057342529296875, -0.19691848754882812, -0.18810272216796875, -0.17928695678710938, -0.17047119140625, -0.16165542602539062, -0.15283966064453125, -0.14402389526367188, -0.1352081298828125, -0.12639236450195312, -0.11757659912109375, -0.10876083374023438, -0.099945068359375, -0.09112930297851562, -0.08231353759765625, -0.07349777221679688, -0.0646820068359375, -0.055866241455078125, -0.04705047607421875, -0.038234710693359375, -0.0294189453125, -0.020603179931640625, -0.01178741455078125, -0.002971649169921875, 0.0058441162109375, 0.014659881591796875, 0.02347564697265625, 0.032291412353515625, 0.041107177734375, 0.049922943115234375, 0.05873870849609375, 0.06755447387695312, 0.0763702392578125, 0.08518600463867188, 0.09400177001953125, 0.10281753540039062, 0.11163330078125, 0.12044906616210938, 0.12926483154296875, 0.13808059692382812, 0.1468963623046875, 0.15571212768554688, 0.16452789306640625, 0.17334365844726562, 0.182159423828125, 0.19097518920898438, 0.19979095458984375, 0.20860671997070312, 0.2174224853515625, 0.22623825073242188, 0.23505401611328125, 0.24386978149414062, 0.252685546875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 4.0, 5.0, 7.0, 10.0, 22.0, 46.0, 65.0, 127.0, 245.0, 622.0, 1580.0, 5052.0, 24667.0, 224744.0, 690497.0, 83476.0, 12304.0, 3158.0, 1045.0, 445.0, 181.0, 106.0, 51.0, 36.0, 17.0, 14.0, 6.0, 6.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0909423828125, -0.08803653717041016, -0.08513069152832031, -0.08222484588623047, -0.07931900024414062, -0.07641315460205078, -0.07350730895996094, -0.0706014633178711, -0.06769561767578125, -0.0647897720336914, -0.06188392639160156, -0.05897808074951172, -0.056072235107421875, -0.05316638946533203, -0.05026054382324219, -0.047354698181152344, -0.0444488525390625, -0.041543006896972656, -0.03863716125488281, -0.03573131561279297, -0.032825469970703125, -0.02991962432861328, -0.027013778686523438, -0.024107933044433594, -0.02120208740234375, -0.018296241760253906, -0.015390396118164062, -0.012484550476074219, -0.009578704833984375, -0.006672859191894531, -0.0037670135498046875, -0.0008611679077148438, 0.002044677734375, 0.004950523376464844, 0.007856369018554688, 0.010762214660644531, 0.013668060302734375, 0.01657390594482422, 0.019479751586914062, 0.022385597229003906, 0.02529144287109375, 0.028197288513183594, 0.031103134155273438, 0.03400897979736328, 0.036914825439453125, 0.03982067108154297, 0.04272651672363281, 0.045632362365722656, 0.0485382080078125, 0.051444053649902344, 0.05434989929199219, 0.05725574493408203, 0.060161590576171875, 0.06306743621826172, 0.06597328186035156, 0.0688791275024414, 0.07178497314453125, 0.0746908187866211, 0.07759666442871094, 0.08050251007080078, 0.08340835571289062, 0.08631420135498047, 0.08922004699707031, 0.09212589263916016, 0.09503173828125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 3.0, 3.0, 10.0, 9.0, 16.0, 12.0, 31.0, 37.0, 54.0, 55.0, 89.0, 84.0, 128.0, 132.0, 79.0, 69.0, 39.0, 45.0, 36.0, 18.0, 16.0, 6.0, 8.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.404254913330078e-06, -8.063390851020813e-06, -7.722526788711548e-06, -7.381662726402283e-06, -7.040798664093018e-06, -6.6999346017837524e-06, -6.359070539474487e-06, -6.018206477165222e-06, -5.677342414855957e-06, -5.336478352546692e-06, -4.995614290237427e-06, -4.654750227928162e-06, -4.3138861656188965e-06, -3.973022103309631e-06, -3.632158041000366e-06, -3.291293978691101e-06, -2.950429916381836e-06, -2.609565854072571e-06, -2.2687017917633057e-06, -1.9278377294540405e-06, -1.5869736671447754e-06, -1.2461096048355103e-06, -9.052455425262451e-07, -5.6438148021698e-07, -2.2351741790771484e-07, 1.1734664440155029e-07, 4.5821070671081543e-07, 7.990747690200806e-07, 1.1399388313293457e-06, 1.4808028936386108e-06, 1.821666955947876e-06, 2.162531018257141e-06, 2.5033950805664062e-06, 2.8442591428756714e-06, 3.1851232051849365e-06, 3.5259872674942017e-06, 3.866851329803467e-06, 4.207715392112732e-06, 4.548579454421997e-06, 4.889443516731262e-06, 5.230307579040527e-06, 5.5711716413497925e-06, 5.912035703659058e-06, 6.252899765968323e-06, 6.593763828277588e-06, 6.934627890586853e-06, 7.275491952896118e-06, 7.616356015205383e-06, 7.957220077514648e-06, 8.298084139823914e-06, 8.638948202133179e-06, 8.979812264442444e-06, 9.320676326751709e-06, 9.661540389060974e-06, 1.000240445137024e-05, 1.0343268513679504e-05, 1.068413257598877e-05, 1.1024996638298035e-05, 1.13658607006073e-05, 1.1706724762916565e-05, 1.204758882522583e-05, 1.2388452887535095e-05, 1.272931694984436e-05, 1.3070181012153625e-05, 1.341104507446289e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 6.0, 7.0, 18.0, 14.0, 27.0, 33.0, 56.0, 61.0, 97.0, 135.0, 191.0, 328.0, 480.0, 814.0, 1340.0, 2402.0, 4478.0, 8968.0, 21609.0, 67303.0, 276748.0, 486810.0, 117863.0, 32819.0, 12601.0, 5998.0, 3001.0, 1646.0, 915.0, 610.0, 382.0, 257.0, 162.0, 109.0, 83.0, 53.0, 36.0, 21.0, 23.0, 12.0, 3.0, 15.0, 6.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.058563232421875, -0.0566864013671875, -0.0548095703125, -0.0529327392578125, -0.051055908203125, -0.0491790771484375, -0.04730224609375, -0.0454254150390625, -0.043548583984375, -0.0416717529296875, -0.039794921875, -0.0379180908203125, -0.036041259765625, -0.0341644287109375, -0.03228759765625, -0.0304107666015625, -0.028533935546875, -0.0266571044921875, -0.0247802734375, -0.0229034423828125, -0.021026611328125, -0.0191497802734375, -0.01727294921875, -0.0153961181640625, -0.013519287109375, -0.0116424560546875, -0.009765625, -0.0078887939453125, -0.006011962890625, -0.0041351318359375, -0.00225830078125, -0.0003814697265625, 0.001495361328125, 0.0033721923828125, 0.0052490234375, 0.0071258544921875, 0.009002685546875, 0.0108795166015625, 0.01275634765625, 0.0146331787109375, 0.016510009765625, 0.0183868408203125, 0.020263671875, 0.0221405029296875, 0.024017333984375, 0.0258941650390625, 0.02777099609375, 0.0296478271484375, 0.031524658203125, 0.0334014892578125, 0.0352783203125, 0.0371551513671875, 0.039031982421875, 0.0409088134765625, 0.04278564453125, 0.0446624755859375, 0.046539306640625, 0.0484161376953125, 0.05029296875, 0.0521697998046875, 0.054046630859375, 0.0559234619140625, 0.05780029296875, 0.0596771240234375, 0.061553955078125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 9.0, 7.0, 6.0, 4.0, 13.0, 21.0, 18.0, 16.0, 40.0, 65.0, 87.0, 98.0, 186.0, 118.0, 91.0, 77.0, 44.0, 35.0, 20.0, 14.0, 8.0, 8.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04608154296875, -0.04462718963623047, -0.04317283630371094, -0.041718482971191406, -0.040264129638671875, -0.038809776306152344, -0.03735542297363281, -0.03590106964111328, -0.03444671630859375, -0.03299236297607422, -0.03153800964355469, -0.030083656311035156, -0.028629302978515625, -0.027174949645996094, -0.025720596313476562, -0.02426624298095703, -0.0228118896484375, -0.02135753631591797, -0.019903182983398438, -0.018448829650878906, -0.016994476318359375, -0.015540122985839844, -0.014085769653320312, -0.012631416320800781, -0.01117706298828125, -0.009722709655761719, -0.008268356323242188, -0.006814002990722656, -0.005359649658203125, -0.0039052963256835938, -0.0024509429931640625, -0.0009965896606445312, 0.000457763671875, 0.0019121170043945312, 0.0033664703369140625, 0.004820823669433594, 0.006275177001953125, 0.007729530334472656, 0.009183883666992188, 0.010638236999511719, 0.01209259033203125, 0.013546943664550781, 0.015001296997070312, 0.016455650329589844, 0.017910003662109375, 0.019364356994628906, 0.020818710327148438, 0.02227306365966797, 0.0237274169921875, 0.02518177032470703, 0.026636123657226562, 0.028090476989746094, 0.029544830322265625, 0.030999183654785156, 0.03245353698730469, 0.03390789031982422, 0.03536224365234375, 0.03681659698486328, 0.03827095031738281, 0.039725303649902344, 0.041179656982421875, 0.042634010314941406, 0.04408836364746094, 0.04554271697998047, 0.0469970703125]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 10.0, 5.0, 18.0, 30.0, 44.0, 76.0, 147.0, 185.0, 146.0, 118.0, 82.0, 49.0, 38.0, 25.0, 8.0, 9.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8316740989685059, -0.8072460889816284, -0.7828181385993958, -0.7583901286125183, -0.7339621782302856, -0.7095341682434082, -0.6851061582565308, -0.6606782078742981, -0.6362502574920654, -0.611822247505188, -0.5873942971229553, -0.5629662871360779, -0.5385383367538452, -0.5141103267669678, -0.4896823465824127, -0.46525436639785767, -0.4408263564109802, -0.41639837622642517, -0.3919703960418701, -0.3675423860549927, -0.34311443567276, -0.31868642568588257, -0.2942584455013275, -0.26983046531677246, -0.2454024851322174, -0.22097450494766235, -0.1965465247631073, -0.17211852967739105, -0.147690549492836, -0.12326256930828094, -0.0988345742225647, -0.07440659403800964, -0.049978673458099365, -0.025550689548254013, -0.0011227056384086609, 0.02330528199672699, 0.04773326218128204, 0.0721612423658371, 0.09658923745155334, 0.1210172176361084, 0.14544519782066345, 0.1698731780052185, 0.19430115818977356, 0.2187291532754898, 0.24315713346004486, 0.2675850987434387, 0.29201310873031616, 0.3164410889148712, 0.34086906909942627, 0.3652970492839813, 0.3897250294685364, 0.4141530394554138, 0.4385809898376465, 0.4630089998245239, 0.487436980009079, 0.511864960193634, 0.5362929105758667, 0.5607209205627441, 0.5851488709449768, 0.6095768809318542, 0.6340048313140869, 0.6584328413009644, 0.6828608512878418, 0.7072888016700745, 0.7317168116569519]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 2.0, 4.0, 6.0, 7.0, 9.0, 10.0, 19.0, 15.0, 21.0, 13.0, 27.0, 35.0, 34.0, 33.0, 34.0, 48.0, 26.0, 37.0, 30.0, 38.0, 46.0, 35.0, 45.0, 33.0, 35.0, 52.0, 34.0, 37.0, 29.0, 35.0, 27.0, 23.0, 21.0, 16.0, 19.0, 13.0, 15.0, 8.0, 10.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.5037117600440979, -0.4893195927143097, -0.4749274253845215, -0.4605352282524109, -0.4461430609226227, -0.4317508935928345, -0.4173586964607239, -0.40296652913093567, -0.38857436180114746, -0.37418219447135925, -0.35979002714157104, -0.34539783000946045, -0.33100566267967224, -0.31661349534988403, -0.30222129821777344, -0.28782913088798523, -0.273436963558197, -0.2590447962284088, -0.2446526139974594, -0.23026043176651, -0.2158682644367218, -0.2014760971069336, -0.1870839148759842, -0.1726917326450348, -0.15829956531524658, -0.14390739798545837, -0.12951521575450897, -0.11512304097414017, -0.10073086619377136, -0.08633869141340256, -0.07194651663303375, -0.05755434185266495, -0.043162137269973755, -0.02876996248960495, -0.014377787709236145, 1.4387071132659912e-05, 0.014406561851501465, 0.02879873663187027, 0.043190911412239075, 0.05758308619260788, 0.07197526097297668, 0.08636743575334549, 0.1007596105337143, 0.1151517853140831, 0.1295439600944519, 0.1439361274242401, 0.15832830965518951, 0.17272049188613892, 0.18711265921592712, 0.20150482654571533, 0.21589700877666473, 0.23028919100761414, 0.24468135833740234, 0.25907352566719055, 0.27346569299697876, 0.28785789012908936, 0.30225005745887756, 0.31664222478866577, 0.33103442192077637, 0.3454265892505646, 0.3598187565803528, 0.374210923910141, 0.3886030912399292, 0.4029952883720398, 0.417387455701828]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 0.0, 3.0, 6.0, 3.0, 5.0, 9.0, 4.0, 9.0, 5.0, 15.0, 7.0, 17.0, 20.0, 40.0, 39.0, 59.0, 77.0, 118.0, 200.0, 285.0, 493.0, 818.0, 1713.0, 3983.0, 1035941.0, 3355.0, 1388.0, 705.0, 449.0, 257.0, 155.0, 115.0, 72.0, 59.0, 31.0, 32.0, 22.0, 16.0, 15.0, 8.0, 11.0, 11.0, 8.0, 7.0, 5.0, 1.0, 4.0, 7.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.7920936942100525, -0.7683619856834412, -0.7446303367614746, -0.7208986282348633, -0.6971669793128967, -0.6734352707862854, -0.6497036218643188, -0.6259719133377075, -0.6022402048110962, -0.5785084962844849, -0.5547768473625183, -0.531045138835907, -0.5073134899139404, -0.4835817813873291, -0.45985010266304016, -0.4361184239387512, -0.41238677501678467, -0.3886550962924957, -0.3649234175682068, -0.34119170904159546, -0.3174600601196289, -0.2937283515930176, -0.26999667286872864, -0.2462649941444397, -0.22253331542015076, -0.19880163669586182, -0.17506995797157288, -0.15133826434612274, -0.1276065856218338, -0.10387490689754486, -0.08014321327209473, -0.056411534547805786, -0.032679855823516846, -0.008948173373937607, 0.014783509075641632, 0.03851519525051117, 0.06224687397480011, 0.08597855269908905, 0.10971024632453918, 0.13344192504882812, 0.15717360377311707, 0.180905282497406, 0.20463696122169495, 0.22836865484714508, 0.2521003484725952, 0.27583199739456177, 0.2995637059211731, 0.32329538464546204, 0.347027063369751, 0.3707587420940399, 0.39449042081832886, 0.4182221293449402, 0.44195377826690674, 0.46568548679351807, 0.489417165517807, 0.513148844242096, 0.5368804931640625, 0.5606122016906738, 0.5843438506126404, 0.6080755591392517, 0.6318072080612183, 0.6555389165878296, 0.6792706251144409, 0.7030022740364075, 0.7267339825630188]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 9.0, 3.0, 6.0, 19.0, 20.0, 31.0, 38.0, 56.0, 93.0, 117.0, 178.0, 259.0, 468.0, 1034.0, 3502.0, 51455756.0, 5920.0, 1232.0, 577.0, 328.0, 216.0, 135.0, 101.0, 62.0, 50.0, 32.0, 28.0, 23.0, 12.0, 5.0, 8.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7265625, -10.387202262878418, -10.047842025756836, -9.70848274230957, -9.369122505187988, -9.029762268066406, -8.69040298461914, -8.351042747497559, -8.011682510375977, -7.6723222732543945, -7.332962512969971, -6.993602752685547, -6.654242515563965, -6.314882278442383, -5.975522518157959, -5.636162757873535, -5.296802520751953, -4.957442283630371, -4.618082523345947, -4.278722763061523, -3.9393625259399414, -3.6000025272369385, -3.2606425285339355, -2.9212825298309326, -2.5819225311279297, -2.2425625324249268, -1.9032025337219238, -1.563842535018921, -1.224482536315918, -0.885122537612915, -0.5457625389099121, -0.20640254020690918, 0.13295841217041016, 0.4723184108734131, 0.811678409576416, 1.151038408279419, 1.4903984069824219, 1.8297584056854248, 2.1691184043884277, 2.5084784030914307, 2.8478384017944336, 3.1871984004974365, 3.5265583992004395, 3.8659183979034424, 4.205278396606445, 4.544638633728027, 4.883998394012451, 5.223358154296875, 5.562718391418457, 5.902078628540039, 6.241438388824463, 6.580798149108887, 6.920158386230469, 7.259518623352051, 7.598878383636475, 7.938238143920898, 8.27759838104248, 8.616958618164062, 8.956317901611328, 9.29567813873291, 9.635038375854492, 9.974398612976074, 10.313758850097656, 10.653118133544922, 10.992478370666504]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 10.0, 16.0, 18.0, 28.0, 42.0, 72.0, 64.0, 115.0, 163.0, 307.0, 431.0, 645.0, 1056.0, 1752.0, 2719.0, 4801.0, 7860.0, 13485.0, 24120.0, 43756.0, 79521.0, 146907.0, 264780.0, 444811.0, 2621232.0, 1655880.0, 421060.0, 248093.0, 137278.0, 74274.0, 40961.0, 22810.0, 12994.0, 7433.0, 4491.0, 2764.0, 1676.0, 1115.0, 692.0, 387.0, 288.0, 184.0, 129.0, 73.0, 54.0, 27.0, 19.0, 18.0, 15.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.77099609375, -0.7482833862304688, -0.7255706787109375, -0.7028579711914062, -0.680145263671875, -0.6574325561523438, -0.6347198486328125, -0.6120071411132812, -0.58929443359375, -0.5665817260742188, -0.5438690185546875, -0.5211563110351562, -0.498443603515625, -0.47573089599609375, -0.4530181884765625, -0.43030548095703125, -0.4075927734375, -0.38488006591796875, -0.3621673583984375, -0.33945465087890625, -0.316741943359375, -0.29402923583984375, -0.2713165283203125, -0.24860382080078125, -0.22589111328125, -0.20317840576171875, -0.1804656982421875, -0.15775299072265625, -0.135040283203125, -0.11232757568359375, -0.0896148681640625, -0.06690216064453125, -0.044189453125, -0.02147674560546875, 0.0012359619140625, 0.02394866943359375, 0.046661376953125, 0.06937408447265625, 0.0920867919921875, 0.11479949951171875, 0.13751220703125, 0.16022491455078125, 0.1829376220703125, 0.20565032958984375, 0.228363037109375, 0.25107574462890625, 0.2737884521484375, 0.29650115966796875, 0.3192138671875, 0.34192657470703125, 0.3646392822265625, 0.38735198974609375, 0.410064697265625, 0.43277740478515625, 0.4554901123046875, 0.47820281982421875, 0.50091552734375, 0.5236282348632812, 0.5463409423828125, 0.5690536499023438, 0.591766357421875, 0.6144790649414062, 0.6371917724609375, 0.6599044799804688, 0.6826171875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 3.0, 2.0, 5.0, 8.0, 12.0, 11.0, 20.0, 14.0, 23.0, 20.0, 15.0, 27.0, 37.0, 49.0, 45.0, 45.0, 50.0, 65.0, 240.0, 805.0, 115.0, 55.0, 46.0, 52.0, 42.0, 36.0, 33.0, 24.0, 22.0, 20.0, 22.0, 14.0, 14.0, 11.0, 5.0, 10.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.5625, -5.4049072265625, -5.247314453125, -5.0897216796875, -4.93212890625, -4.7745361328125, -4.616943359375, -4.4593505859375, -4.3017578125, -4.1441650390625, -3.986572265625, -3.8289794921875, -3.67138671875, -3.5137939453125, -3.356201171875, -3.1986083984375, -3.041015625, -2.8834228515625, -2.725830078125, -2.5682373046875, -2.41064453125, -2.2530517578125, -2.095458984375, -1.9378662109375, -1.7802734375, -1.6226806640625, -1.465087890625, -1.3074951171875, -1.14990234375, -0.9923095703125, -0.834716796875, -0.6771240234375, -0.51953125, -0.3619384765625, -0.204345703125, -0.0467529296875, 0.11083984375, 0.2684326171875, 0.426025390625, 0.5836181640625, 0.7412109375, 0.8988037109375, 1.056396484375, 1.2139892578125, 1.37158203125, 1.5291748046875, 1.686767578125, 1.8443603515625, 2.001953125, 2.1595458984375, 2.317138671875, 2.4747314453125, 2.63232421875, 2.7899169921875, 2.947509765625, 3.1051025390625, 3.2626953125, 3.4202880859375, 3.577880859375, 3.7354736328125, 3.89306640625, 4.0506591796875, 4.208251953125, 4.3658447265625, 4.5234375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 5.0, 2.0, 8.0, 14.0, 21.0, 41.0, 86.0, 91.0, 174.0, 285.0, 427.0, 683.0, 1020.0, 1738.0, 2672.0, 4442.0, 7084.0, 11442.0, 18563.0, 29475.0, 47676.0, 74988.0, 116299.0, 173113.0, 245073.0, 323822.0, 595413.0, 3293874.0, 398791.0, 297153.0, 220176.0, 152391.0, 100788.0, 64954.0, 41074.0, 25781.0, 15952.0, 9668.0, 6165.0, 3815.0, 2423.0, 1390.0, 916.0, 560.0, 354.0, 225.0, 112.0, 86.0, 47.0, 32.0, 16.0, 12.0, 10.0, 12.0, 3.0, 5.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.405517578125, -0.392578125, -0.379638671875, -0.36669921875, -0.353759765625, -0.3408203125, -0.327880859375, -0.31494140625, -0.302001953125, -0.2890625, -0.276123046875, -0.26318359375, -0.250244140625, -0.2373046875, -0.224365234375, -0.21142578125, -0.198486328125, -0.185546875, -0.172607421875, -0.15966796875, -0.146728515625, -0.1337890625, -0.120849609375, -0.10791015625, -0.094970703125, -0.08203125, -0.069091796875, -0.05615234375, -0.043212890625, -0.0302734375, -0.017333984375, -0.00439453125, 0.008544921875, 0.021484375, 0.034423828125, 0.04736328125, 0.060302734375, 0.0732421875, 0.086181640625, 0.09912109375, 0.112060546875, 0.125, 0.137939453125, 0.15087890625, 0.163818359375, 0.1767578125, 0.189697265625, 0.20263671875, 0.215576171875, 0.228515625, 0.241455078125, 0.25439453125, 0.267333984375, 0.2802734375, 0.293212890625, 0.30615234375, 0.319091796875, 0.33203125, 0.344970703125, 0.35791015625, 0.370849609375, 0.3837890625, 0.396728515625, 0.40966796875, 0.422607421875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 7.0, 10.0, 13.0, 5.0, 14.0, 18.0, 13.0, 17.0, 20.0, 17.0, 20.0, 30.0, 30.0, 29.0, 37.0, 34.0, 41.0, 28.0, 40.0, 75.0, 438.0, 592.0, 73.0, 41.0, 28.0, 26.0, 33.0, 42.0, 20.0, 29.0, 26.0, 14.0, 17.0, 16.0, 23.0, 14.0, 10.0, 12.0, 14.0, 8.0, 4.0, 9.0, 9.0, 7.0, 4.0, 5.0, 7.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.076171875, -2.977264404296875, -2.87835693359375, -2.779449462890625, -2.6805419921875, -2.581634521484375, -2.48272705078125, -2.383819580078125, -2.284912109375, -2.186004638671875, -2.08709716796875, -1.988189697265625, -1.8892822265625, -1.790374755859375, -1.69146728515625, -1.592559814453125, -1.49365234375, -1.394744873046875, -1.29583740234375, -1.196929931640625, -1.0980224609375, -0.999114990234375, -0.90020751953125, -0.801300048828125, -0.702392578125, -0.603485107421875, -0.50457763671875, -0.405670166015625, -0.3067626953125, -0.207855224609375, -0.10894775390625, -0.010040283203125, 0.0888671875, 0.187774658203125, 0.28668212890625, 0.385589599609375, 0.4844970703125, 0.583404541015625, 0.68231201171875, 0.781219482421875, 0.880126953125, 0.979034423828125, 1.07794189453125, 1.176849365234375, 1.2757568359375, 1.374664306640625, 1.47357177734375, 1.572479248046875, 1.67138671875, 1.770294189453125, 1.86920166015625, 1.968109130859375, 2.0670166015625, 2.165924072265625, 2.26483154296875, 2.363739013671875, 2.462646484375, 2.561553955078125, 2.66046142578125, 2.759368896484375, 2.8582763671875, 2.957183837890625, 3.05609130859375, 3.154998779296875, 3.25390625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 8.0, 18.0, 20.0, 25.0, 26.0, 34.0, 47.0, 71.0, 94.0, 113.0, 148.0, 213.0, 319.0, 486.0, 684.0, 931.0, 1494.0, 2473.0, 4143.0, 7615.0, 15149.0, 31358.0, 64539.0, 132790.0, 5544323.0, 298825.0, 93221.0, 45443.0, 21798.0, 10582.0, 5507.0, 3203.0, 1763.0, 1149.0, 774.0, 564.0, 422.0, 287.0, 251.0, 162.0, 114.0, 77.0, 50.0, 42.0, 22.0, 16.0, 12.0, 14.0, 4.0, 6.0, 6.0, 5.0, 0.0, 0.0, 1.0], "bins": [-1.578125, -1.5313720703125, -1.484619140625, -1.4378662109375, -1.39111328125, -1.3443603515625, -1.297607421875, -1.2508544921875, -1.2041015625, -1.1573486328125, -1.110595703125, -1.0638427734375, -1.01708984375, -0.9703369140625, -0.923583984375, -0.8768310546875, -0.830078125, -0.7833251953125, -0.736572265625, -0.6898193359375, -0.64306640625, -0.5963134765625, -0.549560546875, -0.5028076171875, -0.4560546875, -0.4093017578125, -0.362548828125, -0.3157958984375, -0.26904296875, -0.2222900390625, -0.175537109375, -0.1287841796875, -0.08203125, -0.0352783203125, 0.011474609375, 0.0582275390625, 0.10498046875, 0.1517333984375, 0.198486328125, 0.2452392578125, 0.2919921875, 0.3387451171875, 0.385498046875, 0.4322509765625, 0.47900390625, 0.5257568359375, 0.572509765625, 0.6192626953125, 0.666015625, 0.7127685546875, 0.759521484375, 0.8062744140625, 0.85302734375, 0.8997802734375, 0.946533203125, 0.9932861328125, 1.0400390625, 1.0867919921875, 1.133544921875, 1.1802978515625, 1.22705078125, 1.2738037109375, 1.320556640625, 1.3673095703125, 1.4140625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 8.0, 16.0, 6.0, 8.0, 11.0, 26.0, 13.0, 36.0, 28.0, 25.0, 25.0, 30.0, 29.0, 49.0, 45.0, 49.0, 44.0, 340.0, 750.0, 69.0, 38.0, 40.0, 33.0, 47.0, 36.0, 31.0, 27.0, 24.0, 27.0, 18.0, 13.0, 15.0, 18.0, 9.0, 6.0, 6.0, 6.0, 4.0, 8.0, 5.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.19140625, -4.06884765625, -3.9462890625, -3.82373046875, -3.701171875, -3.57861328125, -3.4560546875, -3.33349609375, -3.2109375, -3.08837890625, -2.9658203125, -2.84326171875, -2.720703125, -2.59814453125, -2.4755859375, -2.35302734375, -2.23046875, -2.10791015625, -1.9853515625, -1.86279296875, -1.740234375, -1.61767578125, -1.4951171875, -1.37255859375, -1.25, -1.12744140625, -1.0048828125, -0.88232421875, -0.759765625, -0.63720703125, -0.5146484375, -0.39208984375, -0.26953125, -0.14697265625, -0.0244140625, 0.09814453125, 0.220703125, 0.34326171875, 0.4658203125, 0.58837890625, 0.7109375, 0.83349609375, 0.9560546875, 1.07861328125, 1.201171875, 1.32373046875, 1.4462890625, 1.56884765625, 1.69140625, 1.81396484375, 1.9365234375, 2.05908203125, 2.181640625, 2.30419921875, 2.4267578125, 2.54931640625, 2.671875, 2.79443359375, 2.9169921875, 3.03955078125, 3.162109375, 3.28466796875, 3.4072265625, 3.52978515625, 3.65234375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 7.0, 4.0, 7.0, 11.0, 25.0, 35.0, 75.0, 162.0, 245.0, 216.0, 105.0, 47.0, 22.0, 21.0, 9.0, 9.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.026805877685547, -18.461204528808594, -17.89560317993164, -17.330001831054688, -16.764400482177734, -16.198801040649414, -15.633199691772461, -15.067598342895508, -14.501996994018555, -13.936395645141602, -13.370794296264648, -12.805193901062012, -12.239592552185059, -11.673991203308105, -11.108390808105469, -10.542789459228516, -9.977188110351562, -9.41158676147461, -8.845985412597656, -8.28038501739502, -7.714783668518066, -7.149182319641113, -6.583581447601318, -6.017980575561523, -5.45237922668457, -4.886777877807617, -4.321177005767822, -3.7555758953094482, -3.189974784851074, -2.6243736743927, -2.058772563934326, -1.4931714534759521, -0.9275722503662109, -0.3619711399078369, 0.2036299705505371, 0.7692310810089111, 1.3348321914672852, 1.9004333019256592, 2.466034412384033, 3.0316355228424072, 3.5972366333007812, 4.162837982177734, 4.728438854217529, 5.294039726257324, 5.859641075134277, 6.4252424240112305, 6.990843296051025, 7.55644416809082, 8.122045516967773, 8.687646865844727, 9.25324821472168, 9.818848609924316, 10.38444995880127, 10.950051307678223, 11.51565170288086, 12.081253051757812, 12.646854400634766, 13.212455749511719, 13.778057098388672, 14.343657493591309, 14.909258842468262, 15.474860191345215, 16.04046058654785, 16.606061935424805, 17.171663284301758]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 6.0, 6.0, 5.0, 9.0, 10.0, 13.0, 9.0, 16.0, 17.0, 18.0, 33.0, 28.0, 29.0, 53.0, 51.0, 44.0, 55.0, 62.0, 67.0, 53.0, 53.0, 45.0, 44.0, 39.0, 42.0, 21.0, 37.0, 26.0, 18.0, 9.0, 14.0, 8.0, 9.0, 8.0, 7.0, 4.0, 2.0, 4.0, 3.0, 5.0, 3.0, 5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0], "bins": [-12.745399475097656, -12.375323295593262, -12.005248069763184, -11.635171890258789, -11.265096664428711, -10.895020484924316, -10.524944305419922, -10.154869079589844, -9.784793853759766, -9.414717674255371, -9.044642448425293, -8.674566268920898, -8.30449104309082, -7.934414863586426, -7.5643391609191895, -7.194263458251953, -6.824187278747559, -6.454111576080322, -6.084035873413086, -5.713959693908691, -5.343884468078613, -4.973808288574219, -4.603732585906982, -4.233656883239746, -3.8635811805725098, -3.4935054779052734, -3.123429775238037, -2.7533538341522217, -2.3832781314849854, -2.013202428817749, -1.6431264877319336, -1.2730507850646973, -0.9029760360717773, -0.5329002737998962, -0.16282451152801514, 0.20725131034851074, 0.5773270130157471, 0.9474027156829834, 1.3174786567687988, 1.6875543594360352, 2.0576300621032715, 2.427705764770508, 2.797781467437744, 3.1678574085235596, 3.537933111190796, 3.9080088138580322, 4.278084754943848, 4.648160457611084, 5.01823616027832, 5.388311862945557, 5.758387565612793, 6.1284637451171875, 6.498538970947266, 6.86861515045166, 7.2386908531188965, 7.608766555786133, 7.978842258453369, 8.348917961120605, 8.718994140625, 9.089069366455078, 9.459145545959473, 9.82922077178955, 10.199296951293945, 10.569372177124023, 10.939448356628418]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 9.0, 6.0, 8.0, 10.0, 8.0, 14.0, 37.0, 35.0, 52.0, 80.0, 90.0, 108.0, 193.0, 299.0, 434.0, 817.0, 1475.0, 2877.0, 6527.0, 16773.0, 73269.0, 3966963.0, 90873.0, 18738.0, 6967.0, 3383.0, 1743.0, 950.0, 543.0, 333.0, 199.0, 137.0, 94.0, 60.0, 43.0, 34.0, 23.0, 18.0, 12.0, 11.0, 9.0, 3.0, 9.0, 6.0, 7.0, 1.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.1640625, -0.15917396545410156, -0.15428543090820312, -0.1493968963623047, -0.14450836181640625, -0.1396198272705078, -0.13473129272460938, -0.12984275817871094, -0.1249542236328125, -0.12006568908691406, -0.11517715454101562, -0.11028861999511719, -0.10540008544921875, -0.10051155090332031, -0.09562301635742188, -0.09073448181152344, -0.085845947265625, -0.08095741271972656, -0.07606887817382812, -0.07118034362792969, -0.06629180908203125, -0.06140327453613281, -0.056514739990234375, -0.05162620544433594, -0.0467376708984375, -0.04184913635253906, -0.036960601806640625, -0.03207206726074219, -0.02718353271484375, -0.022294998168945312, -0.017406463623046875, -0.012517929077148438, -0.00762939453125, -0.0027408599853515625, 0.002147674560546875, 0.0070362091064453125, 0.01192474365234375, 0.016813278198242188, 0.021701812744140625, 0.026590347290039062, 0.0314788818359375, 0.03636741638183594, 0.041255950927734375, 0.04614448547363281, 0.05103302001953125, 0.05592155456542969, 0.060810089111328125, 0.06569862365722656, 0.070587158203125, 0.07547569274902344, 0.08036422729492188, 0.08525276184082031, 0.09014129638671875, 0.09502983093261719, 0.09991836547851562, 0.10480690002441406, 0.1096954345703125, 0.11458396911621094, 0.11947250366210938, 0.12436103820800781, 0.12924957275390625, 0.1341381072998047, 0.13902664184570312, 0.14391517639160156, 0.1488037109375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 3.0, 8.0, 11.0, 6.0, 5.0, 8.0, 10.0, 14.0, 14.0, 31.0, 51.0, 182.0, 465.0, 56.0, 28.0, 14.0, 13.0, 10.0, 14.0, 10.0, 4.0, 4.0, 3.0, 3.0, 3.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.047943115234375, -0.046575069427490234, -0.04520702362060547, -0.0438389778137207, -0.04247093200683594, -0.04110288619995117, -0.039734840393066406, -0.03836679458618164, -0.036998748779296875, -0.03563070297241211, -0.034262657165527344, -0.03289461135864258, -0.03152656555175781, -0.030158519744873047, -0.02879047393798828, -0.027422428131103516, -0.02605438232421875, -0.024686336517333984, -0.02331829071044922, -0.021950244903564453, -0.020582199096679688, -0.019214153289794922, -0.017846107482910156, -0.01647806167602539, -0.015110015869140625, -0.01374197006225586, -0.012373924255371094, -0.011005878448486328, -0.009637832641601562, -0.008269786834716797, -0.006901741027832031, -0.005533695220947266, -0.0041656494140625, -0.0027976036071777344, -0.0014295578002929688, -6.151199340820312e-05, 0.0013065338134765625, 0.002674579620361328, 0.004042625427246094, 0.005410671234130859, 0.006778717041015625, 0.00814676284790039, 0.009514808654785156, 0.010882854461669922, 0.012250900268554688, 0.013618946075439453, 0.014986991882324219, 0.016355037689208984, 0.01772308349609375, 0.019091129302978516, 0.02045917510986328, 0.021827220916748047, 0.023195266723632812, 0.024563312530517578, 0.025931358337402344, 0.02729940414428711, 0.028667449951171875, 0.03003549575805664, 0.031403541564941406, 0.03277158737182617, 0.03413963317871094, 0.0355076789855957, 0.03687572479248047, 0.038243770599365234, 0.03961181640625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 6.0, 7.0, 3.0, 12.0, 14.0, 20.0, 34.0, 40.0, 54.0, 96.0, 156.0, 345.0, 787.0, 1811.0, 4880.0, 14697.0, 54042.0, 287101.0, 3206417.0, 514418.0, 78126.0, 20336.0, 6503.0, 2361.0, 973.0, 435.0, 228.0, 136.0, 65.0, 51.0, 31.0, 29.0, 16.0, 12.0, 8.0, 10.0, 6.0, 0.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.09490966796875, -0.09147453308105469, -0.08803939819335938, -0.08460426330566406, -0.08116912841796875, -0.07773399353027344, -0.07429885864257812, -0.07086372375488281, -0.0674285888671875, -0.06399345397949219, -0.060558319091796875, -0.05712318420410156, -0.05368804931640625, -0.05025291442871094, -0.046817779541015625, -0.04338264465332031, -0.039947509765625, -0.03651237487792969, -0.033077239990234375, -0.029642105102539062, -0.02620697021484375, -0.022771835327148438, -0.019336700439453125, -0.015901565551757812, -0.0124664306640625, -0.009031295776367188, -0.005596160888671875, -0.0021610260009765625, 0.00127410888671875, 0.0047092437744140625, 0.008144378662109375, 0.011579513549804688, 0.0150146484375, 0.018449783325195312, 0.021884918212890625, 0.025320053100585938, 0.02875518798828125, 0.03219032287597656, 0.035625457763671875, 0.03906059265136719, 0.0424957275390625, 0.04593086242675781, 0.049365997314453125, 0.05280113220214844, 0.05623626708984375, 0.05967140197753906, 0.06310653686523438, 0.06654167175292969, 0.069976806640625, 0.07341194152832031, 0.07684707641601562, 0.08028221130371094, 0.08371734619140625, 0.08715248107910156, 0.09058761596679688, 0.09402275085449219, 0.0974578857421875, 0.10089302062988281, 0.10432815551757812, 0.10776329040527344, 0.11119842529296875, 0.11463356018066406, 0.11806869506835938, 0.12150382995605469, 0.12493896484375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 2.0, 13.0, 13.0, 11.0, 17.0, 16.0, 23.0, 34.0, 43.0, 50.0, 65.0, 81.0, 110.0, 183.0, 265.0, 599.0, 1066.0, 551.0, 281.0, 174.0, 111.0, 80.0, 55.0, 48.0, 36.0, 20.0, 25.0, 24.0, 14.0, 10.0, 10.0, 6.0, 6.0, 3.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.031280517578125, -0.030140399932861328, -0.029000282287597656, -0.027860164642333984, -0.026720046997070312, -0.02557992935180664, -0.02443981170654297, -0.023299694061279297, -0.022159576416015625, -0.021019458770751953, -0.01987934112548828, -0.01873922348022461, -0.017599105834960938, -0.016458988189697266, -0.015318870544433594, -0.014178752899169922, -0.01303863525390625, -0.011898517608642578, -0.010758399963378906, -0.009618282318115234, -0.008478164672851562, -0.007338047027587891, -0.006197929382324219, -0.005057811737060547, -0.003917694091796875, -0.002777576446533203, -0.0016374588012695312, -0.0004973411560058594, 0.0006427764892578125, 0.0017828941345214844, 0.0029230117797851562, 0.004063129425048828, 0.0052032470703125, 0.006343364715576172, 0.007483482360839844, 0.008623600006103516, 0.009763717651367188, 0.01090383529663086, 0.012043952941894531, 0.013184070587158203, 0.014324188232421875, 0.015464305877685547, 0.01660442352294922, 0.01774454116821289, 0.018884658813476562, 0.020024776458740234, 0.021164894104003906, 0.022305011749267578, 0.02344512939453125, 0.024585247039794922, 0.025725364685058594, 0.026865482330322266, 0.028005599975585938, 0.02914571762084961, 0.03028583526611328, 0.03142595291137695, 0.032566070556640625, 0.0337061882019043, 0.03484630584716797, 0.03598642349243164, 0.03712654113769531, 0.038266658782958984, 0.039406776428222656, 0.04054689407348633, 0.04168701171875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 12.0, 28.0, 64.0, 149.0, 243.0, 254.0, 140.0, 60.0, 23.0, 10.0, 7.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.22374887764453888, -0.21200014650821686, -0.20025141537189484, -0.18850268423557281, -0.1767539530992508, -0.16500522196292877, -0.15325647592544556, -0.14150774478912354, -0.1297590136528015, -0.11801028251647949, -0.10626155138015747, -0.09451282024383545, -0.08276408910751343, -0.0710153579711914, -0.05926661938428879, -0.047517888247966766, -0.03576916456222534, -0.02402043342590332, -0.01227170042693615, -0.0005229674279689789, 0.011225763708353043, 0.022974494844675064, 0.034723229706287384, 0.046471960842609406, 0.05822069197893143, 0.06996942311525345, 0.08171815425157547, 0.09346689283847809, 0.10521562397480011, 0.11696435511112213, 0.12871308624744415, 0.14046181738376617, 0.1522105634212494, 0.1639592945575714, 0.17570802569389343, 0.18745675683021545, 0.19920548796653748, 0.2109542191028595, 0.22270295023918152, 0.23445168137550354, 0.24620041251182556, 0.2579491436481476, 0.2696978747844696, 0.2814466059207916, 0.29319533705711365, 0.30494406819343567, 0.3166927993297577, 0.3284415304660797, 0.3401902914047241, 0.35193902254104614, 0.36368775367736816, 0.3754364848136902, 0.3871852159500122, 0.39893394708633423, 0.41068267822265625, 0.42243140935897827, 0.4341801404953003, 0.4459288716316223, 0.45767760276794434, 0.46942633390426636, 0.4811750650405884, 0.4929237961769104, 0.5046725273132324, 0.5164212584495544, 0.5281699895858765]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 8.0, 5.0, 6.0, 3.0, 9.0, 12.0, 14.0, 15.0, 20.0, 25.0, 35.0, 44.0, 39.0, 51.0, 51.0, 74.0, 64.0, 71.0, 71.0, 71.0, 56.0, 62.0, 32.0, 32.0, 22.0, 29.0, 19.0, 24.0, 9.0, 8.0, 10.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17424196004867554, -0.16807514429092407, -0.1619083285331726, -0.15574151277542114, -0.14957469701766968, -0.14340786635875702, -0.13724105060100555, -0.1310742348432541, -0.12490741908550262, -0.11874060332775116, -0.1125737875699997, -0.10640696436166763, -0.10024014860391617, -0.0940733328461647, -0.08790650963783264, -0.08173969388008118, -0.07557287812232971, -0.06940606236457825, -0.06323924660682678, -0.05707242339849472, -0.050905607640743256, -0.04473879188299179, -0.03857197239995003, -0.032405152916908264, -0.0262383371591568, -0.020071519538760185, -0.013904701918363571, -0.007737884297966957, -0.001571066677570343, 0.004595750942826271, 0.010762568563222885, 0.01692938804626465, 0.023096203804016113, 0.029263021424412727, 0.03542983904480934, 0.041596658527851105, 0.04776347428560257, 0.053930290043354034, 0.0600971095263958, 0.06626392900943756, 0.07243074476718903, 0.07859756052494049, 0.08476437628269196, 0.09093119949102402, 0.09709801524877548, 0.10326483100652695, 0.10943165421485901, 0.11559846997261047, 0.12176528573036194, 0.1279321014881134, 0.13409891724586487, 0.14026573300361633, 0.1464325487613678, 0.15259937942028046, 0.15876619517803192, 0.1649330109357834, 0.17109982669353485, 0.17726664245128632, 0.18343345820903778, 0.18960027396678925, 0.1957671046257019, 0.20193392038345337, 0.20810073614120483, 0.2142675518989563, 0.22043436765670776]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 8.0, 1.0, 6.0, 6.0, 13.0, 19.0, 34.0, 39.0, 54.0, 84.0, 128.0, 168.0, 206.0, 307.0, 426.0, 551.0, 837.0, 1209.0, 1629.0, 2324.0, 3583.0, 5382.0, 8550.0, 14316.0, 26646.0, 71387.0, 762478.0, 79506.0, 28038.0, 14664.0, 8820.0, 5510.0, 3593.0, 2429.0, 1660.0, 1107.0, 795.0, 551.0, 393.0, 308.0, 244.0, 167.0, 118.0, 90.0, 66.0, 28.0, 30.0, 24.0, 11.0, 9.0, 8.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1036376953125, -0.10035037994384766, -0.09706306457519531, -0.09377574920654297, -0.09048843383789062, -0.08720111846923828, -0.08391380310058594, -0.0806264877319336, -0.07733917236328125, -0.0740518569946289, -0.07076454162597656, -0.06747722625732422, -0.06418991088867188, -0.06090259552001953, -0.05761528015136719, -0.054327964782714844, -0.0510406494140625, -0.047753334045410156, -0.04446601867675781, -0.04117870330810547, -0.037891387939453125, -0.03460407257080078, -0.03131675720214844, -0.028029441833496094, -0.02474212646484375, -0.021454811096191406, -0.018167495727539062, -0.014880180358886719, -0.011592864990234375, -0.008305549621582031, -0.0050182342529296875, -0.0017309188842773438, 0.001556396484375, 0.004843711853027344, 0.008131027221679688, 0.011418342590332031, 0.014705657958984375, 0.01799297332763672, 0.021280288696289062, 0.024567604064941406, 0.02785491943359375, 0.031142234802246094, 0.03442955017089844, 0.03771686553955078, 0.041004180908203125, 0.04429149627685547, 0.04757881164550781, 0.050866127014160156, 0.0541534423828125, 0.057440757751464844, 0.06072807312011719, 0.06401538848876953, 0.06730270385742188, 0.07059001922607422, 0.07387733459472656, 0.0771646499633789, 0.08045196533203125, 0.0837392807006836, 0.08702659606933594, 0.09031391143798828, 0.09360122680664062, 0.09688854217529297, 0.10017585754394531, 0.10346317291259766, 0.10675048828125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 6.0, 3.0, 6.0, 5.0, 9.0, 9.0, 6.0, 6.0, 6.0, 7.0, 17.0, 24.0, 27.0, 80.0, 361.0, 249.0, 52.0, 32.0, 15.0, 14.0, 11.0, 7.0, 8.0, 9.0, 2.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.044189453125, -0.04288339614868164, -0.04157733917236328, -0.04027128219604492, -0.03896522521972656, -0.0376591682434082, -0.036353111267089844, -0.035047054290771484, -0.033740997314453125, -0.032434940338134766, -0.031128883361816406, -0.029822826385498047, -0.028516769409179688, -0.027210712432861328, -0.02590465545654297, -0.02459859848022461, -0.02329254150390625, -0.02198648452758789, -0.02068042755126953, -0.019374370574951172, -0.018068313598632812, -0.016762256622314453, -0.015456199645996094, -0.014150142669677734, -0.012844085693359375, -0.011538028717041016, -0.010231971740722656, -0.008925914764404297, -0.0076198577880859375, -0.006313800811767578, -0.005007743835449219, -0.0037016868591308594, -0.0023956298828125, -0.0010895729064941406, 0.00021648406982421875, 0.0015225410461425781, 0.0028285980224609375, 0.004134654998779297, 0.005440711975097656, 0.006746768951416016, 0.008052825927734375, 0.009358882904052734, 0.010664939880371094, 0.011970996856689453, 0.013277053833007812, 0.014583110809326172, 0.01588916778564453, 0.01719522476196289, 0.01850128173828125, 0.01980733871459961, 0.02111339569091797, 0.022419452667236328, 0.023725509643554688, 0.025031566619873047, 0.026337623596191406, 0.027643680572509766, 0.028949737548828125, 0.030255794525146484, 0.031561851501464844, 0.0328679084777832, 0.03417396545410156, 0.03548002243041992, 0.03678607940673828, 0.03809213638305664, 0.039398193359375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 3.0, 3.0, 5.0, 12.0, 10.0, 13.0, 12.0, 19.0, 13.0, 30.0, 49.0, 70.0, 80.0, 127.0, 196.0, 349.0, 654.0, 1382.0, 3186.0, 8582.0, 26079.0, 99762.0, 436684.0, 356226.0, 79939.0, 22210.0, 7318.0, 2765.0, 1207.0, 621.0, 330.0, 175.0, 130.0, 83.0, 49.0, 41.0, 38.0, 18.0, 16.0, 24.0, 17.0, 7.0, 6.0, 4.0, 6.0, 4.0, 0.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10247802734375, -0.09916400909423828, -0.09584999084472656, -0.09253597259521484, -0.08922195434570312, -0.0859079360961914, -0.08259391784667969, -0.07927989959716797, -0.07596588134765625, -0.07265186309814453, -0.06933784484863281, -0.0660238265991211, -0.06270980834960938, -0.059395790100097656, -0.05608177185058594, -0.05276775360107422, -0.0494537353515625, -0.04613971710205078, -0.04282569885253906, -0.039511680603027344, -0.036197662353515625, -0.032883644104003906, -0.029569625854492188, -0.02625560760498047, -0.02294158935546875, -0.01962757110595703, -0.016313552856445312, -0.012999534606933594, -0.009685516357421875, -0.006371498107910156, -0.0030574798583984375, 0.00025653839111328125, 0.003570556640625, 0.006884574890136719, 0.010198593139648438, 0.013512611389160156, 0.016826629638671875, 0.020140647888183594, 0.023454666137695312, 0.02676868438720703, 0.03008270263671875, 0.03339672088623047, 0.03671073913574219, 0.040024757385253906, 0.043338775634765625, 0.046652793884277344, 0.04996681213378906, 0.05328083038330078, 0.0565948486328125, 0.05990886688232422, 0.06322288513183594, 0.06653690338134766, 0.06985092163085938, 0.0731649398803711, 0.07647895812988281, 0.07979297637939453, 0.08310699462890625, 0.08642101287841797, 0.08973503112792969, 0.0930490493774414, 0.09636306762695312, 0.09967708587646484, 0.10299110412597656, 0.10630512237548828, 0.109619140625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 3.0, 10.0, 12.0, 9.0, 6.0, 9.0, 16.0, 16.0, 18.0, 24.0, 23.0, 26.0, 38.0, 36.0, 33.0, 39.0, 33.0, 31.0, 28.0, 56.0, 42.0, 38.0, 42.0, 35.0, 42.0, 32.0, 36.0, 40.0, 31.0, 25.0, 24.0, 32.0, 19.0, 13.0, 7.0, 9.0, 16.0, 17.0, 10.0, 5.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1273193359375, -0.123260498046875, -0.11920166015625, -0.115142822265625, -0.111083984375, -0.107025146484375, -0.10296630859375, -0.098907470703125, -0.0948486328125, -0.090789794921875, -0.08673095703125, -0.082672119140625, -0.07861328125, -0.074554443359375, -0.07049560546875, -0.066436767578125, -0.0623779296875, -0.058319091796875, -0.05426025390625, -0.050201416015625, -0.046142578125, -0.042083740234375, -0.03802490234375, -0.033966064453125, -0.0299072265625, -0.025848388671875, -0.02178955078125, -0.017730712890625, -0.013671875, -0.009613037109375, -0.00555419921875, -0.001495361328125, 0.0025634765625, 0.006622314453125, 0.01068115234375, 0.014739990234375, 0.018798828125, 0.022857666015625, 0.02691650390625, 0.030975341796875, 0.0350341796875, 0.039093017578125, 0.04315185546875, 0.047210693359375, 0.05126953125, 0.055328369140625, 0.05938720703125, 0.063446044921875, 0.0675048828125, 0.071563720703125, 0.07562255859375, 0.079681396484375, 0.083740234375, 0.087799072265625, 0.09185791015625, 0.095916748046875, 0.0999755859375, 0.104034423828125, 0.10809326171875, 0.112152099609375, 0.1162109375, 0.120269775390625, 0.12432861328125, 0.128387451171875, 0.1324462890625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 7.0, 11.0, 15.0, 15.0, 31.0, 65.0, 98.0, 127.0, 259.0, 562.0, 1232.0, 3442.0, 12675.0, 82478.0, 732303.0, 185716.0, 21056.0, 5267.0, 1663.0, 717.0, 350.0, 187.0, 97.0, 62.0, 41.0, 22.0, 19.0, 7.0, 12.0, 5.0, 8.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09393310546875, -0.09105682373046875, -0.0881805419921875, -0.08530426025390625, -0.082427978515625, -0.07955169677734375, -0.0766754150390625, -0.07379913330078125, -0.0709228515625, -0.06804656982421875, -0.0651702880859375, -0.06229400634765625, -0.059417724609375, -0.05654144287109375, -0.0536651611328125, -0.05078887939453125, -0.04791259765625, -0.04503631591796875, -0.0421600341796875, -0.03928375244140625, -0.036407470703125, -0.03353118896484375, -0.0306549072265625, -0.02777862548828125, -0.02490234375, -0.02202606201171875, -0.0191497802734375, -0.01627349853515625, -0.013397216796875, -0.01052093505859375, -0.0076446533203125, -0.00476837158203125, -0.00189208984375, 0.00098419189453125, 0.0038604736328125, 0.00673675537109375, 0.009613037109375, 0.01248931884765625, 0.0153656005859375, 0.01824188232421875, 0.0211181640625, 0.02399444580078125, 0.0268707275390625, 0.02974700927734375, 0.032623291015625, 0.03549957275390625, 0.0383758544921875, 0.04125213623046875, 0.04412841796875, 0.04700469970703125, 0.0498809814453125, 0.05275726318359375, 0.055633544921875, 0.05850982666015625, 0.0613861083984375, 0.06426239013671875, 0.067138671875, 0.07001495361328125, 0.0728912353515625, 0.07576751708984375, 0.078643798828125, 0.08152008056640625, 0.0843963623046875, 0.08727264404296875, 0.09014892578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 1.0, 5.0, 5.0, 5.0, 7.0, 10.0, 12.0, 16.0, 20.0, 34.0, 30.0, 28.0, 42.0, 59.0, 57.0, 83.0, 74.0, 58.0, 57.0, 49.0, 66.0, 38.0, 36.0, 41.0, 23.0, 38.0, 30.0, 15.0, 12.0, 9.0, 21.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2278556823730469e-05, -1.176539808511734e-05, -1.1252239346504211e-05, -1.0739080607891083e-05, -1.0225921869277954e-05, -9.712763130664825e-06, -9.199604392051697e-06, -8.686445653438568e-06, -8.17328691482544e-06, -7.66012817621231e-06, -7.146969437599182e-06, -6.6338106989860535e-06, -6.120651960372925e-06, -5.607493221759796e-06, -5.0943344831466675e-06, -4.581175744533539e-06, -4.06801700592041e-06, -3.5548582673072815e-06, -3.041699528694153e-06, -2.528540790081024e-06, -2.0153820514678955e-06, -1.5022233128547668e-06, -9.890645742416382e-07, -4.759058356285095e-07, 3.725290298461914e-08, 5.504116415977478e-07, 1.0635703802108765e-06, 1.5767291188240051e-06, 2.089887857437134e-06, 2.6030465960502625e-06, 3.116205334663391e-06, 3.6293640732765198e-06, 4.1425228118896484e-06, 4.655681550502777e-06, 5.168840289115906e-06, 5.6819990277290344e-06, 6.195157766342163e-06, 6.708316504955292e-06, 7.22147524356842e-06, 7.734633982181549e-06, 8.247792720794678e-06, 8.760951459407806e-06, 9.274110198020935e-06, 9.787268936634064e-06, 1.0300427675247192e-05, 1.0813586413860321e-05, 1.132674515247345e-05, 1.1839903891086578e-05, 1.2353062629699707e-05, 1.2866221368312836e-05, 1.3379380106925964e-05, 1.3892538845539093e-05, 1.4405697584152222e-05, 1.491885632276535e-05, 1.543201506137848e-05, 1.5945173799991608e-05, 1.6458332538604736e-05, 1.6971491277217865e-05, 1.7484650015830994e-05, 1.7997808754444122e-05, 1.851096749305725e-05, 1.902412623167038e-05, 1.9537284970283508e-05, 2.0050443708896637e-05, 2.0563602447509766e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 6.0, 9.0, 25.0, 30.0, 54.0, 107.0, 199.0, 473.0, 1163.0, 3959.0, 18313.0, 170356.0, 750991.0, 86571.0, 11769.0, 2834.0, 902.0, 377.0, 177.0, 90.0, 51.0, 23.0, 24.0, 10.0, 17.0, 6.0, 3.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0916748046875, -0.08832550048828125, -0.0849761962890625, -0.08162689208984375, -0.078277587890625, -0.07492828369140625, -0.0715789794921875, -0.06822967529296875, -0.06488037109375, -0.06153106689453125, -0.0581817626953125, -0.05483245849609375, -0.051483154296875, -0.04813385009765625, -0.0447845458984375, -0.04143524169921875, -0.0380859375, -0.03473663330078125, -0.0313873291015625, -0.02803802490234375, -0.024688720703125, -0.02133941650390625, -0.0179901123046875, -0.01464080810546875, -0.01129150390625, -0.00794219970703125, -0.0045928955078125, -0.00124359130859375, 0.002105712890625, 0.00545501708984375, 0.0088043212890625, 0.01215362548828125, 0.0155029296875, 0.01885223388671875, 0.0222015380859375, 0.02555084228515625, 0.028900146484375, 0.03224945068359375, 0.0355987548828125, 0.03894805908203125, 0.04229736328125, 0.04564666748046875, 0.0489959716796875, 0.05234527587890625, 0.055694580078125, 0.05904388427734375, 0.0623931884765625, 0.06574249267578125, 0.069091796875, 0.07244110107421875, 0.0757904052734375, 0.07913970947265625, 0.082489013671875, 0.08583831787109375, 0.0891876220703125, 0.09253692626953125, 0.09588623046875, 0.09923553466796875, 0.1025848388671875, 0.10593414306640625, 0.109283447265625, 0.11263275146484375, 0.1159820556640625, 0.11933135986328125, 0.1226806640625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 5.0, 1.0, 3.0, 8.0, 12.0, 19.0, 23.0, 35.0, 42.0, 75.0, 85.0, 130.0, 101.0, 127.0, 97.0, 75.0, 51.0, 34.0, 30.0, 20.0, 12.0, 7.0, 2.0, 0.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07171630859375, -0.0688161849975586, -0.06591606140136719, -0.06301593780517578, -0.060115814208984375, -0.05721569061279297, -0.05431556701660156, -0.051415443420410156, -0.04851531982421875, -0.045615196228027344, -0.04271507263183594, -0.03981494903564453, -0.036914825439453125, -0.03401470184326172, -0.031114578247070312, -0.028214454650878906, -0.0253143310546875, -0.022414207458496094, -0.019514083862304688, -0.01661396026611328, -0.013713836669921875, -0.010813713073730469, -0.007913589477539062, -0.005013465881347656, -0.00211334228515625, 0.0007867813110351562, 0.0036869049072265625, 0.006587028503417969, 0.009487152099609375, 0.012387275695800781, 0.015287399291992188, 0.018187522888183594, 0.021087646484375, 0.023987770080566406, 0.026887893676757812, 0.02978801727294922, 0.032688140869140625, 0.03558826446533203, 0.03848838806152344, 0.041388511657714844, 0.04428863525390625, 0.047188758850097656, 0.05008888244628906, 0.05298900604248047, 0.055889129638671875, 0.05878925323486328, 0.06168937683105469, 0.0645895004272461, 0.0674896240234375, 0.0703897476196289, 0.07328987121582031, 0.07618999481201172, 0.07909011840820312, 0.08199024200439453, 0.08489036560058594, 0.08779048919677734, 0.09069061279296875, 0.09359073638916016, 0.09649085998535156, 0.09939098358154297, 0.10229110717773438, 0.10519123077392578, 0.10809135437011719, 0.1109914779663086, 0.1138916015625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 8.0, 25.0, 47.0, 133.0, 276.0, 282.0, 119.0, 50.0, 29.0, 12.0, 6.0, 10.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1231088638305664, -1.076072335243225, -1.0290359258651733, -0.981999397277832, -0.9349629878997803, -0.887926459312439, -0.8408899903297424, -0.7938535213470459, -0.7468170523643494, -0.6997805833816528, -0.6527441143989563, -0.6057076454162598, -0.5586711168289185, -0.5116347074508667, -0.4645981788635254, -0.41756170988082886, -0.3705252408981323, -0.3234887719154358, -0.27645230293273926, -0.22941580414772034, -0.1823793351650238, -0.13534286618232727, -0.08830636739730835, -0.041269898414611816, 0.005766570568084717, 0.05280304700136185, 0.09983952343463898, 0.1468760073184967, 0.19391247630119324, 0.24094894528388977, 0.2879854440689087, 0.3350219130516052, 0.3820585012435913, 0.42909497022628784, 0.4761314392089844, 0.5231679677963257, 0.5702043771743774, 0.6172409057617188, 0.6642773747444153, 0.7113138437271118, 0.7583503127098083, 0.8053867816925049, 0.8524232506752014, 0.899459719657898, 0.9464962482452393, 0.993532657623291, 1.0405691862106323, 1.0876057147979736, 1.1346421241760254, 1.1816786527633667, 1.2287150621414185, 1.2757515907287598, 1.3227880001068115, 1.3698245286941528, 1.4168610572814941, 1.463897466659546, 1.5109338760375977, 1.557970404624939, 1.6050068140029907, 1.652043342590332, 1.6990797519683838, 1.746116280555725, 1.7931528091430664, 1.8401892185211182, 1.8872257471084595]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 6.0, 5.0, 8.0, 6.0, 8.0, 15.0, 19.0, 40.0, 53.0, 90.0, 138.0, 170.0, 134.0, 92.0, 71.0, 39.0, 30.0, 10.0, 13.0, 8.0, 5.0, 10.0, 6.0, 8.0, 2.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0380027294158936, -2.9527106285095215, -2.8674187660217285, -2.7821266651153564, -2.6968345642089844, -2.6115427017211914, -2.5262506008148193, -2.4409584999084473, -2.3556666374206543, -2.2703745365142822, -2.1850826740264893, -2.099790573120117, -2.014498472213745, -1.9292064905166626, -1.84391450881958, -1.758622407913208, -1.673330307006836, -1.5880383253097534, -1.5027462244033813, -1.4174542427062988, -1.3321621417999268, -1.2468701601028442, -1.1615781784057617, -1.0762860774993896, -0.9909940958023071, -0.9057020545005798, -0.8204100131988525, -0.73511803150177, -0.6498259902000427, -0.5645339488983154, -0.4792419672012329, -0.3939499258995056, -0.3086576461791992, -0.22336561977863312, -0.13807359337806702, -0.05278158187866211, 0.032510459423065186, 0.11780250072479248, 0.203094482421875, 0.2883865237236023, 0.3736785650253296, 0.4589706063270569, 0.5442626476287842, 0.6295546293258667, 0.714846670627594, 0.8001387119293213, 0.8854306936264038, 0.9707227349281311, 1.0560147762298584, 1.141306757926941, 1.226598858833313, 1.3118908405303955, 1.3971829414367676, 1.48247492313385, 1.5677669048309326, 1.6530590057373047, 1.7383509874343872, 1.8236429691314697, 1.9089350700378418, 1.9942270517349243, 2.079519033432007, 2.164811134338379, 2.250102996826172, 2.335395097732544, 2.420687198638916]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 7.0, 11.0, 13.0, 15.0, 31.0, 47.0, 72.0, 99.0, 149.0, 236.0, 320.0, 562.0, 861.0, 1440.0, 2470.0, 4775.0, 10208.0, 26285.0, 122434.0, 3879397.0, 101224.0, 23233.0, 9252.0, 4484.0, 2476.0, 1462.0, 889.0, 587.0, 380.0, 248.0, 178.0, 118.0, 99.0, 63.0, 43.0, 26.0, 27.0, 23.0, 11.0, 8.0, 12.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.322265625, -0.31317901611328125, -0.3040924072265625, -0.29500579833984375, -0.285919189453125, -0.27683258056640625, -0.2677459716796875, -0.25865936279296875, -0.24957275390625, -0.24048614501953125, -0.2313995361328125, -0.22231292724609375, -0.213226318359375, -0.20413970947265625, -0.1950531005859375, -0.18596649169921875, -0.1768798828125, -0.16779327392578125, -0.1587066650390625, -0.14962005615234375, -0.140533447265625, -0.13144683837890625, -0.1223602294921875, -0.11327362060546875, -0.10418701171875, -0.09510040283203125, -0.0860137939453125, -0.07692718505859375, -0.067840576171875, -0.05875396728515625, -0.0496673583984375, -0.04058074951171875, -0.031494140625, -0.02240753173828125, -0.0133209228515625, -0.00423431396484375, 0.004852294921875, 0.01393890380859375, 0.0230255126953125, 0.03211212158203125, 0.04119873046875, 0.05028533935546875, 0.0593719482421875, 0.06845855712890625, 0.077545166015625, 0.08663177490234375, 0.0957183837890625, 0.10480499267578125, 0.1138916015625, 0.12297821044921875, 0.1320648193359375, 0.14115142822265625, 0.150238037109375, 0.15932464599609375, 0.1684112548828125, 0.17749786376953125, 0.18658447265625, 0.19567108154296875, 0.2047576904296875, 0.21384429931640625, 0.222930908203125, 0.23201751708984375, 0.2411041259765625, 0.25019073486328125, 0.25927734375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 3.0, 3.0, 7.0, 6.0, 5.0, 2.0, 11.0, 8.0, 11.0, 13.0, 16.0, 27.0, 54.0, 101.0, 209.0, 242.0, 112.0, 55.0, 20.0, 15.0, 8.0, 13.0, 8.0, 5.0, 14.0, 5.0, 5.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.03717041015625, -0.036008358001708984, -0.03484630584716797, -0.03368425369262695, -0.03252220153808594, -0.03136014938354492, -0.030198097229003906, -0.02903604507446289, -0.027873992919921875, -0.02671194076538086, -0.025549888610839844, -0.024387836456298828, -0.023225784301757812, -0.022063732147216797, -0.02090167999267578, -0.019739627838134766, -0.01857757568359375, -0.017415523529052734, -0.01625347137451172, -0.015091419219970703, -0.013929367065429688, -0.012767314910888672, -0.011605262756347656, -0.01044321060180664, -0.009281158447265625, -0.00811910629272461, -0.006957054138183594, -0.005795001983642578, -0.0046329498291015625, -0.003470897674560547, -0.0023088455200195312, -0.0011467933654785156, 1.52587890625e-05, 0.0011773109436035156, 0.0023393630981445312, 0.003501415252685547, 0.0046634674072265625, 0.005825519561767578, 0.006987571716308594, 0.00814962387084961, 0.009311676025390625, 0.01047372817993164, 0.011635780334472656, 0.012797832489013672, 0.013959884643554688, 0.015121936798095703, 0.01628398895263672, 0.017446041107177734, 0.01860809326171875, 0.019770145416259766, 0.02093219757080078, 0.022094249725341797, 0.023256301879882812, 0.024418354034423828, 0.025580406188964844, 0.02674245834350586, 0.027904510498046875, 0.02906656265258789, 0.030228614807128906, 0.03139066696166992, 0.03255271911621094, 0.03371477127075195, 0.03487682342529297, 0.036038875579833984, 0.037200927734375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 2.0, 5.0, 14.0, 23.0, 41.0, 50.0, 72.0, 148.0, 271.0, 591.0, 1369.0, 3744.0, 12517.0, 55023.0, 572250.0, 3386271.0, 128856.0, 22979.0, 6105.0, 2153.0, 908.0, 402.0, 190.0, 105.0, 68.0, 39.0, 28.0, 15.0, 8.0, 10.0, 5.0, 1.0, 3.0, 4.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.263427734375, -0.2549896240234375, -0.246551513671875, -0.2381134033203125, -0.22967529296875, -0.2212371826171875, -0.212799072265625, -0.2043609619140625, -0.1959228515625, -0.1874847412109375, -0.179046630859375, -0.1706085205078125, -0.16217041015625, -0.1537322998046875, -0.145294189453125, -0.1368560791015625, -0.12841796875, -0.1199798583984375, -0.111541748046875, -0.1031036376953125, -0.09466552734375, -0.0862274169921875, -0.077789306640625, -0.0693511962890625, -0.0609130859375, -0.0524749755859375, -0.044036865234375, -0.0355987548828125, -0.02716064453125, -0.0187225341796875, -0.010284423828125, -0.0018463134765625, 0.006591796875, 0.0150299072265625, 0.023468017578125, 0.0319061279296875, 0.04034423828125, 0.0487823486328125, 0.057220458984375, 0.0656585693359375, 0.0740966796875, 0.0825347900390625, 0.090972900390625, 0.0994110107421875, 0.10784912109375, 0.1162872314453125, 0.124725341796875, 0.1331634521484375, 0.1416015625, 0.1500396728515625, 0.158477783203125, 0.1669158935546875, 0.17535400390625, 0.1837921142578125, 0.192230224609375, 0.2006683349609375, 0.2091064453125, 0.2175445556640625, 0.225982666015625, 0.2344207763671875, 0.24285888671875, 0.2512969970703125, 0.259735107421875, 0.2681732177734375, 0.276611328125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 8.0, 9.0, 7.0, 13.0, 11.0, 15.0, 16.0, 24.0, 39.0, 67.0, 106.0, 138.0, 251.0, 541.0, 1639.0, 468.0, 231.0, 146.0, 97.0, 64.0, 46.0, 34.0, 17.0, 12.0, 11.0, 14.0, 7.0, 9.0, 6.0, 7.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.039337158203125, -0.038083553314208984, -0.03682994842529297, -0.03557634353637695, -0.03432273864746094, -0.03306913375854492, -0.031815528869628906, -0.03056192398071289, -0.029308319091796875, -0.02805471420288086, -0.026801109313964844, -0.025547504425048828, -0.024293899536132812, -0.023040294647216797, -0.02178668975830078, -0.020533084869384766, -0.01927947998046875, -0.018025875091552734, -0.01677227020263672, -0.015518665313720703, -0.014265060424804688, -0.013011455535888672, -0.011757850646972656, -0.01050424575805664, -0.009250640869140625, -0.00799703598022461, -0.006743431091308594, -0.005489826202392578, -0.0042362213134765625, -0.002982616424560547, -0.0017290115356445312, -0.0004754066467285156, 0.0007781982421875, 0.0020318031311035156, 0.0032854080200195312, 0.004539012908935547, 0.0057926177978515625, 0.007046222686767578, 0.008299827575683594, 0.00955343246459961, 0.010807037353515625, 0.01206064224243164, 0.013314247131347656, 0.014567852020263672, 0.015821456909179688, 0.017075061798095703, 0.01832866668701172, 0.019582271575927734, 0.02083587646484375, 0.022089481353759766, 0.02334308624267578, 0.024596691131591797, 0.025850296020507812, 0.027103900909423828, 0.028357505798339844, 0.02961111068725586, 0.030864715576171875, 0.03211832046508789, 0.033371925354003906, 0.03462553024291992, 0.03587913513183594, 0.03713274002075195, 0.03838634490966797, 0.039639949798583984, 0.0408935546875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 10.0, 92.0, 442.0, 353.0, 74.0, 15.0, 11.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2886160910129547, -0.2639516294002533, -0.23928715288639069, -0.21462269127368927, -0.18995821475982666, -0.16529375314712524, -0.14062929153442383, -0.11596481502056122, -0.0913003534078598, -0.06663588434457779, -0.041971419006586075, -0.01730695366859436, 0.007357515394687653, 0.032021984457969666, 0.05668644607067108, 0.08135092258453369, 0.10601538419723511, 0.13067984580993652, 0.15534432232379913, 0.18000878393650055, 0.20467326045036316, 0.22933772206306458, 0.254002183675766, 0.2786666750907898, 0.3033311367034912, 0.3279955983161926, 0.35266005992889404, 0.37732452154159546, 0.40198901295661926, 0.4266534745693207, 0.4513179361820221, 0.4759824275970459, 0.5006468892097473, 0.5253113508224487, 0.5499758124351501, 0.5746402740478516, 0.599304735660553, 0.6239691972732544, 0.6486337184906006, 0.673298180103302, 0.6979626417160034, 0.7226271033287048, 0.7472915649414062, 0.7719560265541077, 0.7966204881668091, 0.8212850093841553, 0.8459494113922119, 0.8706139326095581, 0.8952783346176147, 0.9199427962303162, 0.9446072578430176, 0.969271719455719, 0.9939361810684204, 1.0186007022857666, 1.0432651042938232, 1.0679296255111694, 1.0925941467285156, 1.1172586679458618, 1.1419230699539185, 1.1665875911712646, 1.1912519931793213, 1.2159165143966675, 1.2405809164047241, 1.2652454376220703, 1.289909839630127]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 2.0, 6.0, 4.0, 6.0, 6.0, 9.0, 7.0, 16.0, 16.0, 19.0, 21.0, 35.0, 38.0, 49.0, 47.0, 46.0, 57.0, 60.0, 68.0, 56.0, 57.0, 59.0, 63.0, 45.0, 37.0, 30.0, 36.0, 18.0, 17.0, 10.0, 13.0, 13.0, 8.0, 5.0, 5.0, 10.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.23094552755355835, -0.22420775890350342, -0.21747000515460968, -0.21073223650455475, -0.203994482755661, -0.19725671410560608, -0.19051894545555115, -0.1837811917066574, -0.17704343795776367, -0.17030566930770874, -0.163567915558815, -0.15683014690876007, -0.15009239315986633, -0.1433546245098114, -0.13661685585975647, -0.12987910211086273, -0.1231413334608078, -0.11640357226133347, -0.10966581106185913, -0.1029280424118042, -0.09619028866291046, -0.08945252001285553, -0.0827147588133812, -0.07597699761390686, -0.06923923641443253, -0.06250147521495819, -0.055763714015483856, -0.04902594909071922, -0.04228818789124489, -0.035550426691770554, -0.02881266176700592, -0.022074900567531586, -0.015337139368057251, -0.008599377237260342, -0.0018616151064634323, 0.004876147955656052, 0.011613909155130386, 0.01835167035460472, 0.025089435279369354, 0.03182719647884369, 0.038564957678318024, 0.04530271887779236, 0.05204048007726669, 0.058778245002031326, 0.06551600992679596, 0.0722537636756897, 0.07899153232574463, 0.08572929352521896, 0.0924670547246933, 0.09920481592416763, 0.10594257712364197, 0.1126803457736969, 0.11941809952259064, 0.12615586817264557, 0.1328936219215393, 0.13963139057159424, 0.14636915922164917, 0.1531069278717041, 0.15984468162059784, 0.16658245027065277, 0.1733202040195465, 0.18005797266960144, 0.18679574131965637, 0.1935334950685501, 0.20027124881744385]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 6.0, 6.0, 12.0, 26.0, 20.0, 40.0, 53.0, 83.0, 101.0, 149.0, 222.0, 357.0, 505.0, 864.0, 1349.0, 2219.0, 3747.0, 7230.0, 15584.0, 39957.0, 244889.0, 621690.0, 66505.0, 21328.0, 9589.0, 4915.0, 2768.0, 1570.0, 933.0, 588.0, 396.0, 258.0, 170.0, 136.0, 85.0, 55.0, 45.0, 28.0, 15.0, 16.0, 17.0, 8.0, 3.0, 2.0, 4.0, 1.0, 0.0, 4.0, 2.0], "bins": [-0.222412109375, -0.21626663208007812, -0.21012115478515625, -0.20397567749023438, -0.1978302001953125, -0.19168472290039062, -0.18553924560546875, -0.17939376831054688, -0.173248291015625, -0.16710281372070312, -0.16095733642578125, -0.15481185913085938, -0.1486663818359375, -0.14252090454101562, -0.13637542724609375, -0.13022994995117188, -0.12408447265625, -0.11793899536132812, -0.11179351806640625, -0.10564804077148438, -0.0995025634765625, -0.09335708618164062, -0.08721160888671875, -0.08106613159179688, -0.074920654296875, -0.06877517700195312, -0.06262969970703125, -0.056484222412109375, -0.0503387451171875, -0.044193267822265625, -0.03804779052734375, -0.031902313232421875, -0.0257568359375, -0.019611358642578125, -0.01346588134765625, -0.007320404052734375, -0.0011749267578125, 0.004970550537109375, 0.01111602783203125, 0.017261505126953125, 0.023406982421875, 0.029552459716796875, 0.03569793701171875, 0.041843414306640625, 0.0479888916015625, 0.054134368896484375, 0.06027984619140625, 0.06642532348632812, 0.07257080078125, 0.07871627807617188, 0.08486175537109375, 0.09100723266601562, 0.0971527099609375, 0.10329818725585938, 0.10944366455078125, 0.11558914184570312, 0.121734619140625, 0.12788009643554688, 0.13402557373046875, 0.14017105102539062, 0.1463165283203125, 0.15246200561523438, 0.15860748291015625, 0.16475296020507812, 0.1708984375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 4.0, 7.0, 3.0, 14.0, 12.0, 10.0, 19.0, 25.0, 44.0, 85.0, 152.0, 216.0, 152.0, 92.0, 51.0, 26.0, 18.0, 13.0, 11.0, 9.0, 7.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.03662109375, -0.03542137145996094, -0.034221649169921875, -0.03302192687988281, -0.03182220458984375, -0.030622482299804688, -0.029422760009765625, -0.028223037719726562, -0.0270233154296875, -0.025823593139648438, -0.024623870849609375, -0.023424148559570312, -0.02222442626953125, -0.021024703979492188, -0.019824981689453125, -0.018625259399414062, -0.017425537109375, -0.016225814819335938, -0.015026092529296875, -0.013826370239257812, -0.01262664794921875, -0.011426925659179688, -0.010227203369140625, -0.009027481079101562, -0.0078277587890625, -0.0066280364990234375, -0.005428314208984375, -0.0042285919189453125, -0.00302886962890625, -0.0018291473388671875, -0.000629425048828125, 0.0005702972412109375, 0.00177001953125, 0.0029697418212890625, 0.004169464111328125, 0.0053691864013671875, 0.00656890869140625, 0.0077686309814453125, 0.008968353271484375, 0.010168075561523438, 0.0113677978515625, 0.012567520141601562, 0.013767242431640625, 0.014966964721679688, 0.01616668701171875, 0.017366409301757812, 0.018566131591796875, 0.019765853881835938, 0.020965576171875, 0.022165298461914062, 0.023365020751953125, 0.024564743041992188, 0.02576446533203125, 0.026964187622070312, 0.028163909912109375, 0.029363632202148438, 0.0305633544921875, 0.03176307678222656, 0.032962799072265625, 0.03416252136230469, 0.03536224365234375, 0.03656196594238281, 0.037761688232421875, 0.03896141052246094, 0.0401611328125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 4.0, 4.0, 6.0, 6.0, 7.0, 13.0, 8.0, 8.0, 19.0, 25.0, 48.0, 52.0, 87.0, 138.0, 244.0, 357.0, 637.0, 1200.0, 2476.0, 5943.0, 15279.0, 46885.0, 185956.0, 521220.0, 194403.0, 47503.0, 15079.0, 5696.0, 2447.0, 1198.0, 655.0, 317.0, 215.0, 152.0, 78.0, 55.0, 42.0, 36.0, 22.0, 11.0, 11.0, 6.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12445068359375, -0.12062358856201172, -0.11679649353027344, -0.11296939849853516, -0.10914230346679688, -0.1053152084350586, -0.10148811340332031, -0.09766101837158203, -0.09383392333984375, -0.09000682830810547, -0.08617973327636719, -0.0823526382446289, -0.07852554321289062, -0.07469844818115234, -0.07087135314941406, -0.06704425811767578, -0.0632171630859375, -0.05939006805419922, -0.05556297302246094, -0.051735877990722656, -0.047908782958984375, -0.044081687927246094, -0.04025459289550781, -0.03642749786376953, -0.03260040283203125, -0.02877330780029297, -0.024946212768554688, -0.021119117736816406, -0.017292022705078125, -0.013464927673339844, -0.009637832641601562, -0.005810737609863281, -0.001983642578125, 0.0018434524536132812, 0.0056705474853515625, 0.009497642517089844, 0.013324737548828125, 0.017151832580566406, 0.020978927612304688, 0.02480602264404297, 0.02863311767578125, 0.03246021270751953, 0.03628730773925781, 0.040114402770996094, 0.043941497802734375, 0.047768592834472656, 0.05159568786621094, 0.05542278289794922, 0.0592498779296875, 0.06307697296142578, 0.06690406799316406, 0.07073116302490234, 0.07455825805664062, 0.0783853530883789, 0.08221244812011719, 0.08603954315185547, 0.08986663818359375, 0.09369373321533203, 0.09752082824707031, 0.1013479232788086, 0.10517501831054688, 0.10900211334228516, 0.11282920837402344, 0.11665630340576172, 0.1204833984375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 6.0, 7.0, 2.0, 6.0, 4.0, 7.0, 12.0, 12.0, 13.0, 26.0, 20.0, 29.0, 27.0, 21.0, 31.0, 43.0, 25.0, 52.0, 48.0, 49.0, 38.0, 43.0, 44.0, 56.0, 49.0, 41.0, 27.0, 42.0, 31.0, 29.0, 26.0, 25.0, 24.0, 18.0, 10.0, 8.0, 11.0, 10.0, 10.0, 7.0, 7.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0965576171875, -0.09331607818603516, -0.09007453918457031, -0.08683300018310547, -0.08359146118164062, -0.08034992218017578, -0.07710838317871094, -0.0738668441772461, -0.07062530517578125, -0.0673837661743164, -0.06414222717285156, -0.06090068817138672, -0.057659149169921875, -0.05441761016845703, -0.05117607116699219, -0.047934532165527344, -0.0446929931640625, -0.041451454162597656, -0.03820991516113281, -0.03496837615966797, -0.031726837158203125, -0.02848529815673828, -0.025243759155273438, -0.022002220153808594, -0.01876068115234375, -0.015519142150878906, -0.012277603149414062, -0.009036064147949219, -0.005794525146484375, -0.0025529861450195312, 0.0006885528564453125, 0.003930091857910156, 0.007171630859375, 0.010413169860839844, 0.013654708862304688, 0.01689624786376953, 0.020137786865234375, 0.02337932586669922, 0.026620864868164062, 0.029862403869628906, 0.03310394287109375, 0.036345481872558594, 0.03958702087402344, 0.04282855987548828, 0.046070098876953125, 0.04931163787841797, 0.05255317687988281, 0.055794715881347656, 0.0590362548828125, 0.062277793884277344, 0.06551933288574219, 0.06876087188720703, 0.07200241088867188, 0.07524394989013672, 0.07848548889160156, 0.0817270278930664, 0.08496856689453125, 0.0882101058959961, 0.09145164489746094, 0.09469318389892578, 0.09793472290039062, 0.10117626190185547, 0.10441780090332031, 0.10765933990478516, 0.11090087890625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 7.0, 8.0, 16.0, 15.0, 26.0, 41.0, 59.0, 95.0, 117.0, 184.0, 333.0, 660.0, 1173.0, 2511.0, 6280.0, 20072.0, 97445.0, 564946.0, 290576.0, 44609.0, 11459.0, 3992.0, 1817.0, 861.0, 477.0, 277.0, 176.0, 101.0, 70.0, 47.0, 31.0, 21.0, 15.0, 10.0, 7.0, 4.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1331787109375, -0.1287059783935547, -0.12423324584960938, -0.11976051330566406, -0.11528778076171875, -0.11081504821777344, -0.10634231567382812, -0.10186958312988281, -0.0973968505859375, -0.09292411804199219, -0.08845138549804688, -0.08397865295410156, -0.07950592041015625, -0.07503318786621094, -0.07056045532226562, -0.06608772277832031, -0.061614990234375, -0.05714225769042969, -0.052669525146484375, -0.04819679260253906, -0.04372406005859375, -0.03925132751464844, -0.034778594970703125, -0.030305862426757812, -0.0258331298828125, -0.021360397338867188, -0.016887664794921875, -0.012414932250976562, -0.00794219970703125, -0.0034694671630859375, 0.001003265380859375, 0.0054759979248046875, 0.00994873046875, 0.014421463012695312, 0.018894195556640625, 0.023366928100585938, 0.02783966064453125, 0.03231239318847656, 0.036785125732421875, 0.04125785827636719, 0.0457305908203125, 0.05020332336425781, 0.054676055908203125, 0.05914878845214844, 0.06362152099609375, 0.06809425354003906, 0.07256698608398438, 0.07703971862792969, 0.081512451171875, 0.08598518371582031, 0.09045791625976562, 0.09493064880371094, 0.09940338134765625, 0.10387611389160156, 0.10834884643554688, 0.11282157897949219, 0.1172943115234375, 0.12176704406738281, 0.12623977661132812, 0.13071250915527344, 0.13518524169921875, 0.13965797424316406, 0.14413070678710938, 0.1486034393310547, 0.153076171875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 5.0, 3.0, 11.0, 25.0, 23.0, 32.0, 40.0, 47.0, 67.0, 84.0, 88.0, 107.0, 107.0, 92.0, 59.0, 60.0, 54.0, 23.0, 28.0, 22.0, 10.0, 9.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8715858459472656e-05, -1.7663463950157166e-05, -1.6611069440841675e-05, -1.5558674931526184e-05, -1.4506280422210693e-05, -1.3453885912895203e-05, -1.2401491403579712e-05, -1.1349096894264221e-05, -1.029670238494873e-05, -9.24430787563324e-06, -8.191913366317749e-06, -7.139518857002258e-06, -6.087124347686768e-06, -5.034729838371277e-06, -3.982335329055786e-06, -2.9299408197402954e-06, -1.8775463104248047e-06, -8.25151801109314e-07, 2.2724270820617676e-07, 1.2796372175216675e-06, 2.332031726837158e-06, 3.384426236152649e-06, 4.43682074546814e-06, 5.48921525478363e-06, 6.541609764099121e-06, 7.594004273414612e-06, 8.646398782730103e-06, 9.698793292045593e-06, 1.0751187801361084e-05, 1.1803582310676575e-05, 1.2855976819992065e-05, 1.3908371329307556e-05, 1.4960765838623047e-05, 1.6013160347938538e-05, 1.706555485725403e-05, 1.811794936656952e-05, 1.917034387588501e-05, 2.02227383852005e-05, 2.127513289451599e-05, 2.2327527403831482e-05, 2.3379921913146973e-05, 2.4432316422462463e-05, 2.5484710931777954e-05, 2.6537105441093445e-05, 2.7589499950408936e-05, 2.8641894459724426e-05, 2.9694288969039917e-05, 3.074668347835541e-05, 3.17990779876709e-05, 3.285147249698639e-05, 3.390386700630188e-05, 3.495626151561737e-05, 3.600865602493286e-05, 3.706105053424835e-05, 3.811344504356384e-05, 3.9165839552879333e-05, 4.0218234062194824e-05, 4.1270628571510315e-05, 4.2323023080825806e-05, 4.3375417590141296e-05, 4.442781209945679e-05, 4.548020660877228e-05, 4.653260111808777e-05, 4.758499562740326e-05, 4.863739013671875e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 6.0, 8.0, 10.0, 16.0, 19.0, 32.0, 46.0, 61.0, 78.0, 142.0, 230.0, 353.0, 630.0, 1141.0, 2224.0, 4822.0, 11893.0, 36418.0, 153478.0, 509231.0, 245839.0, 54062.0, 16008.0, 5989.0, 2661.0, 1324.0, 704.0, 399.0, 256.0, 135.0, 93.0, 69.0, 48.0, 31.0, 25.0, 10.0, 21.0, 12.0, 6.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.1171875, -0.11380577087402344, -0.11042404174804688, -0.10704231262207031, -0.10366058349609375, -0.10027885437011719, -0.09689712524414062, -0.09351539611816406, -0.0901336669921875, -0.08675193786621094, -0.08337020874023438, -0.07998847961425781, -0.07660675048828125, -0.07322502136230469, -0.06984329223632812, -0.06646156311035156, -0.063079833984375, -0.05969810485839844, -0.056316375732421875, -0.05293464660644531, -0.04955291748046875, -0.04617118835449219, -0.042789459228515625, -0.03940773010253906, -0.0360260009765625, -0.03264427185058594, -0.029262542724609375, -0.025880813598632812, -0.02249908447265625, -0.019117355346679688, -0.015735626220703125, -0.012353897094726562, -0.00897216796875, -0.0055904388427734375, -0.002208709716796875, 0.0011730194091796875, 0.00455474853515625, 0.007936477661132812, 0.011318206787109375, 0.014699935913085938, 0.0180816650390625, 0.021463394165039062, 0.024845123291015625, 0.028226852416992188, 0.03160858154296875, 0.03499031066894531, 0.038372039794921875, 0.04175376892089844, 0.045135498046875, 0.04851722717285156, 0.051898956298828125, 0.05528068542480469, 0.05866241455078125, 0.06204414367675781, 0.06542587280273438, 0.06880760192871094, 0.0721893310546875, 0.07557106018066406, 0.07895278930664062, 0.08233451843261719, 0.08571624755859375, 0.08909797668457031, 0.09247970581054688, 0.09586143493652344, 0.0992431640625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 4.0, 4.0, 3.0, 5.0, 7.0, 10.0, 15.0, 22.0, 16.0, 23.0, 28.0, 30.0, 48.0, 58.0, 73.0, 74.0, 80.0, 67.0, 79.0, 55.0, 65.0, 68.0, 43.0, 27.0, 21.0, 14.0, 13.0, 10.0, 12.0, 6.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.08795166015625, -0.08558177947998047, -0.08321189880371094, -0.0808420181274414, -0.07847213745117188, -0.07610225677490234, -0.07373237609863281, -0.07136249542236328, -0.06899261474609375, -0.06662273406982422, -0.06425285339355469, -0.061882972717285156, -0.059513092041015625, -0.057143211364746094, -0.05477333068847656, -0.05240345001220703, -0.0500335693359375, -0.04766368865966797, -0.04529380798339844, -0.042923927307128906, -0.040554046630859375, -0.038184165954589844, -0.03581428527832031, -0.03344440460205078, -0.03107452392578125, -0.02870464324951172, -0.026334762573242188, -0.023964881896972656, -0.021595001220703125, -0.019225120544433594, -0.016855239868164062, -0.014485359191894531, -0.012115478515625, -0.009745597839355469, -0.0073757171630859375, -0.005005836486816406, -0.002635955810546875, -0.00026607513427734375, 0.0021038055419921875, 0.004473686218261719, 0.00684356689453125, 0.009213447570800781, 0.011583328247070312, 0.013953208923339844, 0.016323089599609375, 0.018692970275878906, 0.021062850952148438, 0.02343273162841797, 0.0258026123046875, 0.02817249298095703, 0.030542373657226562, 0.032912254333496094, 0.035282135009765625, 0.037652015686035156, 0.04002189636230469, 0.04239177703857422, 0.04476165771484375, 0.04713153839111328, 0.04950141906738281, 0.051871299743652344, 0.054241180419921875, 0.056611061096191406, 0.05898094177246094, 0.06135082244873047, 0.063720703125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 11.0, 92.0, 785.0, 112.0, 13.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.077866554260254, -0.9116312861442566, -0.7453960180282593, -0.579160749912262, -0.41292548179626465, -0.24669021368026733, -0.08045494556427002, 0.08578038215637207, 0.2520155906677246, 0.4182508587837219, 0.5844861268997192, 0.7507213950157166, 0.9169566631317139, 1.0831918716430664, 1.2494271993637085, 1.4156625270843506, 1.5818977355957031, 1.7481329441070557, 1.9143682718276978, 2.08060359954834, 2.2468388080596924, 2.413074016571045, 2.5793094635009766, 2.745544672012329, 2.9117798805236816, 3.078015089035034, 3.2442502975463867, 3.4104857444763184, 3.576720952987671, 3.7429561614990234, 3.909191608428955, 4.075427055358887, 4.24166202545166, 4.407897472381592, 4.574132442474365, 4.740367889404297, 4.90660285949707, 5.072838306427002, 5.239073753356934, 5.405308723449707, 5.571544170379639, 5.73777961730957, 5.904014587402344, 6.070250034332275, 6.236485481262207, 6.4027204513549805, 6.568955898284912, 6.735191345214844, 6.901426315307617, 7.067661762237549, 7.233896732330322, 7.400132179260254, 7.566367149353027, 7.732602596282959, 7.898838043212891, 8.065073013305664, 8.231307983398438, 8.397542953491211, 8.5637788772583, 8.730013847351074, 8.896248817443848, 9.062484741210938, 9.228719711303711, 9.394954681396484, 9.561190605163574]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 3.0, 10.0, 4.0, 6.0, 8.0, 16.0, 12.0, 19.0, 23.0, 37.0, 69.0, 52.0, 65.0, 75.0, 71.0, 83.0, 83.0, 71.0, 63.0, 48.0, 49.0, 20.0, 15.0, 17.0, 10.0, 17.0, 9.0, 8.0, 8.0, 3.0, 3.0, 4.0, 2.0, 1.0, 3.0, 6.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1898272037506104, -1.1554876565933228, -1.1211482286453247, -1.086808681488037, -1.052469253540039, -1.0181297063827515, -0.9837902188301086, -0.9494507312774658, -0.915111243724823, -0.8807717561721802, -0.8464322686195374, -0.8120927810668945, -0.7777532339096069, -0.7434138059616089, -0.7090742588043213, -0.6747347712516785, -0.6403952836990356, -0.6060557961463928, -0.57171630859375, -0.5373768210411072, -0.5030373334884644, -0.46869781613349915, -0.43435829877853394, -0.4000188112258911, -0.3656793236732483, -0.33133983612060547, -0.29700034856796265, -0.26266083121299744, -0.22832134366035461, -0.1939818561077118, -0.15964235365390778, -0.12530285120010376, -0.09096336364746094, -0.05662386864423752, -0.0222843736410141, 0.01205512136220932, 0.04639461636543274, 0.08073410391807556, 0.11507360637187958, 0.1494131088256836, 0.18375259637832642, 0.21809208393096924, 0.25243157148361206, 0.28677108883857727, 0.3211105763912201, 0.3554500639438629, 0.3897895812988281, 0.42412906885147095, 0.45846855640411377, 0.4928080439567566, 0.5271475315093994, 0.5614870190620422, 0.5958265066146851, 0.6301660537719727, 0.6645055413246155, 0.6988450288772583, 0.7331845164299011, 0.767524003982544, 0.8018634915351868, 0.8362029790878296, 0.8705425262451172, 0.9048819541931152, 0.9392215013504028, 0.9735609889030457, 1.0079004764556885]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 16.0, 11.0, 18.0, 28.0, 30.0, 27.0, 65.0, 79.0, 106.0, 139.0, 200.0, 333.0, 436.0, 660.0, 1059.0, 1706.0, 3092.0, 6029.0, 13899.0, 46188.0, 878554.0, 3159404.0, 52098.0, 14899.0, 6340.0, 3187.0, 1788.0, 1147.0, 737.0, 512.0, 357.0, 246.0, 205.0, 150.0, 112.0, 78.0, 69.0, 47.0, 52.0, 40.0, 28.0, 28.0, 23.0, 15.0, 14.0, 4.0, 7.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.3525390625, -0.3408050537109375, -0.329071044921875, -0.3173370361328125, -0.30560302734375, -0.2938690185546875, -0.282135009765625, -0.2704010009765625, -0.2586669921875, -0.2469329833984375, -0.235198974609375, -0.2234649658203125, -0.21173095703125, -0.1999969482421875, -0.188262939453125, -0.1765289306640625, -0.164794921875, -0.1530609130859375, -0.141326904296875, -0.1295928955078125, -0.11785888671875, -0.1061248779296875, -0.094390869140625, -0.0826568603515625, -0.0709228515625, -0.0591888427734375, -0.047454833984375, -0.0357208251953125, -0.02398681640625, -0.0122528076171875, -0.000518798828125, 0.0112152099609375, 0.02294921875, 0.0346832275390625, 0.046417236328125, 0.0581512451171875, 0.06988525390625, 0.0816192626953125, 0.093353271484375, 0.1050872802734375, 0.1168212890625, 0.1285552978515625, 0.140289306640625, 0.1520233154296875, 0.16375732421875, 0.1754913330078125, 0.187225341796875, 0.1989593505859375, 0.210693359375, 0.2224273681640625, 0.234161376953125, 0.2458953857421875, 0.25762939453125, 0.2693634033203125, 0.281097412109375, 0.2928314208984375, 0.3045654296875, 0.3162994384765625, 0.328033447265625, 0.3397674560546875, 0.35150146484375, 0.3632354736328125, 0.374969482421875, 0.3867034912109375, 0.3984375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 8.0, 5.0, 3.0, 6.0, 2.0, 6.0, 14.0, 12.0, 22.0, 31.0, 44.0, 65.0, 110.0, 161.0, 133.0, 117.0, 94.0, 47.0, 38.0, 27.0, 13.0, 11.0, 7.0, 3.0, 2.0, 6.0, 6.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.034088134765625, -0.032959938049316406, -0.03183174133300781, -0.03070354461669922, -0.029575347900390625, -0.02844715118408203, -0.027318954467773438, -0.026190757751464844, -0.02506256103515625, -0.023934364318847656, -0.022806167602539062, -0.02167797088623047, -0.020549774169921875, -0.01942157745361328, -0.018293380737304688, -0.017165184020996094, -0.0160369873046875, -0.014908790588378906, -0.013780593872070312, -0.012652397155761719, -0.011524200439453125, -0.010396003723144531, -0.009267807006835938, -0.008139610290527344, -0.00701141357421875, -0.005883216857910156, -0.0047550201416015625, -0.0036268234252929688, -0.002498626708984375, -0.0013704299926757812, -0.0002422332763671875, 0.0008859634399414062, 0.00201416015625, 0.0031423568725585938, 0.0042705535888671875, 0.005398750305175781, 0.006526947021484375, 0.007655143737792969, 0.008783340454101562, 0.009911537170410156, 0.01103973388671875, 0.012167930603027344, 0.013296127319335938, 0.014424324035644531, 0.015552520751953125, 0.01668071746826172, 0.017808914184570312, 0.018937110900878906, 0.0200653076171875, 0.021193504333496094, 0.022321701049804688, 0.02344989776611328, 0.024578094482421875, 0.02570629119873047, 0.026834487915039062, 0.027962684631347656, 0.02909088134765625, 0.030219078063964844, 0.03134727478027344, 0.03247547149658203, 0.033603668212890625, 0.03473186492919922, 0.03586006164550781, 0.036988258361816406, 0.038116455078125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 1.0, 6.0, 3.0, 6.0, 8.0, 16.0, 12.0, 27.0, 66.0, 133.0, 344.0, 1361.0, 10417.0, 321676.0, 3829569.0, 26984.0, 2699.0, 571.0, 181.0, 87.0, 39.0, 25.0, 20.0, 12.0, 8.0, 1.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8359375, -0.8121795654296875, -0.788421630859375, -0.7646636962890625, -0.74090576171875, -0.7171478271484375, -0.693389892578125, -0.6696319580078125, -0.6458740234375, -0.6221160888671875, -0.598358154296875, -0.5746002197265625, -0.55084228515625, -0.5270843505859375, -0.503326416015625, -0.4795684814453125, -0.455810546875, -0.4320526123046875, -0.408294677734375, -0.3845367431640625, -0.36077880859375, -0.3370208740234375, -0.313262939453125, -0.2895050048828125, -0.2657470703125, -0.2419891357421875, -0.218231201171875, -0.1944732666015625, -0.17071533203125, -0.1469573974609375, -0.123199462890625, -0.0994415283203125, -0.07568359375, -0.0519256591796875, -0.028167724609375, -0.0044097900390625, 0.01934814453125, 0.0431060791015625, 0.066864013671875, 0.0906219482421875, 0.1143798828125, 0.1381378173828125, 0.161895751953125, 0.1856536865234375, 0.20941162109375, 0.2331695556640625, 0.256927490234375, 0.2806854248046875, 0.304443359375, 0.3282012939453125, 0.351959228515625, 0.3757171630859375, 0.39947509765625, 0.4232330322265625, 0.446990966796875, 0.4707489013671875, 0.4945068359375, 0.5182647705078125, 0.542022705078125, 0.5657806396484375, 0.58953857421875, 0.6132965087890625, 0.637054443359375, 0.6608123779296875, 0.6845703125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 6.0, 11.0, 10.0, 22.0, 28.0, 49.0, 69.0, 113.0, 276.0, 683.0, 1950.0, 410.0, 193.0, 89.0, 50.0, 37.0, 20.0, 16.0, 12.0, 5.0, 2.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0684814453125, -0.06629371643066406, -0.06410598754882812, -0.06191825866699219, -0.05973052978515625, -0.05754280090332031, -0.055355072021484375, -0.05316734313964844, -0.0509796142578125, -0.04879188537597656, -0.046604156494140625, -0.04441642761230469, -0.04222869873046875, -0.04004096984863281, -0.037853240966796875, -0.03566551208496094, -0.033477783203125, -0.03129005432128906, -0.029102325439453125, -0.026914596557617188, -0.02472686767578125, -0.022539138793945312, -0.020351409912109375, -0.018163681030273438, -0.0159759521484375, -0.013788223266601562, -0.011600494384765625, -0.009412765502929688, -0.00722503662109375, -0.0050373077392578125, -0.002849578857421875, -0.0006618499755859375, 0.00152587890625, 0.0037136077880859375, 0.005901336669921875, 0.008089065551757812, 0.01027679443359375, 0.012464523315429688, 0.014652252197265625, 0.016839981079101562, 0.0190277099609375, 0.021215438842773438, 0.023403167724609375, 0.025590896606445312, 0.02777862548828125, 0.029966354370117188, 0.032154083251953125, 0.03434181213378906, 0.036529541015625, 0.03871726989746094, 0.040904998779296875, 0.04309272766113281, 0.04528045654296875, 0.04746818542480469, 0.049655914306640625, 0.05184364318847656, 0.0540313720703125, 0.05621910095214844, 0.058406829833984375, 0.06059455871582031, 0.06278228759765625, 0.06497001647949219, 0.06715774536132812, 0.06934547424316406, 0.071533203125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 7.0, 16.0, 19.0, 26.0, 75.0, 120.0, 136.0, 190.0, 147.0, 107.0, 67.0, 32.0, 23.0, 11.0, 4.0, 7.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3303999900817871, -0.32059523463249207, -0.31079044938087463, -0.3009856939315796, -0.29118093848228455, -0.2813761830329895, -0.27157139778137207, -0.261766642332077, -0.251961886882782, -0.24215711653232574, -0.2323523610830307, -0.22254759073257446, -0.21274283528327942, -0.20293806493282318, -0.19313329458236694, -0.1833285391330719, -0.17352375388145447, -0.16371898353099823, -0.15391422808170319, -0.14410945773124695, -0.1343047022819519, -0.12449993193149567, -0.11469516158103943, -0.10489039868116379, -0.09508563578128815, -0.0852808728814125, -0.07547610998153687, -0.06567133963108063, -0.05586657673120499, -0.046061813831329346, -0.036257047206163406, -0.026452280580997467, -0.016647517681121826, -0.006842752918601036, 0.002962011843919754, 0.012766776606440544, 0.022571541368961334, 0.032376304268836975, 0.042181070894002914, 0.051985837519168854, 0.061790600419044495, 0.07159536331892014, 0.08140012621879578, 0.09120489656925201, 0.10100965946912766, 0.1108144223690033, 0.12061919271945953, 0.13042396306991577, 0.14022871851921082, 0.15003348886966705, 0.1598382443189621, 0.16964301466941833, 0.17944777011871338, 0.18925254046916962, 0.19905731081962585, 0.2088620662689209, 0.21866683661937714, 0.22847160696983337, 0.23827636241912842, 0.24808113276958466, 0.2578859031200409, 0.26769065856933594, 0.277495414018631, 0.2873001992702484, 0.29710495471954346]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 7.0, 4.0, 8.0, 10.0, 7.0, 15.0, 22.0, 21.0, 32.0, 39.0, 36.0, 43.0, 58.0, 63.0, 62.0, 70.0, 69.0, 57.0, 59.0, 57.0, 41.0, 59.0, 34.0, 28.0, 25.0, 20.0, 16.0, 7.0, 7.0, 7.0, 7.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23356515169143677, -0.22616197168827057, -0.21875879168510437, -0.21135561168193817, -0.20395243167877197, -0.19654925167560577, -0.18914607167243958, -0.18174290657043457, -0.17433971166610718, -0.16693653166294098, -0.15953335165977478, -0.15213017165660858, -0.14472699165344238, -0.13732381165027618, -0.12992063164710999, -0.12251745909452438, -0.11511428654193878, -0.10771110653877258, -0.10030792653560638, -0.09290474653244019, -0.08550156652927399, -0.07809838652610779, -0.07069521397352219, -0.06329203397035599, -0.05588885396718979, -0.04848567396402359, -0.04108249396085739, -0.03367931768298149, -0.026276137679815292, -0.018872957676649094, -0.011469781398773193, -0.004066601395606995, 0.003336578607559204, 0.010739757679402828, 0.018142936751246452, 0.025546114891767502, 0.0329492948949337, 0.0403524748980999, 0.0477556511759758, 0.055158831179142, 0.0625620111823082, 0.0699651911854744, 0.0773683711886406, 0.0847715437412262, 0.0921747237443924, 0.0995779037475586, 0.10698108375072479, 0.11438426375389099, 0.12178744375705719, 0.1291906237602234, 0.1365938037633896, 0.1439969837665558, 0.15140016376972198, 0.15880334377288818, 0.1662065088748932, 0.17360970377922058, 0.18101286888122559, 0.18841604888439178, 0.19581922888755798, 0.20322240889072418, 0.21062558889389038, 0.21802876889705658, 0.22543194890022278, 0.23283511400222778, 0.24023830890655518]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 4.0, 4.0, 7.0, 15.0, 18.0, 25.0, 31.0, 42.0, 68.0, 79.0, 138.0, 211.0, 291.0, 461.0, 811.0, 1392.0, 2460.0, 4779.0, 10877.0, 32468.0, 167038.0, 647489.0, 132026.0, 28150.0, 9604.0, 4405.0, 2279.0, 1228.0, 726.0, 454.0, 305.0, 193.0, 150.0, 96.0, 65.0, 48.0, 38.0, 26.0, 23.0, 8.0, 7.0, 8.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.231201171875, -0.22307205200195312, -0.21494293212890625, -0.20681381225585938, -0.1986846923828125, -0.19055557250976562, -0.18242645263671875, -0.17429733276367188, -0.166168212890625, -0.15803909301757812, -0.14990997314453125, -0.14178085327148438, -0.1336517333984375, -0.12552261352539062, -0.11739349365234375, -0.10926437377929688, -0.10113525390625, -0.09300613403320312, -0.08487701416015625, -0.07674789428710938, -0.0686187744140625, -0.060489654541015625, -0.05236053466796875, -0.044231414794921875, -0.036102294921875, -0.027973175048828125, -0.01984405517578125, -0.011714935302734375, -0.0035858154296875, 0.004543304443359375, 0.01267242431640625, 0.020801544189453125, 0.0289306640625, 0.037059783935546875, 0.04518890380859375, 0.053318023681640625, 0.0614471435546875, 0.06957626342773438, 0.07770538330078125, 0.08583450317382812, 0.093963623046875, 0.10209274291992188, 0.11022186279296875, 0.11835098266601562, 0.1264801025390625, 0.13460922241210938, 0.14273834228515625, 0.15086746215820312, 0.15899658203125, 0.16712570190429688, 0.17525482177734375, 0.18338394165039062, 0.1915130615234375, 0.19964218139648438, 0.20777130126953125, 0.21590042114257812, 0.224029541015625, 0.23215866088867188, 0.24028778076171875, 0.24841690063476562, 0.2565460205078125, 0.2646751403808594, 0.27280426025390625, 0.2809333801269531, 0.2890625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 5.0, 5.0, 11.0, 13.0, 23.0, 31.0, 55.0, 78.0, 122.0, 159.0, 166.0, 115.0, 79.0, 41.0, 32.0, 19.0, 10.0, 9.0, 2.0, 2.0, 6.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.038909912109375, -0.03768587112426758, -0.036461830139160156, -0.035237789154052734, -0.03401374816894531, -0.03278970718383789, -0.03156566619873047, -0.030341625213623047, -0.029117584228515625, -0.027893543243408203, -0.02666950225830078, -0.02544546127319336, -0.024221420288085938, -0.022997379302978516, -0.021773338317871094, -0.020549297332763672, -0.01932525634765625, -0.018101215362548828, -0.016877174377441406, -0.015653133392333984, -0.014429092407226562, -0.01320505142211914, -0.011981010437011719, -0.010756969451904297, -0.009532928466796875, -0.008308887481689453, -0.007084846496582031, -0.005860805511474609, -0.0046367645263671875, -0.0034127235412597656, -0.0021886825561523438, -0.0009646415710449219, 0.0002593994140625, 0.0014834403991699219, 0.0027074813842773438, 0.003931522369384766, 0.0051555633544921875, 0.006379604339599609, 0.007603645324707031, 0.008827686309814453, 0.010051727294921875, 0.011275768280029297, 0.012499809265136719, 0.01372385025024414, 0.014947891235351562, 0.016171932220458984, 0.017395973205566406, 0.018620014190673828, 0.01984405517578125, 0.021068096160888672, 0.022292137145996094, 0.023516178131103516, 0.024740219116210938, 0.02596426010131836, 0.02718830108642578, 0.028412342071533203, 0.029636383056640625, 0.030860424041748047, 0.03208446502685547, 0.03330850601196289, 0.03453254699707031, 0.035756587982177734, 0.036980628967285156, 0.03820466995239258, 0.0394287109375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 6.0, 10.0, 13.0, 9.0, 16.0, 21.0, 46.0, 53.0, 79.0, 113.0, 160.0, 303.0, 529.0, 1075.0, 2992.0, 10795.0, 56439.0, 374243.0, 499517.0, 80594.0, 14917.0, 3821.0, 1325.0, 562.0, 333.0, 224.0, 107.0, 58.0, 49.0, 33.0, 29.0, 19.0, 15.0, 8.0, 11.0, 9.0, 3.0, 7.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2420654296875, -0.23313331604003906, -0.22420120239257812, -0.2152690887451172, -0.20633697509765625, -0.1974048614501953, -0.18847274780273438, -0.17954063415527344, -0.1706085205078125, -0.16167640686035156, -0.15274429321289062, -0.1438121795654297, -0.13488006591796875, -0.1259479522705078, -0.11701583862304688, -0.10808372497558594, -0.099151611328125, -0.09021949768066406, -0.08128738403320312, -0.07235527038574219, -0.06342315673828125, -0.05449104309082031, -0.045558929443359375, -0.03662681579589844, -0.0276947021484375, -0.018762588500976562, -0.009830474853515625, -0.0008983612060546875, 0.00803375244140625, 0.016965866088867188, 0.025897979736328125, 0.03483009338378906, 0.04376220703125, 0.05269432067871094, 0.061626434326171875, 0.07055854797363281, 0.07949066162109375, 0.08842277526855469, 0.09735488891601562, 0.10628700256347656, 0.1152191162109375, 0.12415122985839844, 0.13308334350585938, 0.1420154571533203, 0.15094757080078125, 0.1598796844482422, 0.16881179809570312, 0.17774391174316406, 0.186676025390625, 0.19560813903808594, 0.20454025268554688, 0.2134723663330078, 0.22240447998046875, 0.2313365936279297, 0.24026870727539062, 0.24920082092285156, 0.2581329345703125, 0.26706504821777344, 0.2759971618652344, 0.2849292755126953, 0.29386138916015625, 0.3027935028076172, 0.3117256164550781, 0.32065773010253906, 0.32958984375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 8.0, 2.0, 10.0, 7.0, 11.0, 6.0, 12.0, 14.0, 20.0, 16.0, 28.0, 24.0, 29.0, 29.0, 35.0, 36.0, 37.0, 54.0, 52.0, 54.0, 40.0, 44.0, 48.0, 54.0, 46.0, 42.0, 39.0, 32.0, 35.0, 29.0, 19.0, 13.0, 14.0, 12.0, 9.0, 17.0, 9.0, 4.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10009765625, -0.09634971618652344, -0.09260177612304688, -0.08885383605957031, -0.08510589599609375, -0.08135795593261719, -0.07761001586914062, -0.07386207580566406, -0.0701141357421875, -0.06636619567871094, -0.06261825561523438, -0.05887031555175781, -0.05512237548828125, -0.05137443542480469, -0.047626495361328125, -0.04387855529785156, -0.040130615234375, -0.03638267517089844, -0.032634735107421875, -0.028886795043945312, -0.02513885498046875, -0.021390914916992188, -0.017642974853515625, -0.013895034790039062, -0.0101470947265625, -0.0063991546630859375, -0.002651214599609375, 0.0010967254638671875, 0.00484466552734375, 0.008592605590820312, 0.012340545654296875, 0.016088485717773438, 0.01983642578125, 0.023584365844726562, 0.027332305908203125, 0.031080245971679688, 0.03482818603515625, 0.03857612609863281, 0.042324066162109375, 0.04607200622558594, 0.0498199462890625, 0.05356788635253906, 0.057315826416015625, 0.06106376647949219, 0.06481170654296875, 0.06855964660644531, 0.07230758666992188, 0.07605552673339844, 0.079803466796875, 0.08355140686035156, 0.08729934692382812, 0.09104728698730469, 0.09479522705078125, 0.09854316711425781, 0.10229110717773438, 0.10603904724121094, 0.1097869873046875, 0.11353492736816406, 0.11728286743164062, 0.12103080749511719, 0.12477874755859375, 0.1285266876220703, 0.13227462768554688, 0.13602256774902344, 0.1397705078125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 8.0, 8.0, 13.0, 12.0, 20.0, 19.0, 53.0, 67.0, 66.0, 133.0, 166.0, 222.0, 319.0, 551.0, 922.0, 1682.0, 3171.0, 6682.0, 15176.0, 37878.0, 104135.0, 296515.0, 357164.0, 138945.0, 48746.0, 19120.0, 7989.0, 3872.0, 2043.0, 1096.0, 559.0, 397.0, 239.0, 151.0, 113.0, 80.0, 52.0, 51.0, 31.0, 25.0, 16.0, 14.0, 5.0, 9.0, 7.0, 5.0, 3.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.08282470703125, -0.0802469253540039, -0.07766914367675781, -0.07509136199951172, -0.07251358032226562, -0.06993579864501953, -0.06735801696777344, -0.06478023529052734, -0.06220245361328125, -0.059624671936035156, -0.05704689025878906, -0.05446910858154297, -0.051891326904296875, -0.04931354522705078, -0.04673576354980469, -0.044157981872558594, -0.0415802001953125, -0.039002418518066406, -0.03642463684082031, -0.03384685516357422, -0.031269073486328125, -0.02869129180908203, -0.026113510131835938, -0.023535728454589844, -0.02095794677734375, -0.018380165100097656, -0.015802383422851562, -0.013224601745605469, -0.010646820068359375, -0.008069038391113281, -0.0054912567138671875, -0.0029134750366210938, -0.000335693359375, 0.0022420883178710938, 0.0048198699951171875, 0.007397651672363281, 0.009975433349609375, 0.012553215026855469, 0.015130996704101562, 0.017708778381347656, 0.02028656005859375, 0.022864341735839844, 0.025442123413085938, 0.02801990509033203, 0.030597686767578125, 0.03317546844482422, 0.03575325012207031, 0.038331031799316406, 0.0409088134765625, 0.043486595153808594, 0.04606437683105469, 0.04864215850830078, 0.051219940185546875, 0.05379772186279297, 0.05637550354003906, 0.058953285217285156, 0.06153106689453125, 0.06410884857177734, 0.06668663024902344, 0.06926441192626953, 0.07184219360351562, 0.07441997528076172, 0.07699775695800781, 0.0795755386352539, 0.0821533203125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 8.0, 14.0, 14.0, 14.0, 24.0, 23.0, 34.0, 39.0, 37.0, 45.0, 58.0, 79.0, 73.0, 84.0, 65.0, 68.0, 52.0, 48.0, 52.0, 33.0, 29.0, 23.0, 21.0, 15.0, 15.0, 8.0, 7.0, 7.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.647804260253906e-05, -3.535579890012741e-05, -3.423355519771576e-05, -3.311131149530411e-05, -3.1989067792892456e-05, -3.0866824090480804e-05, -2.9744580388069153e-05, -2.86223366856575e-05, -2.750009298324585e-05, -2.6377849280834198e-05, -2.5255605578422546e-05, -2.4133361876010895e-05, -2.3011118173599243e-05, -2.188887447118759e-05, -2.076663076877594e-05, -1.964438706636429e-05, -1.8522143363952637e-05, -1.7399899661540985e-05, -1.6277655959129333e-05, -1.5155412256717682e-05, -1.403316855430603e-05, -1.2910924851894379e-05, -1.1788681149482727e-05, -1.0666437447071075e-05, -9.544193744659424e-06, -8.421950042247772e-06, -7.299706339836121e-06, -6.177462637424469e-06, -5.055218935012817e-06, -3.932975232601166e-06, -2.810731530189514e-06, -1.6884878277778625e-06, -5.662441253662109e-07, 5.559995770454407e-07, 1.6782432794570923e-06, 2.800486981868744e-06, 3.9227306842803955e-06, 5.044974386692047e-06, 6.167218089103699e-06, 7.28946179151535e-06, 8.411705493927002e-06, 9.533949196338654e-06, 1.0656192898750305e-05, 1.1778436601161957e-05, 1.2900680303573608e-05, 1.402292400598526e-05, 1.5145167708396912e-05, 1.6267411410808563e-05, 1.7389655113220215e-05, 1.8511898815631866e-05, 1.9634142518043518e-05, 2.075638622045517e-05, 2.187862992286682e-05, 2.3000873625278473e-05, 2.4123117327690125e-05, 2.5245361030101776e-05, 2.6367604732513428e-05, 2.748984843492508e-05, 2.861209213733673e-05, 2.9734335839748383e-05, 3.0856579542160034e-05, 3.1978823244571686e-05, 3.310106694698334e-05, 3.422331064939499e-05, 3.534555435180664e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 8.0, 10.0, 9.0, 11.0, 15.0, 25.0, 40.0, 46.0, 87.0, 112.0, 228.0, 416.0, 786.0, 1908.0, 5688.0, 20903.0, 105175.0, 549593.0, 296652.0, 49323.0, 11330.0, 3462.0, 1330.0, 577.0, 327.0, 176.0, 93.0, 73.0, 37.0, 27.0, 18.0, 13.0, 19.0, 12.0, 9.0, 4.0, 0.0, 3.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.138916015625, -0.13454437255859375, -0.1301727294921875, -0.12580108642578125, -0.121429443359375, -0.11705780029296875, -0.1126861572265625, -0.10831451416015625, -0.10394287109375, -0.09957122802734375, -0.0951995849609375, -0.09082794189453125, -0.086456298828125, -0.08208465576171875, -0.0777130126953125, -0.07334136962890625, -0.0689697265625, -0.06459808349609375, -0.0602264404296875, -0.05585479736328125, -0.051483154296875, -0.04711151123046875, -0.0427398681640625, -0.03836822509765625, -0.03399658203125, -0.02962493896484375, -0.0252532958984375, -0.02088165283203125, -0.016510009765625, -0.01213836669921875, -0.0077667236328125, -0.00339508056640625, 0.0009765625, 0.00534820556640625, 0.0097198486328125, 0.01409149169921875, 0.018463134765625, 0.02283477783203125, 0.0272064208984375, 0.03157806396484375, 0.03594970703125, 0.04032135009765625, 0.0446929931640625, 0.04906463623046875, 0.053436279296875, 0.05780792236328125, 0.0621795654296875, 0.06655120849609375, 0.0709228515625, 0.07529449462890625, 0.0796661376953125, 0.08403778076171875, 0.088409423828125, 0.09278106689453125, 0.0971527099609375, 0.10152435302734375, 0.10589599609375, 0.11026763916015625, 0.1146392822265625, 0.11901092529296875, 0.123382568359375, 0.12775421142578125, 0.1321258544921875, 0.13649749755859375, 0.140869140625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 6.0, 6.0, 4.0, 8.0, 7.0, 10.0, 14.0, 16.0, 27.0, 28.0, 29.0, 43.0, 49.0, 55.0, 62.0, 71.0, 69.0, 66.0, 76.0, 59.0, 57.0, 48.0, 35.0, 24.0, 22.0, 18.0, 14.0, 14.0, 7.0, 13.0, 8.0, 6.0, 4.0, 6.0, 5.0, 2.0, 4.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.060272216796875, -0.058428287506103516, -0.05658435821533203, -0.05474042892456055, -0.05289649963378906, -0.05105257034301758, -0.049208641052246094, -0.04736471176147461, -0.045520782470703125, -0.04367685317993164, -0.041832923889160156, -0.03998899459838867, -0.03814506530761719, -0.0363011360168457, -0.03445720672607422, -0.032613277435302734, -0.03076934814453125, -0.028925418853759766, -0.02708148956298828, -0.025237560272216797, -0.023393630981445312, -0.021549701690673828, -0.019705772399902344, -0.01786184310913086, -0.016017913818359375, -0.01417398452758789, -0.012330055236816406, -0.010486125946044922, -0.008642196655273438, -0.006798267364501953, -0.004954338073730469, -0.0031104087829589844, -0.0012664794921875, 0.0005774497985839844, 0.0024213790893554688, 0.004265308380126953, 0.0061092376708984375, 0.007953166961669922, 0.009797096252441406, 0.01164102554321289, 0.013484954833984375, 0.01532888412475586, 0.017172813415527344, 0.019016742706298828, 0.020860671997070312, 0.022704601287841797, 0.02454853057861328, 0.026392459869384766, 0.02823638916015625, 0.030080318450927734, 0.03192424774169922, 0.0337681770324707, 0.03561210632324219, 0.03745603561401367, 0.039299964904785156, 0.04114389419555664, 0.042987823486328125, 0.04483175277709961, 0.046675682067871094, 0.04851961135864258, 0.05036354064941406, 0.05220746994018555, 0.05405139923095703, 0.055895328521728516, 0.0577392578125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 9.0, 13.0, 27.0, 53.0, 118.0, 233.0, 238.0, 146.0, 94.0, 35.0, 14.0, 13.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8776824474334717, -1.8176438808441162, -1.7576054334640503, -1.6975668668746948, -1.6375283002853394, -1.5774898529052734, -1.517451286315918, -1.4574127197265625, -1.397374153137207, -1.3373355865478516, -1.2772971391677856, -1.2172585725784302, -1.1572200059890747, -1.0971815586090088, -1.0371429920196533, -0.9771044254302979, -0.9170659780502319, -0.8570274710655212, -0.7969889044761658, -0.7369503974914551, -0.6769118309020996, -0.6168733239173889, -0.5568348169326782, -0.49679628014564514, -0.43675774335861206, -0.376719206571579, -0.3166806697845459, -0.2566421627998352, -0.19660362601280212, -0.13656508922576904, -0.07652658224105835, -0.01648804545402527, 0.04355049133300781, 0.1035890206694603, 0.16362755000591278, 0.22366607189178467, 0.28370460867881775, 0.34374314546585083, 0.4037816524505615, 0.4638201892375946, 0.5238587260246277, 0.5838972330093384, 0.6439357995986938, 0.7039743065834045, 0.7640128135681152, 0.8240513801574707, 0.8840898871421814, 0.9441283941268921, 1.0041669607162476, 1.064205527305603, 1.124243974685669, 1.1842825412750244, 1.2443211078643799, 1.3043596744537354, 1.3643981218338013, 1.4244366884231567, 1.4844751358032227, 1.5445137023925781, 1.604552149772644, 1.6645907163619995, 1.724629282951355, 1.784667730331421, 1.8447062969207764, 1.9047448635101318, 1.9647834300994873]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 7.0, 6.0, 9.0, 9.0, 17.0, 17.0, 21.0, 29.0, 25.0, 45.0, 39.0, 50.0, 64.0, 75.0, 72.0, 60.0, 67.0, 58.0, 45.0, 46.0, 45.0, 39.0, 32.0, 19.0, 20.0, 19.0, 18.0, 14.0, 8.0, 8.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9781767725944519, -0.9423176050186157, -0.9064583778381348, -0.8705992102622986, -0.8347400426864624, -0.7988808751106262, -0.76302170753479, -0.7271624803543091, -0.6913033127784729, -0.6554441452026367, -0.6195849180221558, -0.5837257504463196, -0.5478665828704834, -0.5120074152946472, -0.47614821791648865, -0.4402890205383301, -0.4044298529624939, -0.3685706853866577, -0.33271148800849915, -0.2968522906303406, -0.2609931230545044, -0.22513394057750702, -0.18927475810050964, -0.15341556072235107, -0.11755639314651489, -0.08169721066951752, -0.04583802819252014, -0.009978845715522766, 0.02588033676147461, 0.061739519238471985, 0.09759870171546936, 0.13345789909362793, 0.1693171262741089, 0.20517630875110626, 0.24103549122810364, 0.2768946886062622, 0.3127538561820984, 0.34861302375793457, 0.38447222113609314, 0.4203314185142517, 0.4561905860900879, 0.4920497536659241, 0.5279089212417603, 0.5637681484222412, 0.5996273159980774, 0.6354864835739136, 0.6713457107543945, 0.7072048783302307, 0.7430640459060669, 0.7789232134819031, 0.8147823810577393, 0.8506416082382202, 0.8865007758140564, 0.9223599433898926, 0.9582191705703735, 0.9940783381462097, 1.029937505722046, 1.0657967329025269, 1.1016558408737183, 1.1375150680541992, 1.1733741760253906, 1.2092334032058716, 1.2450926303863525, 1.280951738357544, 1.316810965538025]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 2.0, 1.0, 1.0, 10.0, 17.0, 11.0, 40.0, 100.0, 197.0, 571.0, 2373.0, 19596.0, 4051129.0, 112363.0, 5714.0, 1266.0, 462.0, 194.0, 111.0, 42.0, 29.0, 17.0, 14.0, 11.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.005859375, -0.9731292724609375, -0.940399169921875, -0.9076690673828125, -0.87493896484375, -0.8422088623046875, -0.809478759765625, -0.7767486572265625, -0.7440185546875, -0.7112884521484375, -0.678558349609375, -0.6458282470703125, -0.61309814453125, -0.5803680419921875, -0.547637939453125, -0.5149078369140625, -0.482177734375, -0.4494476318359375, -0.416717529296875, -0.3839874267578125, -0.35125732421875, -0.3185272216796875, -0.285797119140625, -0.2530670166015625, -0.2203369140625, -0.1876068115234375, -0.154876708984375, -0.1221466064453125, -0.08941650390625, -0.0566864013671875, -0.023956298828125, 0.0087738037109375, 0.04150390625, 0.0742340087890625, 0.106964111328125, 0.1396942138671875, 0.17242431640625, 0.2051544189453125, 0.237884521484375, 0.2706146240234375, 0.3033447265625, 0.3360748291015625, 0.368804931640625, 0.4015350341796875, 0.43426513671875, 0.4669952392578125, 0.499725341796875, 0.5324554443359375, 0.565185546875, 0.5979156494140625, 0.630645751953125, 0.6633758544921875, 0.69610595703125, 0.7288360595703125, 0.761566162109375, 0.7942962646484375, 0.8270263671875, 0.8597564697265625, 0.892486572265625, 0.9252166748046875, 0.95794677734375, 0.9906768798828125, 1.023406982421875, 1.0561370849609375, 1.0888671875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 0.0, 3.0, 4.0, 6.0, 7.0, 18.0, 21.0, 29.0, 43.0, 67.0, 107.0, 146.0, 131.0, 130.0, 100.0, 61.0, 46.0, 31.0, 25.0, 9.0, 7.0, 5.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043304443359375, -0.04178476333618164, -0.04026508331298828, -0.03874540328979492, -0.03722572326660156, -0.0357060432434082, -0.034186363220214844, -0.032666683197021484, -0.031147003173828125, -0.029627323150634766, -0.028107643127441406, -0.026587963104248047, -0.025068283081054688, -0.023548603057861328, -0.02202892303466797, -0.02050924301147461, -0.01898956298828125, -0.01746988296508789, -0.01595020294189453, -0.014430522918701172, -0.012910842895507812, -0.011391162872314453, -0.009871482849121094, -0.008351802825927734, -0.006832122802734375, -0.005312442779541016, -0.0037927627563476562, -0.002273082733154297, -0.0007534027099609375, 0.0007662773132324219, 0.0022859573364257812, 0.0038056373596191406, 0.0053253173828125, 0.006844997406005859, 0.008364677429199219, 0.009884357452392578, 0.011404037475585938, 0.012923717498779297, 0.014443397521972656, 0.015963077545166016, 0.017482757568359375, 0.019002437591552734, 0.020522117614746094, 0.022041797637939453, 0.023561477661132812, 0.025081157684326172, 0.02660083770751953, 0.02812051773071289, 0.02964019775390625, 0.03115987777709961, 0.03267955780029297, 0.03419923782348633, 0.03571891784667969, 0.03723859786987305, 0.038758277893066406, 0.040277957916259766, 0.041797637939453125, 0.043317317962646484, 0.044836997985839844, 0.0463566780090332, 0.04787635803222656, 0.04939603805541992, 0.05091571807861328, 0.05243539810180664, 0.053955078125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 2.0, 5.0, 2.0, 11.0, 6.0, 11.0, 25.0, 28.0, 30.0, 50.0, 79.0, 91.0, 149.0, 222.0, 449.0, 792.0, 1542.0, 3383.0, 8209.0, 22235.0, 75676.0, 472385.0, 3292128.0, 240010.0, 49947.0, 15710.0, 5909.0, 2569.0, 1174.0, 575.0, 328.0, 175.0, 112.0, 79.0, 56.0, 32.0, 31.0, 23.0, 13.0, 8.0, 5.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.2191162109375, -0.21164894104003906, -0.20418167114257812, -0.1967144012451172, -0.18924713134765625, -0.1817798614501953, -0.17431259155273438, -0.16684532165527344, -0.1593780517578125, -0.15191078186035156, -0.14444351196289062, -0.1369762420654297, -0.12950897216796875, -0.12204170227050781, -0.11457443237304688, -0.10710716247558594, -0.099639892578125, -0.09217262268066406, -0.08470535278320312, -0.07723808288574219, -0.06977081298828125, -0.06230354309082031, -0.054836273193359375, -0.04736900329589844, -0.0399017333984375, -0.03243446350097656, -0.024967193603515625, -0.017499923706054688, -0.01003265380859375, -0.0025653839111328125, 0.004901885986328125, 0.012369155883789062, 0.01983642578125, 0.027303695678710938, 0.034770965576171875, 0.04223823547363281, 0.04970550537109375, 0.05717277526855469, 0.06464004516601562, 0.07210731506347656, 0.0795745849609375, 0.08704185485839844, 0.09450912475585938, 0.10197639465332031, 0.10944366455078125, 0.11691093444824219, 0.12437820434570312, 0.13184547424316406, 0.139312744140625, 0.14678001403808594, 0.15424728393554688, 0.1617145538330078, 0.16918182373046875, 0.1766490936279297, 0.18411636352539062, 0.19158363342285156, 0.1990509033203125, 0.20651817321777344, 0.21398544311523438, 0.2214527130126953, 0.22891998291015625, 0.2363872528076172, 0.24385452270507812, 0.25132179260253906, 0.2587890625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 3.0, 8.0, 6.0, 9.0, 14.0, 24.0, 20.0, 20.0, 36.0, 44.0, 65.0, 106.0, 183.0, 405.0, 1612.0, 686.0, 292.0, 168.0, 124.0, 68.0, 52.0, 41.0, 23.0, 13.0, 10.0, 6.0, 11.0, 10.0, 1.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05889892578125, -0.056987762451171875, -0.05507659912109375, -0.053165435791015625, -0.0512542724609375, -0.049343109130859375, -0.04743194580078125, -0.045520782470703125, -0.043609619140625, -0.041698455810546875, -0.03978729248046875, -0.037876129150390625, -0.0359649658203125, -0.034053802490234375, -0.03214263916015625, -0.030231475830078125, -0.0283203125, -0.026409149169921875, -0.02449798583984375, -0.022586822509765625, -0.0206756591796875, -0.018764495849609375, -0.01685333251953125, -0.014942169189453125, -0.013031005859375, -0.011119842529296875, -0.00920867919921875, -0.007297515869140625, -0.0053863525390625, -0.003475189208984375, -0.00156402587890625, 0.000347137451171875, 0.00225830078125, 0.004169464111328125, 0.00608062744140625, 0.007991790771484375, 0.0099029541015625, 0.011814117431640625, 0.01372528076171875, 0.015636444091796875, 0.017547607421875, 0.019458770751953125, 0.02136993408203125, 0.023281097412109375, 0.0251922607421875, 0.027103424072265625, 0.02901458740234375, 0.030925750732421875, 0.0328369140625, 0.034748077392578125, 0.03665924072265625, 0.038570404052734375, 0.0404815673828125, 0.042392730712890625, 0.04430389404296875, 0.046215057373046875, 0.048126220703125, 0.050037384033203125, 0.05194854736328125, 0.053859710693359375, 0.0557708740234375, 0.057682037353515625, 0.05959320068359375, 0.061504364013671875, 0.06341552734375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 9.0, 28.0, 110.0, 240.0, 350.0, 191.0, 52.0, 12.0, 8.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3059757947921753, -1.2800270318984985, -1.2540782690048218, -1.228129506111145, -1.2021806240081787, -1.176231861114502, -1.1502830982208252, -1.1243343353271484, -1.0983855724334717, -1.072436809539795, -1.0464880466461182, -1.0205392837524414, -0.9945904612541199, -0.9686416387557983, -0.9426928758621216, -0.9167441129684448, -0.8907953500747681, -0.8648465871810913, -0.8388977646827698, -0.812949001789093, -0.7870002388954163, -0.7610514163970947, -0.735102653503418, -0.7091538906097412, -0.6832050681114197, -0.6572563052177429, -0.6313074827194214, -0.6053587198257446, -0.5794099569320679, -0.5534611940383911, -0.5275123715400696, -0.5015636086463928, -0.47561487555503845, -0.4496660828590393, -0.42371731996536255, -0.3977685272693634, -0.37181976437568665, -0.3458709716796875, -0.31992220878601074, -0.2939734160900116, -0.26802462339401245, -0.2420758455991745, -0.21612706780433655, -0.1901782751083374, -0.16422951221466064, -0.1382807195186615, -0.11233194172382355, -0.0863831639289856, -0.06043440103530884, -0.034485623240470886, -0.008536841720342636, 0.017411939799785614, 0.043360717594623566, 0.06930950284004211, 0.09525828063488007, 0.12120705842971802, 0.14715583622455597, 0.17310461401939392, 0.19905339181423187, 0.22500216960906982, 0.25095096230506897, 0.2768997550010681, 0.3028485178947449, 0.32879728078842163, 0.3547460734844208]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 6.0, 5.0, 6.0, 14.0, 13.0, 12.0, 8.0, 10.0, 14.0, 14.0, 23.0, 22.0, 27.0, 34.0, 43.0, 40.0, 37.0, 40.0, 34.0, 49.0, 41.0, 41.0, 38.0, 47.0, 43.0, 39.0, 41.0, 32.0, 27.0, 24.0, 27.0, 26.0, 22.0, 13.0, 12.0, 16.0, 9.0, 10.0, 12.0, 7.0, 3.0, 8.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0], "bins": [-0.21332383155822754, -0.2074023187160492, -0.20148082077503204, -0.1955593079328537, -0.18963779509067535, -0.1837162971496582, -0.17779478430747986, -0.1718732714653015, -0.16595175862312317, -0.16003024578094482, -0.15410874783992767, -0.14818723499774933, -0.14226572215557098, -0.13634422421455383, -0.1304227113723755, -0.12450119853019714, -0.11857970058917999, -0.11265819519758224, -0.1067366823554039, -0.10081517696380615, -0.09489366412162781, -0.08897215873003006, -0.08305065333843231, -0.07712914049625397, -0.07120763510465622, -0.06528612971305847, -0.05936461687088013, -0.05344311147928238, -0.04752160236239433, -0.04160009324550629, -0.03567858785390854, -0.029757078737020493, -0.023835569620132446, -0.0179140605032444, -0.011992553249001503, -0.006071045994758606, -0.0001495368778705597, 0.005771972239017487, 0.011693477630615234, 0.01761498674750328, 0.023536495864391327, 0.029458004981279373, 0.03537951409816742, 0.04130101948976517, 0.047222528606653214, 0.05314403772354126, 0.05906554311513901, 0.06498704850673676, 0.0709085613489151, 0.07683006674051285, 0.08275157958269119, 0.08867308497428894, 0.09459459781646729, 0.10051610320806503, 0.10643760859966278, 0.11235912144184113, 0.11828062683343887, 0.12420213222503662, 0.13012364506721497, 0.1360451579093933, 0.14196665585041046, 0.1478881686925888, 0.15380966663360596, 0.1597311794757843, 0.16565269231796265]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 0.0, 2.0, 2.0, 6.0, 7.0, 14.0, 9.0, 18.0, 33.0, 56.0, 72.0, 90.0, 194.0, 331.0, 538.0, 1023.0, 2051.0, 5323.0, 20280.0, 130314.0, 668951.0, 182309.0, 25615.0, 6500.0, 2320.0, 1033.0, 595.0, 336.0, 202.0, 120.0, 78.0, 47.0, 30.0, 21.0, 10.0, 10.0, 4.0, 3.0, 5.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.30810546875, -0.29834747314453125, -0.2885894775390625, -0.27883148193359375, -0.269073486328125, -0.25931549072265625, -0.2495574951171875, -0.23979949951171875, -0.23004150390625, -0.22028350830078125, -0.2105255126953125, -0.20076751708984375, -0.191009521484375, -0.18125152587890625, -0.1714935302734375, -0.16173553466796875, -0.1519775390625, -0.14221954345703125, -0.1324615478515625, -0.12270355224609375, -0.112945556640625, -0.10318756103515625, -0.0934295654296875, -0.08367156982421875, -0.07391357421875, -0.06415557861328125, -0.0543975830078125, -0.04463958740234375, -0.034881591796875, -0.02512359619140625, -0.0153656005859375, -0.00560760498046875, 0.004150390625, 0.01390838623046875, 0.0236663818359375, 0.03342437744140625, 0.043182373046875, 0.05294036865234375, 0.0626983642578125, 0.07245635986328125, 0.08221435546875, 0.09197235107421875, 0.1017303466796875, 0.11148834228515625, 0.121246337890625, 0.13100433349609375, 0.1407623291015625, 0.15052032470703125, 0.1602783203125, 0.17003631591796875, 0.1797943115234375, 0.18955230712890625, 0.199310302734375, 0.20906829833984375, 0.2188262939453125, 0.22858428955078125, 0.23834228515625, 0.24810028076171875, 0.2578582763671875, 0.26761627197265625, 0.277374267578125, 0.28713226318359375, 0.2968902587890625, 0.30664825439453125, 0.31640625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 13.0, 12.0, 16.0, 29.0, 41.0, 76.0, 77.0, 124.0, 142.0, 131.0, 111.0, 77.0, 55.0, 33.0, 21.0, 16.0, 15.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046661376953125, -0.04509735107421875, -0.0435333251953125, -0.04196929931640625, -0.0404052734375, -0.03884124755859375, -0.0372772216796875, -0.03571319580078125, -0.034149169921875, -0.03258514404296875, -0.0310211181640625, -0.02945709228515625, -0.02789306640625, -0.02632904052734375, -0.0247650146484375, -0.02320098876953125, -0.021636962890625, -0.02007293701171875, -0.0185089111328125, -0.01694488525390625, -0.015380859375, -0.01381683349609375, -0.0122528076171875, -0.01068878173828125, -0.009124755859375, -0.00756072998046875, -0.0059967041015625, -0.00443267822265625, -0.00286865234375, -0.00130462646484375, 0.0002593994140625, 0.00182342529296875, 0.003387451171875, 0.00495147705078125, 0.0065155029296875, 0.00807952880859375, 0.0096435546875, 0.01120758056640625, 0.0127716064453125, 0.01433563232421875, 0.015899658203125, 0.01746368408203125, 0.0190277099609375, 0.02059173583984375, 0.02215576171875, 0.02371978759765625, 0.0252838134765625, 0.02684783935546875, 0.028411865234375, 0.02997589111328125, 0.0315399169921875, 0.03310394287109375, 0.03466796875, 0.03623199462890625, 0.0377960205078125, 0.03936004638671875, 0.040924072265625, 0.04248809814453125, 0.0440521240234375, 0.04561614990234375, 0.04718017578125, 0.04874420166015625, 0.0503082275390625, 0.05187225341796875, 0.053436279296875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 6.0, 6.0, 11.0, 15.0, 28.0, 31.0, 51.0, 65.0, 106.0, 160.0, 243.0, 395.0, 762.0, 1477.0, 3788.0, 11812.0, 48578.0, 243873.0, 544025.0, 148607.0, 30664.0, 8222.0, 2896.0, 1174.0, 589.0, 332.0, 205.0, 138.0, 99.0, 55.0, 42.0, 31.0, 21.0, 8.0, 9.0, 7.0, 8.0, 4.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2705078125, -0.26239585876464844, -0.2542839050292969, -0.2461719512939453, -0.23805999755859375, -0.2299480438232422, -0.22183609008789062, -0.21372413635253906, -0.2056121826171875, -0.19750022888183594, -0.18938827514648438, -0.1812763214111328, -0.17316436767578125, -0.1650524139404297, -0.15694046020507812, -0.14882850646972656, -0.140716552734375, -0.13260459899902344, -0.12449264526367188, -0.11638069152832031, -0.10826873779296875, -0.10015678405761719, -0.09204483032226562, -0.08393287658691406, -0.0758209228515625, -0.06770896911621094, -0.059597015380859375, -0.05148506164550781, -0.04337310791015625, -0.03526115417480469, -0.027149200439453125, -0.019037246704101562, -0.01092529296875, -0.0028133392333984375, 0.005298614501953125, 0.013410568237304688, 0.02152252197265625, 0.029634475708007812, 0.037746429443359375, 0.04585838317871094, 0.0539703369140625, 0.06208229064941406, 0.07019424438476562, 0.07830619812011719, 0.08641815185546875, 0.09453010559082031, 0.10264205932617188, 0.11075401306152344, 0.118865966796875, 0.12697792053222656, 0.13508987426757812, 0.1432018280029297, 0.15131378173828125, 0.1594257354736328, 0.16753768920898438, 0.17564964294433594, 0.1837615966796875, 0.19187355041503906, 0.19998550415039062, 0.2080974578857422, 0.21620941162109375, 0.2243213653564453, 0.23243331909179688, 0.24054527282714844, 0.2486572265625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 6.0, 6.0, 9.0, 10.0, 14.0, 11.0, 15.0, 25.0, 32.0, 44.0, 37.0, 41.0, 44.0, 43.0, 40.0, 53.0, 49.0, 47.0, 52.0, 57.0, 65.0, 62.0, 34.0, 34.0, 30.0, 34.0, 23.0, 21.0, 15.0, 7.0, 6.0, 6.0, 5.0, 6.0, 4.0, 7.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1922607421875, -0.18689727783203125, -0.1815338134765625, -0.17617034912109375, -0.170806884765625, -0.16544342041015625, -0.1600799560546875, -0.15471649169921875, -0.14935302734375, -0.14398956298828125, -0.1386260986328125, -0.13326263427734375, -0.127899169921875, -0.12253570556640625, -0.1171722412109375, -0.11180877685546875, -0.1064453125, -0.10108184814453125, -0.0957183837890625, -0.09035491943359375, -0.084991455078125, -0.07962799072265625, -0.0742645263671875, -0.06890106201171875, -0.06353759765625, -0.05817413330078125, -0.0528106689453125, -0.04744720458984375, -0.042083740234375, -0.03672027587890625, -0.0313568115234375, -0.02599334716796875, -0.0206298828125, -0.01526641845703125, -0.0099029541015625, -0.00453948974609375, 0.000823974609375, 0.00618743896484375, 0.0115509033203125, 0.01691436767578125, 0.02227783203125, 0.02764129638671875, 0.0330047607421875, 0.03836822509765625, 0.043731689453125, 0.04909515380859375, 0.0544586181640625, 0.05982208251953125, 0.065185546875, 0.07054901123046875, 0.0759124755859375, 0.08127593994140625, 0.086639404296875, 0.09200286865234375, 0.0973663330078125, 0.10272979736328125, 0.10809326171875, 0.11345672607421875, 0.1188201904296875, 0.12418365478515625, 0.129547119140625, 0.13491058349609375, 0.1402740478515625, 0.14563751220703125, 0.1510009765625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 6.0, 5.0, 7.0, 10.0, 17.0, 26.0, 19.0, 37.0, 64.0, 62.0, 105.0, 191.0, 284.0, 449.0, 764.0, 1272.0, 2338.0, 4503.0, 9137.0, 20748.0, 53760.0, 166049.0, 426245.0, 238070.0, 73182.0, 27402.0, 11625.0, 5471.0, 2789.0, 1558.0, 877.0, 534.0, 314.0, 211.0, 124.0, 81.0, 66.0, 44.0, 24.0, 20.0, 18.0, 18.0, 8.0, 9.0, 9.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.09466552734375, -0.09185218811035156, -0.08903884887695312, -0.08622550964355469, -0.08341217041015625, -0.08059883117675781, -0.07778549194335938, -0.07497215270996094, -0.0721588134765625, -0.06934547424316406, -0.06653213500976562, -0.06371879577636719, -0.06090545654296875, -0.05809211730957031, -0.055278778076171875, -0.05246543884277344, -0.049652099609375, -0.04683876037597656, -0.044025421142578125, -0.04121208190917969, -0.03839874267578125, -0.03558540344238281, -0.032772064208984375, -0.029958724975585938, -0.0271453857421875, -0.024332046508789062, -0.021518707275390625, -0.018705368041992188, -0.01589202880859375, -0.013078689575195312, -0.010265350341796875, -0.0074520111083984375, -0.004638671875, -0.0018253326416015625, 0.000988006591796875, 0.0038013458251953125, 0.00661468505859375, 0.009428024291992188, 0.012241363525390625, 0.015054702758789062, 0.0178680419921875, 0.020681381225585938, 0.023494720458984375, 0.026308059692382812, 0.02912139892578125, 0.03193473815917969, 0.034748077392578125, 0.03756141662597656, 0.040374755859375, 0.04318809509277344, 0.046001434326171875, 0.04881477355957031, 0.05162811279296875, 0.05444145202636719, 0.057254791259765625, 0.06006813049316406, 0.0628814697265625, 0.06569480895996094, 0.06850814819335938, 0.07132148742675781, 0.07413482666015625, 0.07694816589355469, 0.07976150512695312, 0.08257484436035156, 0.08538818359375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 6.0, 5.0, 11.0, 14.0, 11.0, 18.0, 25.0, 36.0, 48.0, 46.0, 60.0, 61.0, 62.0, 84.0, 76.0, 65.0, 84.0, 53.0, 60.0, 38.0, 29.0, 17.0, 17.0, 22.0, 18.0, 10.0, 8.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.55839729309082e-05, -3.456976264715195e-05, -3.355555236339569e-05, -3.2541342079639435e-05, -3.152713179588318e-05, -3.0512921512126923e-05, -2.9498711228370667e-05, -2.848450094461441e-05, -2.7470290660858154e-05, -2.6456080377101898e-05, -2.5441870093345642e-05, -2.4427659809589386e-05, -2.341344952583313e-05, -2.2399239242076874e-05, -2.1385028958320618e-05, -2.037081867456436e-05, -1.9356608390808105e-05, -1.834239810705185e-05, -1.7328187823295593e-05, -1.6313977539539337e-05, -1.529976725578308e-05, -1.4285556972026825e-05, -1.3271346688270569e-05, -1.2257136404514313e-05, -1.1242926120758057e-05, -1.02287158370018e-05, -9.214505553245544e-06, -8.200295269489288e-06, -7.186084985733032e-06, -6.171874701976776e-06, -5.15766441822052e-06, -4.143454134464264e-06, -3.129243850708008e-06, -2.1150335669517517e-06, -1.1008232831954956e-06, -8.66129994392395e-08, 9.275972843170166e-07, 1.9418075680732727e-06, 2.956017851829529e-06, 3.970228135585785e-06, 4.984438419342041e-06, 5.998648703098297e-06, 7.012858986854553e-06, 8.02706927061081e-06, 9.041279554367065e-06, 1.0055489838123322e-05, 1.1069700121879578e-05, 1.2083910405635834e-05, 1.309812068939209e-05, 1.4112330973148346e-05, 1.5126541256904602e-05, 1.6140751540660858e-05, 1.7154961824417114e-05, 1.816917210817337e-05, 1.9183382391929626e-05, 2.0197592675685883e-05, 2.121180295944214e-05, 2.2226013243198395e-05, 2.324022352695465e-05, 2.4254433810710907e-05, 2.5268644094467163e-05, 2.628285437822342e-05, 2.7297064661979675e-05, 2.831127494573593e-05, 2.9325485229492188e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 4.0, 6.0, 16.0, 16.0, 31.0, 37.0, 54.0, 78.0, 140.0, 207.0, 390.0, 778.0, 1969.0, 6028.0, 25693.0, 166710.0, 703500.0, 114610.0, 19888.0, 5031.0, 1802.0, 726.0, 354.0, 167.0, 105.0, 74.0, 41.0, 21.0, 23.0, 13.0, 8.0, 7.0, 6.0, 6.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1744384765625, -0.1687030792236328, -0.16296768188476562, -0.15723228454589844, -0.15149688720703125, -0.14576148986816406, -0.14002609252929688, -0.1342906951904297, -0.1285552978515625, -0.12281990051269531, -0.11708450317382812, -0.11134910583496094, -0.10561370849609375, -0.09987831115722656, -0.09414291381835938, -0.08840751647949219, -0.082672119140625, -0.07693672180175781, -0.07120132446289062, -0.06546592712402344, -0.05973052978515625, -0.05399513244628906, -0.048259735107421875, -0.04252433776855469, -0.0367889404296875, -0.031053543090820312, -0.025318145751953125, -0.019582748413085938, -0.01384735107421875, -0.008111953735351562, -0.002376556396484375, 0.0033588409423828125, 0.00909423828125, 0.014829635620117188, 0.020565032958984375, 0.026300430297851562, 0.03203582763671875, 0.03777122497558594, 0.043506622314453125, 0.04924201965332031, 0.0549774169921875, 0.06071281433105469, 0.06644821166992188, 0.07218360900878906, 0.07791900634765625, 0.08365440368652344, 0.08938980102539062, 0.09512519836425781, 0.100860595703125, 0.10659599304199219, 0.11233139038085938, 0.11806678771972656, 0.12380218505859375, 0.12953758239746094, 0.13527297973632812, 0.1410083770751953, 0.1467437744140625, 0.1524791717529297, 0.15821456909179688, 0.16394996643066406, 0.16968536376953125, 0.17542076110839844, 0.18115615844726562, 0.1868915557861328, 0.192626953125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 6.0, 3.0, 7.0, 9.0, 9.0, 7.0, 20.0, 12.0, 28.0, 29.0, 53.0, 63.0, 82.0, 92.0, 94.0, 97.0, 77.0, 49.0, 39.0, 58.0, 30.0, 34.0, 25.0, 14.0, 9.0, 8.0, 15.0, 3.0, 5.0, 2.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.09930419921875, -0.0966024398803711, -0.09390068054199219, -0.09119892120361328, -0.08849716186523438, -0.08579540252685547, -0.08309364318847656, -0.08039188385009766, -0.07769012451171875, -0.07498836517333984, -0.07228660583496094, -0.06958484649658203, -0.06688308715820312, -0.06418132781982422, -0.06147956848144531, -0.058777809143066406, -0.0560760498046875, -0.053374290466308594, -0.05067253112792969, -0.04797077178955078, -0.045269012451171875, -0.04256725311279297, -0.03986549377441406, -0.037163734436035156, -0.03446197509765625, -0.031760215759277344, -0.029058456420898438, -0.02635669708251953, -0.023654937744140625, -0.02095317840576172, -0.018251419067382812, -0.015549659729003906, -0.012847900390625, -0.010146141052246094, -0.0074443817138671875, -0.004742622375488281, -0.002040863037109375, 0.0006608963012695312, 0.0033626556396484375, 0.006064414978027344, 0.00876617431640625, 0.011467933654785156, 0.014169692993164062, 0.01687145233154297, 0.019573211669921875, 0.02227497100830078, 0.024976730346679688, 0.027678489685058594, 0.0303802490234375, 0.033082008361816406, 0.03578376770019531, 0.03848552703857422, 0.041187286376953125, 0.04388904571533203, 0.04659080505371094, 0.049292564392089844, 0.05199432373046875, 0.054696083068847656, 0.05739784240722656, 0.06009960174560547, 0.06280136108398438, 0.06550312042236328, 0.06820487976074219, 0.0709066390991211, 0.0736083984375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 10.0, 10.0, 14.0, 39.0, 60.0, 121.0, 176.0, 209.0, 156.0, 95.0, 52.0, 30.0, 13.0, 11.0, 10.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4192583560943604, -1.360929012298584, -1.3025997877120972, -1.2442704439163208, -1.1859411001205444, -1.1276118755340576, -1.0692825317382812, -1.0109531879425049, -0.9526238441467285, -0.8942945599555969, -0.8359652161598206, -0.777635931968689, -0.7193065881729126, -0.660977303981781, -0.6026480197906494, -0.544318675994873, -0.48598939180374146, -0.4276600778102875, -0.3693307638168335, -0.3110014796257019, -0.25267213582992554, -0.19434285163879395, -0.13601353764533997, -0.07768422365188599, -0.019354909658432007, 0.038974400609731674, 0.09730371087789536, 0.15563301742076874, 0.21396233141422272, 0.2722916305065155, 0.3306209444999695, 0.38895025849342346, 0.44727957248687744, 0.505608856678009, 0.5639382004737854, 0.622267484664917, 0.6805968284606934, 0.738926112651825, 0.7972553968429565, 0.8555847406387329, 0.9139140844345093, 0.9722433686256409, 1.0305726528167725, 1.0889019966125488, 1.1472313404083252, 1.2055606842041016, 1.2638899087905884, 1.3222192525863647, 1.3805484771728516, 1.438877820968628, 1.4972070455551147, 1.5555363893508911, 1.6138657331466675, 1.6721949577331543, 1.7305243015289307, 1.788853645324707, 1.8471829891204834, 1.9055123329162598, 1.9638415575027466, 2.0221710205078125, 2.0805001258850098, 2.138829469680786, 2.1971588134765625, 2.255488157272339, 2.3138175010681152]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 4.0, 2.0, 3.0, 8.0, 13.0, 10.0, 14.0, 10.0, 17.0, 21.0, 17.0, 26.0, 31.0, 39.0, 41.0, 43.0, 40.0, 45.0, 37.0, 44.0, 48.0, 42.0, 44.0, 45.0, 48.0, 37.0, 40.0, 36.0, 28.0, 35.0, 20.0, 21.0, 20.0, 19.0, 10.0, 13.0, 5.0, 10.0, 4.0, 6.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0357482433319092, -1.0045775175094604, -0.9734067916870117, -0.9422361254692078, -0.911065399646759, -0.8798946738243103, -0.8487240076065063, -0.8175532817840576, -0.7863825559616089, -0.7552118301391602, -0.7240411043167114, -0.6928704380989075, -0.6616997122764587, -0.63052898645401, -0.599358320236206, -0.5681875944137573, -0.5370168685913086, -0.5058461427688599, -0.4746754467487335, -0.4435047507286072, -0.41233402490615845, -0.3811632990837097, -0.3499926030635834, -0.31882190704345703, -0.2876511812210083, -0.25648045539855957, -0.22530975937843323, -0.1941390484571457, -0.16296833753585815, -0.13179762661457062, -0.10062691569328308, -0.06945620477199554, -0.03828549385070801, -0.007114782929420471, 0.024055927991867065, 0.0552266389131546, 0.08639734983444214, 0.11756806075572968, 0.1487387716770172, 0.17990948259830475, 0.21108019351959229, 0.24225090444087982, 0.27342161536216736, 0.3045923113822937, 0.33576303720474243, 0.36693376302719116, 0.3981044590473175, 0.42927515506744385, 0.4604458808898926, 0.4916166067123413, 0.52278733253479, 0.553957998752594, 0.5851287245750427, 0.6162994503974915, 0.6474701166152954, 0.6786408424377441, 0.7098115682601929, 0.7409822940826416, 0.7721530199050903, 0.8033236861228943, 0.834494411945343, 0.8656651377677917, 0.8968358039855957, 0.9280065298080444, 0.9591772556304932]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 9.0, 11.0, 15.0, 26.0, 38.0, 86.0, 147.0, 252.0, 597.0, 1308.0, 3464.0, 12346.0, 76736.0, 3840703.0, 226596.0, 22331.0, 5549.0, 2008.0, 893.0, 479.0, 245.0, 150.0, 84.0, 48.0, 42.0, 31.0, 13.0, 20.0, 12.0, 5.0, 7.0, 10.0, 10.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.379638671875, -0.3680267333984375, -0.356414794921875, -0.3448028564453125, -0.33319091796875, -0.3215789794921875, -0.309967041015625, -0.2983551025390625, -0.2867431640625, -0.2751312255859375, -0.263519287109375, -0.2519073486328125, -0.24029541015625, -0.2286834716796875, -0.217071533203125, -0.2054595947265625, -0.19384765625, -0.1822357177734375, -0.170623779296875, -0.1590118408203125, -0.14739990234375, -0.1357879638671875, -0.124176025390625, -0.1125640869140625, -0.1009521484375, -0.0893402099609375, -0.077728271484375, -0.0661163330078125, -0.05450439453125, -0.0428924560546875, -0.031280517578125, -0.0196685791015625, -0.008056640625, 0.0035552978515625, 0.015167236328125, 0.0267791748046875, 0.03839111328125, 0.0500030517578125, 0.061614990234375, 0.0732269287109375, 0.0848388671875, 0.0964508056640625, 0.108062744140625, 0.1196746826171875, 0.13128662109375, 0.1428985595703125, 0.154510498046875, 0.1661224365234375, 0.177734375, 0.1893463134765625, 0.200958251953125, 0.2125701904296875, 0.22418212890625, 0.2357940673828125, 0.247406005859375, 0.2590179443359375, 0.2706298828125, 0.2822418212890625, 0.293853759765625, 0.3054656982421875, 0.31707763671875, 0.3286895751953125, 0.340301513671875, 0.3519134521484375, 0.363525390625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 5.0, 7.0, 6.0, 9.0, 13.0, 29.0, 29.0, 57.0, 50.0, 82.0, 104.0, 98.0, 93.0, 95.0, 81.0, 68.0, 43.0, 38.0, 30.0, 24.0, 17.0, 13.0, 9.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04620361328125, -0.044681549072265625, -0.04315948486328125, -0.041637420654296875, -0.0401153564453125, -0.038593292236328125, -0.03707122802734375, -0.035549163818359375, -0.034027099609375, -0.032505035400390625, -0.03098297119140625, -0.029460906982421875, -0.0279388427734375, -0.026416778564453125, -0.02489471435546875, -0.023372650146484375, -0.0218505859375, -0.020328521728515625, -0.01880645751953125, -0.017284393310546875, -0.0157623291015625, -0.014240264892578125, -0.01271820068359375, -0.011196136474609375, -0.009674072265625, -0.008152008056640625, -0.00662994384765625, -0.005107879638671875, -0.0035858154296875, -0.002063751220703125, -0.00054168701171875, 0.000980377197265625, 0.00250244140625, 0.004024505615234375, 0.00554656982421875, 0.007068634033203125, 0.0085906982421875, 0.010112762451171875, 0.01163482666015625, 0.013156890869140625, 0.014678955078125, 0.016201019287109375, 0.01772308349609375, 0.019245147705078125, 0.0207672119140625, 0.022289276123046875, 0.02381134033203125, 0.025333404541015625, 0.02685546875, 0.028377532958984375, 0.02989959716796875, 0.031421661376953125, 0.0329437255859375, 0.034465789794921875, 0.03598785400390625, 0.037509918212890625, 0.039031982421875, 0.040554046630859375, 0.04207611083984375, 0.043598175048828125, 0.0451202392578125, 0.046642303466796875, 0.04816436767578125, 0.049686431884765625, 0.05120849609375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 4.0, 5.0, 5.0, 19.0, 17.0, 41.0, 49.0, 78.0, 150.0, 265.0, 535.0, 1420.0, 4663.0, 21308.0, 195002.0, 3803706.0, 143041.0, 17632.0, 4052.0, 1246.0, 499.0, 234.0, 134.0, 73.0, 40.0, 22.0, 11.0, 17.0, 9.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.312744140625, -0.3013496398925781, -0.28995513916015625, -0.2785606384277344, -0.2671661376953125, -0.2557716369628906, -0.24437713623046875, -0.23298263549804688, -0.221588134765625, -0.21019363403320312, -0.19879913330078125, -0.18740463256835938, -0.1760101318359375, -0.16461563110351562, -0.15322113037109375, -0.14182662963867188, -0.13043212890625, -0.11903762817382812, -0.10764312744140625, -0.09624862670898438, -0.0848541259765625, -0.07345962524414062, -0.06206512451171875, -0.050670623779296875, -0.039276123046875, -0.027881622314453125, -0.01648712158203125, -0.005092620849609375, 0.0063018798828125, 0.017696380615234375, 0.02909088134765625, 0.040485382080078125, 0.0518798828125, 0.06327438354492188, 0.07466888427734375, 0.08606338500976562, 0.0974578857421875, 0.10885238647460938, 0.12024688720703125, 0.13164138793945312, 0.143035888671875, 0.15443038940429688, 0.16582489013671875, 0.17721939086914062, 0.1886138916015625, 0.20000839233398438, 0.21140289306640625, 0.22279739379882812, 0.23419189453125, 0.24558639526367188, 0.25698089599609375, 0.2683753967285156, 0.2797698974609375, 0.2911643981933594, 0.30255889892578125, 0.3139533996582031, 0.325347900390625, 0.3367424011230469, 0.34813690185546875, 0.3595314025878906, 0.3709259033203125, 0.3823204040527344, 0.39371490478515625, 0.4051094055175781, 0.41650390625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 10.0, 7.0, 8.0, 24.0, 21.0, 33.0, 83.0, 168.0, 386.0, 2200.0, 672.0, 200.0, 104.0, 59.0, 44.0, 26.0, 9.0, 13.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11712646484375, -0.11410140991210938, -0.11107635498046875, -0.10805130004882812, -0.1050262451171875, -0.10200119018554688, -0.09897613525390625, -0.09595108032226562, -0.092926025390625, -0.08990097045898438, -0.08687591552734375, -0.08385086059570312, -0.0808258056640625, -0.07780075073242188, -0.07477569580078125, -0.07175064086914062, -0.0687255859375, -0.06570053100585938, -0.06267547607421875, -0.059650421142578125, -0.0566253662109375, -0.053600311279296875, -0.05057525634765625, -0.047550201416015625, -0.044525146484375, -0.041500091552734375, -0.03847503662109375, -0.035449981689453125, -0.0324249267578125, -0.029399871826171875, -0.02637481689453125, -0.023349761962890625, -0.02032470703125, -0.017299652099609375, -0.01427459716796875, -0.011249542236328125, -0.0082244873046875, -0.005199432373046875, -0.00217437744140625, 0.000850677490234375, 0.003875732421875, 0.006900787353515625, 0.00992584228515625, 0.012950897216796875, 0.0159759521484375, 0.019001007080078125, 0.02202606201171875, 0.025051116943359375, 0.028076171875, 0.031101226806640625, 0.03412628173828125, 0.037151336669921875, 0.0401763916015625, 0.043201446533203125, 0.04622650146484375, 0.049251556396484375, 0.052276611328125, 0.055301666259765625, 0.05832672119140625, 0.061351776123046875, 0.0643768310546875, 0.06740188598632812, 0.07042694091796875, 0.07345199584960938, 0.07647705078125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 16.0, 27.0, 72.0, 125.0, 200.0, 224.0, 166.0, 88.0, 41.0, 22.0, 8.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7236816883087158, -0.705675482749939, -0.6876692175865173, -0.6696630120277405, -0.6516567468643188, -0.633650541305542, -0.6156443357467651, -0.5976380705833435, -0.5796318650245667, -0.5616256594657898, -0.5436193943023682, -0.5256131887435913, -0.5076069235801697, -0.4896007180213928, -0.4715944826602936, -0.45358824729919434, -0.4355820119380951, -0.41757577657699585, -0.3995695412158966, -0.38156330585479736, -0.3635571002960205, -0.34555086493492126, -0.327544629573822, -0.30953842401504517, -0.29153215885162354, -0.2735259234905243, -0.25551968812942505, -0.237513467669487, -0.21950724720954895, -0.2015010118484497, -0.18349477648735046, -0.16548855602741241, -0.14748233556747437, -0.12947610020637512, -0.11146987974643707, -0.09346364438533783, -0.07545741647481918, -0.05745118856430054, -0.039444953203201294, -0.021438732743263245, -0.0034324973821640015, 0.014573732390999794, 0.03257996216416359, 0.050586193799972534, 0.06859242171049118, 0.08659864962100983, 0.10460488498210907, 0.12261110544204712, 0.14061734080314636, 0.1586235761642456, 0.17662979662418365, 0.1946360319852829, 0.21264225244522095, 0.2306484878063202, 0.24865472316741943, 0.2666609287261963, 0.2846671938896179, 0.30267342925071716, 0.3206796646118164, 0.33868587017059326, 0.3566921055316925, 0.37469834089279175, 0.392704576253891, 0.41071081161499023, 0.4287170171737671]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 4.0, 3.0, 5.0, 10.0, 6.0, 13.0, 11.0, 14.0, 25.0, 29.0, 26.0, 28.0, 24.0, 30.0, 32.0, 35.0, 40.0, 46.0, 38.0, 45.0, 46.0, 45.0, 46.0, 53.0, 34.0, 44.0, 59.0, 35.0, 34.0, 18.0, 25.0, 18.0, 14.0, 19.0, 11.0, 7.0, 5.0, 7.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19146603345870972, -0.18510855734348297, -0.17875108122825623, -0.17239362001419067, -0.16603614389896393, -0.15967866778373718, -0.15332119166851044, -0.1469637155532837, -0.14060625433921814, -0.1342487782239914, -0.12789130210876465, -0.1215338334441185, -0.11517636477947235, -0.1088188886642456, -0.10246141254901886, -0.09610393643379211, -0.08974646031856537, -0.08338898420333862, -0.07703151553869247, -0.07067403942346573, -0.06431657075881958, -0.057959094643592834, -0.05160161852836609, -0.04524414613842964, -0.038886673748493195, -0.03252920135855675, -0.02617172710597515, -0.019814252853393555, -0.013456780463457108, -0.00709930807352066, -0.0007418319582939148, 0.005615640431642532, 0.01197311282157898, 0.018330585211515427, 0.024688059464097023, 0.03104553371667862, 0.037403006106615067, 0.043760478496551514, 0.05011795461177826, 0.056475427001714706, 0.06283289939165115, 0.0691903755068779, 0.07554784417152405, 0.0819053202867508, 0.08826279640197754, 0.09462026506662369, 0.10097774118185043, 0.10733520984649658, 0.11369268596172333, 0.12005016207695007, 0.12640763819217682, 0.13276511430740356, 0.13912257552146912, 0.14548005163669586, 0.1518375277519226, 0.15819500386714935, 0.1645524799823761, 0.17090995609760284, 0.1772674322128296, 0.18362489342689514, 0.1899823695421219, 0.19633984565734863, 0.20269732177257538, 0.20905479788780212, 0.21541225910186768]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 2.0, 0.0, 4.0, 9.0, 9.0, 5.0, 14.0, 19.0, 16.0, 34.0, 34.0, 38.0, 56.0, 82.0, 114.0, 125.0, 244.0, 294.0, 454.0, 783.0, 1346.0, 2417.0, 5163.0, 11257.0, 27857.0, 76779.0, 217311.0, 398357.0, 192265.0, 67634.0, 25146.0, 10259.0, 4724.0, 2306.0, 1236.0, 711.0, 463.0, 272.0, 189.0, 135.0, 120.0, 75.0, 50.0, 32.0, 24.0, 20.0, 18.0, 20.0, 15.0, 5.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.1541748046875, -0.14969825744628906, -0.14522171020507812, -0.1407451629638672, -0.13626861572265625, -0.1317920684814453, -0.12731552124023438, -0.12283897399902344, -0.1183624267578125, -0.11388587951660156, -0.10940933227539062, -0.10493278503417969, -0.10045623779296875, -0.09597969055175781, -0.09150314331054688, -0.08702659606933594, -0.082550048828125, -0.07807350158691406, -0.07359695434570312, -0.06912040710449219, -0.06464385986328125, -0.06016731262207031, -0.055690765380859375, -0.05121421813964844, -0.0467376708984375, -0.04226112365722656, -0.037784576416015625, -0.03330802917480469, -0.02883148193359375, -0.024354934692382812, -0.019878387451171875, -0.015401840209960938, -0.01092529296875, -0.0064487457275390625, -0.001972198486328125, 0.0025043487548828125, 0.00698089599609375, 0.011457443237304688, 0.015933990478515625, 0.020410537719726562, 0.0248870849609375, 0.029363632202148438, 0.033840179443359375, 0.03831672668457031, 0.04279327392578125, 0.04726982116699219, 0.051746368408203125, 0.05622291564941406, 0.060699462890625, 0.06517601013183594, 0.06965255737304688, 0.07412910461425781, 0.07860565185546875, 0.08308219909667969, 0.08755874633789062, 0.09203529357910156, 0.0965118408203125, 0.10098838806152344, 0.10546493530273438, 0.10994148254394531, 0.11441802978515625, 0.11889457702636719, 0.12337112426757812, 0.12784767150878906, 0.13232421875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 8.0, 14.0, 17.0, 25.0, 32.0, 49.0, 62.0, 81.0, 71.0, 98.0, 94.0, 106.0, 79.0, 63.0, 46.0, 35.0, 40.0, 21.0, 16.0, 14.0, 9.0, 7.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.040679931640625, -0.03924703598022461, -0.03781414031982422, -0.03638124465942383, -0.03494834899902344, -0.03351545333862305, -0.032082557678222656, -0.030649662017822266, -0.029216766357421875, -0.027783870697021484, -0.026350975036621094, -0.024918079376220703, -0.023485183715820312, -0.022052288055419922, -0.02061939239501953, -0.01918649673461914, -0.01775360107421875, -0.01632070541381836, -0.014887809753417969, -0.013454914093017578, -0.012022018432617188, -0.010589122772216797, -0.009156227111816406, -0.007723331451416016, -0.006290435791015625, -0.004857540130615234, -0.0034246444702148438, -0.001991748809814453, -0.0005588531494140625, 0.0008740425109863281, 0.0023069381713867188, 0.0037398338317871094, 0.0051727294921875, 0.006605625152587891, 0.008038520812988281, 0.009471416473388672, 0.010904312133789062, 0.012337207794189453, 0.013770103454589844, 0.015202999114990234, 0.016635894775390625, 0.018068790435791016, 0.019501686096191406, 0.020934581756591797, 0.022367477416992188, 0.023800373077392578, 0.02523326873779297, 0.02666616439819336, 0.02809906005859375, 0.02953195571899414, 0.03096485137939453, 0.03239774703979492, 0.03383064270019531, 0.0352635383605957, 0.036696434020996094, 0.038129329681396484, 0.039562225341796875, 0.040995121002197266, 0.042428016662597656, 0.04386091232299805, 0.04529380798339844, 0.04672670364379883, 0.04815959930419922, 0.04959249496459961, 0.051025390625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 4.0, 8.0, 5.0, 7.0, 15.0, 18.0, 26.0, 28.0, 38.0, 83.0, 122.0, 176.0, 252.0, 451.0, 769.0, 1533.0, 3762.0, 10068.0, 31500.0, 118679.0, 414501.0, 337663.0, 89792.0, 24733.0, 7981.0, 3069.0, 1422.0, 726.0, 402.0, 254.0, 157.0, 95.0, 81.0, 45.0, 30.0, 31.0, 7.0, 8.0, 11.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1658935546875, -0.16034507751464844, -0.15479660034179688, -0.1492481231689453, -0.14369964599609375, -0.1381511688232422, -0.13260269165039062, -0.12705421447753906, -0.1215057373046875, -0.11595726013183594, -0.11040878295898438, -0.10486030578613281, -0.09931182861328125, -0.09376335144042969, -0.08821487426757812, -0.08266639709472656, -0.077117919921875, -0.07156944274902344, -0.06602096557617188, -0.06047248840332031, -0.05492401123046875, -0.04937553405761719, -0.043827056884765625, -0.03827857971191406, -0.0327301025390625, -0.027181625366210938, -0.021633148193359375, -0.016084671020507812, -0.01053619384765625, -0.0049877166748046875, 0.000560760498046875, 0.0061092376708984375, 0.01165771484375, 0.017206192016601562, 0.022754669189453125, 0.028303146362304688, 0.03385162353515625, 0.03940010070800781, 0.044948577880859375, 0.05049705505371094, 0.0560455322265625, 0.06159400939941406, 0.06714248657226562, 0.07269096374511719, 0.07823944091796875, 0.08378791809082031, 0.08933639526367188, 0.09488487243652344, 0.100433349609375, 0.10598182678222656, 0.11153030395507812, 0.11707878112792969, 0.12262725830078125, 0.1281757354736328, 0.13372421264648438, 0.13927268981933594, 0.1448211669921875, 0.15036964416503906, 0.15591812133789062, 0.1614665985107422, 0.16701507568359375, 0.1725635528564453, 0.17811203002929688, 0.18366050720214844, 0.189208984375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 6.0, 6.0, 6.0, 11.0, 15.0, 22.0, 27.0, 21.0, 32.0, 26.0, 37.0, 34.0, 38.0, 55.0, 48.0, 54.0, 61.0, 44.0, 55.0, 51.0, 41.0, 49.0, 31.0, 41.0, 44.0, 29.0, 19.0, 25.0, 13.0, 10.0, 7.0, 6.0, 12.0, 6.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1646728515625, -0.15947532653808594, -0.15427780151367188, -0.1490802764892578, -0.14388275146484375, -0.1386852264404297, -0.13348770141601562, -0.12829017639160156, -0.1230926513671875, -0.11789512634277344, -0.11269760131835938, -0.10750007629394531, -0.10230255126953125, -0.09710502624511719, -0.09190750122070312, -0.08670997619628906, -0.081512451171875, -0.07631492614746094, -0.07111740112304688, -0.06591987609863281, -0.06072235107421875, -0.05552482604980469, -0.050327301025390625, -0.04512977600097656, -0.0399322509765625, -0.03473472595214844, -0.029537200927734375, -0.024339675903320312, -0.01914215087890625, -0.013944625854492188, -0.008747100830078125, -0.0035495758056640625, 0.00164794921875, 0.0068454742431640625, 0.012042999267578125, 0.017240524291992188, 0.02243804931640625, 0.027635574340820312, 0.032833099365234375, 0.03803062438964844, 0.0432281494140625, 0.04842567443847656, 0.053623199462890625, 0.05882072448730469, 0.06401824951171875, 0.06921577453613281, 0.07441329956054688, 0.07961082458496094, 0.084808349609375, 0.09000587463378906, 0.09520339965820312, 0.10040092468261719, 0.10559844970703125, 0.11079597473144531, 0.11599349975585938, 0.12119102478027344, 0.1263885498046875, 0.13158607482910156, 0.13678359985351562, 0.1419811248779297, 0.14717864990234375, 0.1523761749267578, 0.15757369995117188, 0.16277122497558594, 0.16796875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 2.0, 10.0, 8.0, 17.0, 25.0, 35.0, 51.0, 64.0, 115.0, 162.0, 266.0, 489.0, 864.0, 1586.0, 3258.0, 6968.0, 16751.0, 47565.0, 183508.0, 502037.0, 201019.0, 51647.0, 17702.0, 7168.0, 3392.0, 1661.0, 894.0, 502.0, 290.0, 182.0, 103.0, 67.0, 47.0, 32.0, 19.0, 14.0, 11.0, 4.0, 4.0, 5.0, 7.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07781982421875, -0.07535171508789062, -0.07288360595703125, -0.07041549682617188, -0.0679473876953125, -0.06547927856445312, -0.06301116943359375, -0.060543060302734375, -0.058074951171875, -0.055606842041015625, -0.05313873291015625, -0.050670623779296875, -0.0482025146484375, -0.045734405517578125, -0.04326629638671875, -0.040798187255859375, -0.038330078125, -0.035861968994140625, -0.03339385986328125, -0.030925750732421875, -0.0284576416015625, -0.025989532470703125, -0.02352142333984375, -0.021053314208984375, -0.018585205078125, -0.016117095947265625, -0.01364898681640625, -0.011180877685546875, -0.0087127685546875, -0.006244659423828125, -0.00377655029296875, -0.001308441162109375, 0.00115966796875, 0.003627777099609375, 0.00609588623046875, 0.008563995361328125, 0.0110321044921875, 0.013500213623046875, 0.01596832275390625, 0.018436431884765625, 0.020904541015625, 0.023372650146484375, 0.02584075927734375, 0.028308868408203125, 0.0307769775390625, 0.033245086669921875, 0.03571319580078125, 0.038181304931640625, 0.0406494140625, 0.043117523193359375, 0.04558563232421875, 0.048053741455078125, 0.0505218505859375, 0.052989959716796875, 0.05545806884765625, 0.057926177978515625, 0.060394287109375, 0.06286239624023438, 0.06533050537109375, 0.06779861450195312, 0.0702667236328125, 0.07273483276367188, 0.07520294189453125, 0.07767105102539062, 0.08013916015625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 7.0, 11.0, 18.0, 13.0, 22.0, 16.0, 22.0, 24.0, 29.0, 34.0, 27.0, 45.0, 52.0, 61.0, 65.0, 65.0, 67.0, 55.0, 70.0, 53.0, 40.0, 37.0, 37.0, 32.0, 13.0, 17.0, 16.0, 14.0, 7.0, 2.0, 5.0, 2.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1636486053466797e-05, -2.0889565348625183e-05, -2.014264464378357e-05, -1.9395723938941956e-05, -1.8648803234100342e-05, -1.7901882529258728e-05, -1.7154961824417114e-05, -1.64080411195755e-05, -1.5661120414733887e-05, -1.4914199709892273e-05, -1.416727900505066e-05, -1.3420358300209045e-05, -1.2673437595367432e-05, -1.1926516890525818e-05, -1.1179596185684204e-05, -1.043267548084259e-05, -9.685754776000977e-06, -8.938834071159363e-06, -8.191913366317749e-06, -7.444992661476135e-06, -6.6980719566345215e-06, -5.951151251792908e-06, -5.204230546951294e-06, -4.45730984210968e-06, -3.7103891372680664e-06, -2.9634684324264526e-06, -2.216547727584839e-06, -1.469627022743225e-06, -7.227063179016113e-07, 2.421438694000244e-08, 7.711350917816162e-07, 1.51805579662323e-06, 2.2649765014648438e-06, 3.0118972063064575e-06, 3.7588179111480713e-06, 4.505738615989685e-06, 5.252659320831299e-06, 5.999580025672913e-06, 6.746500730514526e-06, 7.49342143535614e-06, 8.240342140197754e-06, 8.987262845039368e-06, 9.734183549880981e-06, 1.0481104254722595e-05, 1.1228024959564209e-05, 1.1974945664405823e-05, 1.2721866369247437e-05, 1.346878707408905e-05, 1.4215707778930664e-05, 1.4962628483772278e-05, 1.570954918861389e-05, 1.6456469893455505e-05, 1.720339059829712e-05, 1.7950311303138733e-05, 1.8697232007980347e-05, 1.944415271282196e-05, 2.0191073417663574e-05, 2.0937994122505188e-05, 2.1684914827346802e-05, 2.2431835532188416e-05, 2.317875623703003e-05, 2.3925676941871643e-05, 2.4672597646713257e-05, 2.541951835155487e-05, 2.6166439056396484e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 7.0, 2.0, 4.0, 5.0, 6.0, 1.0, 9.0, 12.0, 16.0, 21.0, 33.0, 64.0, 86.0, 138.0, 250.0, 474.0, 924.0, 1936.0, 4957.0, 14525.0, 60555.0, 472016.0, 416408.0, 54288.0, 13481.0, 4526.0, 1889.0, 850.0, 444.0, 232.0, 141.0, 94.0, 55.0, 38.0, 23.0, 19.0, 8.0, 10.0, 8.0, 1.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1162109375, -0.11257553100585938, -0.10894012451171875, -0.10530471801757812, -0.1016693115234375, -0.09803390502929688, -0.09439849853515625, -0.09076309204101562, -0.087127685546875, -0.08349227905273438, -0.07985687255859375, -0.07622146606445312, -0.0725860595703125, -0.06895065307617188, -0.06531524658203125, -0.061679840087890625, -0.05804443359375, -0.054409027099609375, -0.05077362060546875, -0.047138214111328125, -0.0435028076171875, -0.039867401123046875, -0.03623199462890625, -0.032596588134765625, -0.028961181640625, -0.025325775146484375, -0.02169036865234375, -0.018054962158203125, -0.0144195556640625, -0.010784149169921875, -0.00714874267578125, -0.003513336181640625, 0.0001220703125, 0.003757476806640625, 0.00739288330078125, 0.011028289794921875, 0.0146636962890625, 0.018299102783203125, 0.02193450927734375, 0.025569915771484375, 0.029205322265625, 0.032840728759765625, 0.03647613525390625, 0.040111541748046875, 0.0437469482421875, 0.047382354736328125, 0.05101776123046875, 0.054653167724609375, 0.05828857421875, 0.061923980712890625, 0.06555938720703125, 0.06919479370117188, 0.0728302001953125, 0.07646560668945312, 0.08010101318359375, 0.08373641967773438, 0.087371826171875, 0.09100723266601562, 0.09464263916015625, 0.09827804565429688, 0.1019134521484375, 0.10554885864257812, 0.10918426513671875, 0.11281967163085938, 0.116455078125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 4.0, 5.0, 8.0, 5.0, 9.0, 14.0, 22.0, 23.0, 31.0, 48.0, 81.0, 88.0, 97.0, 120.0, 113.0, 80.0, 80.0, 40.0, 34.0, 19.0, 9.0, 15.0, 14.0, 11.0, 11.0, 3.0, 1.0, 6.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08917236328125, -0.08665657043457031, -0.08414077758789062, -0.08162498474121094, -0.07910919189453125, -0.07659339904785156, -0.07407760620117188, -0.07156181335449219, -0.0690460205078125, -0.06653022766113281, -0.06401443481445312, -0.06149864196777344, -0.05898284912109375, -0.05646705627441406, -0.053951263427734375, -0.05143547058105469, -0.048919677734375, -0.04640388488769531, -0.043888092041015625, -0.04137229919433594, -0.03885650634765625, -0.03634071350097656, -0.033824920654296875, -0.03130912780761719, -0.0287933349609375, -0.026277542114257812, -0.023761749267578125, -0.021245956420898438, -0.01873016357421875, -0.016214370727539062, -0.013698577880859375, -0.011182785034179688, -0.0086669921875, -0.0061511993408203125, -0.003635406494140625, -0.0011196136474609375, 0.00139617919921875, 0.0039119720458984375, 0.006427764892578125, 0.008943557739257812, 0.0114593505859375, 0.013975143432617188, 0.016490936279296875, 0.019006729125976562, 0.02152252197265625, 0.024038314819335938, 0.026554107666015625, 0.029069900512695312, 0.031585693359375, 0.03410148620605469, 0.036617279052734375, 0.03913307189941406, 0.04164886474609375, 0.04416465759277344, 0.046680450439453125, 0.04919624328613281, 0.0517120361328125, 0.05422782897949219, 0.056743621826171875, 0.05925941467285156, 0.06177520751953125, 0.06429100036621094, 0.06680679321289062, 0.06932258605957031, 0.07183837890625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 19.0, 32.0, 57.0, 108.0, 170.0, 187.0, 178.0, 122.0, 54.0, 32.0, 19.0, 13.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1748592853546143, -1.1267269849777222, -1.07859468460083, -1.030462384223938, -0.9823301434516907, -0.9341978430747986, -0.8860656023025513, -0.8379333019256592, -0.7898010015487671, -0.741668701171875, -0.6935364007949829, -0.6454041600227356, -0.5972718596458435, -0.5491395592689514, -0.5010073184967041, -0.452875018119812, -0.4047427177429199, -0.35661041736602783, -0.30847814679145813, -0.2603458762168884, -0.21221357583999634, -0.16408129036426544, -0.11594900488853455, -0.06781673431396484, -0.019684433937072754, 0.028447851538658142, 0.07658013701438904, 0.12471242249011993, 0.17284470796585083, 0.22097699344158173, 0.2691092789173126, 0.3172415494918823, 0.3653738498687744, 0.4135061502456665, 0.4616384208202362, 0.5097706913948059, 0.557902991771698, 0.6060352921485901, 0.6541675329208374, 0.7022998332977295, 0.7504321336746216, 0.7985644340515137, 0.8466967344284058, 0.8948289752006531, 0.9429612755775452, 0.9910935759544373, 1.0392258167266846, 1.0873581171035767, 1.1354904174804688, 1.1836227178573608, 1.231755018234253, 1.279887318611145, 1.328019618988037, 1.3761518001556396, 1.4242841005325317, 1.4724164009094238, 1.520548701286316, 1.568681001663208, 1.6168133020401, 1.6649456024169922, 1.7130777835845947, 1.7612100839614868, 1.809342384338379, 1.857474684715271, 1.905606985092163]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 3.0, 9.0, 7.0, 3.0, 15.0, 9.0, 8.0, 18.0, 20.0, 26.0, 35.0, 39.0, 39.0, 48.0, 36.0, 49.0, 43.0, 65.0, 58.0, 46.0, 54.0, 54.0, 38.0, 44.0, 27.0, 38.0, 32.0, 29.0, 23.0, 11.0, 17.0, 12.0, 12.0, 9.0, 6.0, 7.0, 9.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8695246577262878, -0.8401280641555786, -0.8107314109802246, -0.7813347578048706, -0.7519381642341614, -0.7225415706634521, -0.6931449174880981, -0.6637482643127441, -0.6343516707420349, -0.6049550771713257, -0.5755584239959717, -0.5461617708206177, -0.5167651772499084, -0.48736855387687683, -0.4579719305038452, -0.4285753071308136, -0.399178683757782, -0.36978206038475037, -0.34038543701171875, -0.31098881363868713, -0.2815921902656555, -0.2521955668926239, -0.22279894351959229, -0.19340232014656067, -0.16400569677352905, -0.13460907340049744, -0.10521245002746582, -0.0758158266544342, -0.04641920328140259, -0.01702257990837097, 0.012374043464660645, 0.04177066683769226, 0.0711672306060791, 0.10056385397911072, 0.12996047735214233, 0.15935710072517395, 0.18875372409820557, 0.21815034747123718, 0.2475469708442688, 0.2769435942173004, 0.30634021759033203, 0.33573684096336365, 0.36513346433639526, 0.3945300877094269, 0.4239267110824585, 0.4533233344554901, 0.48271995782852173, 0.512116551399231, 0.541513204574585, 0.570909857749939, 0.6003064513206482, 0.6297030448913574, 0.6590996980667114, 0.6884963512420654, 0.7178929448127747, 0.7472895383834839, 0.7766861915588379, 0.8060828447341919, 0.8354794383049011, 0.8648760318756104, 0.8942726850509644, 0.9236693382263184, 0.9530659317970276, 0.9824625253677368, 1.0118591785430908]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 0.0, 2.0, 6.0, 7.0, 11.0, 18.0, 25.0, 59.0, 116.0, 251.0, 652.0, 1838.0, 6783.0, 35274.0, 3599826.0, 515807.0, 25189.0, 5415.0, 1684.0, 627.0, 309.0, 145.0, 99.0, 55.0, 32.0, 16.0, 15.0, 9.0, 8.0, 3.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41162109375, -0.4004707336425781, -0.38932037353515625, -0.3781700134277344, -0.3670196533203125, -0.3558692932128906, -0.34471893310546875, -0.3335685729980469, -0.322418212890625, -0.3112678527832031, -0.30011749267578125, -0.2889671325683594, -0.2778167724609375, -0.2666664123535156, -0.25551605224609375, -0.24436569213867188, -0.23321533203125, -0.22206497192382812, -0.21091461181640625, -0.19976425170898438, -0.1886138916015625, -0.17746353149414062, -0.16631317138671875, -0.15516281127929688, -0.144012451171875, -0.13286209106445312, -0.12171173095703125, -0.11056137084960938, -0.0994110107421875, -0.08826065063476562, -0.07711029052734375, -0.06595993041992188, -0.0548095703125, -0.043659210205078125, -0.03250885009765625, -0.021358489990234375, -0.0102081298828125, 0.000942230224609375, 0.01209259033203125, 0.023242950439453125, 0.034393310546875, 0.045543670654296875, 0.05669403076171875, 0.06784439086914062, 0.0789947509765625, 0.09014511108398438, 0.10129547119140625, 0.11244583129882812, 0.12359619140625, 0.13474655151367188, 0.14589691162109375, 0.15704727172851562, 0.1681976318359375, 0.17934799194335938, 0.19049835205078125, 0.20164871215820312, 0.212799072265625, 0.22394943237304688, 0.23509979248046875, 0.24625015258789062, 0.2574005126953125, 0.2685508728027344, 0.27970123291015625, 0.2908515930175781, 0.302001953125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 3.0, 5.0, 7.0, 14.0, 15.0, 24.0, 21.0, 42.0, 62.0, 81.0, 79.0, 72.0, 90.0, 94.0, 100.0, 74.0, 52.0, 48.0, 34.0, 29.0, 17.0, 10.0, 11.0, 13.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047088623046875, -0.04561185836791992, -0.044135093688964844, -0.042658329010009766, -0.04118156433105469, -0.03970479965209961, -0.03822803497314453, -0.03675127029418945, -0.035274505615234375, -0.0337977409362793, -0.03232097625732422, -0.03084421157836914, -0.029367446899414062, -0.027890682220458984, -0.026413917541503906, -0.024937152862548828, -0.02346038818359375, -0.021983623504638672, -0.020506858825683594, -0.019030094146728516, -0.017553329467773438, -0.01607656478881836, -0.014599800109863281, -0.013123035430908203, -0.011646270751953125, -0.010169506072998047, -0.008692741394042969, -0.007215976715087891, -0.0057392120361328125, -0.004262447357177734, -0.0027856826782226562, -0.0013089179992675781, 0.0001678466796875, 0.0016446113586425781, 0.0031213760375976562, 0.004598140716552734, 0.0060749053955078125, 0.007551670074462891, 0.009028434753417969, 0.010505199432373047, 0.011981964111328125, 0.013458728790283203, 0.014935493469238281, 0.01641225814819336, 0.017889022827148438, 0.019365787506103516, 0.020842552185058594, 0.022319316864013672, 0.02379608154296875, 0.025272846221923828, 0.026749610900878906, 0.028226375579833984, 0.029703140258789062, 0.03117990493774414, 0.03265666961669922, 0.0341334342956543, 0.035610198974609375, 0.03708696365356445, 0.03856372833251953, 0.04004049301147461, 0.04151725769042969, 0.042994022369384766, 0.044470787048339844, 0.04594755172729492, 0.04742431640625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 5.0, 10.0, 9.0, 23.0, 24.0, 57.0, 77.0, 125.0, 248.0, 553.0, 1233.0, 3239.0, 10296.0, 47230.0, 634711.0, 3395821.0, 78785.0, 14724.0, 4217.0, 1513.0, 682.0, 290.0, 167.0, 109.0, 53.0, 39.0, 13.0, 19.0, 6.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.303955078125, -0.29577064514160156, -0.2875862121582031, -0.2794017791748047, -0.27121734619140625, -0.2630329132080078, -0.2548484802246094, -0.24666404724121094, -0.2384796142578125, -0.23029518127441406, -0.22211074829101562, -0.2139263153076172, -0.20574188232421875, -0.1975574493408203, -0.18937301635742188, -0.18118858337402344, -0.173004150390625, -0.16481971740722656, -0.15663528442382812, -0.1484508514404297, -0.14026641845703125, -0.1320819854736328, -0.12389755249023438, -0.11571311950683594, -0.1075286865234375, -0.09934425354003906, -0.09115982055664062, -0.08297538757324219, -0.07479095458984375, -0.06660652160644531, -0.058422088623046875, -0.05023765563964844, -0.04205322265625, -0.03386878967285156, -0.025684356689453125, -0.017499923706054688, -0.00931549072265625, -0.0011310577392578125, 0.007053375244140625, 0.015237808227539062, 0.0234222412109375, 0.03160667419433594, 0.039791107177734375, 0.04797554016113281, 0.05615997314453125, 0.06434440612792969, 0.07252883911132812, 0.08071327209472656, 0.088897705078125, 0.09708213806152344, 0.10526657104492188, 0.11345100402832031, 0.12163543701171875, 0.1298198699951172, 0.13800430297851562, 0.14618873596191406, 0.1543731689453125, 0.16255760192871094, 0.17074203491210938, 0.1789264678955078, 0.18711090087890625, 0.1952953338623047, 0.20347976684570312, 0.21166419982910156, 0.2198486328125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 8.0, 11.0, 8.0, 8.0, 13.0, 19.0, 17.0, 25.0, 43.0, 41.0, 73.0, 100.0, 177.0, 337.0, 1547.0, 881.0, 295.0, 138.0, 98.0, 52.0, 46.0, 22.0, 25.0, 19.0, 13.0, 15.0, 9.0, 6.0, 2.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04449462890625, -0.04309892654418945, -0.041703224182128906, -0.04030752182006836, -0.03891181945800781, -0.037516117095947266, -0.03612041473388672, -0.03472471237182617, -0.033329010009765625, -0.03193330764770508, -0.03053760528564453, -0.029141902923583984, -0.027746200561523438, -0.02635049819946289, -0.024954795837402344, -0.023559093475341797, -0.02216339111328125, -0.020767688751220703, -0.019371986389160156, -0.01797628402709961, -0.016580581665039062, -0.015184879302978516, -0.013789176940917969, -0.012393474578857422, -0.010997772216796875, -0.009602069854736328, -0.008206367492675781, -0.006810665130615234, -0.0054149627685546875, -0.004019260406494141, -0.0026235580444335938, -0.0012278556823730469, 0.0001678466796875, 0.0015635490417480469, 0.0029592514038085938, 0.004354953765869141, 0.0057506561279296875, 0.007146358489990234, 0.008542060852050781, 0.009937763214111328, 0.011333465576171875, 0.012729167938232422, 0.014124870300292969, 0.015520572662353516, 0.016916275024414062, 0.01831197738647461, 0.019707679748535156, 0.021103382110595703, 0.02249908447265625, 0.023894786834716797, 0.025290489196777344, 0.02668619155883789, 0.028081893920898438, 0.029477596282958984, 0.03087329864501953, 0.03226900100708008, 0.033664703369140625, 0.03506040573120117, 0.03645610809326172, 0.037851810455322266, 0.03924751281738281, 0.04064321517944336, 0.042038917541503906, 0.04343461990356445, 0.044830322265625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 10.0, 11.0, 25.0, 21.0, 42.0, 76.0, 101.0, 118.0, 109.0, 128.0, 110.0, 75.0, 65.0, 36.0, 24.0, 19.0, 8.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2542146146297455, -0.24508729577064514, -0.2359599769115448, -0.22683264315128326, -0.21770532429218292, -0.20857800543308258, -0.19945067167282104, -0.1903233528137207, -0.18119603395462036, -0.17206871509552002, -0.16294139623641968, -0.15381406247615814, -0.1446867436170578, -0.13555942475795746, -0.12643209099769592, -0.11730477213859558, -0.10817745327949524, -0.0990501344203949, -0.08992280811071396, -0.08079548180103302, -0.07166816294193268, -0.06254084408283234, -0.0534135177731514, -0.04428619146347046, -0.03515887260437012, -0.026031550019979477, -0.016904227435588837, -0.007776904851198196, 0.0013504177331924438, 0.010477740317583084, 0.019605062901973724, 0.028732389211654663, 0.03785967826843262, 0.04698700085282326, 0.0561143234372139, 0.06524164974689484, 0.07436896860599518, 0.08349628746509552, 0.09262361377477646, 0.1017509400844574, 0.11087825894355774, 0.12000557780265808, 0.12913289666175842, 0.13826023042201996, 0.1473875492811203, 0.15651486814022064, 0.16564220190048218, 0.17476952075958252, 0.18389683961868286, 0.1930241584777832, 0.20215147733688354, 0.21127881109714508, 0.22040612995624542, 0.22953344881534576, 0.2386607825756073, 0.24778810143470764, 0.256915420293808, 0.2660427391529083, 0.27517005801200867, 0.284297376871109, 0.29342472553253174, 0.3025520443916321, 0.3116793632507324, 0.32080668210983276, 0.3299340009689331]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 7.0, 1.0, 6.0, 7.0, 8.0, 11.0, 17.0, 18.0, 28.0, 19.0, 18.0, 30.0, 31.0, 31.0, 32.0, 32.0, 42.0, 41.0, 43.0, 34.0, 36.0, 51.0, 38.0, 53.0, 40.0, 25.0, 32.0, 29.0, 27.0, 32.0, 23.0, 24.0, 24.0, 15.0, 16.0, 12.0, 19.0, 14.0, 5.0, 7.0, 6.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.14361059665679932, -0.13893955945968628, -0.13426853716373444, -0.1295975148677826, -0.12492647767066956, -0.12025544792413712, -0.11558441817760468, -0.11091338843107224, -0.1062423586845398, -0.10157132893800735, -0.09690029919147491, -0.09222926944494247, -0.08755823969841003, -0.0828872099518776, -0.07821618020534515, -0.07354515045881271, -0.06887412071228027, -0.06420309096574783, -0.05953206121921539, -0.05486103147268295, -0.05019000172615051, -0.04551897197961807, -0.04084794223308563, -0.03617691248655319, -0.03150588274002075, -0.026834852993488312, -0.02216382324695587, -0.01749279350042343, -0.012821763753890991, -0.008150734007358551, -0.003479704260826111, 0.0011913254857063293, 0.0058623552322387695, 0.01053338497877121, 0.01520441472530365, 0.01987544447183609, 0.02454647421836853, 0.02921750396490097, 0.03388853371143341, 0.03855956345796585, 0.04323059320449829, 0.04790162295103073, 0.05257265269756317, 0.05724368244409561, 0.06191471219062805, 0.06658574193716049, 0.07125677168369293, 0.07592780143022537, 0.08059883117675781, 0.08526986092329025, 0.08994089066982269, 0.09461192041635513, 0.09928295016288757, 0.10395397990942001, 0.10862500965595245, 0.1132960394024849, 0.11796706914901733, 0.12263809889554977, 0.12730912864208221, 0.13198015093803406, 0.1366511881351471, 0.14132222533226013, 0.14599324762821198, 0.15066426992416382, 0.15533530712127686]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 8.0, 9.0, 15.0, 11.0, 35.0, 49.0, 52.0, 108.0, 174.0, 300.0, 498.0, 865.0, 1681.0, 3649.0, 8800.0, 24380.0, 77122.0, 256678.0, 432966.0, 163272.0, 49835.0, 16294.0, 6100.0, 2656.0, 1284.0, 677.0, 386.0, 242.0, 125.0, 74.0, 72.0, 39.0, 26.0, 18.0, 13.0, 15.0, 11.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1630859375, -0.15833282470703125, -0.1535797119140625, -0.14882659912109375, -0.144073486328125, -0.13932037353515625, -0.1345672607421875, -0.12981414794921875, -0.12506103515625, -0.12030792236328125, -0.1155548095703125, -0.11080169677734375, -0.106048583984375, -0.10129547119140625, -0.0965423583984375, -0.09178924560546875, -0.0870361328125, -0.08228302001953125, -0.0775299072265625, -0.07277679443359375, -0.068023681640625, -0.06327056884765625, -0.0585174560546875, -0.05376434326171875, -0.04901123046875, -0.04425811767578125, -0.0395050048828125, -0.03475189208984375, -0.029998779296875, -0.02524566650390625, -0.0204925537109375, -0.01573944091796875, -0.010986328125, -0.00623321533203125, -0.0014801025390625, 0.00327301025390625, 0.008026123046875, 0.01277923583984375, 0.0175323486328125, 0.02228546142578125, 0.02703857421875, 0.03179168701171875, 0.0365447998046875, 0.04129791259765625, 0.046051025390625, 0.05080413818359375, 0.0555572509765625, 0.06031036376953125, 0.0650634765625, 0.06981658935546875, 0.0745697021484375, 0.07932281494140625, 0.084075927734375, 0.08882904052734375, 0.0935821533203125, 0.09833526611328125, 0.10308837890625, 0.10784149169921875, 0.1125946044921875, 0.11734771728515625, 0.122100830078125, 0.12685394287109375, 0.1316070556640625, 0.13636016845703125, 0.14111328125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 12.0, 6.0, 13.0, 23.0, 29.0, 38.0, 45.0, 56.0, 71.0, 73.0, 75.0, 89.0, 89.0, 76.0, 62.0, 59.0, 46.0, 37.0, 32.0, 20.0, 12.0, 9.0, 9.0, 8.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04254150390625, -0.04115629196166992, -0.039771080017089844, -0.038385868072509766, -0.03700065612792969, -0.03561544418334961, -0.03423023223876953, -0.03284502029418945, -0.031459808349609375, -0.030074596405029297, -0.02868938446044922, -0.02730417251586914, -0.025918960571289062, -0.024533748626708984, -0.023148536682128906, -0.021763324737548828, -0.02037811279296875, -0.018992900848388672, -0.017607688903808594, -0.016222476959228516, -0.014837265014648438, -0.01345205307006836, -0.012066841125488281, -0.010681629180908203, -0.009296417236328125, -0.007911205291748047, -0.006525993347167969, -0.005140781402587891, -0.0037555694580078125, -0.0023703575134277344, -0.0009851455688476562, 0.0004000663757324219, 0.0017852783203125, 0.003170490264892578, 0.004555702209472656, 0.005940914154052734, 0.0073261260986328125, 0.00871133804321289, 0.010096549987792969, 0.011481761932373047, 0.012866973876953125, 0.014252185821533203, 0.01563739776611328, 0.01702260971069336, 0.018407821655273438, 0.019793033599853516, 0.021178245544433594, 0.022563457489013672, 0.02394866943359375, 0.025333881378173828, 0.026719093322753906, 0.028104305267333984, 0.029489517211914062, 0.03087472915649414, 0.03225994110107422, 0.0336451530456543, 0.035030364990234375, 0.03641557693481445, 0.03780078887939453, 0.03918600082397461, 0.04057121276855469, 0.041956424713134766, 0.043341636657714844, 0.04472684860229492, 0.046112060546875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 5.0, 9.0, 16.0, 19.0, 28.0, 41.0, 49.0, 85.0, 152.0, 243.0, 447.0, 879.0, 1870.0, 5242.0, 19394.0, 90482.0, 428159.0, 393802.0, 81557.0, 17528.0, 4867.0, 1843.0, 784.0, 451.0, 263.0, 136.0, 70.0, 52.0, 38.0, 19.0, 10.0, 6.0, 2.0, 8.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12103271484375, -0.11526012420654297, -0.10948753356933594, -0.1037149429321289, -0.09794235229492188, -0.09216976165771484, -0.08639717102050781, -0.08062458038330078, -0.07485198974609375, -0.06907939910888672, -0.06330680847167969, -0.057534217834472656, -0.051761627197265625, -0.045989036560058594, -0.04021644592285156, -0.03444385528564453, -0.0286712646484375, -0.02289867401123047, -0.017126083374023438, -0.011353492736816406, -0.005580902099609375, 0.00019168853759765625, 0.0059642791748046875, 0.011736869812011719, 0.01750946044921875, 0.02328205108642578, 0.029054641723632812, 0.034827232360839844, 0.040599822998046875, 0.046372413635253906, 0.05214500427246094, 0.05791759490966797, 0.063690185546875, 0.06946277618408203, 0.07523536682128906, 0.0810079574584961, 0.08678054809570312, 0.09255313873291016, 0.09832572937011719, 0.10409832000732422, 0.10987091064453125, 0.11564350128173828, 0.12141609191894531, 0.12718868255615234, 0.13296127319335938, 0.1387338638305664, 0.14450645446777344, 0.15027904510498047, 0.1560516357421875, 0.16182422637939453, 0.16759681701660156, 0.1733694076538086, 0.17914199829101562, 0.18491458892822266, 0.1906871795654297, 0.19645977020263672, 0.20223236083984375, 0.20800495147705078, 0.2137775421142578, 0.21955013275146484, 0.22532272338867188, 0.2310953140258789, 0.23686790466308594, 0.24264049530029297, 0.2484130859375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 4.0, 8.0, 8.0, 10.0, 22.0, 15.0, 15.0, 25.0, 24.0, 38.0, 35.0, 36.0, 46.0, 50.0, 52.0, 52.0, 43.0, 57.0, 41.0, 63.0, 52.0, 43.0, 35.0, 36.0, 33.0, 29.0, 29.0, 24.0, 22.0, 12.0, 9.0, 5.0, 12.0, 3.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11395263671875, -0.1092233657836914, -0.10449409484863281, -0.09976482391357422, -0.09503555297851562, -0.09030628204345703, -0.08557701110839844, -0.08084774017333984, -0.07611846923828125, -0.07138919830322266, -0.06665992736816406, -0.06193065643310547, -0.057201385498046875, -0.05247211456298828, -0.04774284362792969, -0.043013572692871094, -0.0382843017578125, -0.033555030822753906, -0.028825759887695312, -0.02409648895263672, -0.019367218017578125, -0.014637947082519531, -0.009908676147460938, -0.005179405212402344, -0.00045013427734375, 0.004279136657714844, 0.009008407592773438, 0.013737678527832031, 0.018466949462890625, 0.02319622039794922, 0.027925491333007812, 0.032654762268066406, 0.037384033203125, 0.042113304138183594, 0.04684257507324219, 0.05157184600830078, 0.056301116943359375, 0.06103038787841797, 0.06575965881347656, 0.07048892974853516, 0.07521820068359375, 0.07994747161865234, 0.08467674255371094, 0.08940601348876953, 0.09413528442382812, 0.09886455535888672, 0.10359382629394531, 0.1083230972290039, 0.1130523681640625, 0.1177816390991211, 0.12251091003417969, 0.12724018096923828, 0.13196945190429688, 0.13669872283935547, 0.14142799377441406, 0.14615726470947266, 0.15088653564453125, 0.15561580657958984, 0.16034507751464844, 0.16507434844970703, 0.16980361938476562, 0.17453289031982422, 0.1792621612548828, 0.1839914321899414, 0.188720703125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 1.0, 5.0, 6.0, 21.0, 28.0, 37.0, 54.0, 92.0, 142.0, 221.0, 324.0, 590.0, 1064.0, 1897.0, 3868.0, 8177.0, 20205.0, 62332.0, 258846.0, 478556.0, 146678.0, 38714.0, 14047.0, 6157.0, 2944.0, 1480.0, 820.0, 472.0, 274.0, 174.0, 117.0, 64.0, 44.0, 31.0, 23.0, 12.0, 14.0, 9.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.059539794921875, -0.057436466217041016, -0.05533313751220703, -0.05322980880737305, -0.05112648010253906, -0.04902315139770508, -0.046919822692871094, -0.04481649398803711, -0.042713165283203125, -0.04060983657836914, -0.038506507873535156, -0.03640317916870117, -0.03429985046386719, -0.0321965217590332, -0.03009319305419922, -0.027989864349365234, -0.02588653564453125, -0.023783206939697266, -0.02167987823486328, -0.019576549530029297, -0.017473220825195312, -0.015369892120361328, -0.013266563415527344, -0.01116323471069336, -0.009059906005859375, -0.006956577301025391, -0.004853248596191406, -0.002749919891357422, -0.0006465911865234375, 0.0014567375183105469, 0.0035600662231445312, 0.005663394927978516, 0.0077667236328125, 0.009870052337646484, 0.011973381042480469, 0.014076709747314453, 0.016180038452148438, 0.018283367156982422, 0.020386695861816406, 0.02249002456665039, 0.024593353271484375, 0.02669668197631836, 0.028800010681152344, 0.030903339385986328, 0.03300666809082031, 0.0351099967956543, 0.03721332550048828, 0.039316654205322266, 0.04141998291015625, 0.043523311614990234, 0.04562664031982422, 0.0477299690246582, 0.04983329772949219, 0.05193662643432617, 0.054039955139160156, 0.05614328384399414, 0.058246612548828125, 0.06034994125366211, 0.062453269958496094, 0.06455659866333008, 0.06665992736816406, 0.06876325607299805, 0.07086658477783203, 0.07296991348266602, 0.0750732421875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 5.0, 8.0, 6.0, 11.0, 13.0, 29.0, 39.0, 38.0, 66.0, 70.0, 81.0, 86.0, 99.0, 102.0, 87.0, 76.0, 58.0, 27.0, 32.0, 19.0, 16.0, 11.0, 8.0, 9.0, 6.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.218650817871094e-05, -3.080815076828003e-05, -2.942979335784912e-05, -2.8051435947418213e-05, -2.6673078536987305e-05, -2.5294721126556396e-05, -2.3916363716125488e-05, -2.253800630569458e-05, -2.1159648895263672e-05, -1.9781291484832764e-05, -1.8402934074401855e-05, -1.7024576663970947e-05, -1.564621925354004e-05, -1.4267861843109131e-05, -1.2889504432678223e-05, -1.1511147022247314e-05, -1.0132789611816406e-05, -8.754432201385498e-06, -7.37607479095459e-06, -5.997717380523682e-06, -4.6193599700927734e-06, -3.2410025596618652e-06, -1.862645149230957e-06, -4.842877388000488e-07, 8.940696716308594e-07, 2.2724270820617676e-06, 3.6507844924926758e-06, 5.029141902923584e-06, 6.407499313354492e-06, 7.7858567237854e-06, 9.164214134216309e-06, 1.0542571544647217e-05, 1.1920928955078125e-05, 1.3299286365509033e-05, 1.4677643775939941e-05, 1.605600118637085e-05, 1.7434358596801758e-05, 1.8812716007232666e-05, 2.0191073417663574e-05, 2.1569430828094482e-05, 2.294778823852539e-05, 2.43261456489563e-05, 2.5704503059387207e-05, 2.7082860469818115e-05, 2.8461217880249023e-05, 2.983957529067993e-05, 3.121793270111084e-05, 3.259629011154175e-05, 3.3974647521972656e-05, 3.5353004932403564e-05, 3.673136234283447e-05, 3.810971975326538e-05, 3.948807716369629e-05, 4.08664345741272e-05, 4.2244791984558105e-05, 4.3623149394989014e-05, 4.500150680541992e-05, 4.637986421585083e-05, 4.775822162628174e-05, 4.9136579036712646e-05, 5.0514936447143555e-05, 5.189329385757446e-05, 5.327165126800537e-05, 5.465000867843628e-05, 5.602836608886719e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 10.0, 7.0, 9.0, 12.0, 12.0, 30.0, 55.0, 73.0, 127.0, 239.0, 346.0, 739.0, 1440.0, 3248.0, 8354.0, 25193.0, 112008.0, 573650.0, 256185.0, 44735.0, 12963.0, 4837.0, 2065.0, 998.0, 494.0, 281.0, 158.0, 90.0, 63.0, 35.0, 30.0, 16.0, 16.0, 10.0, 9.0, 0.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.080322265625, -0.07752513885498047, -0.07472801208496094, -0.0719308853149414, -0.06913375854492188, -0.06633663177490234, -0.06353950500488281, -0.06074237823486328, -0.05794525146484375, -0.05514812469482422, -0.05235099792480469, -0.049553871154785156, -0.046756744384765625, -0.043959617614746094, -0.04116249084472656, -0.03836536407470703, -0.0355682373046875, -0.03277111053466797, -0.029973983764648438, -0.027176856994628906, -0.024379730224609375, -0.021582603454589844, -0.018785476684570312, -0.01598834991455078, -0.01319122314453125, -0.010394096374511719, -0.0075969696044921875, -0.004799842834472656, -0.002002716064453125, 0.0007944107055664062, 0.0035915374755859375, 0.006388664245605469, 0.009185791015625, 0.011982917785644531, 0.014780044555664062, 0.017577171325683594, 0.020374298095703125, 0.023171424865722656, 0.025968551635742188, 0.02876567840576172, 0.03156280517578125, 0.03435993194580078, 0.03715705871582031, 0.039954185485839844, 0.042751312255859375, 0.045548439025878906, 0.04834556579589844, 0.05114269256591797, 0.0539398193359375, 0.05673694610595703, 0.05953407287597656, 0.062331199645996094, 0.06512832641601562, 0.06792545318603516, 0.07072257995605469, 0.07351970672607422, 0.07631683349609375, 0.07911396026611328, 0.08191108703613281, 0.08470821380615234, 0.08750534057617188, 0.0903024673461914, 0.09309959411621094, 0.09589672088623047, 0.09869384765625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 10.0, 7.0, 13.0, 12.0, 24.0, 29.0, 51.0, 59.0, 77.0, 93.0, 88.0, 109.0, 87.0, 66.0, 77.0, 61.0, 29.0, 24.0, 26.0, 13.0, 9.0, 10.0, 6.0, 4.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056732177734375, -0.05472898483276367, -0.052725791931152344, -0.050722599029541016, -0.04871940612792969, -0.04671621322631836, -0.04471302032470703, -0.0427098274230957, -0.040706634521484375, -0.03870344161987305, -0.03670024871826172, -0.03469705581665039, -0.03269386291503906, -0.030690670013427734, -0.028687477111816406, -0.026684284210205078, -0.02468109130859375, -0.022677898406982422, -0.020674705505371094, -0.018671512603759766, -0.016668319702148438, -0.01466512680053711, -0.012661933898925781, -0.010658740997314453, -0.008655548095703125, -0.006652355194091797, -0.004649162292480469, -0.0026459693908691406, -0.0006427764892578125, 0.0013604164123535156, 0.0033636093139648438, 0.005366802215576172, 0.0073699951171875, 0.009373188018798828, 0.011376380920410156, 0.013379573822021484, 0.015382766723632812, 0.01738595962524414, 0.01938915252685547, 0.021392345428466797, 0.023395538330078125, 0.025398731231689453, 0.02740192413330078, 0.02940511703491211, 0.03140830993652344, 0.033411502838134766, 0.035414695739746094, 0.03741788864135742, 0.03942108154296875, 0.04142427444458008, 0.043427467346191406, 0.045430660247802734, 0.04743385314941406, 0.04943704605102539, 0.05144023895263672, 0.05344343185424805, 0.055446624755859375, 0.0574498176574707, 0.05945301055908203, 0.06145620346069336, 0.06345939636230469, 0.06546258926391602, 0.06746578216552734, 0.06946897506713867, 0.07147216796875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 8.0, 16.0, 26.0, 51.0, 48.0, 68.0, 118.0, 113.0, 126.0, 104.0, 96.0, 73.0, 42.0, 34.0, 27.0, 16.0, 6.0, 4.0, 5.0, 4.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.873810887336731, -0.844957172870636, -0.816103458404541, -0.787249743938446, -0.7583960294723511, -0.7295423746109009, -0.7006886601448059, -0.6718349456787109, -0.642981231212616, -0.614127516746521, -0.585273802280426, -0.556420087814331, -0.5275664329528809, -0.4987126886844635, -0.4698590040206909, -0.44100528955459595, -0.412151575088501, -0.383297860622406, -0.35444414615631104, -0.32559046149253845, -0.2967367470264435, -0.2678830325603485, -0.23902933299541473, -0.21017563343048096, -0.181321918964386, -0.15246820449829102, -0.12361450493335724, -0.09476079791784286, -0.06590709090232849, -0.03705337643623352, -0.008199676871299744, 0.020654022693634033, 0.049507737159729004, 0.07836144417524338, 0.10721515119075775, 0.13606885075569153, 0.1649225652217865, 0.19377627968788147, 0.22262997925281525, 0.251483678817749, 0.280337393283844, 0.30919110774993896, 0.33804482221603394, 0.3668985068798065, 0.3957522213459015, 0.42460593581199646, 0.45345962047576904, 0.482313334941864, 0.511167049407959, 0.540020763874054, 0.5688744783401489, 0.5977281928062439, 0.6265819072723389, 0.6554355621337891, 0.684289276599884, 0.713142991065979, 0.741996705532074, 0.770850419998169, 0.7997041344642639, 0.8285578489303589, 0.8574115037918091, 0.8862652778625488, 0.915118932723999, 0.943972647190094, 0.972826361656189]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 7.0, 4.0, 12.0, 19.0, 7.0, 17.0, 20.0, 14.0, 37.0, 33.0, 41.0, 45.0, 52.0, 68.0, 60.0, 62.0, 58.0, 64.0, 65.0, 46.0, 44.0, 48.0, 42.0, 36.0, 30.0, 21.0, 10.0, 13.0, 8.0, 4.0, 10.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9815332889556885, -0.9500988721847534, -0.9186645150184631, -0.8872301578521729, -0.8557957410812378, -0.8243613243103027, -0.7929269671440125, -0.7614926099777222, -0.7300581932067871, -0.698623776435852, -0.6671894192695618, -0.6357550621032715, -0.6043206453323364, -0.5728862285614014, -0.5414518713951111, -0.5100175142288208, -0.47858309745788574, -0.44714871048927307, -0.4157143235206604, -0.38427993655204773, -0.35284554958343506, -0.3214111626148224, -0.2899767756462097, -0.25854238867759705, -0.22710800170898438, -0.1956736147403717, -0.16423922777175903, -0.13280484080314636, -0.10137045383453369, -0.06993606686592102, -0.03850167989730835, -0.007067292928695679, 0.024367094039916992, 0.05580148100852966, 0.08723586797714233, 0.118670254945755, 0.15010464191436768, 0.18153902888298035, 0.21297341585159302, 0.2444078028202057, 0.27584218978881836, 0.30727657675743103, 0.3387109637260437, 0.37014535069465637, 0.40157973766326904, 0.4330141246318817, 0.4644485116004944, 0.49588289856910706, 0.5273172855377197, 0.5587517023086548, 0.5901860594749451, 0.6216204166412354, 0.6530548334121704, 0.6844892501831055, 0.7159236073493958, 0.747357964515686, 0.7787923812866211, 0.8102267980575562, 0.8416611552238464, 0.8730955123901367, 0.9045299291610718, 0.9359643459320068, 0.9673987030982971, 0.9988330602645874, 1.0302674770355225]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 11.0, 17.0, 28.0, 61.0, 70.0, 129.0, 233.0, 396.0, 770.0, 1397.0, 3074.0, 7296.0, 20248.0, 80001.0, 2480232.0, 1493597.0, 73408.0, 19405.0, 6990.0, 3150.0, 1539.0, 815.0, 482.0, 284.0, 203.0, 129.0, 76.0, 50.0, 32.0, 36.0, 24.0, 22.0, 15.0, 14.0, 7.0, 7.0, 4.0, 6.0, 1.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.2025146484375, -0.1961822509765625, -0.189849853515625, -0.1835174560546875, -0.17718505859375, -0.1708526611328125, -0.164520263671875, -0.1581878662109375, -0.15185546875, -0.1455230712890625, -0.139190673828125, -0.1328582763671875, -0.12652587890625, -0.1201934814453125, -0.113861083984375, -0.1075286865234375, -0.1011962890625, -0.0948638916015625, -0.088531494140625, -0.0821990966796875, -0.07586669921875, -0.0695343017578125, -0.063201904296875, -0.0568695068359375, -0.050537109375, -0.0442047119140625, -0.037872314453125, -0.0315399169921875, -0.02520751953125, -0.0188751220703125, -0.012542724609375, -0.0062103271484375, 0.0001220703125, 0.0064544677734375, 0.012786865234375, 0.0191192626953125, 0.02545166015625, 0.0317840576171875, 0.038116455078125, 0.0444488525390625, 0.05078125, 0.0571136474609375, 0.063446044921875, 0.0697784423828125, 0.07611083984375, 0.0824432373046875, 0.088775634765625, 0.0951080322265625, 0.1014404296875, 0.1077728271484375, 0.114105224609375, 0.1204376220703125, 0.12677001953125, 0.1331024169921875, 0.139434814453125, 0.1457672119140625, 0.152099609375, 0.1584320068359375, 0.164764404296875, 0.1710968017578125, 0.17742919921875, 0.1837615966796875, 0.190093994140625, 0.1964263916015625, 0.2027587890625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 9.0, 8.0, 11.0, 13.0, 28.0, 34.0, 51.0, 70.0, 70.0, 77.0, 86.0, 75.0, 95.0, 78.0, 81.0, 65.0, 34.0, 42.0, 15.0, 12.0, 11.0, 11.0, 10.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04193115234375, -0.04046344757080078, -0.03899574279785156, -0.037528038024902344, -0.036060333251953125, -0.034592628479003906, -0.03312492370605469, -0.03165721893310547, -0.03018951416015625, -0.02872180938720703, -0.027254104614257812, -0.025786399841308594, -0.024318695068359375, -0.022850990295410156, -0.021383285522460938, -0.01991558074951172, -0.0184478759765625, -0.01698017120361328, -0.015512466430664062, -0.014044761657714844, -0.012577056884765625, -0.011109352111816406, -0.009641647338867188, -0.008173942565917969, -0.00670623779296875, -0.005238533020019531, -0.0037708282470703125, -0.0023031234741210938, -0.000835418701171875, 0.0006322860717773438, 0.0020999908447265625, 0.0035676956176757812, 0.005035400390625, 0.006503105163574219, 0.007970809936523438, 0.009438514709472656, 0.010906219482421875, 0.012373924255371094, 0.013841629028320312, 0.015309333801269531, 0.01677703857421875, 0.01824474334716797, 0.019712448120117188, 0.021180152893066406, 0.022647857666015625, 0.024115562438964844, 0.025583267211914062, 0.02705097198486328, 0.0285186767578125, 0.02998638153076172, 0.03145408630371094, 0.032921791076660156, 0.034389495849609375, 0.035857200622558594, 0.03732490539550781, 0.03879261016845703, 0.04026031494140625, 0.04172801971435547, 0.04319572448730469, 0.044663429260253906, 0.046131134033203125, 0.047598838806152344, 0.04906654357910156, 0.05053424835205078, 0.052001953125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 7.0, 11.0, 9.0, 17.0, 27.0, 33.0, 61.0, 89.0, 132.0, 218.0, 414.0, 701.0, 1310.0, 2748.0, 6122.0, 15746.0, 48169.0, 217607.0, 3215349.0, 562354.0, 83119.0, 23553.0, 8711.0, 3842.0, 1754.0, 904.0, 475.0, 282.0, 176.0, 99.0, 73.0, 45.0, 29.0, 31.0, 12.0, 6.0, 11.0, 5.0, 5.0, 2.0, 5.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.163818359375, -0.15880966186523438, -0.15380096435546875, -0.14879226684570312, -0.1437835693359375, -0.13877487182617188, -0.13376617431640625, -0.12875747680664062, -0.123748779296875, -0.11874008178710938, -0.11373138427734375, -0.10872268676757812, -0.1037139892578125, -0.09870529174804688, -0.09369659423828125, -0.08868789672851562, -0.08367919921875, -0.07867050170898438, -0.07366180419921875, -0.06865310668945312, -0.0636444091796875, -0.058635711669921875, -0.05362701416015625, -0.048618316650390625, -0.043609619140625, -0.038600921630859375, -0.03359222412109375, -0.028583526611328125, -0.0235748291015625, -0.018566131591796875, -0.01355743408203125, -0.008548736572265625, -0.0035400390625, 0.001468658447265625, 0.00647735595703125, 0.011486053466796875, 0.0164947509765625, 0.021503448486328125, 0.02651214599609375, 0.031520843505859375, 0.036529541015625, 0.041538238525390625, 0.04654693603515625, 0.051555633544921875, 0.0565643310546875, 0.061573028564453125, 0.06658172607421875, 0.07159042358398438, 0.07659912109375, 0.08160781860351562, 0.08661651611328125, 0.09162521362304688, 0.0966339111328125, 0.10164260864257812, 0.10665130615234375, 0.11166000366210938, 0.116668701171875, 0.12167739868164062, 0.12668609619140625, 0.13169479370117188, 0.1367034912109375, 0.14171218872070312, 0.14672088623046875, 0.15172958374023438, 0.15673828125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 0.0, 6.0, 6.0, 5.0, 8.0, 13.0, 13.0, 17.0, 32.0, 34.0, 30.0, 38.0, 63.0, 103.0, 147.0, 267.0, 609.0, 1355.0, 563.0, 281.0, 130.0, 91.0, 56.0, 52.0, 30.0, 28.0, 25.0, 16.0, 12.0, 13.0, 7.0, 8.0, 2.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046417236328125, -0.04452180862426758, -0.042626380920410156, -0.040730953216552734, -0.03883552551269531, -0.03694009780883789, -0.03504467010498047, -0.03314924240112305, -0.031253814697265625, -0.029358386993408203, -0.02746295928955078, -0.02556753158569336, -0.023672103881835938, -0.021776676177978516, -0.019881248474121094, -0.017985820770263672, -0.01609039306640625, -0.014194965362548828, -0.012299537658691406, -0.010404109954833984, -0.008508682250976562, -0.006613254547119141, -0.004717826843261719, -0.002822399139404297, -0.000926971435546875, 0.0009684562683105469, 0.0028638839721679688, 0.004759311676025391, 0.0066547393798828125, 0.008550167083740234, 0.010445594787597656, 0.012341022491455078, 0.0142364501953125, 0.016131877899169922, 0.018027305603027344, 0.019922733306884766, 0.021818161010742188, 0.02371358871459961, 0.02560901641845703, 0.027504444122314453, 0.029399871826171875, 0.0312952995300293, 0.03319072723388672, 0.03508615493774414, 0.03698158264160156, 0.038877010345458984, 0.040772438049316406, 0.04266786575317383, 0.04456329345703125, 0.04645872116088867, 0.048354148864746094, 0.050249576568603516, 0.05214500427246094, 0.05404043197631836, 0.05593585968017578, 0.0578312873840332, 0.059726715087890625, 0.06162214279174805, 0.06351757049560547, 0.06541299819946289, 0.06730842590332031, 0.06920385360717773, 0.07109928131103516, 0.07299470901489258, 0.07489013671875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 3.0, 6.0, 8.0, 9.0, 22.0, 52.0, 73.0, 118.0, 153.0, 161.0, 135.0, 103.0, 72.0, 44.0, 21.0, 7.0, 9.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5998169183731079, -0.5819693803787231, -0.5641219019889832, -0.5462743639945984, -0.5284268856048584, -0.5105793476104736, -0.49273183941841125, -0.4748843312263489, -0.4570368230342865, -0.4391893148422241, -0.42134180665016174, -0.40349429845809937, -0.3856467604637146, -0.3677992820739746, -0.34995174407958984, -0.33210423588752747, -0.3142567276954651, -0.2964092195034027, -0.27856171131134033, -0.26071420311927795, -0.24286668002605438, -0.225019171833992, -0.20717164874076843, -0.18932414054870605, -0.17147663235664368, -0.1536291241645813, -0.13578161597251892, -0.11793409287929535, -0.10008658468723297, -0.0822390764951706, -0.06439156085252762, -0.046544045209884644, -0.028696537017822266, -0.01084902510046959, 0.006998486816883087, 0.024845998734235764, 0.04269351065158844, 0.06054101884365082, 0.07838853448629379, 0.09623605012893677, 0.11408355832099915, 0.13193106651306152, 0.1497785747051239, 0.16762609779834747, 0.18547360599040985, 0.20332111418247223, 0.2211686372756958, 0.23901614546775818, 0.25686365365982056, 0.27471116185188293, 0.2925586700439453, 0.3104061782360077, 0.32825368642807007, 0.34610122442245483, 0.3639487326145172, 0.3817962408065796, 0.39964374899864197, 0.41749125719070435, 0.4353387653827667, 0.4531862735748291, 0.47103381156921387, 0.48888128995895386, 0.5067288279533386, 0.5245763063430786, 0.5424238443374634]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 1.0, 6.0, 8.0, 12.0, 8.0, 19.0, 12.0, 18.0, 25.0, 35.0, 37.0, 36.0, 55.0, 52.0, 47.0, 46.0, 53.0, 62.0, 45.0, 53.0, 44.0, 42.0, 33.0, 35.0, 40.0, 30.0, 25.0, 33.0, 26.0, 10.0, 10.0, 12.0, 7.0, 7.0, 3.0, 4.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29416346549987793, -0.28543680906295776, -0.2767101526260376, -0.26798349618911743, -0.25925686955451965, -0.2505302131175995, -0.24180355668067932, -0.23307690024375916, -0.224350243806839, -0.21562358736991882, -0.20689694583415985, -0.19817028939723969, -0.18944363296031952, -0.18071699142456055, -0.17199033498764038, -0.16326367855072021, -0.15453703701496124, -0.14581038057804108, -0.1370837390422821, -0.12835708260536194, -0.11963042616844177, -0.1109037771821022, -0.10217712819576263, -0.09345047175884247, -0.0847238227725029, -0.07599717378616333, -0.06727051734924316, -0.058543868362903595, -0.04981721565127373, -0.04109056293964386, -0.03236391395330429, -0.023637261241674423, -0.014910608530044556, -0.006183956749737263, 0.00254269503057003, 0.011269345879554749, 0.019995998591184616, 0.028722651302814484, 0.03744930028915405, 0.04617595300078392, 0.05490260571241379, 0.06362925469875336, 0.07235591113567352, 0.08108256012201309, 0.08980920910835266, 0.09853586554527283, 0.1072625145316124, 0.11598916351795197, 0.12471581995487213, 0.1334424763917923, 0.14216911792755127, 0.15089577436447144, 0.1596224308013916, 0.16834908723831177, 0.17707572877407074, 0.1858023852109909, 0.19452902674674988, 0.20325568318367004, 0.21198232471942902, 0.22070898115634918, 0.22943563759326935, 0.23816227912902832, 0.2468889355659485, 0.25561559200286865, 0.2643422484397888]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 9.0, 16.0, 10.0, 27.0, 35.0, 51.0, 68.0, 127.0, 148.0, 272.0, 471.0, 871.0, 1823.0, 4366.0, 11561.0, 34540.0, 127757.0, 531695.0, 246043.0, 58908.0, 17974.0, 6456.0, 2602.0, 1182.0, 590.0, 318.0, 207.0, 125.0, 84.0, 58.0, 43.0, 23.0, 19.0, 17.0, 14.0, 5.0, 5.0, 7.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.233154296875, -0.22623825073242188, -0.21932220458984375, -0.21240615844726562, -0.2054901123046875, -0.19857406616210938, -0.19165802001953125, -0.18474197387695312, -0.177825927734375, -0.17090988159179688, -0.16399383544921875, -0.15707778930664062, -0.1501617431640625, -0.14324569702148438, -0.13632965087890625, -0.12941360473632812, -0.12249755859375, -0.11558151245117188, -0.10866546630859375, -0.10174942016601562, -0.0948333740234375, -0.08791732788085938, -0.08100128173828125, -0.07408523559570312, -0.067169189453125, -0.060253143310546875, -0.05333709716796875, -0.046421051025390625, -0.0395050048828125, -0.032588958740234375, -0.02567291259765625, -0.018756866455078125, -0.0118408203125, -0.004924774169921875, 0.00199127197265625, 0.008907318115234375, 0.0158233642578125, 0.022739410400390625, 0.02965545654296875, 0.036571502685546875, 0.043487548828125, 0.050403594970703125, 0.05731964111328125, 0.06423568725585938, 0.0711517333984375, 0.07806777954101562, 0.08498382568359375, 0.09189987182617188, 0.09881591796875, 0.10573196411132812, 0.11264801025390625, 0.11956405639648438, 0.1264801025390625, 0.13339614868164062, 0.14031219482421875, 0.14722824096679688, 0.154144287109375, 0.16106033325195312, 0.16797637939453125, 0.17489242553710938, 0.1818084716796875, 0.18872451782226562, 0.19564056396484375, 0.20255661010742188, 0.20947265625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 12.0, 11.0, 13.0, 12.0, 25.0, 59.0, 53.0, 71.0, 81.0, 94.0, 89.0, 105.0, 83.0, 93.0, 57.0, 53.0, 26.0, 26.0, 8.0, 10.0, 7.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.053558349609375, -0.05197334289550781, -0.050388336181640625, -0.04880332946777344, -0.04721832275390625, -0.04563331604003906, -0.044048309326171875, -0.04246330261230469, -0.0408782958984375, -0.03929328918457031, -0.037708282470703125, -0.03612327575683594, -0.03453826904296875, -0.03295326232910156, -0.031368255615234375, -0.029783248901367188, -0.0281982421875, -0.026613235473632812, -0.025028228759765625, -0.023443222045898438, -0.02185821533203125, -0.020273208618164062, -0.018688201904296875, -0.017103195190429688, -0.0155181884765625, -0.013933181762695312, -0.012348175048828125, -0.010763168334960938, -0.00917816162109375, -0.0075931549072265625, -0.006008148193359375, -0.0044231414794921875, -0.002838134765625, -0.0012531280517578125, 0.000331878662109375, 0.0019168853759765625, 0.00350189208984375, 0.0050868988037109375, 0.006671905517578125, 0.008256912231445312, 0.0098419189453125, 0.011426925659179688, 0.013011932373046875, 0.014596939086914062, 0.01618194580078125, 0.017766952514648438, 0.019351959228515625, 0.020936965942382812, 0.02252197265625, 0.024106979370117188, 0.025691986083984375, 0.027276992797851562, 0.02886199951171875, 0.030447006225585938, 0.032032012939453125, 0.03361701965332031, 0.0352020263671875, 0.03678703308105469, 0.038372039794921875, 0.03995704650878906, 0.04154205322265625, 0.04312705993652344, 0.044712066650390625, 0.04629707336425781, 0.047882080078125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 2.0, 9.0, 5.0, 4.0, 11.0, 15.0, 21.0, 32.0, 51.0, 57.0, 86.0, 126.0, 158.0, 250.0, 409.0, 634.0, 999.0, 1620.0, 3030.0, 5454.0, 10959.0, 25133.0, 60753.0, 160726.0, 392742.0, 234775.0, 85844.0, 34184.0, 14697.0, 6975.0, 3489.0, 1961.0, 1157.0, 746.0, 449.0, 301.0, 207.0, 149.0, 82.0, 85.0, 55.0, 41.0, 24.0, 11.0, 12.0, 11.0, 8.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11004638671875, -0.10620975494384766, -0.10237312316894531, -0.09853649139404297, -0.09469985961914062, -0.09086322784423828, -0.08702659606933594, -0.0831899642944336, -0.07935333251953125, -0.0755167007446289, -0.07168006896972656, -0.06784343719482422, -0.06400680541992188, -0.06017017364501953, -0.05633354187011719, -0.052496910095214844, -0.0486602783203125, -0.044823646545410156, -0.04098701477050781, -0.03715038299560547, -0.033313751220703125, -0.02947711944580078, -0.025640487670898438, -0.021803855895996094, -0.01796722412109375, -0.014130592346191406, -0.010293960571289062, -0.006457328796386719, -0.002620697021484375, 0.0012159347534179688, 0.0050525665283203125, 0.008889198303222656, 0.012725830078125, 0.016562461853027344, 0.020399093627929688, 0.02423572540283203, 0.028072357177734375, 0.03190898895263672, 0.03574562072753906, 0.039582252502441406, 0.04341888427734375, 0.047255516052246094, 0.05109214782714844, 0.05492877960205078, 0.058765411376953125, 0.06260204315185547, 0.06643867492675781, 0.07027530670166016, 0.0741119384765625, 0.07794857025146484, 0.08178520202636719, 0.08562183380126953, 0.08945846557617188, 0.09329509735107422, 0.09713172912597656, 0.1009683609008789, 0.10480499267578125, 0.1086416244506836, 0.11247825622558594, 0.11631488800048828, 0.12015151977539062, 0.12398815155029297, 0.1278247833251953, 0.13166141510009766, 0.135498046875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 1.0, 5.0, 12.0, 14.0, 6.0, 12.0, 12.0, 25.0, 17.0, 22.0, 20.0, 26.0, 38.0, 36.0, 38.0, 36.0, 49.0, 54.0, 48.0, 54.0, 52.0, 41.0, 40.0, 48.0, 39.0, 37.0, 40.0, 37.0, 27.0, 32.0, 21.0, 11.0, 13.0, 14.0, 11.0, 3.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1583251953125, -0.15381431579589844, -0.14930343627929688, -0.1447925567626953, -0.14028167724609375, -0.1357707977294922, -0.13125991821289062, -0.12674903869628906, -0.1222381591796875, -0.11772727966308594, -0.11321640014648438, -0.10870552062988281, -0.10419464111328125, -0.09968376159667969, -0.09517288208007812, -0.09066200256347656, -0.086151123046875, -0.08164024353027344, -0.07712936401367188, -0.07261848449707031, -0.06810760498046875, -0.06359672546386719, -0.059085845947265625, -0.05457496643066406, -0.0500640869140625, -0.04555320739746094, -0.041042327880859375, -0.03653144836425781, -0.03202056884765625, -0.027509689331054688, -0.022998809814453125, -0.018487930297851562, -0.01397705078125, -0.009466171264648438, -0.004955291748046875, -0.0004444122314453125, 0.00406646728515625, 0.008577346801757812, 0.013088226318359375, 0.017599105834960938, 0.0221099853515625, 0.026620864868164062, 0.031131744384765625, 0.03564262390136719, 0.04015350341796875, 0.04466438293457031, 0.049175262451171875, 0.05368614196777344, 0.058197021484375, 0.06270790100097656, 0.06721878051757812, 0.07172966003417969, 0.07624053955078125, 0.08075141906738281, 0.08526229858398438, 0.08977317810058594, 0.0942840576171875, 0.09879493713378906, 0.10330581665039062, 0.10781669616699219, 0.11232757568359375, 0.11683845520019531, 0.12134933471679688, 0.12586021423339844, 0.13037109375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 10.0, 8.0, 19.0, 16.0, 21.0, 42.0, 77.0, 140.0, 269.0, 456.0, 863.0, 1595.0, 3412.0, 7972.0, 22199.0, 95983.0, 586159.0, 263334.0, 43231.0, 12686.0, 5011.0, 2356.0, 1237.0, 634.0, 320.0, 174.0, 117.0, 76.0, 47.0, 33.0, 14.0, 7.0, 13.0, 12.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1363525390625, -0.13231277465820312, -0.12827301025390625, -0.12423324584960938, -0.1201934814453125, -0.11615371704101562, -0.11211395263671875, -0.10807418823242188, -0.104034423828125, -0.09999465942382812, -0.09595489501953125, -0.09191513061523438, -0.0878753662109375, -0.08383560180664062, -0.07979583740234375, -0.07575607299804688, -0.07171630859375, -0.06767654418945312, -0.06363677978515625, -0.059597015380859375, -0.0555572509765625, -0.051517486572265625, -0.04747772216796875, -0.043437957763671875, -0.039398193359375, -0.035358428955078125, -0.03131866455078125, -0.027278900146484375, -0.0232391357421875, -0.019199371337890625, -0.01515960693359375, -0.011119842529296875, -0.007080078125, -0.003040313720703125, 0.00099945068359375, 0.005039215087890625, 0.0090789794921875, 0.013118743896484375, 0.01715850830078125, 0.021198272705078125, 0.025238037109375, 0.029277801513671875, 0.03331756591796875, 0.037357330322265625, 0.0413970947265625, 0.045436859130859375, 0.04947662353515625, 0.053516387939453125, 0.05755615234375, 0.061595916748046875, 0.06563568115234375, 0.06967544555664062, 0.0737152099609375, 0.07775497436523438, 0.08179473876953125, 0.08583450317382812, 0.089874267578125, 0.09391403198242188, 0.09795379638671875, 0.10199356079101562, 0.1060333251953125, 0.11007308959960938, 0.11411285400390625, 0.11815261840820312, 0.1221923828125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 8.0, 8.0, 2.0, 7.0, 7.0, 15.0, 25.0, 32.0, 46.0, 45.0, 73.0, 94.0, 88.0, 87.0, 87.0, 84.0, 60.0, 51.0, 54.0, 48.0, 22.0, 15.0, 20.0, 12.0, 4.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.64320182800293e-05, -4.516635090112686e-05, -4.3900683522224426e-05, -4.263501614332199e-05, -4.1369348764419556e-05, -4.010368138551712e-05, -3.8838014006614685e-05, -3.757234662771225e-05, -3.6306679248809814e-05, -3.504101186990738e-05, -3.3775344491004944e-05, -3.250967711210251e-05, -3.124400973320007e-05, -2.9978342354297638e-05, -2.8712674975395203e-05, -2.7447007596492767e-05, -2.6181340217590332e-05, -2.4915672838687897e-05, -2.365000545978546e-05, -2.2384338080883026e-05, -2.111867070198059e-05, -1.9853003323078156e-05, -1.858733594417572e-05, -1.7321668565273285e-05, -1.605600118637085e-05, -1.4790333807468414e-05, -1.3524666428565979e-05, -1.2258999049663544e-05, -1.0993331670761108e-05, -9.727664291858673e-06, -8.461996912956238e-06, -7.1963295340538025e-06, -5.930662155151367e-06, -4.664994776248932e-06, -3.3993273973464966e-06, -2.1336600184440613e-06, -8.67992639541626e-07, 3.976747393608093e-07, 1.6633421182632446e-06, 2.92900949716568e-06, 4.194676876068115e-06, 5.4603442549705505e-06, 6.726011633872986e-06, 7.991679012775421e-06, 9.257346391677856e-06, 1.0523013770580292e-05, 1.1788681149482727e-05, 1.3054348528385162e-05, 1.4320015907287598e-05, 1.5585683286190033e-05, 1.6851350665092468e-05, 1.8117018043994904e-05, 1.938268542289734e-05, 2.0648352801799774e-05, 2.191402018070221e-05, 2.3179687559604645e-05, 2.444535493850708e-05, 2.5711022317409515e-05, 2.697668969631195e-05, 2.8242357075214386e-05, 2.950802445411682e-05, 3.0773691833019257e-05, 3.203935921192169e-05, 3.330502659082413e-05, 3.457069396972656e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 13.0, 13.0, 20.0, 29.0, 46.0, 45.0, 80.0, 118.0, 199.0, 347.0, 602.0, 1313.0, 2903.0, 7025.0, 21087.0, 87356.0, 557240.0, 298482.0, 48954.0, 13447.0, 4935.0, 2085.0, 961.0, 519.0, 267.0, 175.0, 92.0, 67.0, 38.0, 30.0, 15.0, 20.0, 10.0, 6.0, 8.0, 3.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1343994140625, -0.13074874877929688, -0.12709808349609375, -0.12344741821289062, -0.1197967529296875, -0.11614608764648438, -0.11249542236328125, -0.10884475708007812, -0.105194091796875, -0.10154342651367188, -0.09789276123046875, -0.09424209594726562, -0.0905914306640625, -0.08694076538085938, -0.08329010009765625, -0.07963943481445312, -0.07598876953125, -0.07233810424804688, -0.06868743896484375, -0.06503677368164062, -0.0613861083984375, -0.057735443115234375, -0.05408477783203125, -0.050434112548828125, -0.046783447265625, -0.043132781982421875, -0.03948211669921875, -0.035831451416015625, -0.0321807861328125, -0.028530120849609375, -0.02487945556640625, -0.021228790283203125, -0.017578125, -0.013927459716796875, -0.01027679443359375, -0.006626129150390625, -0.0029754638671875, 0.000675201416015625, 0.00432586669921875, 0.007976531982421875, 0.011627197265625, 0.015277862548828125, 0.01892852783203125, 0.022579193115234375, 0.0262298583984375, 0.029880523681640625, 0.03353118896484375, 0.037181854248046875, 0.04083251953125, 0.044483184814453125, 0.04813385009765625, 0.051784515380859375, 0.0554351806640625, 0.059085845947265625, 0.06273651123046875, 0.06638717651367188, 0.070037841796875, 0.07368850708007812, 0.07733917236328125, 0.08098983764648438, 0.0846405029296875, 0.08829116821289062, 0.09194183349609375, 0.09559249877929688, 0.0992431640625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 10.0, 7.0, 8.0, 12.0, 12.0, 12.0, 23.0, 27.0, 39.0, 65.0, 103.0, 141.0, 148.0, 125.0, 76.0, 53.0, 31.0, 21.0, 20.0, 15.0, 11.0, 13.0, 6.0, 5.0, 7.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09014892578125, -0.08706188201904297, -0.08397483825683594, -0.0808877944946289, -0.07780075073242188, -0.07471370697021484, -0.07162666320800781, -0.06853961944580078, -0.06545257568359375, -0.06236553192138672, -0.05927848815917969, -0.056191444396972656, -0.053104400634765625, -0.050017356872558594, -0.04693031311035156, -0.04384326934814453, -0.0407562255859375, -0.03766918182373047, -0.03458213806152344, -0.031495094299316406, -0.028408050537109375, -0.025321006774902344, -0.022233963012695312, -0.01914691925048828, -0.01605987548828125, -0.012972831726074219, -0.009885787963867188, -0.006798744201660156, -0.003711700439453125, -0.0006246566772460938, 0.0024623870849609375, 0.005549430847167969, 0.008636474609375, 0.011723518371582031, 0.014810562133789062, 0.017897605895996094, 0.020984649658203125, 0.024071693420410156, 0.027158737182617188, 0.03024578094482422, 0.03333282470703125, 0.03641986846923828, 0.03950691223144531, 0.042593955993652344, 0.045680999755859375, 0.048768043518066406, 0.05185508728027344, 0.05494213104248047, 0.0580291748046875, 0.06111621856689453, 0.06420326232910156, 0.0672903060913086, 0.07037734985351562, 0.07346439361572266, 0.07655143737792969, 0.07963848114013672, 0.08272552490234375, 0.08581256866455078, 0.08889961242675781, 0.09198665618896484, 0.09507369995117188, 0.0981607437133789, 0.10124778747558594, 0.10433483123779297, 0.107421875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 5.0, 8.0, 17.0, 17.0, 42.0, 49.0, 73.0, 111.0, 155.0, 161.0, 135.0, 82.0, 59.0, 26.0, 23.0, 17.0, 13.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6204460859298706, -1.5788004398345947, -1.5371546745300293, -1.4955090284347534, -1.4538633823394775, -1.4122177362442017, -1.3705719709396362, -1.3289263248443604, -1.2872806787490845, -1.2456350326538086, -1.2039892673492432, -1.1623436212539673, -1.1206979751586914, -1.0790523290634155, -1.03740656375885, -0.9957609176635742, -0.9541152119636536, -0.9124695062637329, -0.870823860168457, -0.8291781544685364, -0.7875325083732605, -0.7458868026733398, -0.704241156578064, -0.6625954508781433, -0.6209497451782227, -0.579304039478302, -0.5376583933830261, -0.49601268768310547, -0.4543670415878296, -0.41272133588790894, -0.37107565999031067, -0.3294299840927124, -0.2877843379974365, -0.24613866209983826, -0.20449298620224, -0.16284729540348053, -0.12120161950588226, -0.079555943608284, -0.037910252809524536, 0.0037354230880737305, 0.045381098985672, 0.08702677488327026, 0.12867245078086853, 0.170318141579628, 0.21196381747722626, 0.25360947847366333, 0.295255184173584, 0.33690086007118225, 0.3785465359687805, 0.4201922118663788, 0.46183788776397705, 0.5034835934638977, 0.5451292395591736, 0.5867749452590942, 0.6284205913543701, 0.6700662970542908, 0.7117120027542114, 0.7533577084541321, 0.795003354549408, 0.8366490602493286, 0.8782947063446045, 0.9199404120445251, 0.9615861177444458, 1.0032317638397217, 1.0448774099349976]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 5.0, 4.0, 2.0, 5.0, 10.0, 7.0, 16.0, 17.0, 17.0, 19.0, 21.0, 25.0, 20.0, 37.0, 31.0, 35.0, 43.0, 53.0, 43.0, 44.0, 49.0, 50.0, 51.0, 58.0, 47.0, 29.0, 33.0, 20.0, 28.0, 23.0, 26.0, 15.0, 23.0, 10.0, 13.0, 12.0, 11.0, 14.0, 8.0, 6.0, 7.0, 8.0, 3.0, 2.0, 4.0, 0.0, 4.0, 1.0, 1.0], "bins": [-0.834596574306488, -0.8115134835243225, -0.788430392742157, -0.7653473019599915, -0.7422642111778259, -0.7191811203956604, -0.6960979700088501, -0.6730148792266846, -0.649931788444519, -0.6268486976623535, -0.603765606880188, -0.5806825160980225, -0.5575994253158569, -0.5345163345336914, -0.5114332437515259, -0.48835012316703796, -0.4652670621871948, -0.4421839714050293, -0.41910088062286377, -0.39601778984069824, -0.3729346990585327, -0.3498516082763672, -0.3267684876918793, -0.30368539690971375, -0.2806023061275482, -0.2575192153453827, -0.23443612456321716, -0.21135301887989044, -0.18826992809772491, -0.1651868373155594, -0.14210373163223267, -0.11902064085006714, -0.09593760967254639, -0.07285451889038086, -0.049771420657634735, -0.02668832242488861, -0.0036052316427230835, 0.019477859139442444, 0.042560964822769165, 0.06564405560493469, 0.08872714638710022, 0.11181023716926575, 0.13489332795143127, 0.157976433634758, 0.18105952441692352, 0.20414261519908905, 0.22722572088241577, 0.2503088116645813, 0.2733919024467468, 0.29647499322891235, 0.3195580840110779, 0.3426411747932434, 0.36572426557540894, 0.38880735635757446, 0.4118904769420624, 0.4349735677242279, 0.45805665850639343, 0.48113974928855896, 0.5042228698730469, 0.5273059606552124, 0.5503890514373779, 0.5734721422195435, 0.596555233001709, 0.6196383237838745, 0.64272141456604]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 5.0, 5.0, 24.0, 27.0, 36.0, 89.0, 142.0, 224.0, 392.0, 735.0, 1417.0, 3398.0, 10741.0, 49887.0, 2565261.0, 1497441.0, 46888.0, 10646.0, 3518.0, 1538.0, 790.0, 416.0, 243.0, 143.0, 96.0, 58.0, 31.0, 26.0, 19.0, 8.0, 9.0, 6.0, 3.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.286865234375, -0.27889442443847656, -0.2709236145019531, -0.2629528045654297, -0.25498199462890625, -0.2470111846923828, -0.23904037475585938, -0.23106956481933594, -0.2230987548828125, -0.21512794494628906, -0.20715713500976562, -0.1991863250732422, -0.19121551513671875, -0.1832447052001953, -0.17527389526367188, -0.16730308532714844, -0.159332275390625, -0.15136146545410156, -0.14339065551757812, -0.1354198455810547, -0.12744903564453125, -0.11947822570800781, -0.11150741577148438, -0.10353660583496094, -0.0955657958984375, -0.08759498596191406, -0.07962417602539062, -0.07165336608886719, -0.06368255615234375, -0.05571174621582031, -0.047740936279296875, -0.03977012634277344, -0.03179931640625, -0.023828506469726562, -0.015857696533203125, -0.007886886596679688, 8.392333984375e-05, 0.008054733276367188, 0.016025543212890625, 0.023996353149414062, 0.0319671630859375, 0.03993797302246094, 0.047908782958984375, 0.05587959289550781, 0.06385040283203125, 0.07182121276855469, 0.07979202270507812, 0.08776283264160156, 0.095733642578125, 0.10370445251464844, 0.11167526245117188, 0.11964607238769531, 0.12761688232421875, 0.1355876922607422, 0.14355850219726562, 0.15152931213378906, 0.1595001220703125, 0.16747093200683594, 0.17544174194335938, 0.1834125518798828, 0.19138336181640625, 0.1993541717529297, 0.20732498168945312, 0.21529579162597656, 0.2232666015625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 6.0, 18.0, 23.0, 24.0, 30.0, 47.0, 79.0, 68.0, 87.0, 86.0, 82.0, 75.0, 81.0, 75.0, 57.0, 34.0, 30.0, 31.0, 13.0, 15.0, 12.0, 8.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.050140380859375, -0.048645973205566406, -0.04715156555175781, -0.04565715789794922, -0.044162750244140625, -0.04266834259033203, -0.04117393493652344, -0.039679527282714844, -0.03818511962890625, -0.036690711975097656, -0.03519630432128906, -0.03370189666748047, -0.032207489013671875, -0.03071308135986328, -0.029218673706054688, -0.027724266052246094, -0.0262298583984375, -0.024735450744628906, -0.023241043090820312, -0.02174663543701172, -0.020252227783203125, -0.01875782012939453, -0.017263412475585938, -0.015769004821777344, -0.01427459716796875, -0.012780189514160156, -0.011285781860351562, -0.009791374206542969, -0.008296966552734375, -0.006802558898925781, -0.0053081512451171875, -0.0038137435913085938, -0.0023193359375, -0.0008249282836914062, 0.0006694793701171875, 0.0021638870239257812, 0.003658294677734375, 0.005152702331542969, 0.0066471099853515625, 0.008141517639160156, 0.00963592529296875, 0.011130332946777344, 0.012624740600585938, 0.014119148254394531, 0.015613555908203125, 0.01710796356201172, 0.018602371215820312, 0.020096778869628906, 0.0215911865234375, 0.023085594177246094, 0.024580001831054688, 0.02607440948486328, 0.027568817138671875, 0.02906322479248047, 0.030557632446289062, 0.032052040100097656, 0.03354644775390625, 0.035040855407714844, 0.03653526306152344, 0.03802967071533203, 0.039524078369140625, 0.04101848602294922, 0.04251289367675781, 0.044007301330566406, 0.045501708984375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 1.0, 8.0, 4.0, 9.0, 9.0, 11.0, 21.0, 17.0, 37.0, 53.0, 67.0, 109.0, 152.0, 296.0, 514.0, 1062.0, 2448.0, 7246.0, 31867.0, 283341.0, 3710269.0, 128691.0, 19264.0, 5036.0, 1842.0, 800.0, 421.0, 264.0, 133.0, 86.0, 64.0, 36.0, 32.0, 29.0, 18.0, 10.0, 6.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24853515625, -0.23976898193359375, -0.2310028076171875, -0.22223663330078125, -0.213470458984375, -0.20470428466796875, -0.1959381103515625, -0.18717193603515625, -0.17840576171875, -0.16963958740234375, -0.1608734130859375, -0.15210723876953125, -0.143341064453125, -0.13457489013671875, -0.1258087158203125, -0.11704254150390625, -0.1082763671875, -0.09951019287109375, -0.0907440185546875, -0.08197784423828125, -0.073211669921875, -0.06444549560546875, -0.0556793212890625, -0.04691314697265625, -0.03814697265625, -0.02938079833984375, -0.0206146240234375, -0.01184844970703125, -0.003082275390625, 0.00568389892578125, 0.0144500732421875, 0.02321624755859375, 0.031982421875, 0.04074859619140625, 0.0495147705078125, 0.05828094482421875, 0.067047119140625, 0.07581329345703125, 0.0845794677734375, 0.09334564208984375, 0.10211181640625, 0.11087799072265625, 0.1196441650390625, 0.12841033935546875, 0.137176513671875, 0.14594268798828125, 0.1547088623046875, 0.16347503662109375, 0.1722412109375, 0.18100738525390625, 0.1897735595703125, 0.19853973388671875, 0.207305908203125, 0.21607208251953125, 0.2248382568359375, 0.23360443115234375, 0.24237060546875, 0.25113677978515625, 0.2599029541015625, 0.26866912841796875, 0.277435302734375, 0.28620147705078125, 0.2949676513671875, 0.30373382568359375, 0.3125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 8.0, 8.0, 10.0, 35.0, 44.0, 74.0, 156.0, 383.0, 2331.0, 609.0, 178.0, 107.0, 68.0, 25.0, 16.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1414794921875, -0.13791370391845703, -0.13434791564941406, -0.1307821273803711, -0.12721633911132812, -0.12365055084228516, -0.12008476257324219, -0.11651897430419922, -0.11295318603515625, -0.10938739776611328, -0.10582160949707031, -0.10225582122802734, -0.09869003295898438, -0.0951242446899414, -0.09155845642089844, -0.08799266815185547, -0.0844268798828125, -0.08086109161376953, -0.07729530334472656, -0.0737295150756836, -0.07016372680664062, -0.06659793853759766, -0.06303215026855469, -0.05946636199951172, -0.05590057373046875, -0.05233478546142578, -0.04876899719238281, -0.045203208923339844, -0.041637420654296875, -0.038071632385253906, -0.03450584411621094, -0.03094005584716797, -0.027374267578125, -0.02380847930908203, -0.020242691040039062, -0.016676902770996094, -0.013111114501953125, -0.009545326232910156, -0.0059795379638671875, -0.0024137496948242188, 0.00115203857421875, 0.004717826843261719, 0.008283615112304688, 0.011849403381347656, 0.015415191650390625, 0.018980979919433594, 0.022546768188476562, 0.02611255645751953, 0.0296783447265625, 0.03324413299560547, 0.03680992126464844, 0.040375709533691406, 0.043941497802734375, 0.047507286071777344, 0.05107307434082031, 0.05463886260986328, 0.05820465087890625, 0.06177043914794922, 0.06533622741699219, 0.06890201568603516, 0.07246780395507812, 0.0760335922241211, 0.07959938049316406, 0.08316516876220703, 0.08673095703125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 17.0, 15.0, 40.0, 60.0, 89.0, 117.0, 162.0, 144.0, 111.0, 98.0, 68.0, 28.0, 11.0, 15.0, 10.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5916775465011597, -0.5743805766105652, -0.5570836663246155, -0.539786696434021, -0.5224897861480713, -0.5051928162574768, -0.4878958463668823, -0.47059890627861023, -0.45330196619033813, -0.43600502610206604, -0.41870808601379395, -0.40141111612319946, -0.38411417603492737, -0.3668172359466553, -0.3495202660560608, -0.3322233259677887, -0.3149263858795166, -0.2976294457912445, -0.2803325057029724, -0.26303553581237793, -0.24573859572410583, -0.22844165563583374, -0.21114470064640045, -0.19384774565696716, -0.17655080556869507, -0.15925386548042297, -0.14195691049098969, -0.124659962952137, -0.1073630154132843, -0.09006606787443161, -0.07276912033557892, -0.05547217279672623, -0.03817516565322876, -0.020878218114376068, -0.0035812705755233765, 0.013715676963329315, 0.031012624502182007, 0.0483095720410347, 0.06560651957988739, 0.08290346711874008, 0.10020041465759277, 0.11749736219644547, 0.13479430973529816, 0.15209126472473145, 0.16938820481300354, 0.18668514490127563, 0.20398209989070892, 0.2212790548801422, 0.2385759949684143, 0.2558729350566864, 0.2731698751449585, 0.290466845035553, 0.3077637851238251, 0.32506072521209717, 0.34235769510269165, 0.35965463519096375, 0.37695157527923584, 0.39424851536750793, 0.41154545545578003, 0.4288424253463745, 0.4461393654346466, 0.4634363055229187, 0.4807332754135132, 0.4980302155017853, 0.5153271555900574]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 7.0, 6.0, 5.0, 9.0, 10.0, 9.0, 11.0, 13.0, 12.0, 22.0, 38.0, 31.0, 26.0, 27.0, 31.0, 36.0, 43.0, 43.0, 45.0, 26.0, 47.0, 35.0, 49.0, 41.0, 42.0, 46.0, 32.0, 40.0, 37.0, 41.0, 23.0, 22.0, 13.0, 17.0, 11.0, 13.0, 10.0, 8.0, 7.0, 2.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.25157982110977173, -0.24420452117919922, -0.2368292212486267, -0.2294539213180542, -0.2220786213874817, -0.21470332145690918, -0.20732800662517548, -0.19995270669460297, -0.19257740676403046, -0.18520210683345795, -0.17782680690288544, -0.17045150697231293, -0.16307619214057922, -0.1557008922100067, -0.1483255922794342, -0.1409502923488617, -0.13357499241828918, -0.12619969248771667, -0.11882439255714417, -0.11144908517599106, -0.10407378524541855, -0.09669848531484604, -0.08932317793369293, -0.08194787800312042, -0.07457257807254791, -0.0671972781419754, -0.059821974486112595, -0.052446670830249786, -0.04507137089967728, -0.03769607096910477, -0.03032076731324196, -0.02294546365737915, -0.01557016372680664, -0.008194861933588982, -0.0008195601403713226, 0.006555741652846336, 0.013931043446063995, 0.021306343376636505, 0.028681647032499313, 0.03605695068836212, 0.04343225061893463, 0.05080755054950714, 0.05818285420536995, 0.06555815786123276, 0.07293345779180527, 0.08030875772237778, 0.08768406510353088, 0.0950593650341034, 0.1024346649646759, 0.10980996489524841, 0.11718526482582092, 0.12456057220697403, 0.13193586468696594, 0.13931116461753845, 0.14668647944927216, 0.15406177937984467, 0.16143707931041718, 0.16881237924098969, 0.1761876791715622, 0.1835629791021347, 0.1909382939338684, 0.19831359386444092, 0.20568889379501343, 0.21306419372558594, 0.22043949365615845]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 8.0, 7.0, 8.0, 15.0, 20.0, 20.0, 34.0, 52.0, 68.0, 106.0, 175.0, 289.0, 433.0, 764.0, 1373.0, 2550.0, 5088.0, 10433.0, 23842.0, 59217.0, 156533.0, 389954.0, 244034.0, 89509.0, 34881.0, 14815.0, 6811.0, 3336.0, 1723.0, 1022.0, 551.0, 285.0, 199.0, 145.0, 81.0, 49.0, 38.0, 27.0, 13.0, 18.0, 11.0, 3.0, 6.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1456298828125, -0.14055824279785156, -0.13548660278320312, -0.1304149627685547, -0.12534332275390625, -0.12027168273925781, -0.11520004272460938, -0.11012840270996094, -0.1050567626953125, -0.09998512268066406, -0.09491348266601562, -0.08984184265136719, -0.08477020263671875, -0.07969856262207031, -0.07462692260742188, -0.06955528259277344, -0.064483642578125, -0.05941200256347656, -0.054340362548828125, -0.04926872253417969, -0.04419708251953125, -0.03912544250488281, -0.034053802490234375, -0.028982162475585938, -0.0239105224609375, -0.018838882446289062, -0.013767242431640625, -0.008695602416992188, -0.00362396240234375, 0.0014476776123046875, 0.006519317626953125, 0.011590957641601562, 0.01666259765625, 0.021734237670898438, 0.026805877685546875, 0.03187751770019531, 0.03694915771484375, 0.04202079772949219, 0.047092437744140625, 0.05216407775878906, 0.0572357177734375, 0.06230735778808594, 0.06737899780273438, 0.07245063781738281, 0.07752227783203125, 0.08259391784667969, 0.08766555786132812, 0.09273719787597656, 0.097808837890625, 0.10288047790527344, 0.10795211791992188, 0.11302375793457031, 0.11809539794921875, 0.12316703796386719, 0.12823867797851562, 0.13331031799316406, 0.1383819580078125, 0.14345359802246094, 0.14852523803710938, 0.1535968780517578, 0.15866851806640625, 0.1637401580810547, 0.16881179809570312, 0.17388343811035156, 0.178955078125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 7.0, 8.0, 21.0, 31.0, 34.0, 37.0, 55.0, 67.0, 58.0, 78.0, 84.0, 73.0, 71.0, 73.0, 53.0, 53.0, 48.0, 37.0, 28.0, 24.0, 16.0, 11.0, 4.0, 9.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04705810546875, -0.045607566833496094, -0.04415702819824219, -0.04270648956298828, -0.041255950927734375, -0.03980541229248047, -0.03835487365722656, -0.036904335021972656, -0.03545379638671875, -0.034003257751464844, -0.03255271911621094, -0.03110218048095703, -0.029651641845703125, -0.02820110321044922, -0.026750564575195312, -0.025300025939941406, -0.0238494873046875, -0.022398948669433594, -0.020948410034179688, -0.01949787139892578, -0.018047332763671875, -0.01659679412841797, -0.015146255493164062, -0.013695716857910156, -0.01224517822265625, -0.010794639587402344, -0.009344100952148438, -0.007893562316894531, -0.006443023681640625, -0.004992485046386719, -0.0035419464111328125, -0.0020914077758789062, -0.000640869140625, 0.0008096694946289062, 0.0022602081298828125, 0.0037107467651367188, 0.005161285400390625, 0.006611824035644531, 0.008062362670898438, 0.009512901306152344, 0.01096343994140625, 0.012413978576660156, 0.013864517211914062, 0.015315055847167969, 0.016765594482421875, 0.01821613311767578, 0.019666671752929688, 0.021117210388183594, 0.0225677490234375, 0.024018287658691406, 0.025468826293945312, 0.02691936492919922, 0.028369903564453125, 0.02982044219970703, 0.03127098083496094, 0.032721519470214844, 0.03417205810546875, 0.035622596740722656, 0.03707313537597656, 0.03852367401123047, 0.039974212646484375, 0.04142475128173828, 0.04287528991699219, 0.044325828552246094, 0.0457763671875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 10.0, 4.0, 11.0, 13.0, 13.0, 17.0, 25.0, 41.0, 71.0, 79.0, 128.0, 146.0, 246.0, 344.0, 589.0, 1089.0, 2063.0, 4242.0, 9920.0, 25412.0, 71432.0, 212906.0, 424781.0, 190478.0, 63769.0, 23199.0, 9085.0, 3919.0, 1767.0, 989.0, 612.0, 372.0, 226.0, 156.0, 117.0, 81.0, 60.0, 44.0, 24.0, 21.0, 20.0, 15.0, 9.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1341552734375, -0.12974929809570312, -0.12534332275390625, -0.12093734741210938, -0.1165313720703125, -0.11212539672851562, -0.10771942138671875, -0.10331344604492188, -0.098907470703125, -0.09450149536132812, -0.09009552001953125, -0.08568954467773438, -0.0812835693359375, -0.07687759399414062, -0.07247161865234375, -0.06806564331054688, -0.06365966796875, -0.059253692626953125, -0.05484771728515625, -0.050441741943359375, -0.0460357666015625, -0.041629791259765625, -0.03722381591796875, -0.032817840576171875, -0.028411865234375, -0.024005889892578125, -0.01959991455078125, -0.015193939208984375, -0.0107879638671875, -0.006381988525390625, -0.00197601318359375, 0.002429962158203125, 0.0068359375, 0.011241912841796875, 0.01564788818359375, 0.020053863525390625, 0.0244598388671875, 0.028865814208984375, 0.03327178955078125, 0.037677764892578125, 0.042083740234375, 0.046489715576171875, 0.05089569091796875, 0.055301666259765625, 0.0597076416015625, 0.06411361694335938, 0.06851959228515625, 0.07292556762695312, 0.07733154296875, 0.08173751831054688, 0.08614349365234375, 0.09054946899414062, 0.0949554443359375, 0.09936141967773438, 0.10376739501953125, 0.10817337036132812, 0.112579345703125, 0.11698532104492188, 0.12139129638671875, 0.12579727172851562, 0.1302032470703125, 0.13460922241210938, 0.13901519775390625, 0.14342117309570312, 0.1478271484375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 7.0, 4.0, 9.0, 9.0, 9.0, 10.0, 14.0, 15.0, 29.0, 18.0, 22.0, 25.0, 27.0, 37.0, 32.0, 20.0, 31.0, 37.0, 44.0, 40.0, 48.0, 47.0, 39.0, 36.0, 39.0, 27.0, 39.0, 36.0, 24.0, 22.0, 20.0, 23.0, 28.0, 21.0, 22.0, 12.0, 13.0, 9.0, 14.0, 10.0, 6.0, 4.0, 6.0, 4.0, 5.0, 6.0, 3.0, 0.0, 4.0], "bins": [-0.1370849609375, -0.13332366943359375, -0.1295623779296875, -0.12580108642578125, -0.122039794921875, -0.11827850341796875, -0.1145172119140625, -0.11075592041015625, -0.10699462890625, -0.10323333740234375, -0.0994720458984375, -0.09571075439453125, -0.091949462890625, -0.08818817138671875, -0.0844268798828125, -0.08066558837890625, -0.076904296875, -0.07314300537109375, -0.0693817138671875, -0.06562042236328125, -0.061859130859375, -0.05809783935546875, -0.0543365478515625, -0.05057525634765625, -0.04681396484375, -0.04305267333984375, -0.0392913818359375, -0.03553009033203125, -0.031768798828125, -0.02800750732421875, -0.0242462158203125, -0.02048492431640625, -0.0167236328125, -0.01296234130859375, -0.0092010498046875, -0.00543975830078125, -0.001678466796875, 0.00208282470703125, 0.0058441162109375, 0.00960540771484375, 0.01336669921875, 0.01712799072265625, 0.0208892822265625, 0.02465057373046875, 0.028411865234375, 0.03217315673828125, 0.0359344482421875, 0.03969573974609375, 0.04345703125, 0.04721832275390625, 0.0509796142578125, 0.05474090576171875, 0.058502197265625, 0.06226348876953125, 0.0660247802734375, 0.06978607177734375, 0.07354736328125, 0.07730865478515625, 0.0810699462890625, 0.08483123779296875, 0.088592529296875, 0.09235382080078125, 0.0961151123046875, 0.09987640380859375, 0.1036376953125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 4.0, 3.0, 5.0, 6.0, 17.0, 14.0, 25.0, 38.0, 65.0, 94.0, 151.0, 267.0, 512.0, 1005.0, 2017.0, 4531.0, 10589.0, 28232.0, 88856.0, 331504.0, 408122.0, 114465.0, 34774.0, 12975.0, 5323.0, 2386.0, 1205.0, 601.0, 320.0, 191.0, 87.0, 66.0, 39.0, 30.0, 14.0, 10.0, 4.0, 8.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.09466552734375, -0.09196853637695312, -0.08927154541015625, -0.08657455444335938, -0.0838775634765625, -0.08118057250976562, -0.07848358154296875, -0.07578659057617188, -0.073089599609375, -0.07039260864257812, -0.06769561767578125, -0.06499862670898438, -0.0623016357421875, -0.059604644775390625, -0.05690765380859375, -0.054210662841796875, -0.051513671875, -0.048816680908203125, -0.04611968994140625, -0.043422698974609375, -0.0407257080078125, -0.038028717041015625, -0.03533172607421875, -0.032634735107421875, -0.029937744140625, -0.027240753173828125, -0.02454376220703125, -0.021846771240234375, -0.0191497802734375, -0.016452789306640625, -0.01375579833984375, -0.011058807373046875, -0.00836181640625, -0.005664825439453125, -0.00296783447265625, -0.000270843505859375, 0.0024261474609375, 0.005123138427734375, 0.00782012939453125, 0.010517120361328125, 0.013214111328125, 0.015911102294921875, 0.01860809326171875, 0.021305084228515625, 0.0240020751953125, 0.026699066162109375, 0.02939605712890625, 0.032093048095703125, 0.0347900390625, 0.037487030029296875, 0.04018402099609375, 0.042881011962890625, 0.0455780029296875, 0.048274993896484375, 0.05097198486328125, 0.053668975830078125, 0.056365966796875, 0.059062957763671875, 0.06175994873046875, 0.06445693969726562, 0.0671539306640625, 0.06985092163085938, 0.07254791259765625, 0.07524490356445312, 0.07794189453125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 7.0, 4.0, 4.0, 4.0, 7.0, 9.0, 10.0, 7.0, 12.0, 22.0, 24.0, 28.0, 25.0, 30.0, 47.0, 49.0, 58.0, 61.0, 74.0, 53.0, 58.0, 66.0, 69.0, 50.0, 29.0, 28.0, 26.0, 27.0, 22.0, 25.0, 13.0, 11.0, 8.0, 7.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3245811462402344e-05, -2.2427178919315338e-05, -2.1608546376228333e-05, -2.0789913833141327e-05, -1.997128129005432e-05, -1.9152648746967316e-05, -1.833401620388031e-05, -1.7515383660793304e-05, -1.66967511177063e-05, -1.5878118574619293e-05, -1.5059486031532288e-05, -1.4240853488445282e-05, -1.3422220945358276e-05, -1.260358840227127e-05, -1.1784955859184265e-05, -1.096632331609726e-05, -1.0147690773010254e-05, -9.329058229923248e-06, -8.510425686836243e-06, -7.691793143749237e-06, -6.8731606006622314e-06, -6.054528057575226e-06, -5.23589551448822e-06, -4.417262971401215e-06, -3.598630428314209e-06, -2.7799978852272034e-06, -1.9613653421401978e-06, -1.1427327990531921e-06, -3.241002559661865e-07, 4.945322871208191e-07, 1.3131648302078247e-06, 2.1317973732948303e-06, 2.950429916381836e-06, 3.7690624594688416e-06, 4.587695002555847e-06, 5.406327545642853e-06, 6.224960088729858e-06, 7.043592631816864e-06, 7.86222517490387e-06, 8.680857717990875e-06, 9.499490261077881e-06, 1.0318122804164886e-05, 1.1136755347251892e-05, 1.1955387890338898e-05, 1.2774020433425903e-05, 1.3592652976512909e-05, 1.4411285519599915e-05, 1.522991806268692e-05, 1.6048550605773926e-05, 1.686718314886093e-05, 1.7685815691947937e-05, 1.8504448235034943e-05, 1.9323080778121948e-05, 2.0141713321208954e-05, 2.096034586429596e-05, 2.1778978407382965e-05, 2.259761095046997e-05, 2.3416243493556976e-05, 2.4234876036643982e-05, 2.5053508579730988e-05, 2.5872141122817993e-05, 2.6690773665905e-05, 2.7509406208992004e-05, 2.832803875207901e-05, 2.9146671295166016e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 5.0, 3.0, 5.0, 6.0, 8.0, 16.0, 27.0, 29.0, 51.0, 60.0, 106.0, 178.0, 298.0, 527.0, 958.0, 1897.0, 4298.0, 10687.0, 30707.0, 111962.0, 443395.0, 328322.0, 77061.0, 22753.0, 8177.0, 3413.0, 1654.0, 808.0, 424.0, 238.0, 162.0, 109.0, 70.0, 50.0, 25.0, 20.0, 21.0, 8.0, 3.0, 9.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07940673828125, -0.07655715942382812, -0.07370758056640625, -0.07085800170898438, -0.0680084228515625, -0.06515884399414062, -0.06230926513671875, -0.059459686279296875, -0.056610107421875, -0.053760528564453125, -0.05091094970703125, -0.048061370849609375, -0.0452117919921875, -0.042362213134765625, -0.03951263427734375, -0.036663055419921875, -0.0338134765625, -0.030963897705078125, -0.02811431884765625, -0.025264739990234375, -0.0224151611328125, -0.019565582275390625, -0.01671600341796875, -0.013866424560546875, -0.011016845703125, -0.008167266845703125, -0.00531768798828125, -0.002468109130859375, 0.0003814697265625, 0.003231048583984375, 0.00608062744140625, 0.008930206298828125, 0.01177978515625, 0.014629364013671875, 0.01747894287109375, 0.020328521728515625, 0.0231781005859375, 0.026027679443359375, 0.02887725830078125, 0.031726837158203125, 0.034576416015625, 0.037425994873046875, 0.04027557373046875, 0.043125152587890625, 0.0459747314453125, 0.048824310302734375, 0.05167388916015625, 0.054523468017578125, 0.057373046875, 0.060222625732421875, 0.06307220458984375, 0.06592178344726562, 0.0687713623046875, 0.07162094116210938, 0.07447052001953125, 0.07732009887695312, 0.080169677734375, 0.08301925659179688, 0.08586883544921875, 0.08871841430664062, 0.0915679931640625, 0.09441757202148438, 0.09726715087890625, 0.10011672973632812, 0.10296630859375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 3.0, 9.0, 8.0, 12.0, 17.0, 18.0, 20.0, 23.0, 45.0, 40.0, 62.0, 53.0, 49.0, 58.0, 63.0, 77.0, 59.0, 61.0, 54.0, 46.0, 41.0, 32.0, 33.0, 24.0, 17.0, 11.0, 9.0, 7.0, 8.0, 4.0, 10.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.06341552734375, -0.06151771545410156, -0.059619903564453125, -0.05772209167480469, -0.05582427978515625, -0.05392646789550781, -0.052028656005859375, -0.05013084411621094, -0.0482330322265625, -0.04633522033691406, -0.044437408447265625, -0.04253959655761719, -0.04064178466796875, -0.03874397277832031, -0.036846160888671875, -0.03494834899902344, -0.033050537109375, -0.031152725219726562, -0.029254913330078125, -0.027357101440429688, -0.02545928955078125, -0.023561477661132812, -0.021663665771484375, -0.019765853881835938, -0.0178680419921875, -0.015970230102539062, -0.014072418212890625, -0.012174606323242188, -0.01027679443359375, -0.008378982543945312, -0.006481170654296875, -0.0045833587646484375, -0.002685546875, -0.0007877349853515625, 0.001110076904296875, 0.0030078887939453125, 0.00490570068359375, 0.0068035125732421875, 0.008701324462890625, 0.010599136352539062, 0.0124969482421875, 0.014394760131835938, 0.016292572021484375, 0.018190383911132812, 0.02008819580078125, 0.021986007690429688, 0.023883819580078125, 0.025781631469726562, 0.027679443359375, 0.029577255249023438, 0.031475067138671875, 0.03337287902832031, 0.03527069091796875, 0.03716850280761719, 0.039066314697265625, 0.04096412658691406, 0.0428619384765625, 0.04475975036621094, 0.046657562255859375, 0.04855537414550781, 0.05045318603515625, 0.05235099792480469, 0.054248809814453125, 0.05614662170410156, 0.05804443359375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 6.0, 10.0, 20.0, 32.0, 60.0, 94.0, 111.0, 162.0, 147.0, 127.0, 91.0, 70.0, 33.0, 20.0, 9.0, 3.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5653105974197388, -1.519366979598999, -1.4734232425689697, -1.4274795055389404, -1.3815358877182007, -1.335592269897461, -1.2896485328674316, -1.2437047958374023, -1.1977611780166626, -1.1518175601959229, -1.1058738231658936, -1.0599300861358643, -1.0139864683151245, -0.96804279088974, -0.9220991134643555, -0.876155436038971, -0.8302117586135864, -0.7842680811882019, -0.7383244037628174, -0.6923807263374329, -0.6464370489120483, -0.6004933714866638, -0.5545496940612793, -0.5086060166358948, -0.46266233921051025, -0.41671866178512573, -0.3707749843597412, -0.3248313069343567, -0.27888762950897217, -0.23294395208358765, -0.18700027465820312, -0.1410565972328186, -0.09511303901672363, -0.04916936159133911, -0.00322568416595459, 0.04271799325942993, 0.08866167068481445, 0.13460534811019897, 0.1805490255355835, 0.22649270296096802, 0.27243638038635254, 0.31838005781173706, 0.3643237352371216, 0.4102674126625061, 0.4562110900878906, 0.5021547675132751, 0.5480984449386597, 0.5940421223640442, 0.6399857997894287, 0.6859294772148132, 0.7318731546401978, 0.7778168320655823, 0.8237605094909668, 0.8697041869163513, 0.9156478643417358, 0.9615915417671204, 1.0075352191925049, 1.0534789562225342, 1.099422574043274, 1.1453661918640137, 1.191309928894043, 1.2372536659240723, 1.283197283744812, 1.3291409015655518, 1.375084638595581]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 2.0, 3.0, 8.0, 9.0, 8.0, 10.0, 17.0, 20.0, 14.0, 23.0, 24.0, 35.0, 35.0, 36.0, 36.0, 36.0, 48.0, 49.0, 51.0, 47.0, 48.0, 41.0, 46.0, 47.0, 34.0, 34.0, 34.0, 34.0, 32.0, 29.0, 23.0, 20.0, 13.0, 14.0, 9.0, 7.0, 9.0, 6.0, 1.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8134320974349976, -0.7879867553710938, -0.7625414133071899, -0.7370960712432861, -0.7116507291793823, -0.6862053871154785, -0.6607600450515747, -0.6353147029876709, -0.6098693609237671, -0.5844240188598633, -0.5589786767959595, -0.5335333347320557, -0.5080879926681519, -0.48264265060424805, -0.4571973383426666, -0.4317519962787628, -0.4063066840171814, -0.3808613419532776, -0.3554159998893738, -0.32997065782546997, -0.30452531576156616, -0.27907997369766235, -0.25363466143608093, -0.22818931937217712, -0.20274397730827332, -0.1772986352443695, -0.1518532931804657, -0.12640796601772308, -0.10096262395381927, -0.07551728188991547, -0.05007195472717285, -0.024626612663269043, 0.000818789005279541, 0.02626412734389305, 0.05170946568250656, 0.07715480029582977, 0.10260014235973358, 0.1280454844236374, 0.15349081158638, 0.1789361536502838, 0.20438149571418762, 0.22982683777809143, 0.25527217984199524, 0.28071749210357666, 0.30616283416748047, 0.3316081762313843, 0.3570535182952881, 0.3824988603591919, 0.4079442024230957, 0.4333895444869995, 0.4588348865509033, 0.48428022861480713, 0.5097255706787109, 0.5351709127426147, 0.5606162548065186, 0.5860615968704224, 0.6115069389343262, 0.63695228099823, 0.6623976230621338, 0.6878429651260376, 0.7132883071899414, 0.7387336492538452, 0.764178991317749, 0.7896243333816528, 0.8150696158409119]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 6.0, 9.0, 18.0, 16.0, 27.0, 36.0, 55.0, 85.0, 142.0, 237.0, 389.0, 664.0, 1113.0, 2017.0, 3946.0, 8124.0, 18769.0, 53958.0, 266129.0, 3533598.0, 222291.0, 48472.0, 17263.0, 7733.0, 3820.0, 2037.0, 1126.0, 746.0, 474.0, 294.0, 208.0, 130.0, 77.0, 78.0, 60.0, 33.0, 21.0, 23.0, 18.0, 8.0, 9.0, 4.0, 5.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.1678466796875, -0.16283035278320312, -0.15781402587890625, -0.15279769897460938, -0.1477813720703125, -0.14276504516601562, -0.13774871826171875, -0.13273239135742188, -0.127716064453125, -0.12269973754882812, -0.11768341064453125, -0.11266708374023438, -0.1076507568359375, -0.10263442993164062, -0.09761810302734375, -0.09260177612304688, -0.08758544921875, -0.08256912231445312, -0.07755279541015625, -0.07253646850585938, -0.0675201416015625, -0.06250381469726562, -0.05748748779296875, -0.052471160888671875, -0.047454833984375, -0.042438507080078125, -0.03742218017578125, -0.032405853271484375, -0.0273895263671875, -0.022373199462890625, -0.01735687255859375, -0.012340545654296875, -0.00732421875, -0.002307891845703125, 0.00270843505859375, 0.007724761962890625, 0.0127410888671875, 0.017757415771484375, 0.02277374267578125, 0.027790069580078125, 0.032806396484375, 0.037822723388671875, 0.04283905029296875, 0.047855377197265625, 0.0528717041015625, 0.057888031005859375, 0.06290435791015625, 0.06792068481445312, 0.07293701171875, 0.07795333862304688, 0.08296966552734375, 0.08798599243164062, 0.0930023193359375, 0.09801864624023438, 0.10303497314453125, 0.10805130004882812, 0.113067626953125, 0.11808395385742188, 0.12310028076171875, 0.12811660766601562, 0.1331329345703125, 0.13814926147460938, 0.14316558837890625, 0.14818191528320312, 0.1531982421875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 10.0, 11.0, 8.0, 15.0, 25.0, 37.0, 33.0, 68.0, 59.0, 67.0, 67.0, 91.0, 69.0, 67.0, 61.0, 71.0, 41.0, 55.0, 39.0, 25.0, 21.0, 15.0, 8.0, 8.0, 6.0, 4.0, 2.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043609619140625, -0.04212760925292969, -0.040645599365234375, -0.03916358947753906, -0.03768157958984375, -0.03619956970214844, -0.034717559814453125, -0.03323554992675781, -0.0317535400390625, -0.030271530151367188, -0.028789520263671875, -0.027307510375976562, -0.02582550048828125, -0.024343490600585938, -0.022861480712890625, -0.021379470825195312, -0.0198974609375, -0.018415451049804688, -0.016933441162109375, -0.015451431274414062, -0.01396942138671875, -0.012487411499023438, -0.011005401611328125, -0.009523391723632812, -0.0080413818359375, -0.0065593719482421875, -0.005077362060546875, -0.0035953521728515625, -0.00211334228515625, -0.0006313323974609375, 0.000850677490234375, 0.0023326873779296875, 0.003814697265625, 0.0052967071533203125, 0.006778717041015625, 0.008260726928710938, 0.00974273681640625, 0.011224746704101562, 0.012706756591796875, 0.014188766479492188, 0.0156707763671875, 0.017152786254882812, 0.018634796142578125, 0.020116806030273438, 0.02159881591796875, 0.023080825805664062, 0.024562835693359375, 0.026044845581054688, 0.02752685546875, 0.029008865356445312, 0.030490875244140625, 0.03197288513183594, 0.03345489501953125, 0.03493690490722656, 0.036418914794921875, 0.03790092468261719, 0.0393829345703125, 0.04086494445800781, 0.042346954345703125, 0.04382896423339844, 0.04531097412109375, 0.04679298400878906, 0.048274993896484375, 0.04975700378417969, 0.051239013671875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 10.0, 8.0, 9.0, 17.0, 23.0, 36.0, 49.0, 89.0, 128.0, 199.0, 334.0, 559.0, 958.0, 1670.0, 3036.0, 6347.0, 14384.0, 36850.0, 119816.0, 1028056.0, 2739306.0, 163639.0, 45781.0, 17267.0, 7518.0, 3621.0, 1919.0, 1029.0, 620.0, 369.0, 235.0, 153.0, 78.0, 61.0, 24.0, 32.0, 12.0, 13.0, 16.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.177734375, -0.17281150817871094, -0.16788864135742188, -0.1629657745361328, -0.15804290771484375, -0.1531200408935547, -0.14819717407226562, -0.14327430725097656, -0.1383514404296875, -0.13342857360839844, -0.12850570678710938, -0.12358283996582031, -0.11865997314453125, -0.11373710632324219, -0.10881423950195312, -0.10389137268066406, -0.098968505859375, -0.09404563903808594, -0.08912277221679688, -0.08419990539550781, -0.07927703857421875, -0.07435417175292969, -0.06943130493164062, -0.06450843811035156, -0.0595855712890625, -0.05466270446777344, -0.049739837646484375, -0.04481697082519531, -0.03989410400390625, -0.03497123718261719, -0.030048370361328125, -0.025125503540039062, -0.02020263671875, -0.015279769897460938, -0.010356903076171875, -0.0054340362548828125, -0.00051116943359375, 0.0044116973876953125, 0.009334564208984375, 0.014257431030273438, 0.0191802978515625, 0.024103164672851562, 0.029026031494140625, 0.03394889831542969, 0.03887176513671875, 0.04379463195800781, 0.048717498779296875, 0.05364036560058594, 0.058563232421875, 0.06348609924316406, 0.06840896606445312, 0.07333183288574219, 0.07825469970703125, 0.08317756652832031, 0.08810043334960938, 0.09302330017089844, 0.0979461669921875, 0.10286903381347656, 0.10779190063476562, 0.11271476745605469, 0.11763763427734375, 0.12256050109863281, 0.12748336791992188, 0.13240623474121094, 0.1373291015625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 5.0, 0.0, 8.0, 9.0, 14.0, 9.0, 22.0, 28.0, 41.0, 56.0, 71.0, 145.0, 244.0, 674.0, 1650.0, 475.0, 206.0, 139.0, 64.0, 56.0, 41.0, 22.0, 24.0, 15.0, 12.0, 9.0, 5.0, 10.0, 2.0, 2.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.09368896484375, -0.09118175506591797, -0.08867454528808594, -0.0861673355102539, -0.08366012573242188, -0.08115291595458984, -0.07864570617675781, -0.07613849639892578, -0.07363128662109375, -0.07112407684326172, -0.06861686706542969, -0.06610965728759766, -0.06360244750976562, -0.061095237731933594, -0.05858802795410156, -0.05608081817626953, -0.0535736083984375, -0.05106639862060547, -0.04855918884277344, -0.046051979064941406, -0.043544769287109375, -0.041037559509277344, -0.03853034973144531, -0.03602313995361328, -0.03351593017578125, -0.03100872039794922, -0.028501510620117188, -0.025994300842285156, -0.023487091064453125, -0.020979881286621094, -0.018472671508789062, -0.01596546173095703, -0.013458251953125, -0.010951042175292969, -0.008443832397460938, -0.005936622619628906, -0.003429412841796875, -0.0009222030639648438, 0.0015850067138671875, 0.004092216491699219, 0.00659942626953125, 0.009106636047363281, 0.011613845825195312, 0.014121055603027344, 0.016628265380859375, 0.019135475158691406, 0.021642684936523438, 0.02414989471435547, 0.0266571044921875, 0.02916431427001953, 0.03167152404785156, 0.034178733825683594, 0.036685943603515625, 0.039193153381347656, 0.04170036315917969, 0.04420757293701172, 0.04671478271484375, 0.04922199249267578, 0.05172920227050781, 0.054236412048339844, 0.056743621826171875, 0.059250831604003906, 0.06175804138183594, 0.06426525115966797, 0.0667724609375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 9.0, 19.0, 11.0, 21.0, 39.0, 39.0, 78.0, 87.0, 94.0, 119.0, 114.0, 111.0, 83.0, 55.0, 38.0, 30.0, 20.0, 14.0, 9.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5666863918304443, -0.5516281723976135, -0.5365700125694275, -0.5215117931365967, -0.5064535737037659, -0.49139538407325745, -0.476337194442749, -0.4612789750099182, -0.4462207853794098, -0.43116259574890137, -0.41610437631607056, -0.40104618668556213, -0.3859879970550537, -0.3709297776222229, -0.3558715879917145, -0.34081339836120605, -0.32575517892837524, -0.3106969892978668, -0.295638769865036, -0.2805805802345276, -0.2655223608016968, -0.25046417117118835, -0.23540598154067993, -0.22034777700901031, -0.2052895724773407, -0.19023136794567108, -0.17517316341400146, -0.16011497378349304, -0.14505676925182343, -0.1299985647201538, -0.11494036763906479, -0.09988217055797577, -0.08482396602630615, -0.06976576149463654, -0.054707564413547516, -0.0396493636071682, -0.02459116280078888, -0.009532958269119263, 0.005525238811969757, 0.020583435893058777, 0.035641640424728394, 0.05069984123110771, 0.06575804203748703, 0.08081623911857605, 0.09587444365024567, 0.11093264818191528, 0.1259908378124237, 0.14104904234409332, 0.15610724687576294, 0.17116545140743256, 0.18622365593910217, 0.2012818455696106, 0.2163400501012802, 0.23139825463294983, 0.24645644426345825, 0.26151466369628906, 0.2765728533267975, 0.2916310429573059, 0.3066892623901367, 0.32174745202064514, 0.33680564165115356, 0.3518638610839844, 0.3669220507144928, 0.3819802403450012, 0.39703845977783203]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 6.0, 10.0, 10.0, 14.0, 10.0, 9.0, 13.0, 19.0, 30.0, 33.0, 21.0, 34.0, 42.0, 45.0, 34.0, 40.0, 37.0, 48.0, 40.0, 40.0, 50.0, 44.0, 34.0, 44.0, 33.0, 54.0, 32.0, 21.0, 25.0, 24.0, 13.0, 20.0, 11.0, 12.0, 9.0, 6.0, 6.0, 11.0, 6.0, 3.0, 6.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2719373106956482, -0.26371222734451294, -0.2554871439933777, -0.24726206064224243, -0.23903697729110718, -0.23081189393997192, -0.22258679568767548, -0.21436171233654022, -0.20613662898540497, -0.19791154563426971, -0.18968646228313446, -0.1814613789319992, -0.17323628067970276, -0.1650111973285675, -0.15678611397743225, -0.148561030626297, -0.14033594727516174, -0.1321108639240265, -0.12388578057289124, -0.11566068977117538, -0.10743560642004013, -0.09921052306890488, -0.09098543226718903, -0.08276034891605377, -0.07453526556491852, -0.06631018221378326, -0.05808509513735771, -0.04986000806093216, -0.041634924709796906, -0.03340984135866165, -0.0251847542822361, -0.016959667205810547, -0.008734583854675293, -0.0005094986408948898, 0.007715586572885513, 0.015940671786665916, 0.02416575700044632, 0.032390840351581573, 0.040615927428007126, 0.04884101450443268, 0.05706609785556793, 0.06529118120670319, 0.07351626455783844, 0.08174135535955429, 0.08996643871068954, 0.0981915220618248, 0.10641661286354065, 0.1146416962146759, 0.12286677956581116, 0.1310918629169464, 0.13931694626808167, 0.14754202961921692, 0.15576711297035217, 0.16399219632148743, 0.17221729457378387, 0.18044237792491913, 0.18866746127605438, 0.19689254462718964, 0.2051176279783249, 0.21334271132946014, 0.2215678095817566, 0.22979289293289185, 0.2380179762840271, 0.24624305963516235, 0.2544681429862976]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 13.0, 14.0, 21.0, 36.0, 65.0, 132.0, 220.0, 356.0, 761.0, 1626.0, 3701.0, 9836.0, 28742.0, 103420.0, 655218.0, 180032.0, 41640.0, 13604.0, 5064.0, 2061.0, 945.0, 491.0, 224.0, 113.0, 86.0, 42.0, 34.0, 22.0, 13.0, 4.0, 5.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.25537109375, -0.24778366088867188, -0.24019622802734375, -0.23260879516601562, -0.2250213623046875, -0.21743392944335938, -0.20984649658203125, -0.20225906372070312, -0.194671630859375, -0.18708419799804688, -0.17949676513671875, -0.17190933227539062, -0.1643218994140625, -0.15673446655273438, -0.14914703369140625, -0.14155960083007812, -0.13397216796875, -0.12638473510742188, -0.11879730224609375, -0.11120986938476562, -0.1036224365234375, -0.09603500366210938, -0.08844757080078125, -0.08086013793945312, -0.073272705078125, -0.06568527221679688, -0.05809783935546875, -0.050510406494140625, -0.0429229736328125, -0.035335540771484375, -0.02774810791015625, -0.020160675048828125, -0.0125732421875, -0.004985809326171875, 0.00260162353515625, 0.010189056396484375, 0.0177764892578125, 0.025363922119140625, 0.03295135498046875, 0.040538787841796875, 0.048126220703125, 0.055713653564453125, 0.06330108642578125, 0.07088851928710938, 0.0784759521484375, 0.08606338500976562, 0.09365081787109375, 0.10123825073242188, 0.10882568359375, 0.11641311645507812, 0.12400054931640625, 0.13158798217773438, 0.1391754150390625, 0.14676284790039062, 0.15435028076171875, 0.16193771362304688, 0.169525146484375, 0.17711257934570312, 0.18470001220703125, 0.19228744506835938, 0.1998748779296875, 0.20746231079101562, 0.21504974365234375, 0.22263717651367188, 0.230224609375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 11.0, 9.0, 25.0, 22.0, 30.0, 54.0, 57.0, 86.0, 79.0, 87.0, 79.0, 85.0, 70.0, 71.0, 54.0, 47.0, 32.0, 28.0, 21.0, 10.0, 9.0, 9.0, 4.0, 3.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0537109375, -0.0520625114440918, -0.050414085388183594, -0.04876565933227539, -0.04711723327636719, -0.045468807220458984, -0.04382038116455078, -0.04217195510864258, -0.040523529052734375, -0.03887510299682617, -0.03722667694091797, -0.035578250885009766, -0.03392982482910156, -0.03228139877319336, -0.030632972717285156, -0.028984546661376953, -0.02733612060546875, -0.025687694549560547, -0.024039268493652344, -0.02239084243774414, -0.020742416381835938, -0.019093990325927734, -0.01744556427001953, -0.015797138214111328, -0.014148712158203125, -0.012500286102294922, -0.010851860046386719, -0.009203433990478516, -0.0075550079345703125, -0.005906581878662109, -0.004258155822753906, -0.002609729766845703, -0.0009613037109375, 0.0006871223449707031, 0.0023355484008789062, 0.003983974456787109, 0.0056324005126953125, 0.007280826568603516, 0.008929252624511719, 0.010577678680419922, 0.012226104736328125, 0.013874530792236328, 0.015522956848144531, 0.017171382904052734, 0.018819808959960938, 0.02046823501586914, 0.022116661071777344, 0.023765087127685547, 0.02541351318359375, 0.027061939239501953, 0.028710365295410156, 0.03035879135131836, 0.03200721740722656, 0.033655643463134766, 0.03530406951904297, 0.03695249557495117, 0.038600921630859375, 0.04024934768676758, 0.04189777374267578, 0.043546199798583984, 0.04519462585449219, 0.04684305191040039, 0.048491477966308594, 0.0501399040222168, 0.051788330078125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 9.0, 5.0, 9.0, 8.0, 11.0, 14.0, 26.0, 16.0, 36.0, 64.0, 105.0, 134.0, 196.0, 309.0, 564.0, 937.0, 1689.0, 3060.0, 6924.0, 18865.0, 68212.0, 492802.0, 368684.0, 56488.0, 16322.0, 6233.0, 3060.0, 1501.0, 877.0, 483.0, 307.0, 197.0, 120.0, 79.0, 55.0, 40.0, 39.0, 19.0, 13.0, 13.0, 7.0, 12.0, 1.0, 6.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.2152099609375, -0.20922088623046875, -0.2032318115234375, -0.19724273681640625, -0.191253662109375, -0.18526458740234375, -0.1792755126953125, -0.17328643798828125, -0.16729736328125, -0.16130828857421875, -0.1553192138671875, -0.14933013916015625, -0.143341064453125, -0.13735198974609375, -0.1313629150390625, -0.12537384033203125, -0.119384765625, -0.11339569091796875, -0.1074066162109375, -0.10141754150390625, -0.095428466796875, -0.08943939208984375, -0.0834503173828125, -0.07746124267578125, -0.07147216796875, -0.06548309326171875, -0.0594940185546875, -0.05350494384765625, -0.047515869140625, -0.04152679443359375, -0.0355377197265625, -0.02954864501953125, -0.0235595703125, -0.01757049560546875, -0.0115814208984375, -0.00559234619140625, 0.000396728515625, 0.00638580322265625, 0.0123748779296875, 0.01836395263671875, 0.02435302734375, 0.03034210205078125, 0.0363311767578125, 0.04232025146484375, 0.048309326171875, 0.05429840087890625, 0.0602874755859375, 0.06627655029296875, 0.072265625, 0.07825469970703125, 0.0842437744140625, 0.09023284912109375, 0.096221923828125, 0.10221099853515625, 0.1082000732421875, 0.11418914794921875, 0.12017822265625, 0.12616729736328125, 0.1321563720703125, 0.13814544677734375, 0.144134521484375, 0.15012359619140625, 0.1561126708984375, 0.16210174560546875, 0.1680908203125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 7.0, 1.0, 7.0, 10.0, 10.0, 20.0, 21.0, 19.0, 24.0, 28.0, 48.0, 44.0, 51.0, 52.0, 64.0, 70.0, 63.0, 66.0, 57.0, 50.0, 44.0, 52.0, 38.0, 35.0, 32.0, 23.0, 21.0, 10.0, 8.0, 4.0, 6.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1636962890625, -0.15790748596191406, -0.15211868286132812, -0.1463298797607422, -0.14054107666015625, -0.1347522735595703, -0.12896347045898438, -0.12317466735839844, -0.1173858642578125, -0.11159706115722656, -0.10580825805664062, -0.10001945495605469, -0.09423065185546875, -0.08844184875488281, -0.08265304565429688, -0.07686424255371094, -0.071075439453125, -0.06528663635253906, -0.059497833251953125, -0.05370903015136719, -0.04792022705078125, -0.04213142395019531, -0.036342620849609375, -0.030553817749023438, -0.0247650146484375, -0.018976211547851562, -0.013187408447265625, -0.0073986053466796875, -0.00160980224609375, 0.0041790008544921875, 0.009967803955078125, 0.015756607055664062, 0.02154541015625, 0.027334213256835938, 0.033123016357421875, 0.03891181945800781, 0.04470062255859375, 0.05048942565917969, 0.056278228759765625, 0.06206703186035156, 0.0678558349609375, 0.07364463806152344, 0.07943344116210938, 0.08522224426269531, 0.09101104736328125, 0.09679985046386719, 0.10258865356445312, 0.10837745666503906, 0.114166259765625, 0.11995506286621094, 0.12574386596679688, 0.1315326690673828, 0.13732147216796875, 0.1431102752685547, 0.14889907836914062, 0.15468788146972656, 0.1604766845703125, 0.16626548767089844, 0.17205429077148438, 0.1778430938720703, 0.18363189697265625, 0.1894207000732422, 0.19520950317382812, 0.20099830627441406, 0.206787109375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 7.0, 10.0, 18.0, 25.0, 33.0, 57.0, 113.0, 198.0, 341.0, 757.0, 1688.0, 4978.0, 17465.0, 84205.0, 786537.0, 120351.0, 22052.0, 5862.0, 2028.0, 881.0, 409.0, 205.0, 138.0, 65.0, 36.0, 27.0, 18.0, 7.0, 10.0, 7.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.1829833984375, -0.17824077606201172, -0.17349815368652344, -0.16875553131103516, -0.16401290893554688, -0.1592702865600586, -0.1545276641845703, -0.14978504180908203, -0.14504241943359375, -0.14029979705810547, -0.1355571746826172, -0.1308145523071289, -0.12607192993164062, -0.12132930755615234, -0.11658668518066406, -0.11184406280517578, -0.1071014404296875, -0.10235881805419922, -0.09761619567871094, -0.09287357330322266, -0.08813095092773438, -0.0833883285522461, -0.07864570617675781, -0.07390308380126953, -0.06916046142578125, -0.06441783905029297, -0.05967521667480469, -0.054932594299316406, -0.050189971923828125, -0.045447349548339844, -0.04070472717285156, -0.03596210479736328, -0.031219482421875, -0.02647686004638672, -0.021734237670898438, -0.016991615295410156, -0.012248992919921875, -0.007506370544433594, -0.0027637481689453125, 0.0019788742065429688, 0.00672149658203125, 0.011464118957519531, 0.016206741333007812, 0.020949363708496094, 0.025691986083984375, 0.030434608459472656, 0.03517723083496094, 0.03991985321044922, 0.0446624755859375, 0.04940509796142578, 0.05414772033691406, 0.058890342712402344, 0.06363296508789062, 0.0683755874633789, 0.07311820983886719, 0.07786083221435547, 0.08260345458984375, 0.08734607696533203, 0.09208869934082031, 0.0968313217163086, 0.10157394409179688, 0.10631656646728516, 0.11105918884277344, 0.11580181121826172, 0.12054443359375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 15.0, 11.0, 17.0, 35.0, 36.0, 66.0, 88.0, 119.0, 135.0, 125.0, 91.0, 69.0, 46.0, 46.0, 30.0, 16.0, 9.0, 14.0, 6.0, 8.0, 5.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.37905502319336e-05, -7.21421092748642e-05, -7.04936683177948e-05, -6.88452273607254e-05, -6.7196786403656e-05, -6.554834544658661e-05, -6.389990448951721e-05, -6.225146353244781e-05, -6.060302257537842e-05, -5.895458161830902e-05, -5.7306140661239624e-05, -5.565769970417023e-05, -5.400925874710083e-05, -5.236081779003143e-05, -5.0712376832962036e-05, -4.906393587589264e-05, -4.741549491882324e-05, -4.5767053961753845e-05, -4.411861300468445e-05, -4.247017204761505e-05, -4.0821731090545654e-05, -3.917329013347626e-05, -3.752484917640686e-05, -3.587640821933746e-05, -3.4227967262268066e-05, -3.257952630519867e-05, -3.093108534812927e-05, -2.9282644391059875e-05, -2.763420343399048e-05, -2.598576247692108e-05, -2.4337321519851685e-05, -2.2688880562782288e-05, -2.104043960571289e-05, -1.9391998648643494e-05, -1.7743557691574097e-05, -1.60951167345047e-05, -1.4446675777435303e-05, -1.2798234820365906e-05, -1.1149793863296509e-05, -9.501352906227112e-06, -7.852911949157715e-06, -6.204470992088318e-06, -4.556030035018921e-06, -2.907589077949524e-06, -1.259148120880127e-06, 3.8929283618927e-07, 2.037733793258667e-06, 3.686174750328064e-06, 5.334615707397461e-06, 6.983056664466858e-06, 8.631497621536255e-06, 1.0279938578605652e-05, 1.1928379535675049e-05, 1.3576820492744446e-05, 1.5225261449813843e-05, 1.687370240688324e-05, 1.8522143363952637e-05, 2.0170584321022034e-05, 2.181902527809143e-05, 2.3467466235160828e-05, 2.5115907192230225e-05, 2.676434814929962e-05, 2.841278910636902e-05, 3.0061230063438416e-05, 3.170967102050781e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 10.0, 10.0, 7.0, 14.0, 17.0, 21.0, 50.0, 60.0, 75.0, 128.0, 230.0, 378.0, 763.0, 1654.0, 3824.0, 10677.0, 37318.0, 289773.0, 626041.0, 54570.0, 14077.0, 4716.0, 2033.0, 957.0, 466.0, 272.0, 133.0, 83.0, 52.0, 34.0, 24.0, 34.0, 16.0, 13.0, 3.0, 3.0, 7.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1181640625, -0.11410713195800781, -0.11005020141601562, -0.10599327087402344, -0.10193634033203125, -0.09787940979003906, -0.09382247924804688, -0.08976554870605469, -0.0857086181640625, -0.08165168762207031, -0.07759475708007812, -0.07353782653808594, -0.06948089599609375, -0.06542396545410156, -0.061367034912109375, -0.05731010437011719, -0.053253173828125, -0.04919624328613281, -0.045139312744140625, -0.04108238220214844, -0.03702545166015625, -0.03296852111816406, -0.028911590576171875, -0.024854660034179688, -0.0207977294921875, -0.016740798950195312, -0.012683868408203125, -0.008626937866210938, -0.00457000732421875, -0.0005130767822265625, 0.003543853759765625, 0.0076007843017578125, 0.01165771484375, 0.015714645385742188, 0.019771575927734375, 0.023828506469726562, 0.02788543701171875, 0.03194236755371094, 0.035999298095703125, 0.04005622863769531, 0.0441131591796875, 0.04817008972167969, 0.052227020263671875, 0.05628395080566406, 0.06034088134765625, 0.06439781188964844, 0.06845474243164062, 0.07251167297363281, 0.076568603515625, 0.08062553405761719, 0.08468246459960938, 0.08873939514160156, 0.09279632568359375, 0.09685325622558594, 0.10091018676757812, 0.10496711730957031, 0.1090240478515625, 0.11308097839355469, 0.11713790893554688, 0.12119483947753906, 0.12525177001953125, 0.12930870056152344, 0.13336563110351562, 0.1374225616455078, 0.1414794921875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 7.0, 2.0, 5.0, 15.0, 17.0, 23.0, 30.0, 60.0, 110.0, 218.0, 203.0, 125.0, 59.0, 47.0, 16.0, 21.0, 10.0, 6.0, 11.0, 5.0, 9.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1138916015625, -0.1105508804321289, -0.10721015930175781, -0.10386943817138672, -0.10052871704101562, -0.09718799591064453, -0.09384727478027344, -0.09050655364990234, -0.08716583251953125, -0.08382511138916016, -0.08048439025878906, -0.07714366912841797, -0.07380294799804688, -0.07046222686767578, -0.06712150573730469, -0.0637807846069336, -0.0604400634765625, -0.057099342346191406, -0.05375862121582031, -0.05041790008544922, -0.047077178955078125, -0.04373645782470703, -0.04039573669433594, -0.037055015563964844, -0.03371429443359375, -0.030373573303222656, -0.027032852172851562, -0.02369213104248047, -0.020351409912109375, -0.01701068878173828, -0.013669967651367188, -0.010329246520996094, -0.006988525390625, -0.0036478042602539062, -0.0003070831298828125, 0.0030336380004882812, 0.006374359130859375, 0.009715080261230469, 0.013055801391601562, 0.016396522521972656, 0.01973724365234375, 0.023077964782714844, 0.026418685913085938, 0.02975940704345703, 0.033100128173828125, 0.03644084930419922, 0.03978157043457031, 0.043122291564941406, 0.0464630126953125, 0.049803733825683594, 0.05314445495605469, 0.05648517608642578, 0.059825897216796875, 0.06316661834716797, 0.06650733947753906, 0.06984806060791016, 0.07318878173828125, 0.07652950286865234, 0.07987022399902344, 0.08321094512939453, 0.08655166625976562, 0.08989238739013672, 0.09323310852050781, 0.0965738296508789, 0.09991455078125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 6.0, 22.0, 35.0, 118.0, 195.0, 223.0, 219.0, 109.0, 46.0, 23.0, 6.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.665393352508545, -3.5882980823516846, -3.511202573776245, -3.4341073036193848, -3.3570117950439453, -3.279916524887085, -3.2028210163116455, -3.125725746154785, -3.0486302375793457, -2.9715349674224854, -2.894439458847046, -2.8173441886901855, -2.740248680114746, -2.6631534099578857, -2.5860579013824463, -2.508962631225586, -2.4318673610687256, -2.3547720909118652, -2.277676582336426, -2.2005813121795654, -2.123485803604126, -2.0463905334472656, -1.9692951440811157, -1.8921997547149658, -1.815104365348816, -1.738008975982666, -1.6609135866165161, -1.5838181972503662, -1.5067229270935059, -1.4296274185180664, -1.352532148361206, -1.2754367589950562, -1.1983413696289062, -1.1212459802627563, -1.0441505908966064, -0.9670552611351013, -0.8899598717689514, -0.8128644824028015, -0.7357691526412964, -0.6586737632751465, -0.5815783739089966, -0.5044829845428467, -0.42738762497901917, -0.35029226541519165, -0.27319687604904175, -0.19610148668289185, -0.11900612711906433, -0.041910767555236816, 0.035184621810913086, 0.1122799962759018, 0.1893753707408905, 0.266470730304718, 0.3435661196708679, 0.4206615090370178, 0.49775686860084534, 0.5748522281646729, 0.6519476175308228, 0.7290430068969727, 0.8061383962631226, 0.8832337260246277, 0.9603291153907776, 1.0374245643615723, 1.1145198345184326, 1.1916152238845825, 1.2687106132507324]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 6.0, 2.0, 8.0, 7.0, 13.0, 14.0, 11.0, 18.0, 30.0, 18.0, 27.0, 25.0, 26.0, 36.0, 28.0, 46.0, 37.0, 44.0, 38.0, 46.0, 30.0, 33.0, 45.0, 40.0, 33.0, 29.0, 28.0, 34.0, 23.0, 35.0, 19.0, 24.0, 23.0, 21.0, 21.0, 12.0, 14.0, 18.0, 6.0, 9.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.6341946125030518, -0.6144767999649048, -0.5947589874267578, -0.5750411748886108, -0.5553233027458191, -0.5356054902076721, -0.5158876776695251, -0.4961698651313782, -0.4764520525932312, -0.45673424005508423, -0.43701639771461487, -0.4172985851764679, -0.3975807726383209, -0.37786293029785156, -0.3581451177597046, -0.3384273052215576, -0.31870946288108826, -0.2989916503429413, -0.2792738080024719, -0.25955599546432495, -0.23983818292617798, -0.2201203554868698, -0.20040252804756165, -0.18068471550941467, -0.1609668880701065, -0.14124906063079834, -0.12153124809265137, -0.1018134206533432, -0.08209560066461563, -0.06237778067588806, -0.042659953236579895, -0.022942140698432922, -0.003224313259124756, 0.016493508592247963, 0.03621133044362068, 0.05592915415763855, 0.07564697414636612, 0.09536479413509369, 0.11508262157440186, 0.13480043411254883, 0.154518261551857, 0.17423608899116516, 0.19395390152931213, 0.2136717289686203, 0.23338955640792847, 0.25310736894607544, 0.2728251814842224, 0.2925429940223694, 0.31226083636283875, 0.3319786489009857, 0.3516964912414551, 0.37141430377960205, 0.391132116317749, 0.410849928855896, 0.43056777119636536, 0.45028558373451233, 0.4700034260749817, 0.48972123861312866, 0.5094390511512756, 0.5291569232940674, 0.5488747358322144, 0.5685925483703613, 0.5883103609085083, 0.6080281734466553, 0.6277459859848022]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 12.0, 6.0, 8.0, 10.0, 30.0, 32.0, 46.0, 63.0, 119.0, 189.0, 268.0, 515.0, 936.0, 1744.0, 3344.0, 7053.0, 17439.0, 56789.0, 483919.0, 3480138.0, 97432.0, 24990.0, 9582.0, 4376.0, 2267.0, 1163.0, 724.0, 386.0, 224.0, 153.0, 106.0, 65.0, 59.0, 32.0, 14.0, 14.0, 13.0, 9.0, 8.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1822509765625, -0.17600440979003906, -0.16975784301757812, -0.1635112762451172, -0.15726470947265625, -0.1510181427001953, -0.14477157592773438, -0.13852500915527344, -0.1322784423828125, -0.12603187561035156, -0.11978530883789062, -0.11353874206542969, -0.10729217529296875, -0.10104560852050781, -0.09479904174804688, -0.08855247497558594, -0.082305908203125, -0.07605934143066406, -0.06981277465820312, -0.06356620788574219, -0.05731964111328125, -0.05107307434082031, -0.044826507568359375, -0.03857994079589844, -0.0323333740234375, -0.026086807250976562, -0.019840240478515625, -0.013593673706054688, -0.00734710693359375, -0.0011005401611328125, 0.005146026611328125, 0.011392593383789062, 0.01763916015625, 0.023885726928710938, 0.030132293701171875, 0.03637886047363281, 0.04262542724609375, 0.04887199401855469, 0.055118560791015625, 0.06136512756347656, 0.0676116943359375, 0.07385826110839844, 0.08010482788085938, 0.08635139465332031, 0.09259796142578125, 0.09884452819824219, 0.10509109497070312, 0.11133766174316406, 0.117584228515625, 0.12383079528808594, 0.13007736206054688, 0.1363239288330078, 0.14257049560546875, 0.1488170623779297, 0.15506362915039062, 0.16131019592285156, 0.1675567626953125, 0.17380332946777344, 0.18004989624023438, 0.1862964630126953, 0.19254302978515625, 0.1987895965576172, 0.20503616333007812, 0.21128273010253906, 0.217529296875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 7.0, 7.0, 12.0, 24.0, 20.0, 27.0, 57.0, 69.0, 69.0, 67.0, 71.0, 88.0, 64.0, 67.0, 74.0, 69.0, 46.0, 39.0, 43.0, 26.0, 12.0, 13.0, 7.0, 6.0, 5.0, 3.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054901123046875, -0.05318927764892578, -0.05147743225097656, -0.049765586853027344, -0.048053741455078125, -0.046341896057128906, -0.04463005065917969, -0.04291820526123047, -0.04120635986328125, -0.03949451446533203, -0.03778266906738281, -0.036070823669433594, -0.034358978271484375, -0.032647132873535156, -0.030935287475585938, -0.02922344207763672, -0.0275115966796875, -0.02579975128173828, -0.024087905883789062, -0.022376060485839844, -0.020664215087890625, -0.018952369689941406, -0.017240524291992188, -0.015528678894042969, -0.01381683349609375, -0.012104988098144531, -0.010393142700195312, -0.008681297302246094, -0.006969451904296875, -0.005257606506347656, -0.0035457611083984375, -0.0018339157104492188, -0.0001220703125, 0.0015897750854492188, 0.0033016204833984375, 0.005013465881347656, 0.006725311279296875, 0.008437156677246094, 0.010149002075195312, 0.011860847473144531, 0.01357269287109375, 0.015284538269042969, 0.016996383666992188, 0.018708229064941406, 0.020420074462890625, 0.022131919860839844, 0.023843765258789062, 0.02555561065673828, 0.0272674560546875, 0.02897930145263672, 0.030691146850585938, 0.032402992248535156, 0.034114837646484375, 0.035826683044433594, 0.03753852844238281, 0.03925037384033203, 0.04096221923828125, 0.04267406463623047, 0.04438591003417969, 0.046097755432128906, 0.047809600830078125, 0.049521446228027344, 0.05123329162597656, 0.05294513702392578, 0.054656982421875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 8.0, 14.0, 14.0, 17.0, 28.0, 45.0, 51.0, 80.0, 91.0, 131.0, 212.0, 287.0, 455.0, 687.0, 1176.0, 2066.0, 3939.0, 9040.0, 23641.0, 77256.0, 793258.0, 3117565.0, 111864.0, 29770.0, 11495.0, 4957.0, 2401.0, 1371.0, 816.0, 513.0, 310.0, 223.0, 142.0, 102.0, 72.0, 38.0, 40.0, 28.0, 22.0, 15.0, 16.0, 10.0, 8.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.217041015625, -0.2106800079345703, -0.20431900024414062, -0.19795799255371094, -0.19159698486328125, -0.18523597717285156, -0.17887496948242188, -0.1725139617919922, -0.1661529541015625, -0.1597919464111328, -0.15343093872070312, -0.14706993103027344, -0.14070892333984375, -0.13434791564941406, -0.12798690795898438, -0.12162590026855469, -0.115264892578125, -0.10890388488769531, -0.10254287719726562, -0.09618186950683594, -0.08982086181640625, -0.08345985412597656, -0.07709884643554688, -0.07073783874511719, -0.0643768310546875, -0.05801582336425781, -0.051654815673828125, -0.04529380798339844, -0.03893280029296875, -0.03257179260253906, -0.026210784912109375, -0.019849777221679688, -0.01348876953125, -0.0071277618408203125, -0.000766754150390625, 0.0055942535400390625, 0.01195526123046875, 0.018316268920898438, 0.024677276611328125, 0.031038284301757812, 0.0373992919921875, 0.04376029968261719, 0.050121307373046875, 0.05648231506347656, 0.06284332275390625, 0.06920433044433594, 0.07556533813476562, 0.08192634582519531, 0.088287353515625, 0.09464836120605469, 0.10100936889648438, 0.10737037658691406, 0.11373138427734375, 0.12009239196777344, 0.12645339965820312, 0.1328144073486328, 0.1391754150390625, 0.1455364227294922, 0.15189743041992188, 0.15825843811035156, 0.16461944580078125, 0.17098045349121094, 0.17734146118164062, 0.1837024688720703, 0.1900634765625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 4.0, 11.0, 11.0, 11.0, 26.0, 27.0, 43.0, 62.0, 164.0, 392.0, 2082.0, 747.0, 218.0, 98.0, 49.0, 38.0, 23.0, 16.0, 8.0, 12.0, 9.0, 6.0, 6.0, 7.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11456298828125, -0.1113576889038086, -0.10815238952636719, -0.10494709014892578, -0.10174179077148438, -0.09853649139404297, -0.09533119201660156, -0.09212589263916016, -0.08892059326171875, -0.08571529388427734, -0.08250999450683594, -0.07930469512939453, -0.07609939575195312, -0.07289409637451172, -0.06968879699707031, -0.0664834976196289, -0.0632781982421875, -0.060072898864746094, -0.05686759948730469, -0.05366230010986328, -0.050457000732421875, -0.04725170135498047, -0.04404640197753906, -0.040841102600097656, -0.03763580322265625, -0.034430503845214844, -0.031225204467773438, -0.02801990509033203, -0.024814605712890625, -0.02160930633544922, -0.018404006958007812, -0.015198707580566406, -0.011993408203125, -0.008788108825683594, -0.0055828094482421875, -0.0023775100708007812, 0.000827789306640625, 0.004033088684082031, 0.0072383880615234375, 0.010443687438964844, 0.01364898681640625, 0.016854286193847656, 0.020059585571289062, 0.02326488494873047, 0.026470184326171875, 0.02967548370361328, 0.03288078308105469, 0.036086082458496094, 0.0392913818359375, 0.042496681213378906, 0.04570198059082031, 0.04890727996826172, 0.052112579345703125, 0.05531787872314453, 0.05852317810058594, 0.061728477478027344, 0.06493377685546875, 0.06813907623291016, 0.07134437561035156, 0.07454967498779297, 0.07775497436523438, 0.08096027374267578, 0.08416557312011719, 0.0873708724975586, 0.090576171875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 13.0, 15.0, 21.0, 45.0, 64.0, 88.0, 112.0, 141.0, 144.0, 118.0, 104.0, 45.0, 31.0, 25.0, 9.0, 6.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5436254143714905, -0.526502788066864, -0.5093802213668823, -0.49225762486457825, -0.47513502836227417, -0.4580124020576477, -0.44088980555534363, -0.42376720905303955, -0.4066446125507355, -0.3895220160484314, -0.3723994195461273, -0.35527682304382324, -0.3381541967391968, -0.3210316300392151, -0.3039090037345886, -0.28678640723228455, -0.26966381072998047, -0.2525412142276764, -0.23541861772537231, -0.21829600632190704, -0.20117340981960297, -0.1840508133172989, -0.16692820191383362, -0.14980560541152954, -0.13268300890922546, -0.11556041240692139, -0.09843780845403671, -0.08131520450115204, -0.06419260799884796, -0.047070011496543884, -0.02994740754365921, -0.012824803590774536, 0.004297852516174316, 0.021420452743768692, 0.03854305297136307, 0.05566565319895744, 0.07278825342655182, 0.0899108499288559, 0.10703345388174057, 0.12415605783462524, 0.14127865433692932, 0.1584012508392334, 0.17552384734153748, 0.19264645874500275, 0.20976905524730682, 0.2268916517496109, 0.24401426315307617, 0.26113685965538025, 0.2782594561576843, 0.2953820526599884, 0.3125046491622925, 0.32962724566459656, 0.34674984216690063, 0.3638724684715271, 0.3809950649738312, 0.39811766147613525, 0.41524025797843933, 0.4323628544807434, 0.4494854509830475, 0.46660804748535156, 0.483730673789978, 0.5008532404899597, 0.5179758667945862, 0.5350984334945679, 0.5522210597991943]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 5.0, 3.0, 4.0, 2.0, 9.0, 10.0, 16.0, 14.0, 10.0, 18.0, 23.0, 34.0, 26.0, 24.0, 28.0, 36.0, 40.0, 34.0, 28.0, 28.0, 47.0, 32.0, 38.0, 43.0, 46.0, 40.0, 22.0, 39.0, 31.0, 30.0, 41.0, 30.0, 20.0, 28.0, 17.0, 15.0, 18.0, 14.0, 11.0, 8.0, 8.0, 7.0, 2.0, 6.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.20087182521820068, -0.19409941136837006, -0.18732699751853943, -0.1805545836687088, -0.17378216981887817, -0.16700975596904755, -0.16023734211921692, -0.1534649133682251, -0.14669251441955566, -0.13992010056972504, -0.1331476867198944, -0.12637527287006378, -0.11960285902023315, -0.11283044517040253, -0.1060580238699913, -0.09928561002016068, -0.09251318871974945, -0.08574077486991882, -0.0789683610200882, -0.07219594717025757, -0.06542353332042694, -0.058651115745306015, -0.05187869817018509, -0.04510628432035446, -0.038333870470523834, -0.03156145662069321, -0.02478904090821743, -0.018016625195741653, -0.011244211345911026, -0.0044717974960803986, 0.0023006200790405273, 0.009073033928871155, 0.015845447778701782, 0.02261786162853241, 0.029390277341008186, 0.03616269305348396, 0.04293510690331459, 0.04970752075314522, 0.056479938328266144, 0.06325235217809677, 0.0700247660279274, 0.07679717987775803, 0.08356959372758865, 0.09034201502799988, 0.0971144288778305, 0.10388684272766113, 0.11065925657749176, 0.11743167042732239, 0.12420408427715302, 0.13097649812698364, 0.13774891197681427, 0.1445213258266449, 0.15129373967647552, 0.15806615352630615, 0.16483858227729797, 0.1716109812259674, 0.17838340997695923, 0.18515582382678986, 0.19192823767662048, 0.1987006515264511, 0.20547306537628174, 0.21224547922611237, 0.219017893075943, 0.22579032182693481, 0.23256272077560425]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 6.0, 6.0, 12.0, 35.0, 53.0, 79.0, 140.0, 315.0, 619.0, 1513.0, 3970.0, 11566.0, 39863.0, 219009.0, 650165.0, 87400.0, 22470.0, 7053.0, 2485.0, 879.0, 426.0, 204.0, 115.0, 64.0, 37.0, 30.0, 15.0, 11.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.2386474609375, -0.23168373107910156, -0.22472000122070312, -0.2177562713623047, -0.21079254150390625, -0.2038288116455078, -0.19686508178710938, -0.18990135192871094, -0.1829376220703125, -0.17597389221191406, -0.16901016235351562, -0.1620464324951172, -0.15508270263671875, -0.1481189727783203, -0.14115524291992188, -0.13419151306152344, -0.127227783203125, -0.12026405334472656, -0.11330032348632812, -0.10633659362792969, -0.09937286376953125, -0.09240913391113281, -0.08544540405273438, -0.07848167419433594, -0.0715179443359375, -0.06455421447753906, -0.057590484619140625, -0.05062675476074219, -0.04366302490234375, -0.03669929504394531, -0.029735565185546875, -0.022771835327148438, -0.01580810546875, -0.008844375610351562, -0.001880645751953125, 0.0050830841064453125, 0.01204681396484375, 0.019010543823242188, 0.025974273681640625, 0.03293800354003906, 0.0399017333984375, 0.04686546325683594, 0.053829193115234375, 0.06079292297363281, 0.06775665283203125, 0.07472038269042969, 0.08168411254882812, 0.08864784240722656, 0.095611572265625, 0.10257530212402344, 0.10953903198242188, 0.11650276184082031, 0.12346649169921875, 0.1304302215576172, 0.13739395141601562, 0.14435768127441406, 0.1513214111328125, 0.15828514099121094, 0.16524887084960938, 0.1722126007080078, 0.17917633056640625, 0.1861400604248047, 0.19310379028320312, 0.20006752014160156, 0.20703125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 13.0, 13.0, 24.0, 19.0, 27.0, 50.0, 54.0, 60.0, 55.0, 88.0, 77.0, 65.0, 82.0, 77.0, 73.0, 46.0, 52.0, 35.0, 23.0, 16.0, 14.0, 13.0, 6.0, 5.0, 7.0, 0.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.060821533203125, -0.059103965759277344, -0.05738639831542969, -0.05566883087158203, -0.053951263427734375, -0.05223369598388672, -0.05051612854003906, -0.048798561096191406, -0.04708099365234375, -0.045363426208496094, -0.04364585876464844, -0.04192829132080078, -0.040210723876953125, -0.03849315643310547, -0.03677558898925781, -0.035058021545410156, -0.0333404541015625, -0.031622886657714844, -0.029905319213867188, -0.02818775177001953, -0.026470184326171875, -0.02475261688232422, -0.023035049438476562, -0.021317481994628906, -0.01959991455078125, -0.017882347106933594, -0.016164779663085938, -0.014447212219238281, -0.012729644775390625, -0.011012077331542969, -0.009294509887695312, -0.007576942443847656, -0.005859375, -0.004141807556152344, -0.0024242401123046875, -0.0007066726684570312, 0.001010894775390625, 0.0027284622192382812, 0.0044460296630859375, 0.006163597106933594, 0.00788116455078125, 0.009598731994628906, 0.011316299438476562, 0.013033866882324219, 0.014751434326171875, 0.01646900177001953, 0.018186569213867188, 0.019904136657714844, 0.0216217041015625, 0.023339271545410156, 0.025056838989257812, 0.02677440643310547, 0.028491973876953125, 0.03020954132080078, 0.03192710876464844, 0.033644676208496094, 0.03536224365234375, 0.037079811096191406, 0.03879737854003906, 0.04051494598388672, 0.042232513427734375, 0.04395008087158203, 0.04566764831542969, 0.047385215759277344, 0.049102783203125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 13.0, 13.0, 19.0, 27.0, 50.0, 107.0, 148.0, 324.0, 704.0, 1514.0, 3723.0, 9594.0, 28763.0, 121474.0, 753297.0, 90183.0, 24438.0, 8393.0, 3203.0, 1320.0, 573.0, 283.0, 158.0, 90.0, 59.0, 29.0, 24.0, 8.0, 10.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2276611328125, -0.22017860412597656, -0.21269607543945312, -0.2052135467529297, -0.19773101806640625, -0.1902484893798828, -0.18276596069335938, -0.17528343200683594, -0.1678009033203125, -0.16031837463378906, -0.15283584594726562, -0.1453533172607422, -0.13787078857421875, -0.1303882598876953, -0.12290573120117188, -0.11542320251464844, -0.107940673828125, -0.10045814514160156, -0.09297561645507812, -0.08549308776855469, -0.07801055908203125, -0.07052803039550781, -0.06304550170898438, -0.05556297302246094, -0.0480804443359375, -0.04059791564941406, -0.033115386962890625, -0.025632858276367188, -0.01815032958984375, -0.010667800903320312, -0.003185272216796875, 0.0042972564697265625, 0.01177978515625, 0.019262313842773438, 0.026744842529296875, 0.03422737121582031, 0.04170989990234375, 0.04919242858886719, 0.056674957275390625, 0.06415748596191406, 0.0716400146484375, 0.07912254333496094, 0.08660507202148438, 0.09408760070800781, 0.10157012939453125, 0.10905265808105469, 0.11653518676757812, 0.12401771545410156, 0.131500244140625, 0.13898277282714844, 0.14646530151367188, 0.1539478302001953, 0.16143035888671875, 0.1689128875732422, 0.17639541625976562, 0.18387794494628906, 0.1913604736328125, 0.19884300231933594, 0.20632553100585938, 0.2138080596923828, 0.22129058837890625, 0.2287731170654297, 0.23625564575195312, 0.24373817443847656, 0.251220703125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 7.0, 5.0, 8.0, 11.0, 20.0, 23.0, 37.0, 30.0, 46.0, 42.0, 63.0, 63.0, 78.0, 75.0, 65.0, 67.0, 62.0, 63.0, 41.0, 46.0, 22.0, 27.0, 24.0, 23.0, 12.0, 7.0, 8.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.277587890625, -0.2702445983886719, -0.26290130615234375, -0.2555580139160156, -0.2482147216796875, -0.24087142944335938, -0.23352813720703125, -0.22618484497070312, -0.218841552734375, -0.21149826049804688, -0.20415496826171875, -0.19681167602539062, -0.1894683837890625, -0.18212509155273438, -0.17478179931640625, -0.16743850708007812, -0.16009521484375, -0.15275192260742188, -0.14540863037109375, -0.13806533813476562, -0.1307220458984375, -0.12337875366210938, -0.11603546142578125, -0.10869216918945312, -0.101348876953125, -0.09400558471679688, -0.08666229248046875, -0.07931900024414062, -0.0719757080078125, -0.06463241577148438, -0.05728912353515625, -0.049945831298828125, -0.0426025390625, -0.035259246826171875, -0.02791595458984375, -0.020572662353515625, -0.0132293701171875, -0.005886077880859375, 0.00145721435546875, 0.008800506591796875, 0.016143798828125, 0.023487091064453125, 0.03083038330078125, 0.038173675537109375, 0.0455169677734375, 0.052860260009765625, 0.06020355224609375, 0.06754684448242188, 0.07489013671875, 0.08223342895507812, 0.08957672119140625, 0.09692001342773438, 0.1042633056640625, 0.11160659790039062, 0.11894989013671875, 0.12629318237304688, 0.133636474609375, 0.14097976684570312, 0.14832305908203125, 0.15566635131835938, 0.1630096435546875, 0.17035293579101562, 0.17769622802734375, 0.18503952026367188, 0.1923828125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 10.0, 5.0, 9.0, 17.0, 17.0, 23.0, 31.0, 56.0, 102.0, 122.0, 203.0, 287.0, 505.0, 931.0, 1755.0, 3780.0, 9428.0, 30452.0, 245933.0, 688643.0, 43933.0, 12698.0, 4802.0, 2144.0, 1053.0, 628.0, 341.0, 208.0, 134.0, 99.0, 64.0, 39.0, 32.0, 23.0, 13.0, 19.0, 8.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.14453125, -0.1395702362060547, -0.13460922241210938, -0.12964820861816406, -0.12468719482421875, -0.11972618103027344, -0.11476516723632812, -0.10980415344238281, -0.1048431396484375, -0.09988212585449219, -0.09492111206054688, -0.08996009826660156, -0.08499908447265625, -0.08003807067871094, -0.07507705688476562, -0.07011604309082031, -0.065155029296875, -0.06019401550292969, -0.055233001708984375, -0.05027198791503906, -0.04531097412109375, -0.04034996032714844, -0.035388946533203125, -0.030427932739257812, -0.0254669189453125, -0.020505905151367188, -0.015544891357421875, -0.010583877563476562, -0.00562286376953125, -0.0006618499755859375, 0.004299163818359375, 0.009260177612304688, 0.01422119140625, 0.019182205200195312, 0.024143218994140625, 0.029104232788085938, 0.03406524658203125, 0.03902626037597656, 0.043987274169921875, 0.04894828796386719, 0.0539093017578125, 0.05887031555175781, 0.06383132934570312, 0.06879234313964844, 0.07375335693359375, 0.07871437072753906, 0.08367538452148438, 0.08863639831542969, 0.093597412109375, 0.09855842590332031, 0.10351943969726562, 0.10848045349121094, 0.11344146728515625, 0.11840248107910156, 0.12336349487304688, 0.1283245086669922, 0.1332855224609375, 0.1382465362548828, 0.14320755004882812, 0.14816856384277344, 0.15312957763671875, 0.15809059143066406, 0.16305160522460938, 0.1680126190185547, 0.1729736328125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 4.0, 5.0, 11.0, 6.0, 17.0, 22.0, 37.0, 56.0, 59.0, 81.0, 120.0, 91.0, 103.0, 110.0, 60.0, 52.0, 36.0, 28.0, 25.0, 26.0, 13.0, 8.0, 7.0, 7.0, 3.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.86102294921875e-05, -2.7223490178585052e-05, -2.5836750864982605e-05, -2.4450011551380157e-05, -2.306327223777771e-05, -2.1676532924175262e-05, -2.0289793610572815e-05, -1.8903054296970367e-05, -1.751631498336792e-05, -1.6129575669765472e-05, -1.4742836356163025e-05, -1.3356097042560577e-05, -1.196935772895813e-05, -1.0582618415355682e-05, -9.195879101753235e-06, -7.809139788150787e-06, -6.42240047454834e-06, -5.035661160945892e-06, -3.648921847343445e-06, -2.2621825337409973e-06, -8.754432201385498e-07, 5.112960934638977e-07, 1.8980354070663452e-06, 3.2847747206687927e-06, 4.67151403427124e-06, 6.058253347873688e-06, 7.444992661476135e-06, 8.831731975078583e-06, 1.021847128868103e-05, 1.1605210602283478e-05, 1.2991949915885925e-05, 1.4378689229488373e-05, 1.576542854309082e-05, 1.7152167856693268e-05, 1.8538907170295715e-05, 1.9925646483898163e-05, 2.131238579750061e-05, 2.2699125111103058e-05, 2.4085864424705505e-05, 2.5472603738307953e-05, 2.68593430519104e-05, 2.8246082365512848e-05, 2.9632821679115295e-05, 3.101956099271774e-05, 3.240630030632019e-05, 3.379303961992264e-05, 3.5179778933525085e-05, 3.656651824712753e-05, 3.795325756072998e-05, 3.933999687433243e-05, 4.0726736187934875e-05, 4.211347550153732e-05, 4.350021481513977e-05, 4.488695412874222e-05, 4.6273693442344666e-05, 4.766043275594711e-05, 4.904717206954956e-05, 5.043391138315201e-05, 5.1820650696754456e-05, 5.32073900103569e-05, 5.459412932395935e-05, 5.59808686375618e-05, 5.7367607951164246e-05, 5.875434726476669e-05, 6.014108657836914e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 10.0, 18.0, 14.0, 23.0, 42.0, 63.0, 88.0, 174.0, 258.0, 483.0, 1031.0, 2180.0, 5203.0, 14883.0, 53522.0, 780202.0, 149692.0, 26030.0, 8193.0, 3275.0, 1515.0, 678.0, 407.0, 217.0, 130.0, 80.0, 52.0, 26.0, 22.0, 11.0, 10.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1650390625, -0.1596698760986328, -0.15430068969726562, -0.14893150329589844, -0.14356231689453125, -0.13819313049316406, -0.13282394409179688, -0.1274547576904297, -0.1220855712890625, -0.11671638488769531, -0.11134719848632812, -0.10597801208496094, -0.10060882568359375, -0.09523963928222656, -0.08987045288085938, -0.08450126647949219, -0.079132080078125, -0.07376289367675781, -0.06839370727539062, -0.06302452087402344, -0.05765533447265625, -0.05228614807128906, -0.046916961669921875, -0.04154777526855469, -0.0361785888671875, -0.030809402465820312, -0.025440216064453125, -0.020071029663085938, -0.01470184326171875, -0.009332656860351562, -0.003963470458984375, 0.0014057159423828125, 0.00677490234375, 0.012144088745117188, 0.017513275146484375, 0.022882461547851562, 0.02825164794921875, 0.03362083435058594, 0.038990020751953125, 0.04435920715332031, 0.0497283935546875, 0.05509757995605469, 0.060466766357421875, 0.06583595275878906, 0.07120513916015625, 0.07657432556152344, 0.08194351196289062, 0.08731269836425781, 0.092681884765625, 0.09805107116699219, 0.10342025756835938, 0.10878944396972656, 0.11415863037109375, 0.11952781677246094, 0.12489700317382812, 0.1302661895751953, 0.1356353759765625, 0.1410045623779297, 0.14637374877929688, 0.15174293518066406, 0.15711212158203125, 0.16248130798339844, 0.16785049438476562, 0.1732196807861328, 0.1785888671875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 6.0, 2.0, 7.0, 10.0, 10.0, 7.0, 12.0, 26.0, 32.0, 53.0, 110.0, 264.0, 219.0, 103.0, 36.0, 18.0, 21.0, 18.0, 14.0, 5.0, 6.0, 6.0, 4.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09320068359375, -0.08849048614501953, -0.08378028869628906, -0.0790700912475586, -0.07435989379882812, -0.06964969635009766, -0.06493949890136719, -0.06022930145263672, -0.05551910400390625, -0.05080890655517578, -0.04609870910644531, -0.041388511657714844, -0.036678314208984375, -0.031968116760253906, -0.027257919311523438, -0.02254772186279297, -0.0178375244140625, -0.013127326965332031, -0.008417129516601562, -0.0037069320678710938, 0.001003265380859375, 0.005713462829589844, 0.010423660278320312, 0.015133857727050781, 0.01984405517578125, 0.02455425262451172, 0.029264450073242188, 0.033974647521972656, 0.038684844970703125, 0.043395042419433594, 0.04810523986816406, 0.05281543731689453, 0.057525634765625, 0.06223583221435547, 0.06694602966308594, 0.0716562271118164, 0.07636642456054688, 0.08107662200927734, 0.08578681945800781, 0.09049701690673828, 0.09520721435546875, 0.09991741180419922, 0.10462760925292969, 0.10933780670166016, 0.11404800415039062, 0.1187582015991211, 0.12346839904785156, 0.12817859649658203, 0.1328887939453125, 0.13759899139404297, 0.14230918884277344, 0.1470193862915039, 0.15172958374023438, 0.15643978118896484, 0.1611499786376953, 0.16586017608642578, 0.17057037353515625, 0.17528057098388672, 0.1799907684326172, 0.18470096588134766, 0.18941116333007812, 0.1941213607788086, 0.19883155822753906, 0.20354175567626953, 0.208251953125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 5.0, 5.0, 18.0, 21.0, 26.0, 40.0, 60.0, 98.0, 95.0, 115.0, 109.0, 108.0, 92.0, 69.0, 40.0, 27.0, 26.0, 14.0, 13.0, 4.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2618948221206665, -1.2237956523895264, -1.1856964826583862, -1.1475971937179565, -1.1094980239868164, -1.0713988542556763, -1.0332996845245361, -0.995200514793396, -0.9571012854576111, -0.919002115726471, -0.880902886390686, -0.8428037166595459, -0.8047045469284058, -0.7666053175926208, -0.7285061478614807, -0.6904069185256958, -0.6523077487945557, -0.6142085790634155, -0.5761093497276306, -0.5380101799964905, -0.49991098046302795, -0.46181178092956543, -0.4237126111984253, -0.38561341166496277, -0.34751421213150024, -0.3094150125980377, -0.2713158130645752, -0.23321664333343506, -0.19511744379997253, -0.15701824426651, -0.11891905963420868, -0.08081987500190735, -0.042720675468444824, -0.004621483385562897, 0.03347770869731903, 0.07157690078020096, 0.10967609286308289, 0.1477752923965454, 0.18587447702884674, 0.22397366166114807, 0.2620728611946106, 0.3001720607280731, 0.33827126026153564, 0.3763704299926758, 0.4144696295261383, 0.45256882905960083, 0.49066799879074097, 0.5287672281265259, 0.566866397857666, 0.6049655675888062, 0.6430647969245911, 0.6811639666557312, 0.7192631959915161, 0.7573623657226562, 0.7954615354537964, 0.8335607051849365, 0.8716599345207214, 0.9097591042518616, 0.9478583335876465, 0.9859575033187866, 1.0240566730499268, 1.0621559619903564, 1.1002551317214966, 1.1383543014526367, 1.1764534711837769]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 5.0, 10.0, 7.0, 8.0, 8.0, 18.0, 25.0, 25.0, 13.0, 25.0, 29.0, 23.0, 29.0, 41.0, 30.0, 40.0, 39.0, 36.0, 43.0, 37.0, 41.0, 38.0, 42.0, 40.0, 35.0, 30.0, 34.0, 27.0, 24.0, 29.0, 20.0, 22.0, 18.0, 14.0, 20.0, 17.0, 8.0, 10.0, 10.0, 6.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0], "bins": [-0.7505302429199219, -0.727845311164856, -0.7051604390144348, -0.6824755072593689, -0.659790575504303, -0.6371057033538818, -0.6144207715988159, -0.59173583984375, -0.5690509080886841, -0.5463659763336182, -0.523681104183197, -0.5009961724281311, -0.4783112406730652, -0.45562633872032166, -0.4329414367675781, -0.4102565050125122, -0.38757163286209106, -0.36488673090934753, -0.3422017991542816, -0.3195168972015381, -0.29683196544647217, -0.27414706349372864, -0.2514621615409851, -0.22877724468708038, -0.20609232783317566, -0.18340741097927094, -0.1607224941253662, -0.13803759217262268, -0.11535267531871796, -0.09266775846481323, -0.0699828565120697, -0.04729793965816498, -0.024613022804260254, -0.0019281096756458282, 0.020756803452968597, 0.043441712856292725, 0.06612662971019745, 0.08881154656410217, 0.1114964485168457, 0.13418136537075043, 0.15686628222465515, 0.17955119907855988, 0.2022361159324646, 0.22492101788520813, 0.24760593473911285, 0.2702908515930176, 0.2929757535457611, 0.31566065549850464, 0.33834558725357056, 0.3610304892063141, 0.38371542096138, 0.40640032291412354, 0.42908525466918945, 0.451770156621933, 0.4744550585746765, 0.49713999032974243, 0.5198248624801636, 0.5425097942352295, 0.5651946663856506, 0.5878795981407166, 0.6105645298957825, 0.6332494020462036, 0.6559343338012695, 0.6786192655563354, 0.7013041973114014]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 3.0, 12.0, 18.0, 21.0, 41.0, 52.0, 84.0, 159.0, 239.0, 391.0, 648.0, 1203.0, 2378.0, 5116.0, 11864.0, 31627.0, 123389.0, 3584981.0, 344376.0, 54658.0, 17906.0, 7440.0, 3432.0, 1784.0, 937.0, 558.0, 361.0, 212.0, 140.0, 81.0, 69.0, 33.0, 26.0, 21.0, 7.0, 9.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.290771484375, -0.2828559875488281, -0.27494049072265625, -0.2670249938964844, -0.2591094970703125, -0.2511940002441406, -0.24327850341796875, -0.23536300659179688, -0.227447509765625, -0.21953201293945312, -0.21161651611328125, -0.20370101928710938, -0.1957855224609375, -0.18787002563476562, -0.17995452880859375, -0.17203903198242188, -0.16412353515625, -0.15620803833007812, -0.14829254150390625, -0.14037704467773438, -0.1324615478515625, -0.12454605102539062, -0.11663055419921875, -0.10871505737304688, -0.100799560546875, -0.09288406372070312, -0.08496856689453125, -0.07705307006835938, -0.0691375732421875, -0.061222076416015625, -0.05330657958984375, -0.045391082763671875, -0.0374755859375, -0.029560089111328125, -0.02164459228515625, -0.013729095458984375, -0.0058135986328125, 0.002101898193359375, 0.01001739501953125, 0.017932891845703125, 0.025848388671875, 0.033763885498046875, 0.04167938232421875, 0.049594879150390625, 0.0575103759765625, 0.06542587280273438, 0.07334136962890625, 0.08125686645507812, 0.08917236328125, 0.09708786010742188, 0.10500335693359375, 0.11291885375976562, 0.1208343505859375, 0.12874984741210938, 0.13666534423828125, 0.14458084106445312, 0.152496337890625, 0.16041183471679688, 0.16832733154296875, 0.17624282836914062, 0.1841583251953125, 0.19207382202148438, 0.19998931884765625, 0.20790481567382812, 0.2158203125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 4.0, 4.0, 9.0, 19.0, 23.0, 30.0, 35.0, 49.0, 53.0, 61.0, 71.0, 64.0, 69.0, 77.0, 63.0, 57.0, 63.0, 61.0, 45.0, 32.0, 22.0, 21.0, 25.0, 10.0, 8.0, 8.0, 11.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0576171875, -0.05589008331298828, -0.05416297912597656, -0.052435874938964844, -0.050708770751953125, -0.048981666564941406, -0.04725456237792969, -0.04552745819091797, -0.04380035400390625, -0.04207324981689453, -0.04034614562988281, -0.038619041442871094, -0.036891937255859375, -0.035164833068847656, -0.03343772888183594, -0.03171062469482422, -0.0299835205078125, -0.02825641632080078, -0.026529312133789062, -0.024802207946777344, -0.023075103759765625, -0.021347999572753906, -0.019620895385742188, -0.01789379119873047, -0.01616668701171875, -0.014439582824707031, -0.012712478637695312, -0.010985374450683594, -0.009258270263671875, -0.007531166076660156, -0.0058040618896484375, -0.004076957702636719, -0.002349853515625, -0.0006227493286132812, 0.0011043548583984375, 0.0028314590454101562, 0.004558563232421875, 0.006285667419433594, 0.008012771606445312, 0.009739875793457031, 0.01146697998046875, 0.013194084167480469, 0.014921188354492188, 0.016648292541503906, 0.018375396728515625, 0.020102500915527344, 0.021829605102539062, 0.02355670928955078, 0.0252838134765625, 0.02701091766357422, 0.028738021850585938, 0.030465126037597656, 0.032192230224609375, 0.033919334411621094, 0.03564643859863281, 0.03737354278564453, 0.03910064697265625, 0.04082775115966797, 0.04255485534667969, 0.044281959533691406, 0.046009063720703125, 0.047736167907714844, 0.04946327209472656, 0.05119037628173828, 0.05291748046875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 4.0, 13.0, 21.0, 33.0, 48.0, 60.0, 69.0, 126.0, 145.0, 217.0, 266.0, 432.0, 621.0, 919.0, 1389.0, 2478.0, 4353.0, 8451.0, 17294.0, 39472.0, 113366.0, 743228.0, 3003607.0, 163094.0, 50243.0, 21279.0, 9958.0, 5121.0, 2954.0, 1634.0, 1085.0, 733.0, 451.0, 323.0, 213.0, 174.0, 115.0, 83.0, 68.0, 41.0, 36.0, 16.0, 17.0, 8.0, 12.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2142333984375, -0.2075672149658203, -0.20090103149414062, -0.19423484802246094, -0.18756866455078125, -0.18090248107910156, -0.17423629760742188, -0.1675701141357422, -0.1609039306640625, -0.1542377471923828, -0.14757156372070312, -0.14090538024902344, -0.13423919677734375, -0.12757301330566406, -0.12090682983398438, -0.11424064636230469, -0.107574462890625, -0.10090827941894531, -0.09424209594726562, -0.08757591247558594, -0.08090972900390625, -0.07424354553222656, -0.06757736206054688, -0.06091117858886719, -0.0542449951171875, -0.04757881164550781, -0.040912628173828125, -0.03424644470214844, -0.02758026123046875, -0.020914077758789062, -0.014247894287109375, -0.0075817108154296875, -0.00091552734375, 0.0057506561279296875, 0.012416839599609375, 0.019083023071289062, 0.02574920654296875, 0.03241539001464844, 0.039081573486328125, 0.04574775695800781, 0.0524139404296875, 0.05908012390136719, 0.06574630737304688, 0.07241249084472656, 0.07907867431640625, 0.08574485778808594, 0.09241104125976562, 0.09907722473144531, 0.105743408203125, 0.11240959167480469, 0.11907577514648438, 0.12574195861816406, 0.13240814208984375, 0.13907432556152344, 0.14574050903320312, 0.1524066925048828, 0.1590728759765625, 0.1657390594482422, 0.17240524291992188, 0.17907142639160156, 0.18573760986328125, 0.19240379333496094, 0.19906997680664062, 0.2057361602783203, 0.21240234375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 12.0, 17.0, 10.0, 26.0, 30.0, 34.0, 50.0, 92.0, 142.0, 318.0, 2118.0, 687.0, 215.0, 101.0, 63.0, 43.0, 27.0, 21.0, 21.0, 13.0, 11.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12115478515625, -0.11722278594970703, -0.11329078674316406, -0.1093587875366211, -0.10542678833007812, -0.10149478912353516, -0.09756278991699219, -0.09363079071044922, -0.08969879150390625, -0.08576679229736328, -0.08183479309082031, -0.07790279388427734, -0.07397079467773438, -0.0700387954711914, -0.06610679626464844, -0.06217479705810547, -0.0582427978515625, -0.05431079864501953, -0.05037879943847656, -0.046446800231933594, -0.042514801025390625, -0.038582801818847656, -0.03465080261230469, -0.03071880340576172, -0.02678680419921875, -0.02285480499267578, -0.018922805786132812, -0.014990806579589844, -0.011058807373046875, -0.007126808166503906, -0.0031948089599609375, 0.0007371902465820312, 0.004669189453125, 0.008601188659667969, 0.012533187866210938, 0.016465187072753906, 0.020397186279296875, 0.024329185485839844, 0.028261184692382812, 0.03219318389892578, 0.03612518310546875, 0.04005718231201172, 0.04398918151855469, 0.047921180725097656, 0.051853179931640625, 0.055785179138183594, 0.05971717834472656, 0.06364917755126953, 0.0675811767578125, 0.07151317596435547, 0.07544517517089844, 0.0793771743774414, 0.08330917358398438, 0.08724117279052734, 0.09117317199707031, 0.09510517120361328, 0.09903717041015625, 0.10296916961669922, 0.10690116882324219, 0.11083316802978516, 0.11476516723632812, 0.1186971664428711, 0.12262916564941406, 0.12656116485595703, 0.1304931640625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 5.0, 6.0, 12.0, 23.0, 32.0, 58.0, 68.0, 149.0, 152.0, 155.0, 128.0, 93.0, 50.0, 34.0, 20.0, 12.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.161692500114441, -1.1336348056793213, -1.1055772304534912, -1.0775195360183716, -1.0494619607925415, -1.0214042663574219, -0.9933466911315918, -0.9652889966964722, -0.9372313618659973, -0.9091737270355225, -0.8811160922050476, -0.8530584573745728, -0.8250008225440979, -0.796943187713623, -0.7688854932785034, -0.7408278584480286, -0.7127702236175537, -0.6847125887870789, -0.656654953956604, -0.6285973191261292, -0.6005396842956543, -0.5724819898605347, -0.5444244146347046, -0.516366720199585, -0.4883091449737549, -0.46025151014328003, -0.4321938753128052, -0.4041362404823303, -0.3760785758495331, -0.3480209410190582, -0.3199633061885834, -0.29190564155578613, -0.2638480067253113, -0.23579037189483643, -0.20773272216320038, -0.17967508733272552, -0.15161743760108948, -0.12355980277061462, -0.09550216794013977, -0.06744451820850372, -0.03938688337802887, -0.011329242959618568, 0.016728397458791733, 0.044786036014556885, 0.07284367829561234, 0.10090132057666779, 0.12895895540714264, 0.1570166051387787, 0.18507423996925354, 0.2131318747997284, 0.24118952453136444, 0.2692471742630005, 0.29730480909347534, 0.3253624439239502, 0.35342007875442505, 0.3814777135848999, 0.40953534841537476, 0.4375929832458496, 0.46565061807632446, 0.4937082529067993, 0.5217658877372742, 0.549823522567749, 0.5778812170028687, 0.6059388518333435, 0.6339964866638184]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 1.0, 4.0, 4.0, 2.0, 5.0, 5.0, 6.0, 6.0, 16.0, 8.0, 13.0, 13.0, 16.0, 18.0, 28.0, 29.0, 30.0, 36.0, 41.0, 30.0, 30.0, 33.0, 44.0, 39.0, 44.0, 24.0, 43.0, 39.0, 41.0, 46.0, 32.0, 32.0, 34.0, 35.0, 27.0, 12.0, 23.0, 20.0, 17.0, 20.0, 11.0, 13.0, 14.0, 7.0, 3.0, 7.0, 4.0, 3.0, 0.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31650543212890625, -0.3055785298347473, -0.29465165734291077, -0.28372475504875183, -0.2727978527545929, -0.26187095046043396, -0.2509440779685974, -0.24001717567443848, -0.22909027338027954, -0.2181633859872818, -0.20723648369312286, -0.19630959630012512, -0.1853826940059662, -0.17445580661296844, -0.1635289192199707, -0.15260201692581177, -0.14167512953281403, -0.13074824213981628, -0.11982133984565735, -0.1088944524526596, -0.09796755015850067, -0.08704066276550293, -0.07611376792192459, -0.06518687307834625, -0.054259978234767914, -0.043333083391189575, -0.03240618854761124, -0.021479297429323196, -0.010552402585744858, 0.00037449225783348083, 0.011301383376121521, 0.02222827821969986, 0.0331551730632782, 0.04408206790685654, 0.055008962750434875, 0.06593585014343262, 0.07686275243759155, 0.0877896398305893, 0.09871653467416763, 0.10964342951774597, 0.12057032436132431, 0.13149721920490265, 0.1424241065979004, 0.15335100889205933, 0.16427789628505707, 0.175204798579216, 0.18613168597221375, 0.19705858826637268, 0.20798547565937042, 0.21891236305236816, 0.2298392653465271, 0.24076615273952484, 0.2516930401325226, 0.2626199424266815, 0.27354684472084045, 0.284473717212677, 0.29540061950683594, 0.3063275218009949, 0.3172543942928314, 0.32818129658699036, 0.3391081988811493, 0.3500351011753082, 0.3609619736671448, 0.3718888759613037, 0.38281577825546265]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 11.0, 19.0, 7.0, 20.0, 35.0, 45.0, 83.0, 114.0, 190.0, 340.0, 628.0, 1089.0, 1839.0, 3468.0, 6724.0, 13066.0, 25445.0, 51796.0, 109006.0, 252804.0, 312747.0, 138824.0, 64764.0, 31834.0, 15997.0, 8267.0, 4160.0, 2236.0, 1230.0, 684.0, 407.0, 237.0, 136.0, 119.0, 62.0, 52.0, 25.0, 17.0, 11.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1304931640625, -0.12616539001464844, -0.12183761596679688, -0.11750984191894531, -0.11318206787109375, -0.10885429382324219, -0.10452651977539062, -0.10019874572753906, -0.0958709716796875, -0.09154319763183594, -0.08721542358398438, -0.08288764953613281, -0.07855987548828125, -0.07423210144042969, -0.06990432739257812, -0.06557655334472656, -0.061248779296875, -0.05692100524902344, -0.052593231201171875, -0.04826545715332031, -0.04393768310546875, -0.03960990905761719, -0.035282135009765625, -0.030954360961914062, -0.0266265869140625, -0.022298812866210938, -0.017971038818359375, -0.013643264770507812, -0.00931549072265625, -0.0049877166748046875, -0.000659942626953125, 0.0036678314208984375, 0.00799560546875, 0.012323379516601562, 0.016651153564453125, 0.020978927612304688, 0.02530670166015625, 0.029634475708007812, 0.033962249755859375, 0.03829002380371094, 0.0426177978515625, 0.04694557189941406, 0.051273345947265625, 0.05560111999511719, 0.05992889404296875, 0.06425666809082031, 0.06858444213867188, 0.07291221618652344, 0.077239990234375, 0.08156776428222656, 0.08589553833007812, 0.09022331237792969, 0.09455108642578125, 0.09887886047363281, 0.10320663452148438, 0.10753440856933594, 0.1118621826171875, 0.11618995666503906, 0.12051773071289062, 0.12484550476074219, 0.12917327880859375, 0.1335010528564453, 0.13782882690429688, 0.14215660095214844, 0.146484375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 2.0, 2.0, 5.0, 8.0, 8.0, 13.0, 26.0, 28.0, 45.0, 32.0, 45.0, 43.0, 42.0, 45.0, 60.0, 59.0, 57.0, 51.0, 50.0, 55.0, 53.0, 50.0, 43.0, 27.0, 31.0, 22.0, 18.0, 25.0, 12.0, 8.0, 8.0, 7.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.054351806640625, -0.05274486541748047, -0.05113792419433594, -0.049530982971191406, -0.047924041748046875, -0.046317100524902344, -0.04471015930175781, -0.04310321807861328, -0.04149627685546875, -0.03988933563232422, -0.03828239440917969, -0.036675453186035156, -0.035068511962890625, -0.033461570739746094, -0.03185462951660156, -0.03024768829345703, -0.0286407470703125, -0.02703380584716797, -0.025426864624023438, -0.023819923400878906, -0.022212982177734375, -0.020606040954589844, -0.018999099731445312, -0.01739215850830078, -0.01578521728515625, -0.014178276062011719, -0.012571334838867188, -0.010964393615722656, -0.009357452392578125, -0.007750511169433594, -0.0061435699462890625, -0.004536628723144531, -0.0029296875, -0.0013227462768554688, 0.0002841949462890625, 0.0018911361694335938, 0.003498077392578125, 0.005105018615722656, 0.0067119598388671875, 0.008318901062011719, 0.00992584228515625, 0.011532783508300781, 0.013139724731445312, 0.014746665954589844, 0.016353607177734375, 0.017960548400878906, 0.019567489624023438, 0.02117443084716797, 0.0227813720703125, 0.02438831329345703, 0.025995254516601562, 0.027602195739746094, 0.029209136962890625, 0.030816078186035156, 0.03242301940917969, 0.03402996063232422, 0.03563690185546875, 0.03724384307861328, 0.03885078430175781, 0.040457725524902344, 0.042064666748046875, 0.043671607971191406, 0.04527854919433594, 0.04688549041748047, 0.048492431640625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 7.0, 5.0, 10.0, 14.0, 25.0, 36.0, 53.0, 71.0, 127.0, 210.0, 351.0, 600.0, 1218.0, 2775.0, 7222.0, 24065.0, 91723.0, 486394.0, 334972.0, 69317.0, 18767.0, 5924.0, 2254.0, 970.0, 524.0, 301.0, 214.0, 128.0, 86.0, 50.0, 37.0, 26.0, 22.0, 17.0, 11.0, 5.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.248291015625, -0.24074363708496094, -0.23319625854492188, -0.2256488800048828, -0.21810150146484375, -0.2105541229248047, -0.20300674438476562, -0.19545936584472656, -0.1879119873046875, -0.18036460876464844, -0.17281723022460938, -0.1652698516845703, -0.15772247314453125, -0.1501750946044922, -0.14262771606445312, -0.13508033752441406, -0.127532958984375, -0.11998558044433594, -0.11243820190429688, -0.10489082336425781, -0.09734344482421875, -0.08979606628417969, -0.08224868774414062, -0.07470130920410156, -0.0671539306640625, -0.05960655212402344, -0.052059173583984375, -0.04451179504394531, -0.03696441650390625, -0.029417037963867188, -0.021869659423828125, -0.014322280883789062, -0.00677490234375, 0.0007724761962890625, 0.008319854736328125, 0.015867233276367188, 0.02341461181640625, 0.030961990356445312, 0.038509368896484375, 0.04605674743652344, 0.0536041259765625, 0.06115150451660156, 0.06869888305664062, 0.07624626159667969, 0.08379364013671875, 0.09134101867675781, 0.09888839721679688, 0.10643577575683594, 0.113983154296875, 0.12153053283691406, 0.12907791137695312, 0.1366252899169922, 0.14417266845703125, 0.1517200469970703, 0.15926742553710938, 0.16681480407714844, 0.1743621826171875, 0.18190956115722656, 0.18945693969726562, 0.1970043182373047, 0.20455169677734375, 0.2120990753173828, 0.21964645385742188, 0.22719383239746094, 0.2347412109375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 7.0, 8.0, 12.0, 10.0, 7.0, 19.0, 12.0, 25.0, 23.0, 26.0, 37.0, 57.0, 40.0, 35.0, 52.0, 58.0, 51.0, 47.0, 45.0, 33.0, 45.0, 40.0, 43.0, 31.0, 49.0, 29.0, 29.0, 24.0, 14.0, 20.0, 14.0, 14.0, 10.0, 5.0, 2.0, 8.0, 4.0, 2.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.2196044921875, -0.21320533752441406, -0.20680618286132812, -0.2004070281982422, -0.19400787353515625, -0.1876087188720703, -0.18120956420898438, -0.17481040954589844, -0.1684112548828125, -0.16201210021972656, -0.15561294555664062, -0.1492137908935547, -0.14281463623046875, -0.1364154815673828, -0.13001632690429688, -0.12361717224121094, -0.117218017578125, -0.11081886291503906, -0.10441970825195312, -0.09802055358886719, -0.09162139892578125, -0.08522224426269531, -0.07882308959960938, -0.07242393493652344, -0.0660247802734375, -0.05962562561035156, -0.053226470947265625, -0.04682731628417969, -0.04042816162109375, -0.03402900695800781, -0.027629852294921875, -0.021230697631835938, -0.01483154296875, -0.008432388305664062, -0.002033233642578125, 0.0043659210205078125, 0.01076507568359375, 0.017164230346679688, 0.023563385009765625, 0.029962539672851562, 0.0363616943359375, 0.04276084899902344, 0.049160003662109375, 0.05555915832519531, 0.06195831298828125, 0.06835746765136719, 0.07475662231445312, 0.08115577697753906, 0.087554931640625, 0.09395408630371094, 0.10035324096679688, 0.10675239562988281, 0.11315155029296875, 0.11955070495605469, 0.12594985961914062, 0.13234901428222656, 0.1387481689453125, 0.14514732360839844, 0.15154647827148438, 0.1579456329345703, 0.16434478759765625, 0.1707439422607422, 0.17714309692382812, 0.18354225158691406, 0.18994140625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 14.0, 9.0, 19.0, 27.0, 40.0, 59.0, 106.0, 152.0, 253.0, 388.0, 727.0, 1181.0, 2038.0, 4223.0, 11128.0, 41627.0, 227062.0, 613252.0, 109024.0, 22895.0, 7258.0, 3009.0, 1662.0, 944.0, 541.0, 349.0, 224.0, 121.0, 69.0, 61.0, 29.0, 20.0, 9.0, 9.0, 7.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.137451171875, -0.13259315490722656, -0.12773513793945312, -0.12287712097167969, -0.11801910400390625, -0.11316108703613281, -0.10830307006835938, -0.10344505310058594, -0.0985870361328125, -0.09372901916503906, -0.08887100219726562, -0.08401298522949219, -0.07915496826171875, -0.07429695129394531, -0.06943893432617188, -0.06458091735839844, -0.059722900390625, -0.05486488342285156, -0.050006866455078125, -0.04514884948730469, -0.04029083251953125, -0.03543281555175781, -0.030574798583984375, -0.025716781616210938, -0.0208587646484375, -0.016000747680664062, -0.011142730712890625, -0.0062847137451171875, -0.00142669677734375, 0.0034313201904296875, 0.008289337158203125, 0.013147354125976562, 0.01800537109375, 0.022863388061523438, 0.027721405029296875, 0.03257942199707031, 0.03743743896484375, 0.04229545593261719, 0.047153472900390625, 0.05201148986816406, 0.0568695068359375, 0.06172752380371094, 0.06658554077148438, 0.07144355773925781, 0.07630157470703125, 0.08115959167480469, 0.08601760864257812, 0.09087562561035156, 0.095733642578125, 0.10059165954589844, 0.10544967651367188, 0.11030769348144531, 0.11516571044921875, 0.12002372741699219, 0.12488174438476562, 0.12973976135253906, 0.1345977783203125, 0.13945579528808594, 0.14431381225585938, 0.1491718292236328, 0.15402984619140625, 0.1588878631591797, 0.16374588012695312, 0.16860389709472656, 0.1734619140625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 4.0, 9.0, 14.0, 15.0, 23.0, 37.0, 51.0, 43.0, 94.0, 97.0, 148.0, 124.0, 106.0, 73.0, 40.0, 37.0, 33.0, 16.0, 13.0, 5.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.898143768310547e-05, -3.726687282323837e-05, -3.555230796337128e-05, -3.383774310350418e-05, -3.2123178243637085e-05, -3.040861338376999e-05, -2.8694048523902893e-05, -2.6979483664035797e-05, -2.52649188041687e-05, -2.3550353944301605e-05, -2.183578908443451e-05, -2.0121224224567413e-05, -1.8406659364700317e-05, -1.669209450483322e-05, -1.4977529644966125e-05, -1.326296478509903e-05, -1.1548399925231934e-05, -9.833835065364838e-06, -8.119270205497742e-06, -6.404705345630646e-06, -4.69014048576355e-06, -2.975575625896454e-06, -1.261010766029358e-06, 4.5355409383773804e-07, 2.168118953704834e-06, 3.88268381357193e-06, 5.597248673439026e-06, 7.311813533306122e-06, 9.026378393173218e-06, 1.0740943253040314e-05, 1.245550811290741e-05, 1.4170072972774506e-05, 1.58846378326416e-05, 1.7599202692508698e-05, 1.9313767552375793e-05, 2.102833241224289e-05, 2.2742897272109985e-05, 2.445746213197708e-05, 2.6172026991844177e-05, 2.7886591851711273e-05, 2.960115671157837e-05, 3.1315721571445465e-05, 3.303028643131256e-05, 3.474485129117966e-05, 3.645941615104675e-05, 3.817398101091385e-05, 3.9888545870780945e-05, 4.160311073064804e-05, 4.331767559051514e-05, 4.503224045038223e-05, 4.674680531024933e-05, 4.8461370170116425e-05, 5.017593502998352e-05, 5.1890499889850616e-05, 5.360506474971771e-05, 5.531962960958481e-05, 5.7034194469451904e-05, 5.8748759329319e-05, 6.0463324189186096e-05, 6.217788904905319e-05, 6.389245390892029e-05, 6.560701876878738e-05, 6.732158362865448e-05, 6.903614848852158e-05, 7.075071334838867e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 9.0, 9.0, 23.0, 36.0, 36.0, 58.0, 95.0, 149.0, 291.0, 466.0, 890.0, 1909.0, 4732.0, 15789.0, 103154.0, 708570.0, 178361.0, 23384.0, 5978.0, 2238.0, 1040.0, 523.0, 284.0, 163.0, 119.0, 63.0, 51.0, 40.0, 28.0, 17.0, 9.0, 5.0, 4.0, 8.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2120361328125, -0.20532989501953125, -0.1986236572265625, -0.19191741943359375, -0.185211181640625, -0.17850494384765625, -0.1717987060546875, -0.16509246826171875, -0.15838623046875, -0.15167999267578125, -0.1449737548828125, -0.13826751708984375, -0.131561279296875, -0.12485504150390625, -0.1181488037109375, -0.11144256591796875, -0.104736328125, -0.09803009033203125, -0.0913238525390625, -0.08461761474609375, -0.077911376953125, -0.07120513916015625, -0.0644989013671875, -0.05779266357421875, -0.05108642578125, -0.04438018798828125, -0.0376739501953125, -0.03096771240234375, -0.024261474609375, -0.01755523681640625, -0.0108489990234375, -0.00414276123046875, 0.0025634765625, 0.00926971435546875, 0.0159759521484375, 0.02268218994140625, 0.029388427734375, 0.03609466552734375, 0.0428009033203125, 0.04950714111328125, 0.05621337890625, 0.06291961669921875, 0.0696258544921875, 0.07633209228515625, 0.083038330078125, 0.08974456787109375, 0.0964508056640625, 0.10315704345703125, 0.10986328125, 0.11656951904296875, 0.1232757568359375, 0.12998199462890625, 0.136688232421875, 0.14339447021484375, 0.1501007080078125, 0.15680694580078125, 0.16351318359375, 0.17021942138671875, 0.1769256591796875, 0.18363189697265625, 0.190338134765625, 0.19704437255859375, 0.2037506103515625, 0.21045684814453125, 0.2171630859375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 7.0, 9.0, 9.0, 21.0, 32.0, 45.0, 66.0, 111.0, 178.0, 192.0, 117.0, 74.0, 56.0, 20.0, 23.0, 9.0, 10.0, 6.0, 3.0, 3.0, 6.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.27978515625, -0.2729530334472656, -0.26612091064453125, -0.2592887878417969, -0.2524566650390625, -0.24562454223632812, -0.23879241943359375, -0.23196029663085938, -0.225128173828125, -0.21829605102539062, -0.21146392822265625, -0.20463180541992188, -0.1977996826171875, -0.19096755981445312, -0.18413543701171875, -0.17730331420898438, -0.17047119140625, -0.16363906860351562, -0.15680694580078125, -0.14997482299804688, -0.1431427001953125, -0.13631057739257812, -0.12947845458984375, -0.12264633178710938, -0.115814208984375, -0.10898208618164062, -0.10214996337890625, -0.09531784057617188, -0.0884857177734375, -0.08165359497070312, -0.07482147216796875, -0.06798934936523438, -0.0611572265625, -0.054325103759765625, -0.04749298095703125, -0.040660858154296875, -0.0338287353515625, -0.026996612548828125, -0.02016448974609375, -0.013332366943359375, -0.006500244140625, 0.000331878662109375, 0.00716400146484375, 0.013996124267578125, 0.0208282470703125, 0.027660369873046875, 0.03449249267578125, 0.041324615478515625, 0.04815673828125, 0.054988861083984375, 0.06182098388671875, 0.06865310668945312, 0.0754852294921875, 0.08231735229492188, 0.08914947509765625, 0.09598159790039062, 0.102813720703125, 0.10964584350585938, 0.11647796630859375, 0.12331008911132812, 0.1301422119140625, 0.13697433471679688, 0.14380645751953125, 0.15063858032226562, 0.157470703125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 4.0, 11.0, 4.0, 19.0, 28.0, 68.0, 98.0, 130.0, 153.0, 170.0, 121.0, 97.0, 53.0, 21.0, 17.0, 10.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9270260334014893, -0.8544597625732422, -0.7818934321403503, -0.7093271017074585, -0.6367608308792114, -0.5641945600509644, -0.4916282296180725, -0.41906189918518066, -0.3464956283569336, -0.27392932772636414, -0.20136302709579468, -0.12879672646522522, -0.05623042583465576, 0.016335874795913696, 0.08890217542648315, 0.161468505859375, 0.23403477668762207, 0.30660107731819153, 0.379167377948761, 0.45173367857933044, 0.5242999792098999, 0.596866250038147, 0.6694325804710388, 0.7419989109039307, 0.8145651817321777, 0.8871314525604248, 0.9596977829933167, 1.0322641134262085, 1.1048303842544556, 1.1773966550827026, 1.2499630451202393, 1.3225293159484863, 1.3950955867767334, 1.4676618576049805, 1.5402281284332275, 1.6127945184707642, 1.6853607892990112, 1.7579270601272583, 1.830493450164795, 1.903059720993042, 1.975625991821289, 2.048192262649536, 2.120758533477783, 2.1933248043060303, 2.2658910751342773, 2.3384575843811035, 2.4110238552093506, 2.4835901260375977, 2.5561563968658447, 2.628722667694092, 2.701288938522339, 2.773855209350586, 2.846421718597412, 2.918987989425659, 2.9915542602539062, 3.0641205310821533, 3.1366868019104004, 3.2092530727386475, 3.2818193435668945, 3.3543856143951416, 3.4269518852233887, 3.499518394470215, 3.572084665298462, 3.644650936126709, 3.717217206954956]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 2.0, 5.0, 8.0, 11.0, 10.0, 15.0, 7.0, 18.0, 14.0, 17.0, 26.0, 26.0, 24.0, 34.0, 39.0, 42.0, 42.0, 45.0, 37.0, 45.0, 31.0, 43.0, 37.0, 51.0, 45.0, 39.0, 43.0, 31.0, 37.0, 25.0, 29.0, 19.0, 16.0, 13.0, 14.0, 11.0, 8.0, 10.0, 1.0, 6.0, 3.0, 3.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.9620654582977295, -0.9291619658470154, -0.8962584733963013, -0.8633549213409424, -0.8304514288902283, -0.7975479364395142, -0.7646444439888, -0.7317409515380859, -0.698837399482727, -0.6659339070320129, -0.6330304145812988, -0.6001268625259399, -0.5672233700752258, -0.5343198776245117, -0.5014163851737976, -0.4685128927230835, -0.4356094002723694, -0.4027059078216553, -0.3698023855686188, -0.33689889311790466, -0.30399537086486816, -0.27109187841415405, -0.23818838596343994, -0.20528487861156464, -0.17238137125968933, -0.13947786390781403, -0.10657436400651932, -0.07367086410522461, -0.040767356753349304, -0.007863849401473999, 0.025039643049240112, 0.05794315040111542, 0.09084665775299072, 0.12375016510486603, 0.15665367245674133, 0.18955716490745544, 0.22246067225933075, 0.25536417961120605, 0.28826767206192017, 0.3211711645126343, 0.3540746867656708, 0.3869781792163849, 0.4198817014694214, 0.4527851939201355, 0.4856886863708496, 0.5185922384262085, 0.5514956712722778, 0.5843992233276367, 0.6173027157783508, 0.6502062082290649, 0.683109700679779, 0.7160131931304932, 0.748916745185852, 0.7818202376365662, 0.8147237300872803, 0.8476272225379944, 0.8805307149887085, 0.9134342074394226, 0.9463376998901367, 0.9792412519454956, 1.012144684791565, 1.0450482368469238, 1.0779516696929932, 1.110855221748352, 1.143758773803711]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 16.0, 16.0, 17.0, 28.0, 42.0, 56.0, 107.0, 162.0, 234.0, 376.0, 664.0, 1021.0, 1724.0, 3162.0, 6151.0, 12557.0, 28354.0, 82759.0, 571115.0, 3267357.0, 143995.0, 40657.0, 16332.0, 7868.0, 4061.0, 2180.0, 1252.0, 746.0, 436.0, 292.0, 199.0, 104.0, 81.0, 54.0, 35.0, 16.0, 17.0, 15.0, 8.0, 11.0, 4.0, 3.0, 2.0, 4.0], "bins": [-0.255126953125, -0.24861717224121094, -0.24210739135742188, -0.2355976104736328, -0.22908782958984375, -0.2225780487060547, -0.21606826782226562, -0.20955848693847656, -0.2030487060546875, -0.19653892517089844, -0.19002914428710938, -0.1835193634033203, -0.17700958251953125, -0.1704998016357422, -0.16399002075195312, -0.15748023986816406, -0.150970458984375, -0.14446067810058594, -0.13795089721679688, -0.1314411163330078, -0.12493133544921875, -0.11842155456542969, -0.11191177368164062, -0.10540199279785156, -0.0988922119140625, -0.09238243103027344, -0.08587265014648438, -0.07936286926269531, -0.07285308837890625, -0.06634330749511719, -0.059833526611328125, -0.05332374572753906, -0.04681396484375, -0.04030418395996094, -0.033794403076171875, -0.027284622192382812, -0.02077484130859375, -0.014265060424804688, -0.007755279541015625, -0.0012454986572265625, 0.0052642822265625, 0.011774063110351562, 0.018283843994140625, 0.024793624877929688, 0.03130340576171875, 0.03781318664550781, 0.044322967529296875, 0.05083274841308594, 0.057342529296875, 0.06385231018066406, 0.07036209106445312, 0.07687187194824219, 0.08338165283203125, 0.08989143371582031, 0.09640121459960938, 0.10291099548339844, 0.1094207763671875, 0.11593055725097656, 0.12244033813476562, 0.1289501190185547, 0.13545989990234375, 0.1419696807861328, 0.14847946166992188, 0.15498924255371094, 0.1614990234375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 19.0, 16.0, 25.0, 12.0, 25.0, 40.0, 46.0, 43.0, 63.0, 56.0, 55.0, 49.0, 58.0, 79.0, 64.0, 56.0, 39.0, 42.0, 40.0, 30.0, 36.0, 24.0, 18.0, 11.0, 14.0, 9.0, 4.0, 6.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.061676025390625, -0.05984067916870117, -0.058005332946777344, -0.056169986724853516, -0.05433464050292969, -0.05249929428100586, -0.05066394805908203, -0.0488286018371582, -0.046993255615234375, -0.04515790939331055, -0.04332256317138672, -0.04148721694946289, -0.03965187072753906, -0.037816524505615234, -0.035981178283691406, -0.03414583206176758, -0.03231048583984375, -0.030475139617919922, -0.028639793395996094, -0.026804447174072266, -0.024969100952148438, -0.02313375473022461, -0.02129840850830078, -0.019463062286376953, -0.017627716064453125, -0.015792369842529297, -0.013957023620605469, -0.01212167739868164, -0.010286331176757812, -0.008450984954833984, -0.006615638732910156, -0.004780292510986328, -0.0029449462890625, -0.0011096000671386719, 0.0007257461547851562, 0.0025610923767089844, 0.0043964385986328125, 0.006231784820556641, 0.008067131042480469, 0.009902477264404297, 0.011737823486328125, 0.013573169708251953, 0.015408515930175781, 0.01724386215209961, 0.019079208374023438, 0.020914554595947266, 0.022749900817871094, 0.024585247039794922, 0.02642059326171875, 0.028255939483642578, 0.030091285705566406, 0.031926631927490234, 0.03376197814941406, 0.03559732437133789, 0.03743267059326172, 0.03926801681518555, 0.041103363037109375, 0.0429387092590332, 0.04477405548095703, 0.04660940170288086, 0.04844474792480469, 0.050280094146728516, 0.052115440368652344, 0.05395078659057617, 0.0557861328125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 3.0, 12.0, 10.0, 12.0, 8.0, 16.0, 21.0, 25.0, 42.0, 40.0, 69.0, 131.0, 192.0, 305.0, 625.0, 1363.0, 3455.0, 9920.0, 35411.0, 200222.0, 3631619.0, 252758.0, 40050.0, 11123.0, 3675.0, 1568.0, 657.0, 370.0, 192.0, 128.0, 70.0, 46.0, 29.0, 32.0, 20.0, 9.0, 16.0, 9.0, 9.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.455078125, -0.4422760009765625, -0.429473876953125, -0.4166717529296875, -0.40386962890625, -0.3910675048828125, -0.378265380859375, -0.3654632568359375, -0.3526611328125, -0.3398590087890625, -0.327056884765625, -0.3142547607421875, -0.30145263671875, -0.2886505126953125, -0.275848388671875, -0.2630462646484375, -0.250244140625, -0.2374420166015625, -0.224639892578125, -0.2118377685546875, -0.19903564453125, -0.1862335205078125, -0.173431396484375, -0.1606292724609375, -0.1478271484375, -0.1350250244140625, -0.122222900390625, -0.1094207763671875, -0.09661865234375, -0.0838165283203125, -0.071014404296875, -0.0582122802734375, -0.04541015625, -0.0326080322265625, -0.019805908203125, -0.0070037841796875, 0.00579833984375, 0.0186004638671875, 0.031402587890625, 0.0442047119140625, 0.0570068359375, 0.0698089599609375, 0.082611083984375, 0.0954132080078125, 0.10821533203125, 0.1210174560546875, 0.133819580078125, 0.1466217041015625, 0.159423828125, 0.1722259521484375, 0.185028076171875, 0.1978302001953125, 0.21063232421875, 0.2234344482421875, 0.236236572265625, 0.2490386962890625, 0.2618408203125, 0.2746429443359375, 0.287445068359375, 0.3002471923828125, 0.31304931640625, 0.3258514404296875, 0.338653564453125, 0.3514556884765625, 0.3642578125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 5.0, 3.0, 10.0, 17.0, 24.0, 28.0, 37.0, 53.0, 93.0, 226.0, 715.0, 2069.0, 362.0, 173.0, 99.0, 53.0, 37.0, 28.0, 15.0, 11.0, 8.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1207275390625, -0.11446571350097656, -0.10820388793945312, -0.10194206237792969, -0.09568023681640625, -0.08941841125488281, -0.08315658569335938, -0.07689476013183594, -0.0706329345703125, -0.06437110900878906, -0.058109283447265625, -0.05184745788574219, -0.04558563232421875, -0.03932380676269531, -0.033061981201171875, -0.026800155639648438, -0.020538330078125, -0.014276504516601562, -0.008014678955078125, -0.0017528533935546875, 0.00450897216796875, 0.010770797729492188, 0.017032623291015625, 0.023294448852539062, 0.0295562744140625, 0.03581809997558594, 0.042079925537109375, 0.04834175109863281, 0.05460357666015625, 0.06086540222167969, 0.06712722778320312, 0.07338905334472656, 0.07965087890625, 0.08591270446777344, 0.09217453002929688, 0.09843635559082031, 0.10469818115234375, 0.11096000671386719, 0.11722183227539062, 0.12348365783691406, 0.1297454833984375, 0.13600730895996094, 0.14226913452148438, 0.1485309600830078, 0.15479278564453125, 0.1610546112060547, 0.16731643676757812, 0.17357826232910156, 0.179840087890625, 0.18610191345214844, 0.19236373901367188, 0.1986255645751953, 0.20488739013671875, 0.2111492156982422, 0.21741104125976562, 0.22367286682128906, 0.2299346923828125, 0.23619651794433594, 0.24245834350585938, 0.2487201690673828, 0.25498199462890625, 0.2612438201904297, 0.2675056457519531, 0.27376747131347656, 0.280029296875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 11.0, 16.0, 24.0, 50.0, 65.0, 96.0, 108.0, 140.0, 148.0, 101.0, 77.0, 41.0, 44.0, 25.0, 20.0, 10.0, 11.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3025517463684082, -1.2696025371551514, -1.2366533279418945, -1.2037042379379272, -1.1707550287246704, -1.1378058195114136, -1.1048566102981567, -1.0719074010849, -1.0389583110809326, -1.0060091018676758, -0.9730599522590637, -0.9401107430458069, -0.9071615934371948, -0.874212384223938, -0.8412631750106812, -0.8083139657974243, -0.7753647565841675, -0.7424155473709106, -0.7094663977622986, -0.6765171885490417, -0.6435680389404297, -0.6106188297271729, -0.577669620513916, -0.5447204113006592, -0.5117712616920471, -0.47882208228111267, -0.4458729028701782, -0.4129236936569214, -0.37997451424598694, -0.3470253348350525, -0.31407612562179565, -0.2811269462108612, -0.2481778860092163, -0.21522870659828186, -0.18227951228618622, -0.14933031797409058, -0.11638113856315613, -0.08343195915222168, -0.05048276484012604, -0.017533570528030396, 0.015415608882904053, 0.0483647957444191, 0.08131398260593414, 0.11426316946744919, 0.14721235632896423, 0.18016153573989868, 0.21311073005199432, 0.24605992436408997, 0.2790091037750244, 0.31195828318595886, 0.3449074625968933, 0.37785667181015015, 0.4108058512210846, 0.44375503063201904, 0.4767042398452759, 0.5096534490585327, 0.5426025986671448, 0.5755518078804016, 0.6085009574890137, 0.6414501667022705, 0.6743993759155273, 0.7073485255241394, 0.7402977347373962, 0.7732468843460083, 0.8061960935592651]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 10.0, 7.0, 5.0, 14.0, 11.0, 16.0, 27.0, 20.0, 30.0, 19.0, 23.0, 29.0, 30.0, 35.0, 49.0, 46.0, 32.0, 40.0, 44.0, 45.0, 53.0, 36.0, 39.0, 52.0, 40.0, 46.0, 28.0, 18.0, 19.0, 14.0, 17.0, 25.0, 18.0, 12.0, 7.0, 12.0, 7.0, 5.0, 4.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.5119866728782654, -0.49630919098854065, -0.4806317090988159, -0.4649542570114136, -0.44927677512168884, -0.4335992932319641, -0.41792184114456177, -0.40224435925483704, -0.3865668773651123, -0.3708893954753876, -0.35521191358566284, -0.3395344614982605, -0.32385697960853577, -0.30817949771881104, -0.2925020456314087, -0.27682456374168396, -0.26114708185195923, -0.2454695999622345, -0.22979213297367096, -0.21411466598510742, -0.1984371840953827, -0.18275970220565796, -0.16708223521709442, -0.15140476822853088, -0.13572728633880615, -0.12004981189966202, -0.10437233746051788, -0.08869486302137375, -0.07301738858222961, -0.05733991414308548, -0.041662439703941345, -0.02598496526479721, -0.010307550430297852, 0.005369924008846283, 0.021047398447990417, 0.03672487288713455, 0.052402347326278687, 0.06807982176542282, 0.08375729620456696, 0.09943477064371109, 0.11511224508285522, 0.13078972697257996, 0.1464671939611435, 0.16214466094970703, 0.17782214283943176, 0.1934996247291565, 0.20917709171772003, 0.22485455870628357, 0.2405320405960083, 0.25620952248573303, 0.27188700437545776, 0.2875644564628601, 0.30324193835258484, 0.31891942024230957, 0.3345968723297119, 0.35027435421943665, 0.3659518361091614, 0.3816293179988861, 0.39730679988861084, 0.4129842519760132, 0.4286617338657379, 0.44433921575546265, 0.460016667842865, 0.4756941497325897, 0.49137163162231445]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 8.0, 10.0, 26.0, 37.0, 65.0, 111.0, 172.0, 314.0, 422.0, 814.0, 1410.0, 2691.0, 5175.0, 10372.0, 21409.0, 46179.0, 104629.0, 225853.0, 295772.0, 181743.0, 80579.0, 36095.0, 16982.0, 8356.0, 4206.0, 2260.0, 1201.0, 674.0, 394.0, 240.0, 140.0, 93.0, 52.0, 31.0, 15.0, 10.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1429443359375, -0.1383838653564453, -0.13382339477539062, -0.12926292419433594, -0.12470245361328125, -0.12014198303222656, -0.11558151245117188, -0.11102104187011719, -0.1064605712890625, -0.10190010070800781, -0.09733963012695312, -0.09277915954589844, -0.08821868896484375, -0.08365821838378906, -0.07909774780273438, -0.07453727722167969, -0.069976806640625, -0.06541633605957031, -0.060855865478515625, -0.05629539489746094, -0.05173492431640625, -0.04717445373535156, -0.042613983154296875, -0.03805351257324219, -0.0334930419921875, -0.028932571411132812, -0.024372100830078125, -0.019811630249023438, -0.01525115966796875, -0.010690689086914062, -0.006130218505859375, -0.0015697479248046875, 0.00299072265625, 0.0075511932373046875, 0.012111663818359375, 0.016672134399414062, 0.02123260498046875, 0.025793075561523438, 0.030353546142578125, 0.03491401672363281, 0.0394744873046875, 0.04403495788574219, 0.048595428466796875, 0.05315589904785156, 0.05771636962890625, 0.06227684020996094, 0.06683731079101562, 0.07139778137207031, 0.075958251953125, 0.08051872253417969, 0.08507919311523438, 0.08963966369628906, 0.09420013427734375, 0.09876060485839844, 0.10332107543945312, 0.10788154602050781, 0.1124420166015625, 0.11700248718261719, 0.12156295776367188, 0.12612342834472656, 0.13068389892578125, 0.13524436950683594, 0.13980484008789062, 0.1443653106689453, 0.14892578125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 7.0, 9.0, 10.0, 11.0, 18.0, 14.0, 16.0, 22.0, 22.0, 35.0, 44.0, 54.0, 47.0, 47.0, 48.0, 52.0, 64.0, 62.0, 47.0, 52.0, 61.0, 47.0, 29.0, 30.0, 28.0, 22.0, 23.0, 16.0, 22.0, 7.0, 9.0, 11.0, 7.0, 1.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.053253173828125, -0.0514674186706543, -0.049681663513183594, -0.04789590835571289, -0.04611015319824219, -0.044324398040771484, -0.04253864288330078, -0.04075288772583008, -0.038967132568359375, -0.03718137741088867, -0.03539562225341797, -0.033609867095947266, -0.03182411193847656, -0.03003835678100586, -0.028252601623535156, -0.026466846466064453, -0.02468109130859375, -0.022895336151123047, -0.021109580993652344, -0.01932382583618164, -0.017538070678710938, -0.015752315521240234, -0.013966560363769531, -0.012180805206298828, -0.010395050048828125, -0.008609294891357422, -0.006823539733886719, -0.005037784576416016, -0.0032520294189453125, -0.0014662742614746094, 0.00031948089599609375, 0.002105236053466797, 0.0038909912109375, 0.005676746368408203, 0.007462501525878906, 0.00924825668334961, 0.011034011840820312, 0.012819766998291016, 0.014605522155761719, 0.016391277313232422, 0.018177032470703125, 0.019962787628173828, 0.02174854278564453, 0.023534297943115234, 0.025320053100585938, 0.02710580825805664, 0.028891563415527344, 0.030677318572998047, 0.03246307373046875, 0.03424882888793945, 0.036034584045410156, 0.03782033920288086, 0.03960609436035156, 0.041391849517822266, 0.04317760467529297, 0.04496335983276367, 0.046749114990234375, 0.04853487014770508, 0.05032062530517578, 0.052106380462646484, 0.05389213562011719, 0.05567789077758789, 0.057463645935058594, 0.0592494010925293, 0.06103515625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 2.0, 1.0, 5.0, 4.0, 6.0, 3.0, 5.0, 12.0, 18.0, 11.0, 20.0, 27.0, 34.0, 53.0, 71.0, 118.0, 206.0, 386.0, 593.0, 1374.0, 3443.0, 10386.0, 39918.0, 193196.0, 556755.0, 186670.0, 38916.0, 10153.0, 3300.0, 1325.0, 642.0, 327.0, 209.0, 118.0, 68.0, 53.0, 37.0, 29.0, 10.0, 15.0, 12.0, 3.0, 7.0, 6.0, 9.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.2176513671875, -0.2097339630126953, -0.20181655883789062, -0.19389915466308594, -0.18598175048828125, -0.17806434631347656, -0.17014694213867188, -0.1622295379638672, -0.1543121337890625, -0.1463947296142578, -0.13847732543945312, -0.13055992126464844, -0.12264251708984375, -0.11472511291503906, -0.10680770874023438, -0.09889030456542969, -0.090972900390625, -0.08305549621582031, -0.07513809204101562, -0.06722068786621094, -0.05930328369140625, -0.05138587951660156, -0.043468475341796875, -0.03555107116699219, -0.0276336669921875, -0.019716262817382812, -0.011798858642578125, -0.0038814544677734375, 0.00403594970703125, 0.011953353881835938, 0.019870758056640625, 0.027788162231445312, 0.03570556640625, 0.04362297058105469, 0.051540374755859375, 0.05945777893066406, 0.06737518310546875, 0.07529258728027344, 0.08320999145507812, 0.09112739562988281, 0.0990447998046875, 0.10696220397949219, 0.11487960815429688, 0.12279701232910156, 0.13071441650390625, 0.13863182067871094, 0.14654922485351562, 0.1544666290283203, 0.162384033203125, 0.1703014373779297, 0.17821884155273438, 0.18613624572753906, 0.19405364990234375, 0.20197105407714844, 0.20988845825195312, 0.2178058624267578, 0.2257232666015625, 0.2336406707763672, 0.24155807495117188, 0.24947547912597656, 0.25739288330078125, 0.26531028747558594, 0.2732276916503906, 0.2811450958251953, 0.2890625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 8.0, 13.0, 11.0, 15.0, 15.0, 19.0, 20.0, 21.0, 31.0, 29.0, 31.0, 40.0, 40.0, 49.0, 41.0, 49.0, 42.0, 52.0, 46.0, 39.0, 50.0, 30.0, 36.0, 27.0, 40.0, 33.0, 34.0, 27.0, 18.0, 13.0, 11.0, 12.0, 9.0, 6.0, 7.0, 5.0, 4.0, 4.0, 4.0, 1.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.242919921875, -0.23513412475585938, -0.22734832763671875, -0.21956253051757812, -0.2117767333984375, -0.20399093627929688, -0.19620513916015625, -0.18841934204101562, -0.180633544921875, -0.17284774780273438, -0.16506195068359375, -0.15727615356445312, -0.1494903564453125, -0.14170455932617188, -0.13391876220703125, -0.12613296508789062, -0.11834716796875, -0.11056137084960938, -0.10277557373046875, -0.09498977661132812, -0.0872039794921875, -0.07941818237304688, -0.07163238525390625, -0.06384658813476562, -0.056060791015625, -0.048274993896484375, -0.04048919677734375, -0.032703399658203125, -0.0249176025390625, -0.017131805419921875, -0.00934600830078125, -0.001560211181640625, 0.0062255859375, 0.014011383056640625, 0.02179718017578125, 0.029582977294921875, 0.0373687744140625, 0.045154571533203125, 0.05294036865234375, 0.060726165771484375, 0.068511962890625, 0.07629776000976562, 0.08408355712890625, 0.09186935424804688, 0.0996551513671875, 0.10744094848632812, 0.11522674560546875, 0.12301254272460938, 0.13079833984375, 0.13858413696289062, 0.14636993408203125, 0.15415573120117188, 0.1619415283203125, 0.16972732543945312, 0.17751312255859375, 0.18529891967773438, 0.193084716796875, 0.20087051391601562, 0.20865631103515625, 0.21644210815429688, 0.2242279052734375, 0.23201370239257812, 0.23979949951171875, 0.24758529663085938, 0.25537109375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 3.0, 6.0, 7.0, 4.0, 14.0, 30.0, 40.0, 51.0, 116.0, 145.0, 393.0, 753.0, 2008.0, 7241.0, 71258.0, 848331.0, 105513.0, 8549.0, 2347.0, 897.0, 377.0, 204.0, 91.0, 79.0, 50.0, 14.0, 15.0, 12.0, 6.0, 2.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.294677734375, -0.2839851379394531, -0.27329254150390625, -0.2625999450683594, -0.2519073486328125, -0.24121475219726562, -0.23052215576171875, -0.21982955932617188, -0.209136962890625, -0.19844436645507812, -0.18775177001953125, -0.17705917358398438, -0.1663665771484375, -0.15567398071289062, -0.14498138427734375, -0.13428878784179688, -0.12359619140625, -0.11290359497070312, -0.10221099853515625, -0.09151840209960938, -0.0808258056640625, -0.07013320922851562, -0.05944061279296875, -0.048748016357421875, -0.038055419921875, -0.027362823486328125, -0.01667022705078125, -0.005977630615234375, 0.0047149658203125, 0.015407562255859375, 0.02610015869140625, 0.036792755126953125, 0.0474853515625, 0.058177947998046875, 0.06887054443359375, 0.07956314086914062, 0.0902557373046875, 0.10094833374023438, 0.11164093017578125, 0.12233352661132812, 0.133026123046875, 0.14371871948242188, 0.15441131591796875, 0.16510391235351562, 0.1757965087890625, 0.18648910522460938, 0.19718170166015625, 0.20787429809570312, 0.21856689453125, 0.22925949096679688, 0.23995208740234375, 0.2506446838378906, 0.2613372802734375, 0.2720298767089844, 0.28272247314453125, 0.2934150695800781, 0.304107666015625, 0.3148002624511719, 0.32549285888671875, 0.3361854553222656, 0.3468780517578125, 0.3575706481933594, 0.36826324462890625, 0.3789558410644531, 0.3896484375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 8.0, 5.0, 14.0, 15.0, 32.0, 35.0, 27.0, 51.0, 47.0, 63.0, 75.0, 80.0, 96.0, 87.0, 68.0, 62.0, 52.0, 38.0, 42.0, 23.0, 18.0, 13.0, 8.0, 11.0, 7.0, 3.0, 4.0, 5.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.060434341430664e-05, -4.932191222906113e-05, -4.803948104381561e-05, -4.67570498585701e-05, -4.5474618673324585e-05, -4.419218748807907e-05, -4.290975630283356e-05, -4.162732511758804e-05, -4.034489393234253e-05, -3.9062462747097015e-05, -3.77800315618515e-05, -3.649760037660599e-05, -3.5215169191360474e-05, -3.393273800611496e-05, -3.2650306820869446e-05, -3.136787563562393e-05, -3.0085444450378418e-05, -2.8803013265132904e-05, -2.752058207988739e-05, -2.6238150894641876e-05, -2.4955719709396362e-05, -2.367328852415085e-05, -2.2390857338905334e-05, -2.110842615365982e-05, -1.9825994968414307e-05, -1.8543563783168793e-05, -1.726113259792328e-05, -1.5978701412677765e-05, -1.4696270227432251e-05, -1.3413839042186737e-05, -1.2131407856941223e-05, -1.084897667169571e-05, -9.566545486450195e-06, -8.284114301204681e-06, -7.0016831159591675e-06, -5.7192519307136536e-06, -4.43682074546814e-06, -3.1543895602226257e-06, -1.8719583749771118e-06, -5.895271897315979e-07, 6.92903995513916e-07, 1.97533518075943e-06, 3.257766366004944e-06, 4.540197551250458e-06, 5.822628736495972e-06, 7.105059921741486e-06, 8.387491106987e-06, 9.669922292232513e-06, 1.0952353477478027e-05, 1.2234784662723541e-05, 1.3517215847969055e-05, 1.4799647033214569e-05, 1.6082078218460083e-05, 1.7364509403705597e-05, 1.864694058895111e-05, 1.9929371774196625e-05, 2.121180295944214e-05, 2.2494234144687653e-05, 2.3776665329933167e-05, 2.505909651517868e-05, 2.6341527700424194e-05, 2.7623958885669708e-05, 2.8906390070915222e-05, 3.0188821256160736e-05, 3.147125244140625e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 12.0, 8.0, 9.0, 17.0, 24.0, 30.0, 31.0, 59.0, 77.0, 109.0, 170.0, 211.0, 322.0, 439.0, 705.0, 1216.0, 1959.0, 3881.0, 10919.0, 56263.0, 503543.0, 406065.0, 44109.0, 9611.0, 3729.0, 1842.0, 1075.0, 690.0, 445.0, 298.0, 195.0, 121.0, 98.0, 72.0, 41.0, 43.0, 28.0, 15.0, 16.0, 16.0, 11.0, 6.0, 5.0, 3.0, 0.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2283935546875, -0.22124290466308594, -0.21409225463867188, -0.2069416046142578, -0.19979095458984375, -0.1926403045654297, -0.18548965454101562, -0.17833900451660156, -0.1711883544921875, -0.16403770446777344, -0.15688705444335938, -0.1497364044189453, -0.14258575439453125, -0.1354351043701172, -0.12828445434570312, -0.12113380432128906, -0.113983154296875, -0.10683250427246094, -0.09968185424804688, -0.09253120422363281, -0.08538055419921875, -0.07822990417480469, -0.07107925415039062, -0.06392860412597656, -0.0567779541015625, -0.04962730407714844, -0.042476654052734375, -0.03532600402832031, -0.02817535400390625, -0.021024703979492188, -0.013874053955078125, -0.0067234039306640625, 0.00042724609375, 0.0075778961181640625, 0.014728546142578125, 0.021879196166992188, 0.02902984619140625, 0.03618049621582031, 0.043331146240234375, 0.05048179626464844, 0.0576324462890625, 0.06478309631347656, 0.07193374633789062, 0.07908439636230469, 0.08623504638671875, 0.09338569641113281, 0.10053634643554688, 0.10768699645996094, 0.114837646484375, 0.12198829650878906, 0.12913894653320312, 0.1362895965576172, 0.14344024658203125, 0.1505908966064453, 0.15774154663085938, 0.16489219665527344, 0.1720428466796875, 0.17919349670410156, 0.18634414672851562, 0.1934947967529297, 0.20064544677734375, 0.2077960968017578, 0.21494674682617188, 0.22209739685058594, 0.229248046875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 12.0, 29.0, 30.0, 36.0, 55.0, 88.0, 106.0, 151.0, 134.0, 122.0, 68.0, 59.0, 33.0, 19.0, 18.0, 12.0, 6.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.176025390625, -0.16943931579589844, -0.16285324096679688, -0.1562671661376953, -0.14968109130859375, -0.1430950164794922, -0.13650894165039062, -0.12992286682128906, -0.1233367919921875, -0.11675071716308594, -0.11016464233398438, -0.10357856750488281, -0.09699249267578125, -0.09040641784667969, -0.08382034301757812, -0.07723426818847656, -0.070648193359375, -0.06406211853027344, -0.057476043701171875, -0.05088996887207031, -0.04430389404296875, -0.03771781921386719, -0.031131744384765625, -0.024545669555664062, -0.0179595947265625, -0.011373519897460938, -0.004787445068359375, 0.0017986297607421875, 0.00838470458984375, 0.014970779418945312, 0.021556854248046875, 0.028142929077148438, 0.03472900390625, 0.04131507873535156, 0.047901153564453125, 0.05448722839355469, 0.06107330322265625, 0.06765937805175781, 0.07424545288085938, 0.08083152770996094, 0.0874176025390625, 0.09400367736816406, 0.10058975219726562, 0.10717582702636719, 0.11376190185546875, 0.12034797668457031, 0.12693405151367188, 0.13352012634277344, 0.140106201171875, 0.14669227600097656, 0.15327835083007812, 0.1598644256591797, 0.16645050048828125, 0.1730365753173828, 0.17962265014648438, 0.18620872497558594, 0.1927947998046875, 0.19938087463378906, 0.20596694946289062, 0.2125530242919922, 0.21913909912109375, 0.2257251739501953, 0.23231124877929688, 0.23889732360839844, 0.2454833984375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 11.0, 43.0, 66.0, 169.0, 262.0, 242.0, 125.0, 50.0, 27.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.215538501739502, -3.074989080429077, -2.9344396591186523, -2.7938902378082275, -2.6533408164978027, -2.512791395187378, -2.372241973876953, -2.2316925525665283, -2.0911431312561035, -1.9505937099456787, -1.810044288635254, -1.669494867324829, -1.5289454460144043, -1.3883960247039795, -1.2478466033935547, -1.1072971820831299, -0.9667477607727051, -0.8261983394622803, -0.6856489181518555, -0.5450994968414307, -0.40455007553100586, -0.26400065422058105, -0.12345123291015625, 0.017098188400268555, 0.15764760971069336, 0.29819703102111816, 0.43874645233154297, 0.5792958736419678, 0.7198452949523926, 0.8603947162628174, 1.0009441375732422, 1.141493558883667, 1.28204345703125, 1.4225928783416748, 1.5631422996520996, 1.7036917209625244, 1.8442411422729492, 1.984790563583374, 2.125339984893799, 2.2658894062042236, 2.4064388275146484, 2.5469882488250732, 2.687537670135498, 2.828087091445923, 2.9686365127563477, 3.1091859340667725, 3.2497353553771973, 3.390284776687622, 3.530834197998047, 3.6713836193084717, 3.8119330406188965, 3.9524824619293213, 4.093031883239746, 4.23358154296875, 4.374130725860596, 4.514679908752441, 4.655229568481445, 4.795779228210449, 4.936328411102295, 5.076877593994141, 5.2174272537231445, 5.357976913452148, 5.498526096343994, 5.63907527923584, 5.779624938964844]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 2.0, 10.0, 5.0, 6.0, 14.0, 13.0, 16.0, 11.0, 24.0, 28.0, 16.0, 21.0, 23.0, 19.0, 30.0, 34.0, 25.0, 26.0, 39.0, 34.0, 46.0, 40.0, 41.0, 40.0, 33.0, 37.0, 47.0, 38.0, 28.0, 31.0, 30.0, 30.0, 25.0, 14.0, 17.0, 13.0, 13.0, 8.0, 14.0, 10.0, 8.0, 8.0, 8.0, 7.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.0228466987609863, -0.9889925718307495, -0.9551385045051575, -0.9212844371795654, -0.8874303102493286, -0.8535761833190918, -0.8197221159934998, -0.7858680486679077, -0.7520139217376709, -0.7181597948074341, -0.684305727481842, -0.65045166015625, -0.6165975332260132, -0.5827434062957764, -0.5488893389701843, -0.5150352716445923, -0.48118114471435547, -0.44732704758644104, -0.4134729504585266, -0.3796188533306122, -0.34576475620269775, -0.3119106590747833, -0.2780565619468689, -0.24420246481895447, -0.21034836769104004, -0.1764942705631256, -0.14264017343521118, -0.10878607630729675, -0.07493197917938232, -0.041077882051467896, -0.007223784923553467, 0.026630312204360962, 0.06048452854156494, 0.09433862566947937, 0.1281927227973938, 0.16204681992530823, 0.19590091705322266, 0.22975501418113708, 0.2636091113090515, 0.29746320843696594, 0.33131730556488037, 0.3651714026927948, 0.39902549982070923, 0.43287959694862366, 0.4667336940765381, 0.5005878210067749, 0.5344418883323669, 0.568295955657959, 0.6021500825881958, 0.6360042095184326, 0.6698582768440247, 0.7037123441696167, 0.7375664710998535, 0.7714205980300903, 0.8052746653556824, 0.8391287326812744, 0.8729828596115112, 0.906836986541748, 0.9406910538673401, 0.9745451211929321, 1.008399248123169, 1.0422533750534058, 1.0761075019836426, 1.1099615097045898, 1.1438156366348267]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 8.0, 7.0, 10.0, 20.0, 20.0, 23.0, 32.0, 30.0, 59.0, 69.0, 90.0, 115.0, 173.0, 214.0, 289.0, 452.0, 635.0, 1102.0, 2431.0, 6842.0, 32377.0, 4075820.0, 57591.0, 9001.0, 3015.0, 1366.0, 734.0, 467.0, 336.0, 224.0, 172.0, 140.0, 103.0, 63.0, 54.0, 49.0, 38.0, 28.0, 12.0, 12.0, 12.0, 12.0, 7.0, 2.0, 8.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0], "bins": [-0.482421875, -0.4671630859375, -0.451904296875, -0.4366455078125, -0.42138671875, -0.4061279296875, -0.390869140625, -0.3756103515625, -0.3603515625, -0.3450927734375, -0.329833984375, -0.3145751953125, -0.29931640625, -0.2840576171875, -0.268798828125, -0.2535400390625, -0.23828125, -0.2230224609375, -0.207763671875, -0.1925048828125, -0.17724609375, -0.1619873046875, -0.146728515625, -0.1314697265625, -0.1162109375, -0.1009521484375, -0.085693359375, -0.0704345703125, -0.05517578125, -0.0399169921875, -0.024658203125, -0.0093994140625, 0.005859375, 0.0211181640625, 0.036376953125, 0.0516357421875, 0.06689453125, 0.0821533203125, 0.097412109375, 0.1126708984375, 0.1279296875, 0.1431884765625, 0.158447265625, 0.1737060546875, 0.18896484375, 0.2042236328125, 0.219482421875, 0.2347412109375, 0.25, 0.2652587890625, 0.280517578125, 0.2957763671875, 0.31103515625, 0.3262939453125, 0.341552734375, 0.3568115234375, 0.3720703125, 0.3873291015625, 0.402587890625, 0.4178466796875, 0.43310546875, 0.4483642578125, 0.463623046875, 0.4788818359375, 0.494140625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 9.0, 7.0, 8.0, 13.0, 12.0, 23.0, 16.0, 22.0, 32.0, 41.0, 50.0, 48.0, 39.0, 55.0, 57.0, 69.0, 55.0, 47.0, 52.0, 53.0, 47.0, 40.0, 26.0, 37.0, 35.0, 16.0, 13.0, 18.0, 16.0, 13.0, 12.0, 4.0, 2.0, 6.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058349609375, -0.0563507080078125, -0.054351806640625, -0.0523529052734375, -0.05035400390625, -0.0483551025390625, -0.046356201171875, -0.0443572998046875, -0.0423583984375, -0.0403594970703125, -0.038360595703125, -0.0363616943359375, -0.03436279296875, -0.0323638916015625, -0.030364990234375, -0.0283660888671875, -0.0263671875, -0.0243682861328125, -0.022369384765625, -0.0203704833984375, -0.01837158203125, -0.0163726806640625, -0.014373779296875, -0.0123748779296875, -0.0103759765625, -0.0083770751953125, -0.006378173828125, -0.0043792724609375, -0.00238037109375, -0.0003814697265625, 0.001617431640625, 0.0036163330078125, 0.005615234375, 0.0076141357421875, 0.009613037109375, 0.0116119384765625, 0.01361083984375, 0.0156097412109375, 0.017608642578125, 0.0196075439453125, 0.0216064453125, 0.0236053466796875, 0.025604248046875, 0.0276031494140625, 0.02960205078125, 0.0316009521484375, 0.033599853515625, 0.0355987548828125, 0.03759765625, 0.0395965576171875, 0.041595458984375, 0.0435943603515625, 0.04559326171875, 0.0475921630859375, 0.049591064453125, 0.0515899658203125, 0.0535888671875, 0.0555877685546875, 0.057586669921875, 0.0595855712890625, 0.06158447265625, 0.0635833740234375, 0.065582275390625, 0.0675811767578125, 0.069580078125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 7.0, 6.0, 10.0, 12.0, 12.0, 15.0, 19.0, 24.0, 34.0, 39.0, 52.0, 66.0, 76.0, 131.0, 162.0, 248.0, 382.0, 707.0, 1570.0, 4907.0, 33642.0, 4114129.0, 29877.0, 4634.0, 1429.0, 720.0, 407.0, 265.0, 172.0, 113.0, 109.0, 72.0, 53.0, 37.0, 35.0, 22.0, 24.0, 15.0, 10.0, 15.0, 12.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8603515625, -0.82904052734375, -0.7977294921875, -0.76641845703125, -0.735107421875, -0.70379638671875, -0.6724853515625, -0.64117431640625, -0.60986328125, -0.57855224609375, -0.5472412109375, -0.51593017578125, -0.484619140625, -0.45330810546875, -0.4219970703125, -0.39068603515625, -0.359375, -0.32806396484375, -0.2967529296875, -0.26544189453125, -0.234130859375, -0.20281982421875, -0.1715087890625, -0.14019775390625, -0.10888671875, -0.07757568359375, -0.0462646484375, -0.01495361328125, 0.016357421875, 0.04766845703125, 0.0789794921875, 0.11029052734375, 0.1416015625, 0.17291259765625, 0.2042236328125, 0.23553466796875, 0.266845703125, 0.29815673828125, 0.3294677734375, 0.36077880859375, 0.39208984375, 0.42340087890625, 0.4547119140625, 0.48602294921875, 0.517333984375, 0.54864501953125, 0.5799560546875, 0.61126708984375, 0.642578125, 0.67388916015625, 0.7052001953125, 0.73651123046875, 0.767822265625, 0.79913330078125, 0.8304443359375, 0.86175537109375, 0.89306640625, 0.92437744140625, 0.9556884765625, 0.98699951171875, 1.018310546875, 1.04962158203125, 1.0809326171875, 1.11224365234375, 1.1435546875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 14.0, 20.0, 57.0, 383.0, 3450.0, 81.0, 29.0, 15.0, 8.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08343505859375, -0.07790851593017578, -0.07238197326660156, -0.06685543060302734, -0.061328887939453125, -0.055802345275878906, -0.05027580261230469, -0.04474925994873047, -0.03922271728515625, -0.03369617462158203, -0.028169631958007812, -0.022643089294433594, -0.017116546630859375, -0.011590003967285156, -0.0060634613037109375, -0.0005369186401367188, 0.0049896240234375, 0.010516166687011719, 0.016042709350585938, 0.021569252014160156, 0.027095794677734375, 0.032622337341308594, 0.03814888000488281, 0.04367542266845703, 0.04920196533203125, 0.05472850799560547, 0.06025505065917969, 0.0657815933227539, 0.07130813598632812, 0.07683467864990234, 0.08236122131347656, 0.08788776397705078, 0.093414306640625, 0.09894084930419922, 0.10446739196777344, 0.10999393463134766, 0.11552047729492188, 0.1210470199584961, 0.1265735626220703, 0.13210010528564453, 0.13762664794921875, 0.14315319061279297, 0.1486797332763672, 0.1542062759399414, 0.15973281860351562, 0.16525936126708984, 0.17078590393066406, 0.17631244659423828, 0.1818389892578125, 0.18736553192138672, 0.19289207458496094, 0.19841861724853516, 0.20394515991210938, 0.2094717025756836, 0.2149982452392578, 0.22052478790283203, 0.22605133056640625, 0.23157787322998047, 0.2371044158935547, 0.2426309585571289, 0.24815750122070312, 0.25368404388427734, 0.25921058654785156, 0.2647371292114258, 0.270263671875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 12.0, 23.0, 35.0, 60.0, 93.0, 115.0, 142.0, 145.0, 100.0, 74.0, 47.0, 39.0, 31.0, 19.0, 12.0, 13.0, 10.0, 9.0, 3.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5047615766525269, -0.4841006398200989, -0.4634397327899933, -0.4427787959575653, -0.42211785912513733, -0.40145695209503174, -0.38079601526260376, -0.3601350784301758, -0.3394741415977478, -0.3188132047653198, -0.29815229773521423, -0.27749136090278625, -0.2568304240703583, -0.2361695021390915, -0.2155085802078247, -0.19484764337539673, -0.17418673634529114, -0.15352581441402435, -0.13286487758159637, -0.11220395565032959, -0.09154302626848221, -0.07088209688663483, -0.05022117495536804, -0.029560238122940063, -0.008899316191673279, 0.011761611327528954, 0.032422538846731186, 0.05308346450328827, 0.07374439388513565, 0.09440532326698303, 0.11506624519824982, 0.1357271820306778, 0.15638810396194458, 0.17704902589321136, 0.19770996272563934, 0.21837088465690613, 0.2390318214893341, 0.2596927285194397, 0.2803536653518677, 0.30101460218429565, 0.32167553901672363, 0.3423364758491516, 0.3629973828792572, 0.3836583197116852, 0.40431925654411316, 0.42498016357421875, 0.44564110040664673, 0.4663020372390747, 0.4869629442691803, 0.5076238512992859, 0.5282847881317139, 0.5489457249641418, 0.5696066617965698, 0.5902675986289978, 0.6109285354614258, 0.631589412689209, 0.652250349521637, 0.6729112863540649, 0.6935722231864929, 0.7142331600189209, 0.7348940372467041, 0.7555549740791321, 0.7762159109115601, 0.796876847743988, 0.817537784576416]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 9.0, 11.0, 10.0, 11.0, 14.0, 15.0, 15.0, 20.0, 24.0, 23.0, 13.0, 25.0, 35.0, 23.0, 39.0, 28.0, 34.0, 35.0, 48.0, 37.0, 31.0, 37.0, 35.0, 25.0, 33.0, 28.0, 33.0, 30.0, 19.0, 26.0, 30.0, 24.0, 25.0, 26.0, 24.0, 16.0, 15.0, 19.0, 12.0, 9.0, 9.0, 8.0, 7.0, 3.0, 3.0, 5.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.26647669076919556, -0.2576553225517273, -0.24883392453193665, -0.2400125414133072, -0.23119115829467773, -0.22236977517604828, -0.21354839205741882, -0.20472700893878937, -0.1959056258201599, -0.18708424270153046, -0.178262859582901, -0.16944147646427155, -0.1606200933456421, -0.15179871022701263, -0.14297732710838318, -0.13415594398975372, -0.12533456087112427, -0.11651317775249481, -0.10769179463386536, -0.0988704115152359, -0.09004902839660645, -0.08122764527797699, -0.07240626215934753, -0.06358487904071808, -0.05476349592208862, -0.04594211280345917, -0.03712072968482971, -0.028299346566200256, -0.0194779634475708, -0.010656580328941345, -0.0018351972103118896, 0.006986185908317566, 0.01580756902694702, 0.024628952145576477, 0.03345033526420593, 0.04227171838283539, 0.051093101501464844, 0.0599144846200943, 0.06873586773872375, 0.07755725085735321, 0.08637863397598267, 0.09520001709461212, 0.10402140021324158, 0.11284278333187103, 0.12166416645050049, 0.13048554956912994, 0.1393069326877594, 0.14812831580638885, 0.1569496989250183, 0.16577108204364777, 0.17459246516227722, 0.18341384828090668, 0.19223523139953613, 0.2010566145181656, 0.20987799763679504, 0.2186993807554245, 0.22752076387405396, 0.2363421469926834, 0.24516353011131287, 0.2539849281311035, 0.2628062963485718, 0.27162766456604004, 0.2804490625858307, 0.28927046060562134, 0.2980918288230896]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 8.0, 3.0, 7.0, 6.0, 10.0, 14.0, 16.0, 18.0, 34.0, 41.0, 43.0, 63.0, 101.0, 154.0, 169.0, 218.0, 302.0, 422.0, 567.0, 792.0, 1166.0, 1913.0, 3396.0, 6975.0, 17413.0, 51179.0, 174831.0, 428342.0, 245726.0, 71790.0, 23090.0, 8846.0, 4049.0, 2272.0, 1308.0, 897.0, 634.0, 432.0, 322.0, 266.0, 196.0, 144.0, 91.0, 67.0, 55.0, 44.0, 33.0, 30.0, 18.0, 15.0, 14.0, 6.0, 8.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.24755859375, -0.23947906494140625, -0.2313995361328125, -0.22332000732421875, -0.215240478515625, -0.20716094970703125, -0.1990814208984375, -0.19100189208984375, -0.18292236328125, -0.17484283447265625, -0.1667633056640625, -0.15868377685546875, -0.150604248046875, -0.14252471923828125, -0.1344451904296875, -0.12636566162109375, -0.1182861328125, -0.11020660400390625, -0.1021270751953125, -0.09404754638671875, -0.085968017578125, -0.07788848876953125, -0.0698089599609375, -0.06172943115234375, -0.05364990234375, -0.04557037353515625, -0.0374908447265625, -0.02941131591796875, -0.021331787109375, -0.01325225830078125, -0.0051727294921875, 0.00290679931640625, 0.010986328125, 0.01906585693359375, 0.0271453857421875, 0.03522491455078125, 0.043304443359375, 0.05138397216796875, 0.0594635009765625, 0.06754302978515625, 0.07562255859375, 0.08370208740234375, 0.0917816162109375, 0.09986114501953125, 0.107940673828125, 0.11602020263671875, 0.1240997314453125, 0.13217926025390625, 0.1402587890625, 0.14833831787109375, 0.1564178466796875, 0.16449737548828125, 0.172576904296875, 0.18065643310546875, 0.1887359619140625, 0.19681549072265625, 0.20489501953125, 0.21297454833984375, 0.2210540771484375, 0.22913360595703125, 0.237213134765625, 0.24529266357421875, 0.2533721923828125, 0.26145172119140625, 0.26953125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 7.0, 1.0, 4.0, 10.0, 13.0, 7.0, 8.0, 16.0, 19.0, 24.0, 21.0, 26.0, 29.0, 41.0, 29.0, 52.0, 50.0, 59.0, 49.0, 56.0, 53.0, 46.0, 35.0, 48.0, 41.0, 37.0, 40.0, 39.0, 15.0, 29.0, 21.0, 13.0, 11.0, 11.0, 13.0, 5.0, 11.0, 4.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06689453125, -0.06449222564697266, -0.06208992004394531, -0.05968761444091797, -0.057285308837890625, -0.05488300323486328, -0.05248069763183594, -0.050078392028808594, -0.04767608642578125, -0.045273780822753906, -0.04287147521972656, -0.04046916961669922, -0.038066864013671875, -0.03566455841064453, -0.03326225280761719, -0.030859947204589844, -0.0284576416015625, -0.026055335998535156, -0.023653030395507812, -0.02125072479248047, -0.018848419189453125, -0.01644611358642578, -0.014043807983398438, -0.011641502380371094, -0.00923919677734375, -0.006836891174316406, -0.0044345855712890625, -0.0020322799682617188, 0.000370025634765625, 0.0027723312377929688, 0.0051746368408203125, 0.007576942443847656, 0.009979248046875, 0.012381553649902344, 0.014783859252929688, 0.01718616485595703, 0.019588470458984375, 0.02199077606201172, 0.024393081665039062, 0.026795387268066406, 0.02919769287109375, 0.031599998474121094, 0.03400230407714844, 0.03640460968017578, 0.038806915283203125, 0.04120922088623047, 0.04361152648925781, 0.046013832092285156, 0.0484161376953125, 0.050818443298339844, 0.05322074890136719, 0.05562305450439453, 0.058025360107421875, 0.06042766571044922, 0.06282997131347656, 0.0652322769165039, 0.06763458251953125, 0.0700368881225586, 0.07243919372558594, 0.07484149932861328, 0.07724380493164062, 0.07964611053466797, 0.08204841613769531, 0.08445072174072266, 0.08685302734375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 8.0, 5.0, 9.0, 10.0, 18.0, 30.0, 33.0, 61.0, 77.0, 114.0, 157.0, 241.0, 387.0, 667.0, 1085.0, 2051.0, 4188.0, 10835.0, 42503.0, 293717.0, 577867.0, 84894.0, 17471.0, 5859.0, 2651.0, 1446.0, 779.0, 467.0, 276.0, 183.0, 134.0, 92.0, 83.0, 50.0, 33.0, 24.0, 11.0, 8.0, 12.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.348388671875, -0.336456298828125, -0.32452392578125, -0.312591552734375, -0.3006591796875, -0.288726806640625, -0.27679443359375, -0.264862060546875, -0.2529296875, -0.240997314453125, -0.22906494140625, -0.217132568359375, -0.2052001953125, -0.193267822265625, -0.18133544921875, -0.169403076171875, -0.157470703125, -0.145538330078125, -0.13360595703125, -0.121673583984375, -0.1097412109375, -0.097808837890625, -0.08587646484375, -0.073944091796875, -0.06201171875, -0.050079345703125, -0.03814697265625, -0.026214599609375, -0.0142822265625, -0.002349853515625, 0.00958251953125, 0.021514892578125, 0.033447265625, 0.045379638671875, 0.05731201171875, 0.069244384765625, 0.0811767578125, 0.093109130859375, 0.10504150390625, 0.116973876953125, 0.12890625, 0.140838623046875, 0.15277099609375, 0.164703369140625, 0.1766357421875, 0.188568115234375, 0.20050048828125, 0.212432861328125, 0.224365234375, 0.236297607421875, 0.24822998046875, 0.260162353515625, 0.2720947265625, 0.284027099609375, 0.29595947265625, 0.307891845703125, 0.31982421875, 0.331756591796875, 0.34368896484375, 0.355621337890625, 0.3675537109375, 0.379486083984375, 0.39141845703125, 0.403350830078125, 0.415283203125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 5.0, 5.0, 1.0, 8.0, 11.0, 10.0, 11.0, 18.0, 22.0, 14.0, 33.0, 36.0, 36.0, 41.0, 49.0, 43.0, 43.0, 45.0, 46.0, 58.0, 56.0, 44.0, 49.0, 52.0, 49.0, 26.0, 39.0, 36.0, 23.0, 22.0, 12.0, 14.0, 8.0, 12.0, 5.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.40478515625, -0.3912239074707031, -0.37766265869140625, -0.3641014099121094, -0.3505401611328125, -0.3369789123535156, -0.32341766357421875, -0.3098564147949219, -0.296295166015625, -0.2827339172363281, -0.26917266845703125, -0.2556114196777344, -0.2420501708984375, -0.22848892211914062, -0.21492767333984375, -0.20136642456054688, -0.18780517578125, -0.17424392700195312, -0.16068267822265625, -0.14712142944335938, -0.1335601806640625, -0.11999893188476562, -0.10643768310546875, -0.09287643432617188, -0.079315185546875, -0.06575393676757812, -0.05219268798828125, -0.038631439208984375, -0.0250701904296875, -0.011508941650390625, 0.00205230712890625, 0.015613555908203125, 0.0291748046875, 0.042736053466796875, 0.05629730224609375, 0.06985855102539062, 0.0834197998046875, 0.09698104858398438, 0.11054229736328125, 0.12410354614257812, 0.137664794921875, 0.15122604370117188, 0.16478729248046875, 0.17834854125976562, 0.1919097900390625, 0.20547103881835938, 0.21903228759765625, 0.23259353637695312, 0.24615478515625, 0.2597160339355469, 0.27327728271484375, 0.2868385314941406, 0.3003997802734375, 0.3139610290527344, 0.32752227783203125, 0.3410835266113281, 0.354644775390625, 0.3682060241699219, 0.38176727294921875, 0.3953285217285156, 0.4088897705078125, 0.4224510192871094, 0.43601226806640625, 0.4495735168457031, 0.463134765625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 3.0, 6.0, 12.0, 12.0, 11.0, 22.0, 23.0, 35.0, 51.0, 79.0, 111.0, 188.0, 320.0, 589.0, 1358.0, 3203.0, 11584.0, 122810.0, 836472.0, 58445.0, 8056.0, 2714.0, 1123.0, 533.0, 319.0, 152.0, 92.0, 81.0, 41.0, 26.0, 18.0, 18.0, 8.0, 6.0, 8.0, 3.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3408203125, -0.3302955627441406, -0.31977081298828125, -0.3092460632324219, -0.2987213134765625, -0.2881965637207031, -0.27767181396484375, -0.2671470642089844, -0.256622314453125, -0.24609756469726562, -0.23557281494140625, -0.22504806518554688, -0.2145233154296875, -0.20399856567382812, -0.19347381591796875, -0.18294906616210938, -0.17242431640625, -0.16189956665039062, -0.15137481689453125, -0.14085006713867188, -0.1303253173828125, -0.11980056762695312, -0.10927581787109375, -0.09875106811523438, -0.088226318359375, -0.07770156860351562, -0.06717681884765625, -0.056652069091796875, -0.0461273193359375, -0.035602569580078125, -0.02507781982421875, -0.014553070068359375, -0.0040283203125, 0.006496429443359375, 0.01702117919921875, 0.027545928955078125, 0.0380706787109375, 0.048595428466796875, 0.05912017822265625, 0.06964492797851562, 0.080169677734375, 0.09069442749023438, 0.10121917724609375, 0.11174392700195312, 0.1222686767578125, 0.13279342651367188, 0.14331817626953125, 0.15384292602539062, 0.16436767578125, 0.17489242553710938, 0.18541717529296875, 0.19594192504882812, 0.2064666748046875, 0.21699142456054688, 0.22751617431640625, 0.23804092407226562, 0.248565673828125, 0.2590904235839844, 0.26961517333984375, 0.2801399230957031, 0.2906646728515625, 0.3011894226074219, 0.31171417236328125, 0.3222389221191406, 0.332763671875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 5.0, 5.0, 21.0, 46.0, 73.0, 135.0, 167.0, 187.0, 135.0, 102.0, 59.0, 28.0, 24.0, 15.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012093782424926758, -0.00011814013123512268, -0.00011534243822097778, -0.00011254474520683289, -0.00010974705219268799, -0.00010694935917854309, -0.0001041516661643982, -0.0001013539731502533, -9.85562801361084e-05, -9.57585871219635e-05, -9.29608941078186e-05, -9.01632010936737e-05, -8.736550807952881e-05, -8.456781506538391e-05, -8.177012205123901e-05, -7.897242903709412e-05, -7.617473602294922e-05, -7.337704300880432e-05, -7.057934999465942e-05, -6.778165698051453e-05, -6.498396396636963e-05, -6.218627095222473e-05, -5.9388577938079834e-05, -5.6590884923934937e-05, -5.379319190979004e-05, -5.099549889564514e-05, -4.8197805881500244e-05, -4.540011286735535e-05, -4.260241985321045e-05, -3.980472683906555e-05, -3.7007033824920654e-05, -3.420934081077576e-05, -3.141164779663086e-05, -2.8613954782485962e-05, -2.5816261768341064e-05, -2.3018568754196167e-05, -2.022087574005127e-05, -1.7423182725906372e-05, -1.4625489711761475e-05, -1.1827796697616577e-05, -9.03010368347168e-06, -6.232410669326782e-06, -3.4347176551818848e-06, -6.370246410369873e-07, 2.16066837310791e-06, 4.958361387252808e-06, 7.756054401397705e-06, 1.0553747415542603e-05, 1.33514404296875e-05, 1.6149133443832397e-05, 1.8946826457977295e-05, 2.1744519472122192e-05, 2.454221248626709e-05, 2.7339905500411987e-05, 3.0137598514556885e-05, 3.293529152870178e-05, 3.573298454284668e-05, 3.853067755699158e-05, 4.1328370571136475e-05, 4.412606358528137e-05, 4.692375659942627e-05, 4.972144961357117e-05, 5.2519142627716064e-05, 5.531683564186096e-05, 5.811452865600586e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 3.0, 15.0, 11.0, 27.0, 26.0, 45.0, 71.0, 108.0, 178.0, 407.0, 860.0, 2465.0, 10992.0, 242324.0, 764658.0, 20549.0, 3617.0, 1136.0, 489.0, 223.0, 140.0, 72.0, 47.0, 26.0, 24.0, 7.0, 12.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.387451171875, -0.3726387023925781, -0.35782623291015625, -0.3430137634277344, -0.3282012939453125, -0.3133888244628906, -0.29857635498046875, -0.2837638854980469, -0.268951416015625, -0.2541389465332031, -0.23932647705078125, -0.22451400756835938, -0.2097015380859375, -0.19488906860351562, -0.18007659912109375, -0.16526412963867188, -0.15045166015625, -0.13563919067382812, -0.12082672119140625, -0.10601425170898438, -0.0912017822265625, -0.07638931274414062, -0.06157684326171875, -0.046764373779296875, -0.031951904296875, -0.017139434814453125, -0.00232696533203125, 0.012485504150390625, 0.0272979736328125, 0.042110443115234375, 0.05692291259765625, 0.07173538208007812, 0.0865478515625, 0.10136032104492188, 0.11617279052734375, 0.13098526000976562, 0.1457977294921875, 0.16061019897460938, 0.17542266845703125, 0.19023513793945312, 0.205047607421875, 0.21986007690429688, 0.23467254638671875, 0.24948501586914062, 0.2642974853515625, 0.2791099548339844, 0.29392242431640625, 0.3087348937988281, 0.32354736328125, 0.3383598327636719, 0.35317230224609375, 0.3679847717285156, 0.3827972412109375, 0.3976097106933594, 0.41242218017578125, 0.4272346496582031, 0.442047119140625, 0.4568595886230469, 0.47167205810546875, 0.4864845275878906, 0.5012969970703125, 0.5161094665527344, 0.5309219360351562, 0.5457344055175781, 0.560546875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 1.0, 12.0, 14.0, 23.0, 46.0, 84.0, 149.0, 171.0, 201.0, 129.0, 69.0, 30.0, 17.0, 12.0, 5.0, 5.0, 4.0, 4.0, 5.0, 2.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2186279296875, -0.2075939178466797, -0.19655990600585938, -0.18552589416503906, -0.17449188232421875, -0.16345787048339844, -0.15242385864257812, -0.1413898468017578, -0.1303558349609375, -0.11932182312011719, -0.10828781127929688, -0.09725379943847656, -0.08621978759765625, -0.07518577575683594, -0.06415176391601562, -0.05311775207519531, -0.042083740234375, -0.031049728393554688, -0.020015716552734375, -0.008981704711914062, 0.00205230712890625, 0.013086318969726562, 0.024120330810546875, 0.03515434265136719, 0.0461883544921875, 0.05722236633300781, 0.06825637817382812, 0.07929039001464844, 0.09032440185546875, 0.10135841369628906, 0.11239242553710938, 0.12342643737792969, 0.13446044921875, 0.1454944610595703, 0.15652847290039062, 0.16756248474121094, 0.17859649658203125, 0.18963050842285156, 0.20066452026367188, 0.2116985321044922, 0.2227325439453125, 0.2337665557861328, 0.24480056762695312, 0.25583457946777344, 0.26686859130859375, 0.27790260314941406, 0.2889366149902344, 0.2999706268310547, 0.311004638671875, 0.3220386505126953, 0.3330726623535156, 0.34410667419433594, 0.35514068603515625, 0.36617469787597656, 0.3772087097167969, 0.3882427215576172, 0.3992767333984375, 0.4103107452392578, 0.4213447570800781, 0.43237876892089844, 0.44341278076171875, 0.45444679260253906, 0.4654808044433594, 0.4765148162841797, 0.487548828125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 9.0, 7.0, 20.0, 32.0, 62.0, 104.0, 171.0, 180.0, 150.0, 116.0, 49.0, 51.0, 21.0, 17.0, 5.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-6.660822868347168, -6.519661903381348, -6.3785014152526855, -6.237340927124023, -6.096179962158203, -5.955018997192383, -5.813858509063721, -5.672698020935059, -5.531537055969238, -5.390376091003418, -5.249215602874756, -5.108055114746094, -4.966894149780273, -4.825733184814453, -4.684572696685791, -4.543412208557129, -4.402251243591309, -4.261090278625488, -4.119929790496826, -3.978769063949585, -3.8376083374023438, -3.6964476108551025, -3.5552868843078613, -3.41412615776062, -3.272965431213379, -3.1318047046661377, -2.9906439781188965, -2.8494832515716553, -2.708322525024414, -2.567161798477173, -2.4260010719299316, -2.2848403453826904, -2.143679141998291, -2.00251841545105, -1.8613576889038086, -1.7201969623565674, -1.5790362358093262, -1.437875509262085, -1.2967147827148438, -1.1555540561676025, -1.0143933296203613, -0.8732326030731201, -0.7320718765258789, -0.5909111499786377, -0.4497504234313965, -0.3085896968841553, -0.16742897033691406, -0.02626824378967285, 0.11489248275756836, 0.25605320930480957, 0.3972139358520508, 0.538374662399292, 0.6795353889465332, 0.8206961154937744, 0.9618568420410156, 1.1030175685882568, 1.244178295135498, 1.3853390216827393, 1.5264997482299805, 1.6676604747772217, 1.808821201324463, 1.949981927871704, 2.0911426544189453, 2.2323033809661865, 2.3734641075134277]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 3.0, 2.0, 6.0, 7.0, 8.0, 8.0, 13.0, 18.0, 8.0, 17.0, 19.0, 33.0, 47.0, 35.0, 31.0, 40.0, 52.0, 58.0, 54.0, 58.0, 64.0, 55.0, 48.0, 51.0, 42.0, 32.0, 30.0, 30.0, 29.0, 18.0, 18.0, 25.0, 10.0, 9.0, 4.0, 5.0, 4.0, 9.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.7773356437683105, -2.6994147300720215, -2.6214938163757324, -2.5435729026794434, -2.4656519889831543, -2.3877310752868652, -2.309810161590576, -2.231889247894287, -2.153968334197998, -2.076047420501709, -1.99812650680542, -1.9202055931091309, -1.8422846794128418, -1.7643637657165527, -1.6864429712295532, -1.6085220575332642, -1.5306012630462646, -1.4526803493499756, -1.3747594356536865, -1.2968385219573975, -1.2189176082611084, -1.1409966945648193, -1.0630759000778198, -0.9851549863815308, -0.9072340726852417, -0.8293131589889526, -0.7513922452926636, -0.6734713912010193, -0.5955504775047302, -0.5176295638084412, -0.4397086799144745, -0.3617877960205078, -0.28386712074279785, -0.20594622194766998, -0.12802532315254211, -0.050104424357414246, 0.027816474437713623, 0.10573738813400269, 0.18365827202796936, 0.26157915592193604, 0.3395000696182251, 0.41742098331451416, 0.49534186720848083, 0.5732627511024475, 0.6511836647987366, 0.7291045784950256, 0.8070254325866699, 0.884946346282959, 0.962867259979248, 1.040788173675537, 1.1187090873718262, 1.1966300010681152, 1.2745509147644043, 1.3524718284606934, 1.4303926229476929, 1.508313536643982, 1.586234450340271, 1.66415536403656, 1.7420762777328491, 1.8199971914291382, 1.8979179859161377, 1.9758388996124268, 2.053759813308716, 2.131680727005005, 2.209601640701294]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 4.0, 6.0, 4.0, 12.0, 14.0, 27.0, 30.0, 39.0, 51.0, 85.0, 146.0, 232.0, 564.0, 1616.0, 7209.0, 156395.0, 4014860.0, 9607.0, 2000.0, 636.0, 274.0, 157.0, 101.0, 47.0, 40.0, 36.0, 25.0, 13.0, 14.0, 11.0, 4.0, 4.0, 3.0, 2.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77099609375, -0.7444839477539062, -0.7179718017578125, -0.6914596557617188, -0.664947509765625, -0.6384353637695312, -0.6119232177734375, -0.5854110717773438, -0.55889892578125, -0.5323867797851562, -0.5058746337890625, -0.47936248779296875, -0.452850341796875, -0.42633819580078125, -0.3998260498046875, -0.37331390380859375, -0.3468017578125, -0.32028961181640625, -0.2937774658203125, -0.26726531982421875, -0.240753173828125, -0.21424102783203125, -0.1877288818359375, -0.16121673583984375, -0.13470458984375, -0.10819244384765625, -0.0816802978515625, -0.05516815185546875, -0.028656005859375, -0.00214385986328125, 0.0243682861328125, 0.05088043212890625, 0.077392578125, 0.10390472412109375, 0.1304168701171875, 0.15692901611328125, 0.183441162109375, 0.20995330810546875, 0.2364654541015625, 0.26297760009765625, 0.28948974609375, 0.31600189208984375, 0.3425140380859375, 0.36902618408203125, 0.395538330078125, 0.42205047607421875, 0.4485626220703125, 0.47507476806640625, 0.5015869140625, 0.5280990600585938, 0.5546112060546875, 0.5811233520507812, 0.607635498046875, 0.6341476440429688, 0.6606597900390625, 0.6871719360351562, 0.71368408203125, 0.7401962280273438, 0.7667083740234375, 0.7932205200195312, 0.819732666015625, 0.8462448120117188, 0.8727569580078125, 0.8992691040039062, 0.92578125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 6.0, 4.0, 3.0, 5.0, 0.0, 10.0, 14.0, 10.0, 31.0, 31.0, 57.0, 61.0, 56.0, 77.0, 77.0, 88.0, 68.0, 76.0, 72.0, 56.0, 47.0, 53.0, 33.0, 25.0, 15.0, 8.0, 7.0, 9.0, 4.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10809326171875, -0.10405254364013672, -0.10001182556152344, -0.09597110748291016, -0.09193038940429688, -0.0878896713256836, -0.08384895324707031, -0.07980823516845703, -0.07576751708984375, -0.07172679901123047, -0.06768608093261719, -0.0636453628540039, -0.059604644775390625, -0.055563926696777344, -0.05152320861816406, -0.04748249053955078, -0.0434417724609375, -0.03940105438232422, -0.03536033630371094, -0.031319618225097656, -0.027278900146484375, -0.023238182067871094, -0.019197463989257812, -0.015156745910644531, -0.01111602783203125, -0.007075309753417969, -0.0030345916748046875, 0.0010061264038085938, 0.005046844482421875, 0.009087562561035156, 0.013128280639648438, 0.01716899871826172, 0.021209716796875, 0.02525043487548828, 0.029291152954101562, 0.033331871032714844, 0.037372589111328125, 0.041413307189941406, 0.04545402526855469, 0.04949474334716797, 0.05353546142578125, 0.05757617950439453, 0.06161689758300781, 0.0656576156616211, 0.06969833374023438, 0.07373905181884766, 0.07777976989746094, 0.08182048797607422, 0.0858612060546875, 0.08990192413330078, 0.09394264221191406, 0.09798336029052734, 0.10202407836914062, 0.1060647964477539, 0.11010551452636719, 0.11414623260498047, 0.11818695068359375, 0.12222766876220703, 0.1262683868408203, 0.1303091049194336, 0.13434982299804688, 0.13839054107666016, 0.14243125915527344, 0.14647197723388672, 0.1505126953125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 11.0, 10.0, 5.0, 12.0, 9.0, 18.0, 17.0, 21.0, 33.0, 41.0, 49.0, 57.0, 69.0, 109.0, 222.0, 658.0, 3168.0, 57981.0, 4121619.0, 8057.0, 1211.0, 366.0, 149.0, 96.0, 57.0, 40.0, 35.0, 33.0, 22.0, 23.0, 18.0, 14.0, 13.0, 5.0, 8.0, 8.0, 4.0, 3.0, 1.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8662109375, -1.811676025390625, -1.75714111328125, -1.702606201171875, -1.6480712890625, -1.593536376953125, -1.53900146484375, -1.484466552734375, -1.429931640625, -1.375396728515625, -1.32086181640625, -1.266326904296875, -1.2117919921875, -1.157257080078125, -1.10272216796875, -1.048187255859375, -0.99365234375, -0.939117431640625, -0.88458251953125, -0.830047607421875, -0.7755126953125, -0.720977783203125, -0.66644287109375, -0.611907958984375, -0.557373046875, -0.502838134765625, -0.44830322265625, -0.393768310546875, -0.3392333984375, -0.284698486328125, -0.23016357421875, -0.175628662109375, -0.12109375, -0.066558837890625, -0.01202392578125, 0.042510986328125, 0.0970458984375, 0.151580810546875, 0.20611572265625, 0.260650634765625, 0.315185546875, 0.369720458984375, 0.42425537109375, 0.478790283203125, 0.5333251953125, 0.587860107421875, 0.64239501953125, 0.696929931640625, 0.75146484375, 0.805999755859375, 0.86053466796875, 0.915069580078125, 0.9696044921875, 1.024139404296875, 1.07867431640625, 1.133209228515625, 1.187744140625, 1.242279052734375, 1.29681396484375, 1.351348876953125, 1.4058837890625, 1.460418701171875, 1.51495361328125, 1.569488525390625, 1.6240234375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 14.0, 29.0, 119.0, 3786.0, 94.0, 20.0, 9.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1868896484375, -0.17484474182128906, -0.16279983520507812, -0.1507549285888672, -0.13871002197265625, -0.1266651153564453, -0.11462020874023438, -0.10257530212402344, -0.0905303955078125, -0.07848548889160156, -0.06644058227539062, -0.05439567565917969, -0.04235076904296875, -0.030305862426757812, -0.018260955810546875, -0.0062160491943359375, 0.005828857421875, 0.017873764038085938, 0.029918670654296875, 0.04196357727050781, 0.05400848388671875, 0.06605339050292969, 0.07809829711914062, 0.09014320373535156, 0.1021881103515625, 0.11423301696777344, 0.12627792358398438, 0.1383228302001953, 0.15036773681640625, 0.1624126434326172, 0.17445755004882812, 0.18650245666503906, 0.19854736328125, 0.21059226989746094, 0.22263717651367188, 0.2346820831298828, 0.24672698974609375, 0.2587718963623047, 0.2708168029785156, 0.28286170959472656, 0.2949066162109375, 0.30695152282714844, 0.3189964294433594, 0.3310413360595703, 0.34308624267578125, 0.3551311492919922, 0.3671760559082031, 0.37922096252441406, 0.391265869140625, 0.40331077575683594, 0.4153556823730469, 0.4274005889892578, 0.43944549560546875, 0.4514904022216797, 0.4635353088378906, 0.47558021545410156, 0.4876251220703125, 0.49967002868652344, 0.5117149353027344, 0.5237598419189453, 0.5358047485351562, 0.5478496551513672, 0.5598945617675781, 0.5719394683837891, 0.583984375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 4.0, 11.0, 11.0, 8.0, 11.0, 11.0, 17.0, 40.0, 43.0, 65.0, 98.0, 98.0, 124.0, 108.0, 105.0, 58.0, 51.0, 48.0, 20.0, 27.0, 13.0, 10.0, 2.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6872037649154663, -0.6650705933570862, -0.6429374814033508, -0.6208043098449707, -0.5986711978912354, -0.5765380263328552, -0.5544048547744751, -0.5322717428207397, -0.5101385712623596, -0.4880054295063019, -0.46587228775024414, -0.443739116191864, -0.4216059744358063, -0.39947283267974854, -0.3773396909236908, -0.35520654916763306, -0.3330734074115753, -0.3109402656555176, -0.28880712389945984, -0.2666739821434021, -0.24454081058502197, -0.22240766882896423, -0.2002745270729065, -0.17814137041568756, -0.15600822865962982, -0.13387508690357208, -0.11174193024635315, -0.08960878849029541, -0.06747563928365707, -0.04534249007701874, -0.023209348320961, -0.0010761916637420654, 0.021056950092315674, 0.04319009929895401, 0.06532324850559235, 0.08745639026165009, 0.10958953946828842, 0.13172268867492676, 0.1538558304309845, 0.17598898708820343, 0.19812212884426117, 0.2202552706003189, 0.24238842725753784, 0.2645215690135956, 0.2866547107696533, 0.30878788232803345, 0.3309209942817688, 0.3530541658401489, 0.37518730759620667, 0.3973204493522644, 0.41945359110832214, 0.4415867328643799, 0.46371990442276, 0.48585304617881775, 0.5079861879348755, 0.5301193594932556, 0.552252471446991, 0.5743856430053711, 0.5965187549591064, 0.6186519265174866, 0.6407850384712219, 0.662918210029602, 0.6850513219833374, 0.7071844935417175, 0.7293176651000977]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 4.0, 2.0, 6.0, 4.0, 4.0, 7.0, 11.0, 7.0, 14.0, 12.0, 13.0, 13.0, 18.0, 13.0, 22.0, 26.0, 31.0, 30.0, 24.0, 33.0, 40.0, 30.0, 35.0, 42.0, 41.0, 48.0, 31.0, 34.0, 42.0, 37.0, 39.0, 33.0, 22.0, 32.0, 30.0, 23.0, 26.0, 17.0, 16.0, 16.0, 12.0, 11.0, 10.0, 7.0, 2.0, 9.0, 3.0, 7.0, 5.0, 5.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3262641429901123, -0.3152258098125458, -0.30418750643730164, -0.2931491732597351, -0.28211086988449097, -0.27107253670692444, -0.2600342035293579, -0.24899590015411377, -0.23795756697654724, -0.2269192487001419, -0.21588093042373657, -0.20484259724617004, -0.1938042789697647, -0.18276596069335938, -0.17172764241695404, -0.1606893241405487, -0.14965100586414337, -0.13861268758773804, -0.1275743693113327, -0.11653604358434677, -0.10549771785736084, -0.0944593995809555, -0.08342108130455017, -0.07238275557756424, -0.061344437301158905, -0.05030611529946327, -0.03926779329776764, -0.028229475021362305, -0.017191153019666672, -0.006152831017971039, 0.004885487258434296, 0.015923812985420227, 0.02696213126182556, 0.038000453263521194, 0.04903877526521683, 0.06007709354162216, 0.0711154192686081, 0.08215373754501343, 0.09319205582141876, 0.1042303815484047, 0.11526869982481003, 0.12630702555179596, 0.1373453438282013, 0.14838366210460663, 0.15942198038101196, 0.1704603135585785, 0.18149861693382263, 0.19253695011138916, 0.2035752683877945, 0.21461358666419983, 0.22565190494060516, 0.2366902232170105, 0.24772855639457703, 0.25876688957214355, 0.2698051929473877, 0.2808435261249542, 0.29188182950019836, 0.3029201626777649, 0.31395846605300903, 0.32499679923057556, 0.3360351026058197, 0.34707343578338623, 0.35811173915863037, 0.3691500723361969, 0.3801884055137634]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 4.0, 1.0, 4.0, 5.0, 11.0, 10.0, 17.0, 24.0, 37.0, 49.0, 99.0, 152.0, 220.0, 387.0, 619.0, 1067.0, 1700.0, 2976.0, 5454.0, 10506.0, 22134.0, 49002.0, 117040.0, 264234.0, 306284.0, 149049.0, 62241.0, 27102.0, 12999.0, 6513.0, 3542.0, 1986.0, 1156.0, 741.0, 423.0, 297.0, 172.0, 105.0, 88.0, 29.0, 28.0, 16.0, 16.0, 6.0, 0.0, 7.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-0.224365234375, -0.2181568145751953, -0.21194839477539062, -0.20573997497558594, -0.19953155517578125, -0.19332313537597656, -0.18711471557617188, -0.1809062957763672, -0.1746978759765625, -0.1684894561767578, -0.16228103637695312, -0.15607261657714844, -0.14986419677734375, -0.14365577697753906, -0.13744735717773438, -0.1312389373779297, -0.125030517578125, -0.11882209777832031, -0.11261367797851562, -0.10640525817871094, -0.10019683837890625, -0.09398841857910156, -0.08777999877929688, -0.08157157897949219, -0.0753631591796875, -0.06915473937988281, -0.06294631958007812, -0.05673789978027344, -0.05052947998046875, -0.04432106018066406, -0.038112640380859375, -0.03190422058105469, -0.02569580078125, -0.019487380981445312, -0.013278961181640625, -0.0070705413818359375, -0.00086212158203125, 0.0053462982177734375, 0.011554718017578125, 0.017763137817382812, 0.0239715576171875, 0.030179977416992188, 0.036388397216796875, 0.04259681701660156, 0.04880523681640625, 0.05501365661621094, 0.061222076416015625, 0.06743049621582031, 0.073638916015625, 0.07984733581542969, 0.08605575561523438, 0.09226417541503906, 0.09847259521484375, 0.10468101501464844, 0.11088943481445312, 0.11709785461425781, 0.1233062744140625, 0.1295146942138672, 0.13572311401367188, 0.14193153381347656, 0.14813995361328125, 0.15434837341308594, 0.16055679321289062, 0.1667652130126953, 0.1729736328125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 2.0, 5.0, 3.0, 6.0, 7.0, 11.0, 18.0, 24.0, 20.0, 28.0, 38.0, 32.0, 49.0, 43.0, 48.0, 61.0, 48.0, 57.0, 73.0, 73.0, 63.0, 48.0, 52.0, 25.0, 36.0, 26.0, 25.0, 14.0, 14.0, 12.0, 6.0, 8.0, 7.0, 5.0, 5.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1474609375, -0.14361858367919922, -0.13977622985839844, -0.13593387603759766, -0.13209152221679688, -0.1282491683959961, -0.12440681457519531, -0.12056446075439453, -0.11672210693359375, -0.11287975311279297, -0.10903739929199219, -0.1051950454711914, -0.10135269165039062, -0.09751033782958984, -0.09366798400878906, -0.08982563018798828, -0.0859832763671875, -0.08214092254638672, -0.07829856872558594, -0.07445621490478516, -0.07061386108398438, -0.0667715072631836, -0.06292915344238281, -0.05908679962158203, -0.05524444580078125, -0.05140209197998047, -0.04755973815917969, -0.043717384338378906, -0.039875030517578125, -0.036032676696777344, -0.03219032287597656, -0.02834796905517578, -0.024505615234375, -0.02066326141357422, -0.016820907592773438, -0.012978553771972656, -0.009136199951171875, -0.005293846130371094, -0.0014514923095703125, 0.0023908615112304688, 0.00623321533203125, 0.010075569152832031, 0.013917922973632812, 0.017760276794433594, 0.021602630615234375, 0.025444984436035156, 0.029287338256835938, 0.03312969207763672, 0.0369720458984375, 0.04081439971923828, 0.04465675354003906, 0.048499107360839844, 0.052341461181640625, 0.056183815002441406, 0.06002616882324219, 0.06386852264404297, 0.06771087646484375, 0.07155323028564453, 0.07539558410644531, 0.0792379379272461, 0.08308029174804688, 0.08692264556884766, 0.09076499938964844, 0.09460735321044922, 0.09844970703125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 6.0, 9.0, 17.0, 14.0, 22.0, 36.0, 48.0, 81.0, 147.0, 185.0, 294.0, 541.0, 1037.0, 2499.0, 7853.0, 40465.0, 405540.0, 524198.0, 50763.0, 9367.0, 2862.0, 1103.0, 564.0, 320.0, 184.0, 126.0, 76.0, 61.0, 36.0, 31.0, 22.0, 15.0, 7.0, 3.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.568359375, -0.5525970458984375, -0.536834716796875, -0.5210723876953125, -0.50531005859375, -0.4895477294921875, -0.473785400390625, -0.4580230712890625, -0.4422607421875, -0.4264984130859375, -0.410736083984375, -0.3949737548828125, -0.37921142578125, -0.3634490966796875, -0.347686767578125, -0.3319244384765625, -0.316162109375, -0.3003997802734375, -0.284637451171875, -0.2688751220703125, -0.25311279296875, -0.2373504638671875, -0.221588134765625, -0.2058258056640625, -0.1900634765625, -0.1743011474609375, -0.158538818359375, -0.1427764892578125, -0.12701416015625, -0.1112518310546875, -0.095489501953125, -0.0797271728515625, -0.06396484375, -0.0482025146484375, -0.032440185546875, -0.0166778564453125, -0.00091552734375, 0.0148468017578125, 0.030609130859375, 0.0463714599609375, 0.0621337890625, 0.0778961181640625, 0.093658447265625, 0.1094207763671875, 0.12518310546875, 0.1409454345703125, 0.156707763671875, 0.1724700927734375, 0.188232421875, 0.2039947509765625, 0.219757080078125, 0.2355194091796875, 0.25128173828125, 0.2670440673828125, 0.282806396484375, 0.2985687255859375, 0.3143310546875, 0.3300933837890625, 0.345855712890625, 0.3616180419921875, 0.37738037109375, 0.3931427001953125, 0.408905029296875, 0.4246673583984375, 0.4404296875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 1.0, 2.0, 6.0, 4.0, 4.0, 8.0, 18.0, 8.0, 15.0, 25.0, 27.0, 33.0, 27.0, 32.0, 44.0, 34.0, 38.0, 45.0, 46.0, 53.0, 45.0, 54.0, 47.0, 38.0, 44.0, 38.0, 36.0, 38.0, 32.0, 21.0, 22.0, 20.0, 14.0, 18.0, 18.0, 7.0, 15.0, 8.0, 3.0, 7.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.5185546875, -0.5017929077148438, -0.4850311279296875, -0.46826934814453125, -0.451507568359375, -0.43474578857421875, -0.4179840087890625, -0.40122222900390625, -0.38446044921875, -0.36769866943359375, -0.3509368896484375, -0.33417510986328125, -0.317413330078125, -0.30065155029296875, -0.2838897705078125, -0.26712799072265625, -0.2503662109375, -0.23360443115234375, -0.2168426513671875, -0.20008087158203125, -0.183319091796875, -0.16655731201171875, -0.1497955322265625, -0.13303375244140625, -0.11627197265625, -0.09951019287109375, -0.0827484130859375, -0.06598663330078125, -0.049224853515625, -0.03246307373046875, -0.0157012939453125, 0.00106048583984375, 0.017822265625, 0.03458404541015625, 0.0513458251953125, 0.06810760498046875, 0.084869384765625, 0.10163116455078125, 0.1183929443359375, 0.13515472412109375, 0.15191650390625, 0.16867828369140625, 0.1854400634765625, 0.20220184326171875, 0.218963623046875, 0.23572540283203125, 0.2524871826171875, 0.26924896240234375, 0.2860107421875, 0.30277252197265625, 0.3195343017578125, 0.33629608154296875, 0.353057861328125, 0.36981964111328125, 0.3865814208984375, 0.40334320068359375, 0.42010498046875, 0.43686676025390625, 0.4536285400390625, 0.47039031982421875, 0.487152099609375, 0.5039138793945312, 0.5206756591796875, 0.5374374389648438, 0.55419921875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 6.0, 3.0, 10.0, 14.0, 17.0, 43.0, 55.0, 98.0, 195.0, 330.0, 808.0, 2241.0, 9113.0, 65845.0, 767635.0, 179653.0, 16793.0, 3499.0, 1171.0, 471.0, 231.0, 131.0, 85.0, 40.0, 17.0, 23.0, 10.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.345458984375, -0.3348884582519531, -0.32431793212890625, -0.3137474060058594, -0.3031768798828125, -0.2926063537597656, -0.28203582763671875, -0.2714653015136719, -0.260894775390625, -0.2503242492675781, -0.23975372314453125, -0.22918319702148438, -0.2186126708984375, -0.20804214477539062, -0.19747161865234375, -0.18690109252929688, -0.17633056640625, -0.16576004028320312, -0.15518951416015625, -0.14461898803710938, -0.1340484619140625, -0.12347793579101562, -0.11290740966796875, -0.10233688354492188, -0.091766357421875, -0.08119583129882812, -0.07062530517578125, -0.060054779052734375, -0.0494842529296875, -0.038913726806640625, -0.02834320068359375, -0.017772674560546875, -0.0072021484375, 0.003368377685546875, 0.01393890380859375, 0.024509429931640625, 0.0350799560546875, 0.045650482177734375, 0.05622100830078125, 0.06679153442382812, 0.077362060546875, 0.08793258666992188, 0.09850311279296875, 0.10907363891601562, 0.1196441650390625, 0.13021469116210938, 0.14078521728515625, 0.15135574340820312, 0.16192626953125, 0.17249679565429688, 0.18306732177734375, 0.19363784790039062, 0.2042083740234375, 0.21477890014648438, 0.22534942626953125, 0.23591995239257812, 0.246490478515625, 0.2570610046386719, 0.26763153076171875, 0.2782020568847656, 0.2887725830078125, 0.2993431091308594, 0.30991363525390625, 0.3204841613769531, 0.3310546875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 12.0, 6.0, 6.0, 12.0, 9.0, 13.0, 28.0, 34.0, 40.0, 77.0, 66.0, 98.0, 92.0, 84.0, 100.0, 62.0, 66.0, 46.0, 39.0, 30.0, 11.0, 11.0, 18.0, 6.0, 5.0, 5.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.463029861450195e-05, -3.327615559101105e-05, -3.192201256752014e-05, -3.0567869544029236e-05, -2.921372652053833e-05, -2.7859583497047424e-05, -2.650544047355652e-05, -2.5151297450065613e-05, -2.3797154426574707e-05, -2.24430114030838e-05, -2.1088868379592896e-05, -1.973472535610199e-05, -1.8380582332611084e-05, -1.7026439309120178e-05, -1.5672296285629272e-05, -1.4318153262138367e-05, -1.2964010238647461e-05, -1.1609867215156555e-05, -1.025572419166565e-05, -8.901581168174744e-06, -7.547438144683838e-06, -6.193295121192932e-06, -4.839152097702026e-06, -3.4850090742111206e-06, -2.130866050720215e-06, -7.767230272293091e-07, 5.774199962615967e-07, 1.9315630197525024e-06, 3.285706043243408e-06, 4.639849066734314e-06, 5.99399209022522e-06, 7.3481351137161255e-06, 8.702278137207031e-06, 1.0056421160697937e-05, 1.1410564184188843e-05, 1.2764707207679749e-05, 1.4118850231170654e-05, 1.547299325466156e-05, 1.6827136278152466e-05, 1.818127930164337e-05, 1.9535422325134277e-05, 2.0889565348625183e-05, 2.224370837211609e-05, 2.3597851395606995e-05, 2.49519944190979e-05, 2.6306137442588806e-05, 2.7660280466079712e-05, 2.9014423489570618e-05, 3.0368566513061523e-05, 3.172270953655243e-05, 3.3076852560043335e-05, 3.443099558353424e-05, 3.5785138607025146e-05, 3.713928163051605e-05, 3.849342465400696e-05, 3.9847567677497864e-05, 4.120171070098877e-05, 4.2555853724479675e-05, 4.390999674797058e-05, 4.526413977146149e-05, 4.661828279495239e-05, 4.79724258184433e-05, 4.9326568841934204e-05, 5.068071186542511e-05, 5.2034854888916016e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 9.0, 0.0, 6.0, 10.0, 7.0, 15.0, 22.0, 29.0, 60.0, 102.0, 176.0, 336.0, 736.0, 1810.0, 5548.0, 25670.0, 274539.0, 664772.0, 60126.0, 9707.0, 2792.0, 1018.0, 483.0, 230.0, 127.0, 74.0, 50.0, 36.0, 28.0, 10.0, 12.0, 9.0, 3.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2413330078125, -0.23136329650878906, -0.22139358520507812, -0.2114238739013672, -0.20145416259765625, -0.1914844512939453, -0.18151473999023438, -0.17154502868652344, -0.1615753173828125, -0.15160560607910156, -0.14163589477539062, -0.1316661834716797, -0.12169647216796875, -0.11172676086425781, -0.10175704956054688, -0.09178733825683594, -0.081817626953125, -0.07184791564941406, -0.061878204345703125, -0.05190849304199219, -0.04193878173828125, -0.03196907043457031, -0.021999359130859375, -0.012029647827148438, -0.0020599365234375, 0.007909774780273438, 0.017879486083984375, 0.027849197387695312, 0.03781890869140625, 0.04778861999511719, 0.057758331298828125, 0.06772804260253906, 0.07769775390625, 0.08766746520996094, 0.09763717651367188, 0.10760688781738281, 0.11757659912109375, 0.1275463104248047, 0.13751602172851562, 0.14748573303222656, 0.1574554443359375, 0.16742515563964844, 0.17739486694335938, 0.1873645782470703, 0.19733428955078125, 0.2073040008544922, 0.21727371215820312, 0.22724342346191406, 0.237213134765625, 0.24718284606933594, 0.2571525573730469, 0.2671222686767578, 0.27709197998046875, 0.2870616912841797, 0.2970314025878906, 0.30700111389160156, 0.3169708251953125, 0.32694053649902344, 0.3369102478027344, 0.3468799591064453, 0.35684967041015625, 0.3668193817138672, 0.3767890930175781, 0.38675880432128906, 0.396728515625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 3.0, 1.0, 3.0, 5.0, 10.0, 14.0, 22.0, 33.0, 42.0, 65.0, 83.0, 113.0, 112.0, 97.0, 94.0, 91.0, 63.0, 32.0, 28.0, 26.0, 17.0, 14.0, 11.0, 5.0, 4.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23193359375, -0.22362518310546875, -0.2153167724609375, -0.20700836181640625, -0.198699951171875, -0.19039154052734375, -0.1820831298828125, -0.17377471923828125, -0.16546630859375, -0.15715789794921875, -0.1488494873046875, -0.14054107666015625, -0.132232666015625, -0.12392425537109375, -0.1156158447265625, -0.10730743408203125, -0.0989990234375, -0.09069061279296875, -0.0823822021484375, -0.07407379150390625, -0.065765380859375, -0.05745697021484375, -0.0491485595703125, -0.04084014892578125, -0.03253173828125, -0.02422332763671875, -0.0159149169921875, -0.00760650634765625, 0.000701904296875, 0.00901031494140625, 0.0173187255859375, 0.02562713623046875, 0.033935546875, 0.04224395751953125, 0.0505523681640625, 0.05886077880859375, 0.067169189453125, 0.07547760009765625, 0.0837860107421875, 0.09209442138671875, 0.10040283203125, 0.10871124267578125, 0.1170196533203125, 0.12532806396484375, 0.133636474609375, 0.14194488525390625, 0.1502532958984375, 0.15856170654296875, 0.1668701171875, 0.17517852783203125, 0.1834869384765625, 0.19179534912109375, 0.200103759765625, 0.20841217041015625, 0.2167205810546875, 0.22502899169921875, 0.23333740234375, 0.24164581298828125, 0.2499542236328125, 0.25826263427734375, 0.266571044921875, 0.27487945556640625, 0.2831878662109375, 0.29149627685546875, 0.2998046875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 9.0, 18.0, 25.0, 70.0, 96.0, 146.0, 183.0, 171.0, 124.0, 81.0, 38.0, 18.0, 8.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.785530090332031, -4.6339921951293945, -4.482454776763916, -4.330916881561279, -4.179378986358643, -4.027841567993164, -3.8763036727905273, -3.7247657775878906, -3.573228120803833, -3.4216904640197754, -3.2701525688171387, -3.118614912033081, -2.9670772552490234, -2.8155393600463867, -2.664001703262329, -2.5124640464782715, -2.3609261512756348, -2.209388494491577, -2.0578505992889404, -1.9063129425048828, -1.7547751665115356, -1.6032373905181885, -1.4516997337341309, -1.3001619577407837, -1.1486241817474365, -0.9970864057540894, -0.845548689365387, -0.6940109729766846, -0.5424731969833374, -0.39093542098999023, -0.23939770460128784, -0.08785998821258545, 0.06367778778076172, 0.2152155339717865, 0.3667532801628113, 0.5182909965515137, 0.6698287725448608, 0.821366548538208, 0.9729042649269104, 1.1244419813156128, 1.27597975730896, 1.4275175333023071, 1.5790553092956543, 1.730592966079712, 1.882130742073059, 2.0336685180664062, 2.185206174850464, 2.3367438316345215, 2.488281726837158, 2.639819383621216, 2.7913572788238525, 2.94289493560791, 3.094432830810547, 3.2459704875946045, 3.397508144378662, 3.549046039581299, 3.7005836963653564, 3.852121353149414, 4.003659248352051, 4.1551971435546875, 4.306734561920166, 4.458272457122803, 4.6098103523254395, 4.761347770690918, 4.912885665893555]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 3.0, 4.0, 7.0, 8.0, 9.0, 8.0, 13.0, 13.0, 13.0, 18.0, 15.0, 20.0, 23.0, 25.0, 21.0, 35.0, 53.0, 44.0, 53.0, 54.0, 51.0, 51.0, 51.0, 43.0, 42.0, 42.0, 33.0, 36.0, 37.0, 24.0, 18.0, 23.0, 15.0, 17.0, 11.0, 16.0, 9.0, 11.0, 8.0, 6.0, 4.0, 7.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.340937376022339, -2.2659387588500977, -2.1909403800964355, -2.1159417629241943, -2.0409433841705322, -1.965944766998291, -1.8909462690353394, -1.8159477710723877, -1.740949273109436, -1.6659507751464844, -1.5909522771835327, -1.515953779220581, -1.4409551620483398, -1.3659567832946777, -1.2909581661224365, -1.2159596681594849, -1.1409611701965332, -1.0659626722335815, -0.9909641742706299, -0.9159656167030334, -0.8409671187400818, -0.7659686207771301, -0.6909700632095337, -0.615971565246582, -0.5409730672836304, -0.4659745693206787, -0.39097604155540466, -0.3159775137901306, -0.24097901582717896, -0.1659805178642273, -0.09098199009895325, -0.0159834623336792, 0.05901527404785156, 0.13401378691196442, 0.20901229977607727, 0.2840108275413513, 0.359009325504303, 0.43400782346725464, 0.5090063810348511, 0.5840048789978027, 0.6590033769607544, 0.734001874923706, 0.8090003728866577, 0.8839989304542542, 0.9589974284172058, 1.0339958667755127, 1.108994483947754, 1.1839929819107056, 1.2589914798736572, 1.3339899778366089, 1.4089884757995605, 1.4839869737625122, 1.5589854717254639, 1.633984088897705, 1.7089825868606567, 1.7839810848236084, 1.85897958278656, 1.9339780807495117, 2.008976697921753, 2.083975076675415, 2.1589736938476562, 2.2339720726013184, 2.3089706897735596, 2.383969306945801, 2.458967685699463]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 5.0, 5.0, 7.0, 20.0, 25.0, 34.0, 30.0, 57.0, 63.0, 89.0, 142.0, 222.0, 280.0, 407.0, 707.0, 1224.0, 2449.0, 6496.0, 33467.0, 4114581.0, 23304.0, 5353.0, 2220.0, 1155.0, 606.0, 419.0, 256.0, 168.0, 132.0, 85.0, 81.0, 58.0, 44.0, 23.0, 26.0, 19.0, 7.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5263671875, -0.5101318359375, -0.493896484375, -0.4776611328125, -0.46142578125, -0.4451904296875, -0.428955078125, -0.4127197265625, -0.396484375, -0.3802490234375, -0.364013671875, -0.3477783203125, -0.33154296875, -0.3153076171875, -0.299072265625, -0.2828369140625, -0.2666015625, -0.2503662109375, -0.234130859375, -0.2178955078125, -0.20166015625, -0.1854248046875, -0.169189453125, -0.1529541015625, -0.13671875, -0.1204833984375, -0.104248046875, -0.0880126953125, -0.07177734375, -0.0555419921875, -0.039306640625, -0.0230712890625, -0.0068359375, 0.0093994140625, 0.025634765625, 0.0418701171875, 0.05810546875, 0.0743408203125, 0.090576171875, 0.1068115234375, 0.123046875, 0.1392822265625, 0.155517578125, 0.1717529296875, 0.18798828125, 0.2042236328125, 0.220458984375, 0.2366943359375, 0.2529296875, 0.2691650390625, 0.285400390625, 0.3016357421875, 0.31787109375, 0.3341064453125, 0.350341796875, 0.3665771484375, 0.3828125, 0.3990478515625, 0.415283203125, 0.4315185546875, 0.44775390625, 0.4639892578125, 0.480224609375, 0.4964599609375, 0.5126953125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 5.0, 7.0, 12.0, 13.0, 15.0, 14.0, 29.0, 21.0, 28.0, 31.0, 29.0, 43.0, 69.0, 59.0, 68.0, 64.0, 70.0, 62.0, 61.0, 52.0, 42.0, 44.0, 43.0, 30.0, 35.0, 7.0, 16.0, 4.0, 11.0, 4.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.1522216796875, -0.1479644775390625, -0.143707275390625, -0.1394500732421875, -0.13519287109375, -0.1309356689453125, -0.126678466796875, -0.1224212646484375, -0.1181640625, -0.1139068603515625, -0.109649658203125, -0.1053924560546875, -0.10113525390625, -0.0968780517578125, -0.092620849609375, -0.0883636474609375, -0.0841064453125, -0.0798492431640625, -0.075592041015625, -0.0713348388671875, -0.06707763671875, -0.0628204345703125, -0.058563232421875, -0.0543060302734375, -0.050048828125, -0.0457916259765625, -0.041534423828125, -0.0372772216796875, -0.03302001953125, -0.0287628173828125, -0.024505615234375, -0.0202484130859375, -0.0159912109375, -0.0117340087890625, -0.007476806640625, -0.0032196044921875, 0.00103759765625, 0.0052947998046875, 0.009552001953125, 0.0138092041015625, 0.01806640625, 0.0223236083984375, 0.026580810546875, 0.0308380126953125, 0.03509521484375, 0.0393524169921875, 0.043609619140625, 0.0478668212890625, 0.0521240234375, 0.0563812255859375, 0.060638427734375, 0.0648956298828125, 0.06915283203125, 0.0734100341796875, 0.077667236328125, 0.0819244384765625, 0.086181640625, 0.0904388427734375, 0.094696044921875, 0.0989532470703125, 0.10321044921875, 0.1074676513671875, 0.111724853515625, 0.1159820556640625, 0.1202392578125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 11.0, 7.0, 12.0, 10.0, 29.0, 34.0, 49.0, 64.0, 67.0, 98.0, 158.0, 244.0, 376.0, 667.0, 1408.0, 3572.0, 12472.0, 289997.0, 3864122.0, 13750.0, 3830.0, 1461.0, 695.0, 389.0, 220.0, 161.0, 102.0, 78.0, 59.0, 37.0, 23.0, 28.0, 17.0, 11.0, 6.0, 8.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8232421875, -0.7975387573242188, -0.7718353271484375, -0.7461318969726562, -0.720428466796875, -0.6947250366210938, -0.6690216064453125, -0.6433181762695312, -0.61761474609375, -0.5919113159179688, -0.5662078857421875, -0.5405044555664062, -0.514801025390625, -0.48909759521484375, -0.4633941650390625, -0.43769073486328125, -0.4119873046875, -0.38628387451171875, -0.3605804443359375, -0.33487701416015625, -0.309173583984375, -0.28347015380859375, -0.2577667236328125, -0.23206329345703125, -0.20635986328125, -0.18065643310546875, -0.1549530029296875, -0.12924957275390625, -0.103546142578125, -0.07784271240234375, -0.0521392822265625, -0.02643585205078125, -0.000732421875, 0.02497100830078125, 0.0506744384765625, 0.07637786865234375, 0.102081298828125, 0.12778472900390625, 0.1534881591796875, 0.17919158935546875, 0.20489501953125, 0.23059844970703125, 0.2563018798828125, 0.28200531005859375, 0.307708740234375, 0.33341217041015625, 0.3591156005859375, 0.38481903076171875, 0.4105224609375, 0.43622589111328125, 0.4619293212890625, 0.48763275146484375, 0.513336181640625, 0.5390396118164062, 0.5647430419921875, 0.5904464721679688, 0.61614990234375, 0.6418533325195312, 0.6675567626953125, 0.6932601928710938, 0.718963623046875, 0.7446670532226562, 0.7703704833984375, 0.7960739135742188, 0.82177734375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 4.0, 4.0, 6.0, 3.0, 8.0, 23.0, 41.0, 423.0, 3468.0, 49.0, 22.0, 13.0, 5.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2459716796875, -0.23950576782226562, -0.23303985595703125, -0.22657394409179688, -0.2201080322265625, -0.21364212036132812, -0.20717620849609375, -0.20071029663085938, -0.194244384765625, -0.18777847290039062, -0.18131256103515625, -0.17484664916992188, -0.1683807373046875, -0.16191482543945312, -0.15544891357421875, -0.14898300170898438, -0.14251708984375, -0.13605117797851562, -0.12958526611328125, -0.12311935424804688, -0.1166534423828125, -0.11018753051757812, -0.10372161865234375, -0.09725570678710938, -0.090789794921875, -0.08432388305664062, -0.07785797119140625, -0.07139205932617188, -0.0649261474609375, -0.058460235595703125, -0.05199432373046875, -0.045528411865234375, -0.0390625, -0.032596588134765625, -0.02613067626953125, -0.019664764404296875, -0.0131988525390625, -0.006732940673828125, -0.00026702880859375, 0.006198883056640625, 0.012664794921875, 0.019130706787109375, 0.02559661865234375, 0.032062530517578125, 0.0385284423828125, 0.044994354248046875, 0.05146026611328125, 0.057926177978515625, 0.06439208984375, 0.07085800170898438, 0.07732391357421875, 0.08378982543945312, 0.0902557373046875, 0.09672164916992188, 0.10318756103515625, 0.10965347290039062, 0.116119384765625, 0.12258529663085938, 0.12905120849609375, 0.13551712036132812, 0.1419830322265625, 0.14844894409179688, 0.15491485595703125, 0.16138076782226562, 0.1678466796875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 2.0, 8.0, 4.0, 5.0, 9.0, 16.0, 27.0, 40.0, 55.0, 96.0, 109.0, 114.0, 131.0, 121.0, 92.0, 63.0, 28.0, 26.0, 20.0, 16.0, 7.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5904878377914429, -0.574653148651123, -0.5588184595108032, -0.5429837107658386, -0.5271490216255188, -0.511314332485199, -0.49547961354255676, -0.47964489459991455, -0.4638102054595947, -0.4479755163192749, -0.4321407973766327, -0.4163060784339905, -0.40047138929367065, -0.38463670015335083, -0.3688019812107086, -0.3529672622680664, -0.3371325731277466, -0.32129788398742676, -0.30546316504478455, -0.28962844610214233, -0.2737937569618225, -0.2579590678215027, -0.24212434887886047, -0.22628964483737946, -0.21045494079589844, -0.19462023675441742, -0.1787855327129364, -0.16295082867145538, -0.14711612462997437, -0.13128142058849335, -0.11544671654701233, -0.09961201250553131, -0.08377724885940552, -0.0679425448179245, -0.05210784077644348, -0.03627313673496246, -0.020438432693481445, -0.004603728652000427, 0.01123097538948059, 0.02706567943096161, 0.04290038347244263, 0.058735087513923645, 0.07456979155540466, 0.09040449559688568, 0.1062391996383667, 0.12207390367984772, 0.13790860772132874, 0.15374331176280975, 0.16957801580429077, 0.1854127198457718, 0.2012474238872528, 0.21708212792873383, 0.23291683197021484, 0.24875153601169586, 0.2645862400531769, 0.2804209589958191, 0.2962556481361389, 0.31209033727645874, 0.32792505621910095, 0.34375977516174316, 0.359594464302063, 0.3754291534423828, 0.391263872385025, 0.40709859132766724, 0.42293328046798706]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 5.0, 5.0, 2.0, 6.0, 5.0, 7.0, 8.0, 12.0, 13.0, 19.0, 19.0, 16.0, 23.0, 22.0, 32.0, 20.0, 33.0, 33.0, 40.0, 33.0, 48.0, 29.0, 44.0, 41.0, 43.0, 36.0, 28.0, 37.0, 31.0, 45.0, 36.0, 33.0, 15.0, 20.0, 22.0, 17.0, 18.0, 18.0, 13.0, 18.0, 18.0, 8.0, 8.0, 12.0, 5.0, 1.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.22275447845458984, -0.21590979397296906, -0.20906510949134827, -0.20222041010856628, -0.1953757256269455, -0.1885310411453247, -0.18168634176254272, -0.17484165728092194, -0.16799697279930115, -0.16115228831768036, -0.15430760383605957, -0.1474629044532776, -0.1406182199716568, -0.133773535490036, -0.12692883610725403, -0.12008415162563324, -0.11323946714401245, -0.10639478266239166, -0.09955009073019028, -0.09270539879798889, -0.0858607143163681, -0.07901602983474731, -0.07217133790254593, -0.06532664597034454, -0.058481961488723755, -0.05163727328181267, -0.04479258507490158, -0.037947896867990494, -0.031103208661079407, -0.02425852045416832, -0.017413832247257233, -0.010569144040346146, -0.0037244558334350586, 0.0031202323734760284, 0.009964920580387115, 0.016809608787298203, 0.02365429699420929, 0.030498985201120377, 0.037343673408031464, 0.04418836161494255, 0.05103304982185364, 0.057877738028764725, 0.06472242623567581, 0.0715671181678772, 0.07841180264949799, 0.08525648713111877, 0.09210117906332016, 0.09894587099552155, 0.10579055547714233, 0.11263523995876312, 0.11947993189096451, 0.1263246238231659, 0.13316930830478668, 0.14001399278640747, 0.14685869216918945, 0.15370337665081024, 0.16054806113243103, 0.16739274561405182, 0.1742374300956726, 0.1810821294784546, 0.18792681396007538, 0.19477149844169617, 0.20161619782447815, 0.20846088230609894, 0.21530556678771973]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 5.0, 8.0, 8.0, 13.0, 14.0, 37.0, 38.0, 61.0, 129.0, 171.0, 272.0, 444.0, 669.0, 1182.0, 1931.0, 3572.0, 6511.0, 12468.0, 24290.0, 49406.0, 100855.0, 199051.0, 279832.0, 183705.0, 91317.0, 44958.0, 22230.0, 11420.0, 5958.0, 3249.0, 1872.0, 1094.0, 639.0, 401.0, 240.0, 172.0, 96.0, 73.0, 53.0, 31.0, 26.0, 20.0, 14.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.1552734375, -0.15048599243164062, -0.14569854736328125, -0.14091110229492188, -0.1361236572265625, -0.13133621215820312, -0.12654876708984375, -0.12176132202148438, -0.116973876953125, -0.11218643188476562, -0.10739898681640625, -0.10261154174804688, -0.0978240966796875, -0.09303665161132812, -0.08824920654296875, -0.08346176147460938, -0.07867431640625, -0.07388687133789062, -0.06909942626953125, -0.06431198120117188, -0.0595245361328125, -0.054737091064453125, -0.04994964599609375, -0.045162200927734375, -0.040374755859375, -0.035587310791015625, -0.03079986572265625, -0.026012420654296875, -0.0212249755859375, -0.016437530517578125, -0.01165008544921875, -0.006862640380859375, -0.0020751953125, 0.002712249755859375, 0.00749969482421875, 0.012287139892578125, 0.0170745849609375, 0.021862030029296875, 0.02664947509765625, 0.031436920166015625, 0.036224365234375, 0.041011810302734375, 0.04579925537109375, 0.050586700439453125, 0.0553741455078125, 0.060161590576171875, 0.06494903564453125, 0.06973648071289062, 0.07452392578125, 0.07931137084960938, 0.08409881591796875, 0.08888626098632812, 0.0936737060546875, 0.09846115112304688, 0.10324859619140625, 0.10803604125976562, 0.112823486328125, 0.11761093139648438, 0.12239837646484375, 0.12718582153320312, 0.1319732666015625, 0.13676071166992188, 0.14154815673828125, 0.14633560180664062, 0.151123046875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 6.0, 5.0, 13.0, 10.0, 18.0, 16.0, 24.0, 26.0, 35.0, 42.0, 41.0, 38.0, 63.0, 73.0, 72.0, 63.0, 60.0, 67.0, 67.0, 47.0, 48.0, 39.0, 31.0, 22.0, 22.0, 17.0, 10.0, 5.0, 7.0, 4.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1619873046875, -0.15725326538085938, -0.15251922607421875, -0.14778518676757812, -0.1430511474609375, -0.13831710815429688, -0.13358306884765625, -0.12884902954101562, -0.124114990234375, -0.11938095092773438, -0.11464691162109375, -0.10991287231445312, -0.1051788330078125, -0.10044479370117188, -0.09571075439453125, -0.09097671508789062, -0.08624267578125, -0.08150863647460938, -0.07677459716796875, -0.07204055786132812, -0.0673065185546875, -0.06257247924804688, -0.05783843994140625, -0.053104400634765625, -0.048370361328125, -0.043636322021484375, -0.03890228271484375, -0.034168243408203125, -0.0294342041015625, -0.024700164794921875, -0.01996612548828125, -0.015232086181640625, -0.010498046875, -0.005764007568359375, -0.00102996826171875, 0.003704071044921875, 0.0084381103515625, 0.013172149658203125, 0.01790618896484375, 0.022640228271484375, 0.027374267578125, 0.032108306884765625, 0.03684234619140625, 0.041576385498046875, 0.0463104248046875, 0.051044464111328125, 0.05577850341796875, 0.060512542724609375, 0.06524658203125, 0.06998062133789062, 0.07471466064453125, 0.07944869995117188, 0.0841827392578125, 0.08891677856445312, 0.09365081787109375, 0.09838485717773438, 0.103118896484375, 0.10785293579101562, 0.11258697509765625, 0.11732101440429688, 0.1220550537109375, 0.12678909301757812, 0.13152313232421875, 0.13625717163085938, 0.1409912109375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 9.0, 7.0, 9.0, 14.0, 21.0, 9.0, 31.0, 30.0, 43.0, 60.0, 81.0, 75.0, 124.0, 175.0, 249.0, 333.0, 472.0, 740.0, 1428.0, 3172.0, 9614.0, 40706.0, 249322.0, 597281.0, 112280.0, 21213.0, 5680.0, 2170.0, 1099.0, 630.0, 419.0, 255.0, 179.0, 141.0, 114.0, 92.0, 66.0, 55.0, 33.0, 31.0, 20.0, 16.0, 6.0, 11.0, 13.0, 9.0, 2.0, 7.0, 3.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.283203125, -0.2738533020019531, -0.26450347900390625, -0.2551536560058594, -0.2458038330078125, -0.23645401000976562, -0.22710418701171875, -0.21775436401367188, -0.208404541015625, -0.19905471801757812, -0.18970489501953125, -0.18035507202148438, -0.1710052490234375, -0.16165542602539062, -0.15230560302734375, -0.14295578002929688, -0.13360595703125, -0.12425613403320312, -0.11490631103515625, -0.10555648803710938, -0.0962066650390625, -0.08685684204101562, -0.07750701904296875, -0.06815719604492188, -0.058807373046875, -0.049457550048828125, -0.04010772705078125, -0.030757904052734375, -0.0214080810546875, -0.012058258056640625, -0.00270843505859375, 0.006641387939453125, 0.0159912109375, 0.025341033935546875, 0.03469085693359375, 0.044040679931640625, 0.0533905029296875, 0.06274032592773438, 0.07209014892578125, 0.08143997192382812, 0.090789794921875, 0.10013961791992188, 0.10948944091796875, 0.11883926391601562, 0.1281890869140625, 0.13753890991210938, 0.14688873291015625, 0.15623855590820312, 0.16558837890625, 0.17493820190429688, 0.18428802490234375, 0.19363784790039062, 0.2029876708984375, 0.21233749389648438, 0.22168731689453125, 0.23103713989257812, 0.240386962890625, 0.24973678588867188, 0.25908660888671875, 0.2684364318847656, 0.2777862548828125, 0.2871360778808594, 0.29648590087890625, 0.3058357238769531, 0.315185546875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 7.0, 15.0, 10.0, 5.0, 9.0, 17.0, 21.0, 24.0, 24.0, 28.0, 23.0, 30.0, 24.0, 34.0, 39.0, 41.0, 54.0, 39.0, 60.0, 39.0, 39.0, 38.0, 38.0, 28.0, 29.0, 30.0, 38.0, 36.0, 24.0, 10.0, 24.0, 32.0, 15.0, 15.0, 12.0, 11.0, 8.0, 5.0, 1.0, 5.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.393798828125, -0.3796272277832031, -0.36545562744140625, -0.3512840270996094, -0.3371124267578125, -0.3229408264160156, -0.30876922607421875, -0.2945976257324219, -0.280426025390625, -0.2662544250488281, -0.25208282470703125, -0.23791122436523438, -0.2237396240234375, -0.20956802368164062, -0.19539642333984375, -0.18122482299804688, -0.16705322265625, -0.15288162231445312, -0.13871002197265625, -0.12453842163085938, -0.1103668212890625, -0.09619522094726562, -0.08202362060546875, -0.06785202026367188, -0.053680419921875, -0.039508819580078125, -0.02533721923828125, -0.011165618896484375, 0.0030059814453125, 0.017177581787109375, 0.03134918212890625, 0.045520782470703125, 0.0596923828125, 0.07386398315429688, 0.08803558349609375, 0.10220718383789062, 0.1163787841796875, 0.13055038452148438, 0.14472198486328125, 0.15889358520507812, 0.173065185546875, 0.18723678588867188, 0.20140838623046875, 0.21557998657226562, 0.2297515869140625, 0.24392318725585938, 0.25809478759765625, 0.2722663879394531, 0.28643798828125, 0.3006095886230469, 0.31478118896484375, 0.3289527893066406, 0.3431243896484375, 0.3572959899902344, 0.37146759033203125, 0.3856391906738281, 0.399810791015625, 0.4139823913574219, 0.42815399169921875, 0.4423255920410156, 0.4564971923828125, 0.4706687927246094, 0.48484039306640625, 0.4990119934082031, 0.51318359375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 4.0, 5.0, 5.0, 16.0, 22.0, 13.0, 37.0, 38.0, 91.0, 144.0, 261.0, 592.0, 1465.0, 4899.0, 28057.0, 422791.0, 548192.0, 33543.0, 5479.0, 1610.0, 626.0, 281.0, 134.0, 87.0, 44.0, 38.0, 19.0, 19.0, 6.0, 9.0, 7.0, 10.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.288330078125, -0.2803306579589844, -0.27233123779296875, -0.2643318176269531, -0.2563323974609375, -0.24833297729492188, -0.24033355712890625, -0.23233413696289062, -0.224334716796875, -0.21633529663085938, -0.20833587646484375, -0.20033645629882812, -0.1923370361328125, -0.18433761596679688, -0.17633819580078125, -0.16833877563476562, -0.16033935546875, -0.15233993530273438, -0.14434051513671875, -0.13634109497070312, -0.1283416748046875, -0.12034225463867188, -0.11234283447265625, -0.10434341430664062, -0.096343994140625, -0.08834457397460938, -0.08034515380859375, -0.07234573364257812, -0.0643463134765625, -0.056346893310546875, -0.04834747314453125, -0.040348052978515625, -0.0323486328125, -0.024349212646484375, -0.01634979248046875, -0.008350372314453125, -0.0003509521484375, 0.007648468017578125, 0.01564788818359375, 0.023647308349609375, 0.031646728515625, 0.039646148681640625, 0.04764556884765625, 0.055644989013671875, 0.0636444091796875, 0.07164382934570312, 0.07964324951171875, 0.08764266967773438, 0.09564208984375, 0.10364151000976562, 0.11164093017578125, 0.11964035034179688, 0.1276397705078125, 0.13563919067382812, 0.14363861083984375, 0.15163803100585938, 0.159637451171875, 0.16763687133789062, 0.17563629150390625, 0.18363571166992188, 0.1916351318359375, 0.19963455200195312, 0.20763397216796875, 0.21563339233398438, 0.2236328125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 8.0, 9.0, 13.0, 17.0, 34.0, 34.0, 49.0, 75.0, 124.0, 157.0, 133.0, 103.0, 74.0, 57.0, 29.0, 26.0, 15.0, 17.0, 10.0, 7.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.667043685913086e-05, -4.479195922613144e-05, -4.291348159313202e-05, -4.10350039601326e-05, -3.915652632713318e-05, -3.727804869413376e-05, -3.539957106113434e-05, -3.352109342813492e-05, -3.16426157951355e-05, -2.9764138162136078e-05, -2.7885660529136658e-05, -2.6007182896137238e-05, -2.4128705263137817e-05, -2.2250227630138397e-05, -2.0371749997138977e-05, -1.8493272364139557e-05, -1.6614794731140137e-05, -1.4736317098140717e-05, -1.2857839465141296e-05, -1.0979361832141876e-05, -9.100884199142456e-06, -7.222406566143036e-06, -5.343928933143616e-06, -3.4654513001441956e-06, -1.5869736671447754e-06, 2.915039658546448e-07, 2.169981598854065e-06, 4.048459231853485e-06, 5.926936864852905e-06, 7.805414497852325e-06, 9.683892130851746e-06, 1.1562369763851166e-05, 1.3440847396850586e-05, 1.5319325029850006e-05, 1.7197802662849426e-05, 1.9076280295848846e-05, 2.0954757928848267e-05, 2.2833235561847687e-05, 2.4711713194847107e-05, 2.6590190827846527e-05, 2.8468668460845947e-05, 3.0347146093845367e-05, 3.222562372684479e-05, 3.410410135984421e-05, 3.598257899284363e-05, 3.786105662584305e-05, 3.973953425884247e-05, 4.161801189184189e-05, 4.349648952484131e-05, 4.537496715784073e-05, 4.725344479084015e-05, 4.913192242383957e-05, 5.101040005683899e-05, 5.288887768983841e-05, 5.476735532283783e-05, 5.664583295583725e-05, 5.852431058883667e-05, 6.040278822183609e-05, 6.228126585483551e-05, 6.415974348783493e-05, 6.603822112083435e-05, 6.791669875383377e-05, 6.979517638683319e-05, 7.167365401983261e-05, 7.355213165283203e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 11.0, 26.0, 32.0, 61.0, 108.0, 172.0, 332.0, 820.0, 2184.0, 10323.0, 106401.0, 816587.0, 97932.0, 9754.0, 2267.0, 800.0, 326.0, 168.0, 86.0, 52.0, 31.0, 22.0, 13.0, 7.0, 12.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.341552734375, -0.3324413299560547, -0.3233299255371094, -0.31421852111816406, -0.30510711669921875, -0.29599571228027344, -0.2868843078613281, -0.2777729034423828, -0.2686614990234375, -0.2595500946044922, -0.2504386901855469, -0.24132728576660156, -0.23221588134765625, -0.22310447692871094, -0.21399307250976562, -0.2048816680908203, -0.195770263671875, -0.1866588592529297, -0.17754745483398438, -0.16843605041503906, -0.15932464599609375, -0.15021324157714844, -0.14110183715820312, -0.1319904327392578, -0.1228790283203125, -0.11376762390136719, -0.10465621948242188, -0.09554481506347656, -0.08643341064453125, -0.07732200622558594, -0.06821060180664062, -0.05909919738769531, -0.04998779296875, -0.04087638854980469, -0.031764984130859375, -0.022653579711914062, -0.01354217529296875, -0.0044307708740234375, 0.004680633544921875, 0.013792037963867188, 0.0229034423828125, 0.03201484680175781, 0.041126251220703125, 0.05023765563964844, 0.05934906005859375, 0.06846046447753906, 0.07757186889648438, 0.08668327331542969, 0.095794677734375, 0.10490608215332031, 0.11401748657226562, 0.12312889099121094, 0.13224029541015625, 0.14135169982910156, 0.15046310424804688, 0.1595745086669922, 0.1686859130859375, 0.1777973175048828, 0.18690872192382812, 0.19602012634277344, 0.20513153076171875, 0.21424293518066406, 0.22335433959960938, 0.2324657440185547, 0.2415771484375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 6.0, 7.0, 8.0, 15.0, 23.0, 33.0, 48.0, 73.0, 70.0, 119.0, 97.0, 136.0, 91.0, 94.0, 63.0, 41.0, 23.0, 18.0, 14.0, 9.0, 1.0, 6.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.294189453125, -0.2871742248535156, -0.28015899658203125, -0.2731437683105469, -0.2661285400390625, -0.2591133117675781, -0.25209808349609375, -0.24508285522460938, -0.238067626953125, -0.23105239868164062, -0.22403717041015625, -0.21702194213867188, -0.2100067138671875, -0.20299148559570312, -0.19597625732421875, -0.18896102905273438, -0.18194580078125, -0.17493057250976562, -0.16791534423828125, -0.16090011596679688, -0.1538848876953125, -0.14686965942382812, -0.13985443115234375, -0.13283920288085938, -0.125823974609375, -0.11880874633789062, -0.11179351806640625, -0.10477828979492188, -0.0977630615234375, -0.09074783325195312, -0.08373260498046875, -0.07671737670898438, -0.0697021484375, -0.06268692016601562, -0.05567169189453125, -0.048656463623046875, -0.0416412353515625, -0.034626007080078125, -0.02761077880859375, -0.020595550537109375, -0.013580322265625, -0.006565093994140625, 0.00045013427734375, 0.007465362548828125, 0.0144805908203125, 0.021495819091796875, 0.02851104736328125, 0.035526275634765625, 0.04254150390625, 0.049556732177734375, 0.05657196044921875, 0.06358718872070312, 0.0706024169921875, 0.07761764526367188, 0.08463287353515625, 0.09164810180664062, 0.098663330078125, 0.10567855834960938, 0.11269378662109375, 0.11970901489257812, 0.1267242431640625, 0.13373947143554688, 0.14075469970703125, 0.14776992797851562, 0.15478515625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 6.0, 8.0, 15.0, 37.0, 75.0, 106.0, 142.0, 178.0, 167.0, 114.0, 66.0, 43.0, 20.0, 8.0, 9.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.119657516479492, -4.010087490081787, -3.900517702102661, -3.790947914123535, -3.681378126144409, -3.571808338165283, -3.462238311767578, -3.352668523788452, -3.243098735809326, -3.1335289478302, -3.023958921432495, -2.914389133453369, -2.804819345474243, -2.695249557495117, -2.585679531097412, -2.476109743118286, -2.366539716720581, -2.256969928741455, -2.14739990234375, -2.037830114364624, -1.928260326385498, -1.8186904191970825, -1.709120512008667, -1.599550724029541, -1.4899808168411255, -1.38041090965271, -1.270841121673584, -1.1612712144851685, -1.051701307296753, -0.942131519317627, -0.8325616121292114, -0.7229917645454407, -0.6134216785430908, -0.5038518309593201, -0.39428195357322693, -0.2847120761871338, -0.17514222860336304, -0.06557238101959229, 0.04399752616882324, 0.153567373752594, 0.26313722133636475, 0.3727070689201355, 0.48227694630622864, 0.5918468236923218, 0.7014166712760925, 0.8109865188598633, 0.9205564260482788, 1.0301263332366943, 1.1396961212158203, 1.2492660284042358, 1.3588358163833618, 1.4684057235717773, 1.5779755115509033, 1.6875454187393188, 1.7971153259277344, 1.9066851139068604, 2.0162549018859863, 2.1258246898651123, 2.2353947162628174, 2.3449645042419434, 2.4545342922210693, 2.5641040802001953, 2.6736741065979004, 2.7832438945770264, 2.8928139209747314]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 5.0, 1.0, 5.0, 9.0, 9.0, 7.0, 5.0, 16.0, 15.0, 20.0, 22.0, 26.0, 32.0, 40.0, 33.0, 54.0, 43.0, 52.0, 69.0, 74.0, 61.0, 60.0, 46.0, 52.0, 43.0, 31.0, 33.0, 26.0, 21.0, 19.0, 19.0, 13.0, 13.0, 10.0, 3.0, 8.0, 5.0, 2.0, 1.0, 4.0, 1.0, 4.0, 0.0, 3.0, 1.0], "bins": [-3.3458478450775146, -3.259589195251465, -3.173330307006836, -3.087071657180786, -3.0008130073547363, -2.9145543575286865, -2.8282957077026367, -2.742036819458008, -2.655778169631958, -2.569519519805908, -2.4832606315612793, -2.3970019817352295, -2.3107433319091797, -2.22448468208313, -2.13822603225708, -2.051967144012451, -1.9657084941864014, -1.8794498443603516, -1.7931910753250122, -1.7069323062896729, -1.620673656463623, -1.5344150066375732, -1.4481562376022339, -1.3618974685668945, -1.2756388187408447, -1.189380168914795, -1.1031213998794556, -1.0168626308441162, -0.9306039810180664, -0.8443452715873718, -0.7580865621566772, -0.6718278527259827, -0.5855693817138672, -0.4993106722831726, -0.413051962852478, -0.32679325342178345, -0.24053454399108887, -0.1542758345603943, -0.06801712512969971, 0.018241584300994873, 0.10450029373168945, 0.19075900316238403, 0.2770177125930786, 0.3632764220237732, 0.4495351314544678, 0.5357938408851624, 0.6220525503158569, 0.7083112597465515, 0.7945699691772461, 0.8808286786079407, 0.9670873880386353, 1.0533461570739746, 1.1396048069000244, 1.2258634567260742, 1.3121222257614136, 1.398380994796753, 1.4846396446228027, 1.5708982944488525, 1.657157063484192, 1.7434158325195312, 1.829674482345581, 1.9159331321716309, 2.0021920204162598, 2.0884506702423096, 2.1747093200683594]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 9.0, 2.0, 3.0, 8.0, 6.0, 15.0, 19.0, 35.0, 53.0, 59.0, 100.0, 130.0, 188.0, 325.0, 424.0, 655.0, 1057.0, 1864.0, 3379.0, 7028.0, 18008.0, 94084.0, 3977468.0, 61372.0, 14475.0, 6002.0, 2989.0, 1683.0, 1003.0, 597.0, 406.0, 258.0, 179.0, 119.0, 76.0, 51.0, 46.0, 27.0, 23.0, 15.0, 15.0, 8.0, 4.0, 7.0, 5.0, 5.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29443359375, -0.2844200134277344, -0.27440643310546875, -0.2643928527832031, -0.2543792724609375, -0.24436569213867188, -0.23435211181640625, -0.22433853149414062, -0.214324951171875, -0.20431137084960938, -0.19429779052734375, -0.18428421020507812, -0.1742706298828125, -0.16425704956054688, -0.15424346923828125, -0.14422988891601562, -0.13421630859375, -0.12420272827148438, -0.11418914794921875, -0.10417556762695312, -0.0941619873046875, -0.08414840698242188, -0.07413482666015625, -0.06412124633789062, -0.054107666015625, -0.044094085693359375, -0.03408050537109375, -0.024066925048828125, -0.0140533447265625, -0.004039764404296875, 0.00597381591796875, 0.015987396240234375, 0.0260009765625, 0.036014556884765625, 0.04602813720703125, 0.056041717529296875, 0.0660552978515625, 0.07606887817382812, 0.08608245849609375, 0.09609603881835938, 0.106109619140625, 0.11612319946289062, 0.12613677978515625, 0.13615036010742188, 0.1461639404296875, 0.15617752075195312, 0.16619110107421875, 0.17620468139648438, 0.18621826171875, 0.19623184204101562, 0.20624542236328125, 0.21625900268554688, 0.2262725830078125, 0.23628616333007812, 0.24629974365234375, 0.2563133239746094, 0.266326904296875, 0.2763404846191406, 0.28635406494140625, 0.2963676452636719, 0.3063812255859375, 0.3163948059082031, 0.32640838623046875, 0.3364219665527344, 0.346435546875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 5.0, 7.0, 7.0, 8.0, 14.0, 14.0, 15.0, 19.0, 28.0, 29.0, 34.0, 38.0, 46.0, 50.0, 60.0, 61.0, 65.0, 70.0, 58.0, 57.0, 62.0, 44.0, 38.0, 28.0, 35.0, 23.0, 20.0, 19.0, 15.0, 9.0, 13.0, 5.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.1629638671875, -0.1585378646850586, -0.1541118621826172, -0.14968585968017578, -0.14525985717773438, -0.14083385467529297, -0.13640785217285156, -0.13198184967041016, -0.12755584716796875, -0.12312984466552734, -0.11870384216308594, -0.11427783966064453, -0.10985183715820312, -0.10542583465576172, -0.10099983215332031, -0.0965738296508789, -0.0921478271484375, -0.0877218246459961, -0.08329582214355469, -0.07886981964111328, -0.07444381713867188, -0.07001781463623047, -0.06559181213378906, -0.061165809631347656, -0.05673980712890625, -0.052313804626464844, -0.04788780212402344, -0.04346179962158203, -0.039035797119140625, -0.03460979461669922, -0.030183792114257812, -0.025757789611816406, -0.021331787109375, -0.016905784606933594, -0.012479782104492188, -0.008053779602050781, -0.003627777099609375, 0.0007982254028320312, 0.0052242279052734375, 0.009650230407714844, 0.01407623291015625, 0.018502235412597656, 0.022928237915039062, 0.02735424041748047, 0.031780242919921875, 0.03620624542236328, 0.04063224792480469, 0.045058250427246094, 0.0494842529296875, 0.053910255432128906, 0.05833625793457031, 0.06276226043701172, 0.06718826293945312, 0.07161426544189453, 0.07604026794433594, 0.08046627044677734, 0.08489227294921875, 0.08931827545166016, 0.09374427795410156, 0.09817028045654297, 0.10259628295898438, 0.10702228546142578, 0.11144828796386719, 0.1158742904663086, 0.12030029296875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 7.0, 10.0, 9.0, 10.0, 10.0, 21.0, 20.0, 32.0, 51.0, 78.0, 128.0, 229.0, 444.0, 970.0, 2551.0, 9695.0, 81384.0, 4053118.0, 35802.0, 6255.0, 1817.0, 736.0, 367.0, 198.0, 109.0, 80.0, 32.0, 25.0, 25.0, 15.0, 13.0, 10.0, 10.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.8662109375, -0.840240478515625, -0.81427001953125, -0.788299560546875, -0.7623291015625, -0.736358642578125, -0.71038818359375, -0.684417724609375, -0.658447265625, -0.632476806640625, -0.60650634765625, -0.580535888671875, -0.5545654296875, -0.528594970703125, -0.50262451171875, -0.476654052734375, -0.45068359375, -0.424713134765625, -0.39874267578125, -0.372772216796875, -0.3468017578125, -0.320831298828125, -0.29486083984375, -0.268890380859375, -0.242919921875, -0.216949462890625, -0.19097900390625, -0.165008544921875, -0.1390380859375, -0.113067626953125, -0.08709716796875, -0.061126708984375, -0.03515625, -0.009185791015625, 0.01678466796875, 0.042755126953125, 0.0687255859375, 0.094696044921875, 0.12066650390625, 0.146636962890625, 0.172607421875, 0.198577880859375, 0.22454833984375, 0.250518798828125, 0.2764892578125, 0.302459716796875, 0.32843017578125, 0.354400634765625, 0.38037109375, 0.406341552734375, 0.43231201171875, 0.458282470703125, 0.4842529296875, 0.510223388671875, 0.53619384765625, 0.562164306640625, 0.588134765625, 0.614105224609375, 0.64007568359375, 0.666046142578125, 0.6920166015625, 0.717987060546875, 0.74395751953125, 0.769927978515625, 0.7958984375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 9.0, 8.0, 15.0, 24.0, 39.0, 73.0, 235.0, 3345.0, 188.0, 61.0, 22.0, 17.0, 10.0, 9.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19482421875, -0.18571853637695312, -0.17661285400390625, -0.16750717163085938, -0.1584014892578125, -0.14929580688476562, -0.14019012451171875, -0.13108444213867188, -0.121978759765625, -0.11287307739257812, -0.10376739501953125, -0.09466171264648438, -0.0855560302734375, -0.07645034790039062, -0.06734466552734375, -0.058238983154296875, -0.04913330078125, -0.040027618408203125, -0.03092193603515625, -0.021816253662109375, -0.0127105712890625, -0.003604888916015625, 0.00550079345703125, 0.014606475830078125, 0.023712158203125, 0.032817840576171875, 0.04192352294921875, 0.051029205322265625, 0.0601348876953125, 0.06924057006835938, 0.07834625244140625, 0.08745193481445312, 0.0965576171875, 0.10566329956054688, 0.11476898193359375, 0.12387466430664062, 0.1329803466796875, 0.14208602905273438, 0.15119171142578125, 0.16029739379882812, 0.169403076171875, 0.17850875854492188, 0.18761444091796875, 0.19672012329101562, 0.2058258056640625, 0.21493148803710938, 0.22403717041015625, 0.23314285278320312, 0.24224853515625, 0.2513542175292969, 0.26045989990234375, 0.2695655822753906, 0.2786712646484375, 0.2877769470214844, 0.29688262939453125, 0.3059883117675781, 0.315093994140625, 0.3241996765136719, 0.33330535888671875, 0.3424110412597656, 0.3515167236328125, 0.3606224060058594, 0.36972808837890625, 0.3788337707519531, 0.387939453125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 5.0, 2.0, 5.0, 8.0, 4.0, 9.0, 15.0, 16.0, 19.0, 27.0, 39.0, 38.0, 48.0, 59.0, 65.0, 79.0, 82.0, 70.0, 68.0, 62.0, 59.0, 43.0, 27.0, 36.0, 33.0, 19.0, 9.0, 5.0, 9.0, 12.0, 3.0, 8.0, 2.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.7346688508987427, -0.7159498929977417, -0.6972309947013855, -0.6785120368003845, -0.6597931385040283, -0.6410741806030273, -0.6223552823066711, -0.6036363244056702, -0.584917426109314, -0.566198468208313, -0.5474795699119568, -0.5287606120109558, -0.5100417137145996, -0.49132275581359863, -0.47260382771492004, -0.45388489961624146, -0.4351659417152405, -0.4164470136165619, -0.3977280855178833, -0.3790091574192047, -0.3602902293205261, -0.34157127141952515, -0.32285234332084656, -0.30413341522216797, -0.2854144871234894, -0.2666955590248108, -0.2479766309261322, -0.22925768792629242, -0.21053875982761383, -0.19181983172893524, -0.17310088872909546, -0.15438196063041687, -0.13566303253173828, -0.11694410443305969, -0.0982251688838005, -0.07950623333454132, -0.06078730523586273, -0.04206837713718414, -0.023349441587924957, -0.0046305060386657715, 0.014088422060012817, 0.032807353883981705, 0.05152628570795059, 0.07024522125720978, 0.08896414935588837, 0.10768307745456696, 0.12640202045440674, 0.14512094855308533, 0.16383987665176392, 0.1825588047504425, 0.2012777328491211, 0.21999667584896088, 0.23871560394763947, 0.25743454694747925, 0.27615347504615784, 0.2948724031448364, 0.313591331243515, 0.3323102593421936, 0.3510291874408722, 0.3697481155395508, 0.38846707344055176, 0.40718597173690796, 0.42590492963790894, 0.4446238577365875, 0.4633427858352661]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 5.0, 10.0, 13.0, 8.0, 14.0, 14.0, 15.0, 18.0, 23.0, 19.0, 21.0, 23.0, 21.0, 25.0, 43.0, 36.0, 30.0, 42.0, 41.0, 56.0, 32.0, 39.0, 51.0, 42.0, 37.0, 37.0, 35.0, 29.0, 39.0, 14.0, 30.0, 27.0, 17.0, 13.0, 10.0, 16.0, 6.0, 10.0, 5.0, 6.0, 5.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0], "bins": [-0.5365151166915894, -0.5212335586547852, -0.505952000617981, -0.49067047238349915, -0.47538894414901733, -0.46010738611221313, -0.44482582807540894, -0.4295442998409271, -0.4142627716064453, -0.3989812135696411, -0.3836996853351593, -0.3684181272983551, -0.3531365990638733, -0.3378550410270691, -0.3225734829902649, -0.3072919547557831, -0.2920103967189789, -0.2767288386821747, -0.26144731044769287, -0.24616575241088867, -0.23088422417640686, -0.21560266613960266, -0.20032112300395966, -0.18503957986831665, -0.16975803673267365, -0.15447649359703064, -0.13919495046138763, -0.12391339987516403, -0.10863185673952103, -0.09335031360387802, -0.07806876301765442, -0.06278721988201141, -0.04750567674636841, -0.0322241336107254, -0.0169425867497921, -0.0016610398888587952, 0.01362050324678421, 0.028902046382427216, 0.04418359696865082, 0.05946514010429382, 0.07474668323993683, 0.09002822637557983, 0.10530976951122284, 0.12059132009744644, 0.13587287068367004, 0.15115439891815186, 0.16643595695495605, 0.18171750009059906, 0.19699904322624207, 0.21228058636188507, 0.22756212949752808, 0.24284368753433228, 0.2581252157688141, 0.2734067738056183, 0.2886883020401001, 0.3039698600769043, 0.3192514181137085, 0.3345329761505127, 0.3498145043849945, 0.3650960624217987, 0.3803775906562805, 0.3956591486930847, 0.4109407067298889, 0.4262222349643707, 0.44150376319885254]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 9.0, 11.0, 27.0, 25.0, 47.0, 72.0, 136.0, 201.0, 322.0, 528.0, 950.0, 1597.0, 2941.0, 5454.0, 10732.0, 21836.0, 47791.0, 114419.0, 296047.0, 321363.0, 124025.0, 51936.0, 23394.0, 11521.0, 5825.0, 3258.0, 1681.0, 985.0, 562.0, 322.0, 227.0, 115.0, 63.0, 39.0, 41.0, 22.0, 7.0, 7.0, 11.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.240234375, -0.231964111328125, -0.22369384765625, -0.215423583984375, -0.2071533203125, -0.198883056640625, -0.19061279296875, -0.182342529296875, -0.174072265625, -0.165802001953125, -0.15753173828125, -0.149261474609375, -0.1409912109375, -0.132720947265625, -0.12445068359375, -0.116180419921875, -0.10791015625, -0.099639892578125, -0.09136962890625, -0.083099365234375, -0.0748291015625, -0.066558837890625, -0.05828857421875, -0.050018310546875, -0.041748046875, -0.033477783203125, -0.02520751953125, -0.016937255859375, -0.0086669921875, -0.000396728515625, 0.00787353515625, 0.016143798828125, 0.0244140625, 0.032684326171875, 0.04095458984375, 0.049224853515625, 0.0574951171875, 0.065765380859375, 0.07403564453125, 0.082305908203125, 0.090576171875, 0.098846435546875, 0.10711669921875, 0.115386962890625, 0.1236572265625, 0.131927490234375, 0.14019775390625, 0.148468017578125, 0.15673828125, 0.165008544921875, 0.17327880859375, 0.181549072265625, 0.1898193359375, 0.198089599609375, 0.20635986328125, 0.214630126953125, 0.222900390625, 0.231170654296875, 0.23944091796875, 0.247711181640625, 0.2559814453125, 0.264251708984375, 0.27252197265625, 0.280792236328125, 0.2890625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 7.0, 6.0, 6.0, 4.0, 12.0, 9.0, 12.0, 24.0, 13.0, 21.0, 29.0, 37.0, 36.0, 38.0, 44.0, 59.0, 57.0, 58.0, 55.0, 54.0, 60.0, 43.0, 45.0, 41.0, 38.0, 43.0, 27.0, 27.0, 26.0, 13.0, 16.0, 12.0, 6.0, 8.0, 0.0, 2.0, 3.0, 1.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.154052734375, -0.149688720703125, -0.14532470703125, -0.140960693359375, -0.1365966796875, -0.132232666015625, -0.12786865234375, -0.123504638671875, -0.119140625, -0.114776611328125, -0.11041259765625, -0.106048583984375, -0.1016845703125, -0.097320556640625, -0.09295654296875, -0.088592529296875, -0.084228515625, -0.079864501953125, -0.07550048828125, -0.071136474609375, -0.0667724609375, -0.062408447265625, -0.05804443359375, -0.053680419921875, -0.04931640625, -0.044952392578125, -0.04058837890625, -0.036224365234375, -0.0318603515625, -0.027496337890625, -0.02313232421875, -0.018768310546875, -0.014404296875, -0.010040283203125, -0.00567626953125, -0.001312255859375, 0.0030517578125, 0.007415771484375, 0.01177978515625, 0.016143798828125, 0.0205078125, 0.024871826171875, 0.02923583984375, 0.033599853515625, 0.0379638671875, 0.042327880859375, 0.04669189453125, 0.051055908203125, 0.055419921875, 0.059783935546875, 0.06414794921875, 0.068511962890625, 0.0728759765625, 0.077239990234375, 0.08160400390625, 0.085968017578125, 0.09033203125, 0.094696044921875, 0.09906005859375, 0.103424072265625, 0.1077880859375, 0.112152099609375, 0.11651611328125, 0.120880126953125, 0.125244140625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 6.0, 3.0, 14.0, 10.0, 17.0, 21.0, 24.0, 30.0, 41.0, 57.0, 78.0, 134.0, 186.0, 302.0, 445.0, 756.0, 1371.0, 2877.0, 7832.0, 29229.0, 185809.0, 679882.0, 108158.0, 19914.0, 5833.0, 2406.0, 1228.0, 654.0, 430.0, 245.0, 153.0, 120.0, 70.0, 54.0, 54.0, 28.0, 27.0, 13.0, 11.0, 12.0, 2.0, 7.0, 0.0, 5.0, 4.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.51025390625, -0.494964599609375, -0.47967529296875, -0.464385986328125, -0.4490966796875, -0.433807373046875, -0.41851806640625, -0.403228759765625, -0.387939453125, -0.372650146484375, -0.35736083984375, -0.342071533203125, -0.3267822265625, -0.311492919921875, -0.29620361328125, -0.280914306640625, -0.265625, -0.250335693359375, -0.23504638671875, -0.219757080078125, -0.2044677734375, -0.189178466796875, -0.17388916015625, -0.158599853515625, -0.143310546875, -0.128021240234375, -0.11273193359375, -0.097442626953125, -0.0821533203125, -0.066864013671875, -0.05157470703125, -0.036285400390625, -0.02099609375, -0.005706787109375, 0.00958251953125, 0.024871826171875, 0.0401611328125, 0.055450439453125, 0.07073974609375, 0.086029052734375, 0.101318359375, 0.116607666015625, 0.13189697265625, 0.147186279296875, 0.1624755859375, 0.177764892578125, 0.19305419921875, 0.208343505859375, 0.2236328125, 0.238922119140625, 0.25421142578125, 0.269500732421875, 0.2847900390625, 0.300079345703125, 0.31536865234375, 0.330657958984375, 0.345947265625, 0.361236572265625, 0.37652587890625, 0.391815185546875, 0.4071044921875, 0.422393798828125, 0.43768310546875, 0.452972412109375, 0.46826171875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 7.0, 7.0, 8.0, 9.0, 6.0, 14.0, 20.0, 18.0, 17.0, 32.0, 24.0, 36.0, 45.0, 45.0, 40.0, 65.0, 51.0, 43.0, 51.0, 51.0, 50.0, 41.0, 48.0, 38.0, 35.0, 37.0, 26.0, 22.0, 18.0, 20.0, 9.0, 13.0, 8.0, 10.0, 7.0, 10.0, 7.0, 2.0, 5.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.591796875, -0.5741729736328125, -0.556549072265625, -0.5389251708984375, -0.52130126953125, -0.5036773681640625, -0.486053466796875, -0.4684295654296875, -0.4508056640625, -0.4331817626953125, -0.415557861328125, -0.3979339599609375, -0.38031005859375, -0.3626861572265625, -0.345062255859375, -0.3274383544921875, -0.309814453125, -0.2921905517578125, -0.274566650390625, -0.2569427490234375, -0.23931884765625, -0.2216949462890625, -0.204071044921875, -0.1864471435546875, -0.1688232421875, -0.1511993408203125, -0.133575439453125, -0.1159515380859375, -0.09832763671875, -0.0807037353515625, -0.063079833984375, -0.0454559326171875, -0.02783203125, -0.0102081298828125, 0.007415771484375, 0.0250396728515625, 0.04266357421875, 0.0602874755859375, 0.077911376953125, 0.0955352783203125, 0.1131591796875, 0.1307830810546875, 0.148406982421875, 0.1660308837890625, 0.18365478515625, 0.2012786865234375, 0.218902587890625, 0.2365264892578125, 0.254150390625, 0.2717742919921875, 0.289398193359375, 0.3070220947265625, 0.32464599609375, 0.3422698974609375, 0.359893798828125, 0.3775177001953125, 0.3951416015625, 0.4127655029296875, 0.430389404296875, 0.4480133056640625, 0.46563720703125, 0.4832611083984375, 0.500885009765625, 0.5185089111328125, 0.5361328125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 3.0, 6.0, 11.0, 7.0, 20.0, 32.0, 43.0, 54.0, 79.0, 141.0, 238.0, 419.0, 834.0, 1719.0, 4111.0, 11908.0, 44429.0, 252635.0, 587011.0, 108910.0, 23366.0, 7146.0, 2745.0, 1243.0, 557.0, 326.0, 200.0, 122.0, 62.0, 44.0, 27.0, 27.0, 16.0, 8.0, 13.0, 6.0, 5.0, 5.0, 3.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.172607421875, -0.16725921630859375, -0.1619110107421875, -0.15656280517578125, -0.151214599609375, -0.14586639404296875, -0.1405181884765625, -0.13516998291015625, -0.12982177734375, -0.12447357177734375, -0.1191253662109375, -0.11377716064453125, -0.108428955078125, -0.10308074951171875, -0.0977325439453125, -0.09238433837890625, -0.0870361328125, -0.08168792724609375, -0.0763397216796875, -0.07099151611328125, -0.065643310546875, -0.06029510498046875, -0.0549468994140625, -0.04959869384765625, -0.04425048828125, -0.03890228271484375, -0.0335540771484375, -0.02820587158203125, -0.022857666015625, -0.01750946044921875, -0.0121612548828125, -0.00681304931640625, -0.00146484375, 0.00388336181640625, 0.0092315673828125, 0.01457977294921875, 0.019927978515625, 0.02527618408203125, 0.0306243896484375, 0.03597259521484375, 0.04132080078125, 0.04666900634765625, 0.0520172119140625, 0.05736541748046875, 0.062713623046875, 0.06806182861328125, 0.0734100341796875, 0.07875823974609375, 0.0841064453125, 0.08945465087890625, 0.0948028564453125, 0.10015106201171875, 0.105499267578125, 0.11084747314453125, 0.1161956787109375, 0.12154388427734375, 0.12689208984375, 0.13224029541015625, 0.1375885009765625, 0.14293670654296875, 0.148284912109375, 0.15363311767578125, 0.1589813232421875, 0.16432952880859375, 0.169677734375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 8.0, 6.0, 10.0, 6.0, 9.0, 16.0, 26.0, 25.0, 21.0, 37.0, 38.0, 47.0, 58.0, 82.0, 111.0, 104.0, 82.0, 70.0, 51.0, 34.0, 34.0, 30.0, 29.0, 14.0, 5.0, 7.0, 10.0, 11.0, 4.0, 7.0, 6.0, 6.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.805492401123047e-05, -5.653873085975647e-05, -5.502253770828247e-05, -5.350634455680847e-05, -5.199015140533447e-05, -5.0473958253860474e-05, -4.8957765102386475e-05, -4.7441571950912476e-05, -4.5925378799438477e-05, -4.440918564796448e-05, -4.289299249649048e-05, -4.137679934501648e-05, -3.986060619354248e-05, -3.834441304206848e-05, -3.682821989059448e-05, -3.5312026739120483e-05, -3.3795833587646484e-05, -3.2279640436172485e-05, -3.0763447284698486e-05, -2.9247254133224487e-05, -2.7731060981750488e-05, -2.621486783027649e-05, -2.469867467880249e-05, -2.318248152732849e-05, -2.1666288375854492e-05, -2.0150095224380493e-05, -1.8633902072906494e-05, -1.7117708921432495e-05, -1.5601515769958496e-05, -1.4085322618484497e-05, -1.2569129467010498e-05, -1.1052936315536499e-05, -9.5367431640625e-06, -8.020550012588501e-06, -6.504356861114502e-06, -4.988163709640503e-06, -3.471970558166504e-06, -1.955777406692505e-06, -4.3958425521850586e-07, 1.0766088962554932e-06, 2.592802047729492e-06, 4.108995199203491e-06, 5.62518835067749e-06, 7.141381502151489e-06, 8.657574653625488e-06, 1.0173767805099487e-05, 1.1689960956573486e-05, 1.3206154108047485e-05, 1.4722347259521484e-05, 1.6238540410995483e-05, 1.7754733562469482e-05, 1.927092671394348e-05, 2.078711986541748e-05, 2.230331301689148e-05, 2.381950616836548e-05, 2.5335699319839478e-05, 2.6851892471313477e-05, 2.8368085622787476e-05, 2.9884278774261475e-05, 3.1400471925735474e-05, 3.291666507720947e-05, 3.443285822868347e-05, 3.594905138015747e-05, 3.746524453163147e-05, 3.898143768310547e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 3.0, 8.0, 8.0, 7.0, 18.0, 24.0, 26.0, 40.0, 46.0, 83.0, 104.0, 202.0, 290.0, 493.0, 786.0, 1526.0, 3183.0, 7713.0, 24348.0, 112016.0, 566195.0, 261816.0, 47189.0, 12823.0, 4747.0, 2206.0, 1027.0, 587.0, 372.0, 189.0, 137.0, 94.0, 66.0, 51.0, 37.0, 24.0, 22.0, 17.0, 12.0, 5.0, 8.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1822509765625, -0.1770038604736328, -0.17175674438476562, -0.16650962829589844, -0.16126251220703125, -0.15601539611816406, -0.15076828002929688, -0.1455211639404297, -0.1402740478515625, -0.1350269317626953, -0.12977981567382812, -0.12453269958496094, -0.11928558349609375, -0.11403846740722656, -0.10879135131835938, -0.10354423522949219, -0.098297119140625, -0.09305000305175781, -0.08780288696289062, -0.08255577087402344, -0.07730865478515625, -0.07206153869628906, -0.06681442260742188, -0.06156730651855469, -0.0563201904296875, -0.05107307434082031, -0.045825958251953125, -0.04057884216308594, -0.03533172607421875, -0.030084609985351562, -0.024837493896484375, -0.019590377807617188, -0.01434326171875, -0.009096145629882812, -0.003849029541015625, 0.0013980865478515625, 0.00664520263671875, 0.011892318725585938, 0.017139434814453125, 0.022386550903320312, 0.0276336669921875, 0.03288078308105469, 0.038127899169921875, 0.04337501525878906, 0.04862213134765625, 0.05386924743652344, 0.059116363525390625, 0.06436347961425781, 0.069610595703125, 0.07485771179199219, 0.08010482788085938, 0.08535194396972656, 0.09059906005859375, 0.09584617614746094, 0.10109329223632812, 0.10634040832519531, 0.1115875244140625, 0.11683464050292969, 0.12208175659179688, 0.12732887268066406, 0.13257598876953125, 0.13782310485839844, 0.14307022094726562, 0.1483173370361328, 0.153564453125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 4.0, 7.0, 4.0, 6.0, 9.0, 11.0, 9.0, 25.0, 17.0, 40.0, 35.0, 54.0, 52.0, 70.0, 73.0, 68.0, 76.0, 78.0, 80.0, 51.0, 50.0, 39.0, 30.0, 20.0, 16.0, 18.0, 13.0, 10.0, 5.0, 7.0, 7.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.147216796875, -0.14231300354003906, -0.13740921020507812, -0.1325054168701172, -0.12760162353515625, -0.12269783020019531, -0.11779403686523438, -0.11289024353027344, -0.1079864501953125, -0.10308265686035156, -0.09817886352539062, -0.09327507019042969, -0.08837127685546875, -0.08346748352050781, -0.07856369018554688, -0.07365989685058594, -0.068756103515625, -0.06385231018066406, -0.058948516845703125, -0.05404472351074219, -0.04914093017578125, -0.04423713684082031, -0.039333343505859375, -0.03442955017089844, -0.0295257568359375, -0.024621963500976562, -0.019718170166015625, -0.014814376831054688, -0.00991058349609375, -0.0050067901611328125, -0.000102996826171875, 0.0048007965087890625, 0.00970458984375, 0.014608383178710938, 0.019512176513671875, 0.024415969848632812, 0.02931976318359375, 0.03422355651855469, 0.039127349853515625, 0.04403114318847656, 0.0489349365234375, 0.05383872985839844, 0.058742523193359375, 0.06364631652832031, 0.06855010986328125, 0.07345390319824219, 0.07835769653320312, 0.08326148986816406, 0.088165283203125, 0.09306907653808594, 0.09797286987304688, 0.10287666320800781, 0.10778045654296875, 0.11268424987792969, 0.11758804321289062, 0.12249183654785156, 0.1273956298828125, 0.13229942321777344, 0.13720321655273438, 0.1421070098876953, 0.14701080322265625, 0.1519145965576172, 0.15681838989257812, 0.16172218322753906, 0.1666259765625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 5.0, 9.0, 8.0, 26.0, 66.0, 94.0, 134.0, 169.0, 170.0, 119.0, 90.0, 51.0, 23.0, 16.0, 12.0, 7.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.531129837036133, -4.384349346160889, -4.2375688552856445, -4.0907883644104, -3.9440078735351562, -3.797227382659912, -3.650447130203247, -3.503666639328003, -3.356886148452759, -3.2101056575775146, -3.0633251667022705, -2.9165446758270264, -2.7697644233703613, -2.622983932495117, -2.476203441619873, -2.329422950744629, -2.1826424598693848, -2.0358619689941406, -1.8890814781188965, -1.742301106452942, -1.5955206155776978, -1.4487401247024536, -1.301959753036499, -1.1551792621612549, -1.0083987712860107, -0.8616182804107666, -0.7148378491401672, -0.5680574178695679, -0.42127692699432373, -0.2744964361190796, -0.12771600484848022, 0.01906442642211914, 0.16584539413452148, 0.31262585520744324, 0.459406316280365, 0.6061867475509644, 0.7529672384262085, 0.8997477293014526, 1.0465281009674072, 1.1933085918426514, 1.3400890827178955, 1.4868695735931396, 1.6336500644683838, 1.7804304361343384, 1.9272109270095825, 2.073991298675537, 2.2207717895507812, 2.3675522804260254, 2.5143327713012695, 2.6611132621765137, 2.807893753051758, 2.954674243927002, 3.101454734802246, 3.2482352256774902, 3.3950154781341553, 3.5417959690093994, 3.6885764598846436, 3.8353569507598877, 3.982137441635132, 4.128917694091797, 4.275698184967041, 4.422478675842285, 4.569259166717529, 4.716039657592773, 4.862820148468018]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 5.0, 3.0, 10.0, 10.0, 6.0, 6.0, 13.0, 8.0, 6.0, 16.0, 17.0, 27.0, 20.0, 17.0, 21.0, 33.0, 31.0, 40.0, 37.0, 41.0, 48.0, 33.0, 38.0, 37.0, 40.0, 43.0, 49.0, 39.0, 27.0, 40.0, 29.0, 20.0, 35.0, 17.0, 37.0, 20.0, 20.0, 12.0, 10.0, 12.0, 4.0, 7.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.8938207626342773, -1.8231133222579956, -1.7524058818817139, -1.6816984415054321, -1.6109910011291504, -1.540283441543579, -1.4695760011672974, -1.3988685607910156, -1.3281611204147339, -1.2574536800384521, -1.1867462396621704, -1.1160387992858887, -1.0453312397003174, -0.9746238589286804, -0.9039163589477539, -0.8332089185714722, -0.7625014781951904, -0.6917940378189087, -0.621086597442627, -0.5503790974617004, -0.4796716570854187, -0.40896421670913696, -0.33825674653053284, -0.2675492763519287, -0.19684183597564697, -0.12613438069820404, -0.05542692542076111, 0.015280529856681824, 0.08598798513412476, 0.1566954255104065, 0.22740289568901062, 0.29811036586761475, 0.3688175678253174, 0.4395250082015991, 0.5102324485778809, 0.5809399485588074, 0.6516473889350891, 0.7223548293113708, 0.7930623292922974, 0.8637697696685791, 0.9344772100448608, 1.0051846504211426, 1.0758920907974243, 1.146599531173706, 1.2173070907592773, 1.2880144119262695, 1.3587219715118408, 1.4294294118881226, 1.5001368522644043, 1.570844292640686, 1.6415517330169678, 1.7122591733932495, 1.7829666137695312, 1.8536741733551025, 1.9243816137313843, 1.995089054107666, 2.065796375274658, 2.1365039348602295, 2.2072112560272217, 2.277918815612793, 2.348626136779785, 2.4193336963653564, 2.4900410175323486, 2.56074857711792, 2.631456136703491]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 6.0, 9.0, 13.0, 16.0, 27.0, 58.0, 60.0, 111.0, 177.0, 268.0, 454.0, 746.0, 1246.0, 2270.0, 4047.0, 8332.0, 18925.0, 54286.0, 308442.0, 3278883.0, 413486.0, 62373.0, 20707.0, 9113.0, 4375.0, 2339.0, 1378.0, 802.0, 495.0, 313.0, 205.0, 132.0, 65.0, 60.0, 25.0, 15.0, 13.0, 5.0, 9.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.285888671875, -0.27710723876953125, -0.2683258056640625, -0.25954437255859375, -0.250762939453125, -0.24198150634765625, -0.2332000732421875, -0.22441864013671875, -0.21563720703125, -0.20685577392578125, -0.1980743408203125, -0.18929290771484375, -0.180511474609375, -0.17173004150390625, -0.1629486083984375, -0.15416717529296875, -0.1453857421875, -0.13660430908203125, -0.1278228759765625, -0.11904144287109375, -0.110260009765625, -0.10147857666015625, -0.0926971435546875, -0.08391571044921875, -0.07513427734375, -0.06635284423828125, -0.0575714111328125, -0.04878997802734375, -0.040008544921875, -0.03122711181640625, -0.0224456787109375, -0.01366424560546875, -0.0048828125, 0.00389862060546875, 0.0126800537109375, 0.02146148681640625, 0.030242919921875, 0.03902435302734375, 0.0478057861328125, 0.05658721923828125, 0.06536865234375, 0.07415008544921875, 0.0829315185546875, 0.09171295166015625, 0.100494384765625, 0.10927581787109375, 0.1180572509765625, 0.12683868408203125, 0.1356201171875, 0.14440155029296875, 0.1531829833984375, 0.16196441650390625, 0.170745849609375, 0.17952728271484375, 0.1883087158203125, 0.19709014892578125, 0.20587158203125, 0.21465301513671875, 0.2234344482421875, 0.23221588134765625, 0.240997314453125, 0.24977874755859375, 0.2585601806640625, 0.26734161376953125, 0.276123046875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 12.0, 15.0, 11.0, 22.0, 20.0, 37.0, 27.0, 40.0, 50.0, 68.0, 54.0, 58.0, 56.0, 67.0, 67.0, 66.0, 54.0, 63.0, 33.0, 35.0, 38.0, 23.0, 17.0, 21.0, 13.0, 6.0, 4.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1602783203125, -0.1556987762451172, -0.15111923217773438, -0.14653968811035156, -0.14196014404296875, -0.13738059997558594, -0.13280105590820312, -0.1282215118408203, -0.1236419677734375, -0.11906242370605469, -0.11448287963867188, -0.10990333557128906, -0.10532379150390625, -0.10074424743652344, -0.09616470336914062, -0.09158515930175781, -0.087005615234375, -0.08242607116699219, -0.07784652709960938, -0.07326698303222656, -0.06868743896484375, -0.06410789489746094, -0.059528350830078125, -0.05494880676269531, -0.0503692626953125, -0.04578971862792969, -0.041210174560546875, -0.03663063049316406, -0.03205108642578125, -0.027471542358398438, -0.022891998291015625, -0.018312454223632812, -0.01373291015625, -0.009153366088867188, -0.004573822021484375, 5.7220458984375e-06, 0.00458526611328125, 0.009164810180664062, 0.013744354248046875, 0.018323898315429688, 0.0229034423828125, 0.027482986450195312, 0.032062530517578125, 0.03664207458496094, 0.04122161865234375, 0.04580116271972656, 0.050380706787109375, 0.05496025085449219, 0.059539794921875, 0.06411933898925781, 0.06869888305664062, 0.07327842712402344, 0.07785797119140625, 0.08243751525878906, 0.08701705932617188, 0.09159660339355469, 0.0961761474609375, 0.10075569152832031, 0.10533523559570312, 0.10991477966308594, 0.11449432373046875, 0.11907386779785156, 0.12365341186523438, 0.1282329559326172, 0.1328125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 4.0, 4.0, 6.0, 6.0, 7.0, 15.0, 10.0, 24.0, 39.0, 46.0, 82.0, 127.0, 192.0, 320.0, 609.0, 1083.0, 2192.0, 5052.0, 12743.0, 39775.0, 213291.0, 3403205.0, 429413.0, 57347.0, 16661.0, 6311.0, 2729.0, 1345.0, 683.0, 390.0, 210.0, 119.0, 65.0, 63.0, 39.0, 23.0, 14.0, 12.0, 7.0, 13.0, 2.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35693359375, -0.3444671630859375, -0.332000732421875, -0.3195343017578125, -0.30706787109375, -0.2946014404296875, -0.282135009765625, -0.2696685791015625, -0.2572021484375, -0.2447357177734375, -0.232269287109375, -0.2198028564453125, -0.20733642578125, -0.1948699951171875, -0.182403564453125, -0.1699371337890625, -0.157470703125, -0.1450042724609375, -0.132537841796875, -0.1200714111328125, -0.10760498046875, -0.0951385498046875, -0.082672119140625, -0.0702056884765625, -0.0577392578125, -0.0452728271484375, -0.032806396484375, -0.0203399658203125, -0.00787353515625, 0.0045928955078125, 0.017059326171875, 0.0295257568359375, 0.0419921875, 0.0544586181640625, 0.066925048828125, 0.0793914794921875, 0.09185791015625, 0.1043243408203125, 0.116790771484375, 0.1292572021484375, 0.1417236328125, 0.1541900634765625, 0.166656494140625, 0.1791229248046875, 0.19158935546875, 0.2040557861328125, 0.216522216796875, 0.2289886474609375, 0.241455078125, 0.2539215087890625, 0.266387939453125, 0.2788543701171875, 0.29132080078125, 0.3037872314453125, 0.316253662109375, 0.3287200927734375, 0.3411865234375, 0.3536529541015625, 0.366119384765625, 0.3785858154296875, 0.39105224609375, 0.4035186767578125, 0.415985107421875, 0.4284515380859375, 0.44091796875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 8.0, 5.0, 3.0, 8.0, 6.0, 9.0, 10.0, 16.0, 14.0, 21.0, 36.0, 35.0, 55.0, 90.0, 140.0, 269.0, 540.0, 1058.0, 754.0, 384.0, 190.0, 125.0, 75.0, 60.0, 38.0, 28.0, 23.0, 17.0, 12.0, 9.0, 6.0, 6.0, 5.0, 4.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.321533203125, -0.3099479675292969, -0.29836273193359375, -0.2867774963378906, -0.2751922607421875, -0.2636070251464844, -0.25202178955078125, -0.24043655395507812, -0.228851318359375, -0.21726608276367188, -0.20568084716796875, -0.19409561157226562, -0.1825103759765625, -0.17092514038085938, -0.15933990478515625, -0.14775466918945312, -0.13616943359375, -0.12458419799804688, -0.11299896240234375, -0.10141372680664062, -0.0898284912109375, -0.07824325561523438, -0.06665802001953125, -0.055072784423828125, -0.043487548828125, -0.031902313232421875, -0.02031707763671875, -0.008731842041015625, 0.0028533935546875, 0.014438629150390625, 0.02602386474609375, 0.037609100341796875, 0.0491943359375, 0.060779571533203125, 0.07236480712890625, 0.08395004272460938, 0.0955352783203125, 0.10712051391601562, 0.11870574951171875, 0.13029098510742188, 0.141876220703125, 0.15346145629882812, 0.16504669189453125, 0.17663192749023438, 0.1882171630859375, 0.19980239868164062, 0.21138763427734375, 0.22297286987304688, 0.23455810546875, 0.24614334106445312, 0.25772857666015625, 0.2693138122558594, 0.2808990478515625, 0.2924842834472656, 0.30406951904296875, 0.3156547546386719, 0.327239990234375, 0.3388252258300781, 0.35041046142578125, 0.3619956970214844, 0.3735809326171875, 0.3851661682128906, 0.39675140380859375, 0.4083366394042969, 0.419921875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 2.0, 1.0, 7.0, 2.0, 11.0, 12.0, 36.0, 93.0, 167.0, 228.0, 204.0, 137.0, 54.0, 21.0, 13.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.369821548461914, -6.2051591873168945, -6.040497303009033, -5.875834941864014, -5.711172580718994, -5.546510696411133, -5.381848335266113, -5.217185974121094, -5.052523612976074, -4.887861251831055, -4.723199367523193, -4.558537006378174, -4.393874645233154, -4.229212760925293, -4.064550399780273, -3.899888038635254, -3.7352261543273926, -3.570564031600952, -3.4059016704559326, -3.241239547729492, -3.0765771865844727, -2.9119150638580322, -2.747252941131592, -2.5825905799865723, -2.417928457260132, -2.2532663345336914, -2.088603973388672, -1.9239418506622314, -1.7592796087265015, -1.5946173667907715, -1.429955244064331, -1.265293002128601, -1.100630760192871, -0.9359685182571411, -0.7713063359260559, -0.6066441535949707, -0.4419819116592407, -0.27731966972351074, -0.11265748739242554, 0.05200469493865967, 0.21666693687438965, 0.38132914900779724, 0.5459913611412048, 0.71065354347229, 0.87531578540802, 1.03997802734375, 1.2046401500701904, 1.3693023920059204, 1.5339646339416504, 1.6986268758773804, 1.8632891178131104, 2.027951240539551, 2.1926136016845703, 2.3572757244110107, 2.521937847137451, 2.6866002082824707, 2.851262331008911, 3.0159244537353516, 3.180586814880371, 3.3452489376068115, 3.509911060333252, 3.6745734214782715, 3.839235544204712, 4.003897666931152, 4.168560028076172]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 11.0, 9.0, 7.0, 12.0, 14.0, 16.0, 21.0, 31.0, 29.0, 31.0, 30.0, 59.0, 43.0, 55.0, 66.0, 65.0, 68.0, 53.0, 45.0, 60.0, 63.0, 37.0, 32.0, 32.0, 32.0, 27.0, 17.0, 13.0, 10.0, 8.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9480023384094238, -1.8851134777069092, -1.822224497795105, -1.7593356370925903, -1.6964466571807861, -1.6335577964782715, -1.5706689357757568, -1.5077800750732422, -1.444891095161438, -1.3820022344589233, -1.3191132545471191, -1.2562243938446045, -1.1933355331420898, -1.1304465532302856, -1.067557692527771, -1.0046687126159668, -0.9417798519134521, -0.8788909316062927, -0.8160020112991333, -0.7531131505966187, -0.6902242302894592, -0.6273353099822998, -0.5644464492797852, -0.5015575289726257, -0.4386686086654663, -0.3757796883583069, -0.31289079785346985, -0.2500019073486328, -0.1871129870414734, -0.12422406673431396, -0.06133517622947693, 0.0015537142753601074, 0.06444239616394043, 0.12733130156993866, 0.1902202069759369, 0.2531090974807739, 0.31599801778793335, 0.3788869380950928, 0.4417758285999298, 0.5046647191047668, 0.5675536394119263, 0.6304425597190857, 0.6933314800262451, 0.7562203407287598, 0.8191092610359192, 0.8819981813430786, 0.9448870420455933, 1.0077760219573975, 1.070664882659912, 1.1335537433624268, 1.196442723274231, 1.2593315839767456, 1.3222205638885498, 1.3851094245910645, 1.447998285293579, 1.5108871459960938, 1.573776125907898, 1.6366649866104126, 1.6995539665222168, 1.7624428272247314, 1.825331687927246, 1.8882206678390503, 1.951109528541565, 2.013998508453369, 2.076887369155884]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 8.0, 10.0, 13.0, 15.0, 20.0, 28.0, 34.0, 67.0, 89.0, 120.0, 174.0, 222.0, 377.0, 589.0, 883.0, 1521.0, 2230.0, 4061.0, 7310.0, 13714.0, 27852.0, 61135.0, 158589.0, 369731.0, 235416.0, 87143.0, 37386.0, 17786.0, 9177.0, 5140.0, 2820.0, 1737.0, 1030.0, 712.0, 432.0, 284.0, 214.0, 125.0, 101.0, 82.0, 54.0, 32.0, 34.0, 20.0, 14.0, 11.0, 7.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.234130859375, -0.22624588012695312, -0.21836090087890625, -0.21047592163085938, -0.2025909423828125, -0.19470596313476562, -0.18682098388671875, -0.17893600463867188, -0.171051025390625, -0.16316604614257812, -0.15528106689453125, -0.14739608764648438, -0.1395111083984375, -0.13162612915039062, -0.12374114990234375, -0.11585617065429688, -0.10797119140625, -0.10008621215820312, -0.09220123291015625, -0.08431625366210938, -0.0764312744140625, -0.06854629516601562, -0.06066131591796875, -0.052776336669921875, -0.044891357421875, -0.037006378173828125, -0.02912139892578125, -0.021236419677734375, -0.0133514404296875, -0.005466461181640625, 0.00241851806640625, 0.010303497314453125, 0.0181884765625, 0.026073455810546875, 0.03395843505859375, 0.041843414306640625, 0.0497283935546875, 0.057613372802734375, 0.06549835205078125, 0.07338333129882812, 0.081268310546875, 0.08915328979492188, 0.09703826904296875, 0.10492324829101562, 0.1128082275390625, 0.12069320678710938, 0.12857818603515625, 0.13646316528320312, 0.14434814453125, 0.15223312377929688, 0.16011810302734375, 0.16800308227539062, 0.1758880615234375, 0.18377304077148438, 0.19165802001953125, 0.19954299926757812, 0.207427978515625, 0.21531295776367188, 0.22319793701171875, 0.23108291625976562, 0.2389678955078125, 0.24685287475585938, 0.25473785400390625, 0.2626228332519531, 0.2705078125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 3.0, 3.0, 2.0, 3.0, 7.0, 5.0, 12.0, 11.0, 15.0, 10.0, 15.0, 20.0, 26.0, 34.0, 44.0, 40.0, 40.0, 35.0, 42.0, 40.0, 53.0, 48.0, 50.0, 60.0, 59.0, 42.0, 47.0, 36.0, 38.0, 44.0, 19.0, 23.0, 20.0, 11.0, 15.0, 8.0, 4.0, 5.0, 5.0, 7.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.118408203125, -0.11462688446044922, -0.11084556579589844, -0.10706424713134766, -0.10328292846679688, -0.0995016098022461, -0.09572029113769531, -0.09193897247314453, -0.08815765380859375, -0.08437633514404297, -0.08059501647949219, -0.0768136978149414, -0.07303237915039062, -0.06925106048583984, -0.06546974182128906, -0.06168842315673828, -0.0579071044921875, -0.05412578582763672, -0.05034446716308594, -0.046563148498535156, -0.042781829833984375, -0.039000511169433594, -0.03521919250488281, -0.03143787384033203, -0.02765655517578125, -0.02387523651123047, -0.020093917846679688, -0.016312599182128906, -0.012531280517578125, -0.008749961853027344, -0.0049686431884765625, -0.0011873245239257812, 0.002593994140625, 0.006375312805175781, 0.010156631469726562, 0.013937950134277344, 0.017719268798828125, 0.021500587463378906, 0.025281906127929688, 0.02906322479248047, 0.03284454345703125, 0.03662586212158203, 0.04040718078613281, 0.044188499450683594, 0.047969818115234375, 0.051751136779785156, 0.05553245544433594, 0.05931377410888672, 0.0630950927734375, 0.06687641143798828, 0.07065773010253906, 0.07443904876708984, 0.07822036743164062, 0.0820016860961914, 0.08578300476074219, 0.08956432342529297, 0.09334564208984375, 0.09712696075439453, 0.10090827941894531, 0.1046895980834961, 0.10847091674804688, 0.11225223541259766, 0.11603355407714844, 0.11981487274169922, 0.12359619140625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 4.0, 5.0, 10.0, 7.0, 20.0, 26.0, 25.0, 40.0, 50.0, 68.0, 115.0, 176.0, 296.0, 440.0, 781.0, 1585.0, 3636.0, 9932.0, 41545.0, 408950.0, 517094.0, 45615.0, 10598.0, 3777.0, 1592.0, 867.0, 470.0, 262.0, 191.0, 110.0, 70.0, 61.0, 37.0, 23.0, 18.0, 12.0, 19.0, 6.0, 2.0, 4.0, 6.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48876953125, -0.47193145751953125, -0.4550933837890625, -0.43825531005859375, -0.421417236328125, -0.40457916259765625, -0.3877410888671875, -0.37090301513671875, -0.35406494140625, -0.33722686767578125, -0.3203887939453125, -0.30355072021484375, -0.286712646484375, -0.26987457275390625, -0.2530364990234375, -0.23619842529296875, -0.2193603515625, -0.20252227783203125, -0.1856842041015625, -0.16884613037109375, -0.152008056640625, -0.13516998291015625, -0.1183319091796875, -0.10149383544921875, -0.08465576171875, -0.06781768798828125, -0.0509796142578125, -0.03414154052734375, -0.017303466796875, -0.00046539306640625, 0.0163726806640625, 0.03321075439453125, 0.050048828125, 0.06688690185546875, 0.0837249755859375, 0.10056304931640625, 0.117401123046875, 0.13423919677734375, 0.1510772705078125, 0.16791534423828125, 0.18475341796875, 0.20159149169921875, 0.2184295654296875, 0.23526763916015625, 0.252105712890625, 0.26894378662109375, 0.2857818603515625, 0.30261993408203125, 0.3194580078125, 0.33629608154296875, 0.3531341552734375, 0.36997222900390625, 0.386810302734375, 0.40364837646484375, 0.4204864501953125, 0.43732452392578125, 0.45416259765625, 0.47100067138671875, 0.4878387451171875, 0.5046768188476562, 0.521514892578125, 0.5383529663085938, 0.5551910400390625, 0.5720291137695312, 0.5888671875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 0.0, 2.0, 10.0, 3.0, 7.0, 9.0, 13.0, 11.0, 20.0, 26.0, 33.0, 38.0, 41.0, 39.0, 55.0, 50.0, 57.0, 63.0, 58.0, 59.0, 54.0, 59.0, 53.0, 37.0, 41.0, 33.0, 28.0, 30.0, 23.0, 14.0, 8.0, 11.0, 5.0, 4.0, 2.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66796875, -0.6480941772460938, -0.6282196044921875, -0.6083450317382812, -0.588470458984375, -0.5685958862304688, -0.5487213134765625, -0.5288467407226562, -0.50897216796875, -0.48909759521484375, -0.4692230224609375, -0.44934844970703125, -0.429473876953125, -0.40959930419921875, -0.3897247314453125, -0.36985015869140625, -0.3499755859375, -0.33010101318359375, -0.3102264404296875, -0.29035186767578125, -0.270477294921875, -0.25060272216796875, -0.2307281494140625, -0.21085357666015625, -0.19097900390625, -0.17110443115234375, -0.1512298583984375, -0.13135528564453125, -0.111480712890625, -0.09160614013671875, -0.0717315673828125, -0.05185699462890625, -0.031982421875, -0.01210784912109375, 0.0077667236328125, 0.02764129638671875, 0.047515869140625, 0.06739044189453125, 0.0872650146484375, 0.10713958740234375, 0.12701416015625, 0.14688873291015625, 0.1667633056640625, 0.18663787841796875, 0.206512451171875, 0.22638702392578125, 0.2462615966796875, 0.26613616943359375, 0.2860107421875, 0.30588531494140625, 0.3257598876953125, 0.34563446044921875, 0.365509033203125, 0.38538360595703125, 0.4052581787109375, 0.42513275146484375, 0.44500732421875, 0.46488189697265625, 0.4847564697265625, 0.5046310424804688, 0.524505615234375, 0.5443801879882812, 0.5642547607421875, 0.5841293334960938, 0.60400390625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 12.0, 14.0, 16.0, 18.0, 34.0, 45.0, 57.0, 116.0, 205.0, 316.0, 643.0, 1180.0, 2778.0, 7044.0, 22480.0, 113065.0, 716136.0, 144543.0, 25970.0, 7936.0, 3055.0, 1351.0, 650.0, 358.0, 195.0, 121.0, 65.0, 41.0, 33.0, 20.0, 20.0, 6.0, 10.0, 9.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2484130859375, -0.2412242889404297, -0.23403549194335938, -0.22684669494628906, -0.21965789794921875, -0.21246910095214844, -0.20528030395507812, -0.1980915069580078, -0.1909027099609375, -0.1837139129638672, -0.17652511596679688, -0.16933631896972656, -0.16214752197265625, -0.15495872497558594, -0.14776992797851562, -0.1405811309814453, -0.133392333984375, -0.1262035369873047, -0.11901473999023438, -0.11182594299316406, -0.10463714599609375, -0.09744834899902344, -0.09025955200195312, -0.08307075500488281, -0.0758819580078125, -0.06869316101074219, -0.061504364013671875, -0.05431556701660156, -0.04712677001953125, -0.03993797302246094, -0.032749176025390625, -0.025560379028320312, -0.01837158203125, -0.011182785034179688, -0.003993988037109375, 0.0031948089599609375, 0.01038360595703125, 0.017572402954101562, 0.024761199951171875, 0.03194999694824219, 0.0391387939453125, 0.04632759094238281, 0.053516387939453125, 0.06070518493652344, 0.06789398193359375, 0.07508277893066406, 0.08227157592773438, 0.08946037292480469, 0.096649169921875, 0.10383796691894531, 0.11102676391601562, 0.11821556091308594, 0.12540435791015625, 0.13259315490722656, 0.13978195190429688, 0.1469707489013672, 0.1541595458984375, 0.1613483428955078, 0.16853713989257812, 0.17572593688964844, 0.18291473388671875, 0.19010353088378906, 0.19729232788085938, 0.2044811248779297, 0.211669921875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 4.0, 4.0, 3.0, 1.0, 9.0, 11.0, 13.0, 15.0, 23.0, 32.0, 33.0, 57.0, 114.0, 149.0, 131.0, 125.0, 72.0, 59.0, 37.0, 28.0, 25.0, 12.0, 10.0, 8.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.957220077514648e-05, -7.724948227405548e-05, -7.492676377296448e-05, -7.260404527187347e-05, -7.028132677078247e-05, -6.795860826969147e-05, -6.563588976860046e-05, -6.331317126750946e-05, -6.099045276641846e-05, -5.8667734265327454e-05, -5.634501576423645e-05, -5.402229726314545e-05, -5.169957876205444e-05, -4.937686026096344e-05, -4.7054141759872437e-05, -4.473142325878143e-05, -4.240870475769043e-05, -4.0085986256599426e-05, -3.776326775550842e-05, -3.544054925441742e-05, -3.3117830753326416e-05, -3.079511225223541e-05, -2.847239375114441e-05, -2.6149675250053406e-05, -2.3826956748962402e-05, -2.15042382478714e-05, -1.9181519746780396e-05, -1.6858801245689392e-05, -1.4536082744598389e-05, -1.2213364243507385e-05, -9.890645742416382e-06, -7.567927241325378e-06, -5.245208740234375e-06, -2.9224902391433716e-06, -5.997717380523682e-07, 1.7229467630386353e-06, 4.045665264129639e-06, 6.368383765220642e-06, 8.691102266311646e-06, 1.1013820767402649e-05, 1.3336539268493652e-05, 1.5659257769584656e-05, 1.798197627067566e-05, 2.0304694771766663e-05, 2.2627413272857666e-05, 2.495013177394867e-05, 2.7272850275039673e-05, 2.9595568776130676e-05, 3.191828727722168e-05, 3.424100577831268e-05, 3.6563724279403687e-05, 3.888644278049469e-05, 4.120916128158569e-05, 4.35318797826767e-05, 4.58545982837677e-05, 4.8177316784858704e-05, 5.050003528594971e-05, 5.282275378704071e-05, 5.5145472288131714e-05, 5.746819078922272e-05, 5.979090929031372e-05, 6.211362779140472e-05, 6.443634629249573e-05, 6.675906479358673e-05, 6.908178329467773e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 7.0, 10.0, 12.0, 16.0, 19.0, 31.0, 46.0, 66.0, 118.0, 181.0, 333.0, 621.0, 1247.0, 3229.0, 10143.0, 51304.0, 628873.0, 309141.0, 31158.0, 7334.0, 2414.0, 1030.0, 494.0, 236.0, 160.0, 106.0, 60.0, 42.0, 32.0, 20.0, 19.0, 11.0, 10.0, 8.0, 6.0, 3.0, 3.0, 6.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.263671875, -0.2553977966308594, -0.24712371826171875, -0.23884963989257812, -0.2305755615234375, -0.22230148315429688, -0.21402740478515625, -0.20575332641601562, -0.197479248046875, -0.18920516967773438, -0.18093109130859375, -0.17265701293945312, -0.1643829345703125, -0.15610885620117188, -0.14783477783203125, -0.13956069946289062, -0.13128662109375, -0.12301254272460938, -0.11473846435546875, -0.10646438598632812, -0.0981903076171875, -0.08991622924804688, -0.08164215087890625, -0.07336807250976562, -0.065093994140625, -0.056819915771484375, -0.04854583740234375, -0.040271759033203125, -0.0319976806640625, -0.023723602294921875, -0.01544952392578125, -0.007175445556640625, 0.0010986328125, 0.009372711181640625, 0.01764678955078125, 0.025920867919921875, 0.0341949462890625, 0.042469024658203125, 0.05074310302734375, 0.059017181396484375, 0.067291259765625, 0.07556533813476562, 0.08383941650390625, 0.09211349487304688, 0.1003875732421875, 0.10866165161132812, 0.11693572998046875, 0.12520980834960938, 0.13348388671875, 0.14175796508789062, 0.15003204345703125, 0.15830612182617188, 0.1665802001953125, 0.17485427856445312, 0.18312835693359375, 0.19140243530273438, 0.199676513671875, 0.20795059204101562, 0.21622467041015625, 0.22449874877929688, 0.2327728271484375, 0.24104690551757812, 0.24932098388671875, 0.2575950622558594, 0.265869140625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 7.0, 6.0, 2.0, 8.0, 11.0, 24.0, 27.0, 25.0, 51.0, 40.0, 69.0, 91.0, 85.0, 111.0, 92.0, 72.0, 66.0, 49.0, 34.0, 33.0, 15.0, 18.0, 9.0, 6.0, 10.0, 3.0, 9.0, 8.0, 3.0, 5.0, 1.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2310791015625, -0.22455596923828125, -0.2180328369140625, -0.21150970458984375, -0.204986572265625, -0.19846343994140625, -0.1919403076171875, -0.18541717529296875, -0.17889404296875, -0.17237091064453125, -0.1658477783203125, -0.15932464599609375, -0.152801513671875, -0.14627838134765625, -0.1397552490234375, -0.13323211669921875, -0.126708984375, -0.12018585205078125, -0.1136627197265625, -0.10713958740234375, -0.100616455078125, -0.09409332275390625, -0.0875701904296875, -0.08104705810546875, -0.07452392578125, -0.06800079345703125, -0.0614776611328125, -0.05495452880859375, -0.048431396484375, -0.04190826416015625, -0.0353851318359375, -0.02886199951171875, -0.0223388671875, -0.01581573486328125, -0.0092926025390625, -0.00276947021484375, 0.003753662109375, 0.01027679443359375, 0.0167999267578125, 0.02332305908203125, 0.02984619140625, 0.03636932373046875, 0.0428924560546875, 0.04941558837890625, 0.055938720703125, 0.06246185302734375, 0.0689849853515625, 0.07550811767578125, 0.08203125, 0.08855438232421875, 0.0950775146484375, 0.10160064697265625, 0.108123779296875, 0.11464691162109375, 0.1211700439453125, 0.12769317626953125, 0.13421630859375, 0.14073944091796875, 0.1472625732421875, 0.15378570556640625, 0.160308837890625, 0.16683197021484375, 0.1733551025390625, 0.17987823486328125, 0.1864013671875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 7.0, 6.0, 11.0, 17.0, 42.0, 75.0, 130.0, 217.0, 185.0, 119.0, 94.0, 41.0, 21.0, 17.0, 8.0, 4.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6024069786071777, -2.4645769596099854, -2.326746940612793, -2.1889171600341797, -2.0510871410369873, -1.913257122039795, -1.775427222251892, -1.6375973224639893, -1.4997673034667969, -1.3619372844696045, -1.2241073846817017, -1.0862774848937988, -0.9484474658966064, -0.8106175065040588, -0.6727875471115112, -0.5349575877189636, -0.397127628326416, -0.2592976689338684, -0.1214677095413208, 0.016362249851226807, 0.15419220924377441, 0.292022168636322, 0.42985212802886963, 0.5676820874214172, 0.7055120468139648, 0.8433420062065125, 0.9811719655990601, 1.119001865386963, 1.2568318843841553, 1.3946619033813477, 1.5324918031692505, 1.6703217029571533, 1.808152198791504, 1.9459822177886963, 2.0838122367858887, 2.221642017364502, 2.3594720363616943, 2.4973020553588867, 2.6351318359375, 2.7729618549346924, 2.9107918739318848, 3.048621892929077, 3.1864519119262695, 3.324281692504883, 3.462111711502075, 3.5999417304992676, 3.737771511077881, 3.8756015300750732, 4.013431549072266, 4.151261329650879, 4.28909158706665, 4.426921367645264, 4.564751625061035, 4.702581405639648, 4.840411186218262, 4.978241443634033, 5.1160712242126465, 5.25390100479126, 5.391731262207031, 5.5295610427856445, 5.667390823364258, 5.805221080780029, 5.943050861358643, 6.080881118774414, 6.218710899353027]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 9.0, 9.0, 11.0, 16.0, 14.0, 30.0, 27.0, 27.0, 35.0, 38.0, 44.0, 44.0, 54.0, 54.0, 78.0, 61.0, 64.0, 48.0, 47.0, 41.0, 35.0, 39.0, 28.0, 24.0, 18.0, 20.0, 17.0, 16.0, 12.0, 16.0, 7.0, 5.0, 0.0, 10.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.039203643798828, -2.964172840118408, -2.8891422748565674, -2.8141114711761475, -2.7390806674957275, -2.6640501022338867, -2.589019298553467, -2.513988494873047, -2.438957691192627, -2.363926887512207, -2.288896322250366, -2.2138655185699463, -2.1388347148895264, -2.0638041496276855, -1.9887733459472656, -1.9137425422668457, -1.8387119770050049, -1.7636812925338745, -1.6886504888534546, -1.6136198043823242, -1.5385890007019043, -1.463558316230774, -1.3885276317596436, -1.3134968280792236, -1.2384661436080933, -1.163435459136963, -1.088404655456543, -1.0133739709854126, -0.9383432269096375, -0.8633124828338623, -0.7882817983627319, -0.7132510542869568, -0.6382205486297607, -0.5631898045539856, -0.48815909028053284, -0.4131283760070801, -0.33809763193130493, -0.2630668878555298, -0.18803617358207703, -0.11300545930862427, -0.03797471523284912, 0.03705601394176483, 0.11208674311637878, 0.18711747229099274, 0.2621482014656067, 0.33717894554138184, 0.4122096598148346, 0.48724037408828735, 0.5622711181640625, 0.6373018622398376, 0.7123326063156128, 0.7873632907867432, 0.8623940348625183, 0.9374247789382935, 1.0124554634094238, 1.0874862670898438, 1.1625169515609741, 1.2375476360321045, 1.3125784397125244, 1.3876091241836548, 1.4626398086547852, 1.537670612335205, 1.6127012968063354, 1.6877319812774658, 1.7627627849578857]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 7.0, 7.0, 16.0, 12.0, 17.0, 24.0, 31.0, 69.0, 100.0, 186.0, 509.0, 1667.0, 8631.0, 130687.0, 4003160.0, 42550.0, 4765.0, 1106.0, 329.0, 143.0, 76.0, 46.0, 32.0, 34.0, 12.0, 14.0, 5.0, 10.0, 12.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-1.0673828125, -1.040252685546875, -1.01312255859375, -0.985992431640625, -0.9588623046875, -0.931732177734375, -0.90460205078125, -0.877471923828125, -0.850341796875, -0.823211669921875, -0.79608154296875, -0.768951416015625, -0.7418212890625, -0.714691162109375, -0.68756103515625, -0.660430908203125, -0.63330078125, -0.606170654296875, -0.57904052734375, -0.551910400390625, -0.5247802734375, -0.497650146484375, -0.47052001953125, -0.443389892578125, -0.416259765625, -0.389129638671875, -0.36199951171875, -0.334869384765625, -0.3077392578125, -0.280609130859375, -0.25347900390625, -0.226348876953125, -0.19921875, -0.172088623046875, -0.14495849609375, -0.117828369140625, -0.0906982421875, -0.063568115234375, -0.03643798828125, -0.009307861328125, 0.017822265625, 0.044952392578125, 0.07208251953125, 0.099212646484375, 0.1263427734375, 0.153472900390625, 0.18060302734375, 0.207733154296875, 0.23486328125, 0.261993408203125, 0.28912353515625, 0.316253662109375, 0.3433837890625, 0.370513916015625, 0.39764404296875, 0.424774169921875, 0.451904296875, 0.479034423828125, 0.50616455078125, 0.533294677734375, 0.5604248046875, 0.587554931640625, 0.61468505859375, 0.641815185546875, 0.6689453125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 10.0, 6.0, 9.0, 18.0, 21.0, 28.0, 50.0, 45.0, 52.0, 68.0, 67.0, 78.0, 68.0, 76.0, 64.0, 83.0, 53.0, 49.0, 42.0, 39.0, 28.0, 11.0, 13.0, 11.0, 12.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.231201171875, -0.2256460189819336, -0.2200908660888672, -0.21453571319580078, -0.20898056030273438, -0.20342540740966797, -0.19787025451660156, -0.19231510162353516, -0.18675994873046875, -0.18120479583740234, -0.17564964294433594, -0.17009449005126953, -0.16453933715820312, -0.15898418426513672, -0.1534290313720703, -0.1478738784790039, -0.1423187255859375, -0.1367635726928711, -0.1312084197998047, -0.12565326690673828, -0.12009811401367188, -0.11454296112060547, -0.10898780822753906, -0.10343265533447266, -0.09787750244140625, -0.09232234954833984, -0.08676719665527344, -0.08121204376220703, -0.07565689086914062, -0.07010173797607422, -0.06454658508300781, -0.058991432189941406, -0.053436279296875, -0.047881126403808594, -0.04232597351074219, -0.03677082061767578, -0.031215667724609375, -0.02566051483154297, -0.020105361938476562, -0.014550209045410156, -0.00899505615234375, -0.0034399032592773438, 0.0021152496337890625, 0.007670402526855469, 0.013225555419921875, 0.01878070831298828, 0.024335861206054688, 0.029891014099121094, 0.0354461669921875, 0.041001319885253906, 0.04655647277832031, 0.05211162567138672, 0.057666778564453125, 0.06322193145751953, 0.06877708435058594, 0.07433223724365234, 0.07988739013671875, 0.08544254302978516, 0.09099769592285156, 0.09655284881591797, 0.10210800170898438, 0.10766315460205078, 0.11321830749511719, 0.1187734603881836, 0.12432861328125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 1.0, 6.0, 8.0, 12.0, 9.0, 19.0, 37.0, 61.0, 112.0, 219.0, 399.0, 955.0, 2148.0, 5832.0, 17944.0, 71740.0, 786245.0, 3109867.0, 152278.0, 30674.0, 9494.0, 3439.0, 1447.0, 635.0, 305.0, 161.0, 90.0, 55.0, 32.0, 15.0, 12.0, 9.0, 6.0, 6.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33056640625, -0.3169097900390625, -0.303253173828125, -0.2895965576171875, -0.27593994140625, -0.2622833251953125, -0.248626708984375, -0.2349700927734375, -0.2213134765625, -0.2076568603515625, -0.194000244140625, -0.1803436279296875, -0.16668701171875, -0.1530303955078125, -0.139373779296875, -0.1257171630859375, -0.112060546875, -0.0984039306640625, -0.084747314453125, -0.0710906982421875, -0.05743408203125, -0.0437774658203125, -0.030120849609375, -0.0164642333984375, -0.0028076171875, 0.0108489990234375, 0.024505615234375, 0.0381622314453125, 0.05181884765625, 0.0654754638671875, 0.079132080078125, 0.0927886962890625, 0.1064453125, 0.1201019287109375, 0.133758544921875, 0.1474151611328125, 0.16107177734375, 0.1747283935546875, 0.188385009765625, 0.2020416259765625, 0.2156982421875, 0.2293548583984375, 0.243011474609375, 0.2566680908203125, 0.27032470703125, 0.2839813232421875, 0.297637939453125, 0.3112945556640625, 0.324951171875, 0.3386077880859375, 0.352264404296875, 0.3659210205078125, 0.37957763671875, 0.3932342529296875, 0.406890869140625, 0.4205474853515625, 0.4342041015625, 0.4478607177734375, 0.461517333984375, 0.4751739501953125, 0.48883056640625, 0.5024871826171875, 0.516143798828125, 0.5298004150390625, 0.54345703125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 7.0, 10.0, 7.0, 8.0, 21.0, 14.0, 25.0, 29.0, 53.0, 89.0, 124.0, 183.0, 381.0, 734.0, 1073.0, 515.0, 289.0, 155.0, 93.0, 74.0, 51.0, 33.0, 20.0, 18.0, 11.0, 16.0, 9.0, 6.0, 2.0, 4.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29443359375, -0.2823333740234375, -0.270233154296875, -0.2581329345703125, -0.24603271484375, -0.2339324951171875, -0.221832275390625, -0.2097320556640625, -0.1976318359375, -0.1855316162109375, -0.173431396484375, -0.1613311767578125, -0.14923095703125, -0.1371307373046875, -0.125030517578125, -0.1129302978515625, -0.100830078125, -0.0887298583984375, -0.076629638671875, -0.0645294189453125, -0.05242919921875, -0.0403289794921875, -0.028228759765625, -0.0161285400390625, -0.0040283203125, 0.0080718994140625, 0.020172119140625, 0.0322723388671875, 0.04437255859375, 0.0564727783203125, 0.068572998046875, 0.0806732177734375, 0.0927734375, 0.1048736572265625, 0.116973876953125, 0.1290740966796875, 0.14117431640625, 0.1532745361328125, 0.165374755859375, 0.1774749755859375, 0.1895751953125, 0.2016754150390625, 0.213775634765625, 0.2258758544921875, 0.23797607421875, 0.2500762939453125, 0.262176513671875, 0.2742767333984375, 0.286376953125, 0.2984771728515625, 0.310577392578125, 0.3226776123046875, 0.33477783203125, 0.3468780517578125, 0.358978271484375, 0.3710784912109375, 0.3831787109375, 0.3952789306640625, 0.407379150390625, 0.4194793701171875, 0.43157958984375, 0.4436798095703125, 0.455780029296875, 0.4678802490234375, 0.47998046875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 5.0, 9.0, 21.0, 31.0, 39.0, 70.0, 97.0, 133.0, 117.0, 124.0, 98.0, 73.0, 60.0, 38.0, 23.0, 5.0, 9.0, 5.0, 6.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.598886013031006, -2.520750045776367, -2.4426143169403076, -2.364478349685669, -2.2863426208496094, -2.2082066535949707, -2.130070924758911, -2.0519349575042725, -1.973799228668213, -1.8956633806228638, -1.8175275325775146, -1.7393916845321655, -1.6612558364868164, -1.5831199884414673, -1.5049841403961182, -1.4268481731414795, -1.3487123250961304, -1.2705764770507812, -1.1924406290054321, -1.114304780960083, -1.0361689329147339, -0.9580330848693848, -0.8798971772193909, -0.8017613291740417, -0.7236254811286926, -0.6454896330833435, -0.5673537850379944, -0.4892179071903229, -0.41108205914497375, -0.33294621109962463, -0.2548103332519531, -0.176674485206604, -0.09853863716125488, -0.020402781665325165, 0.05773307383060455, 0.13586893677711487, 0.214004784822464, 0.2921406328678131, 0.3702765107154846, 0.44841235876083374, 0.5265482068061829, 0.604684054851532, 0.6828199028968811, 0.760955810546875, 0.8390916585922241, 0.9172275066375732, 0.9953633546829224, 1.0734992027282715, 1.1516350507736206, 1.2297708988189697, 1.3079067468643188, 1.386042594909668, 1.464178442955017, 1.5423142910003662, 1.6204502582550049, 1.6985859870910645, 1.7767219543457031, 1.8548578023910522, 1.9329936504364014, 2.01112961769104, 2.0892653465270996, 2.1674013137817383, 2.245537042617798, 2.3236730098724365, 2.401808738708496]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 1.0, 4.0, 5.0, 2.0, 1.0, 3.0, 9.0, 7.0, 13.0, 13.0, 10.0, 20.0, 28.0, 15.0, 18.0, 25.0, 35.0, 45.0, 42.0, 50.0, 48.0, 44.0, 49.0, 40.0, 51.0, 51.0, 49.0, 31.0, 26.0, 37.0, 38.0, 34.0, 25.0, 17.0, 21.0, 19.0, 14.0, 17.0, 11.0, 7.0, 10.0, 9.0, 3.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.406076192855835, -1.3600701093673706, -1.3140639066696167, -1.2680578231811523, -1.222051739692688, -1.176045536994934, -1.1300394535064697, -1.0840332508087158, -1.0380271673202515, -0.9920210242271423, -0.946014940738678, -0.9000087976455688, -0.8540026545524597, -0.8079965114593506, -0.7619904279708862, -0.7159842848777771, -0.6699782013893127, -0.6239720582962036, -0.5779659748077393, -0.5319598317146301, -0.485953688621521, -0.43994757533073425, -0.3939414620399475, -0.3479353189468384, -0.30192920565605164, -0.2559230923652649, -0.20991694927215576, -0.16391083598136902, -0.11790470778942108, -0.07189857959747314, -0.0258924663066864, 0.02011367678642273, 0.06611979007720947, 0.11212591826915741, 0.15813204646110535, 0.2041381597518921, 0.2501443028450012, 0.29615041613578796, 0.3421565294265747, 0.38816267251968384, 0.4341687858104706, 0.4801748991012573, 0.5261810421943665, 0.5721871852874756, 0.6181932687759399, 0.6641994118690491, 0.7102055549621582, 0.7562116384506226, 0.8022177815437317, 0.8482239246368408, 0.8942300081253052, 0.9402361512184143, 0.9862422943115234, 1.0322483777999878, 1.0782544612884521, 1.124260663986206, 1.1702667474746704, 1.2162728309631348, 1.2622790336608887, 1.308285117149353, 1.3542912006378174, 1.4002974033355713, 1.4463034868240356, 1.4923095703125, 1.538315773010254]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 11.0, 14.0, 24.0, 32.0, 29.0, 60.0, 85.0, 98.0, 151.0, 213.0, 335.0, 455.0, 757.0, 1058.0, 1775.0, 2787.0, 4700.0, 8160.0, 14775.0, 29853.0, 68487.0, 190056.0, 403697.0, 187652.0, 67843.0, 29967.0, 14956.0, 8102.0, 4692.0, 2755.0, 1687.0, 1082.0, 738.0, 447.0, 309.0, 205.0, 169.0, 97.0, 60.0, 56.0, 36.0, 25.0, 23.0, 10.0, 9.0, 7.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.2474365234375, -0.2395801544189453, -0.23172378540039062, -0.22386741638183594, -0.21601104736328125, -0.20815467834472656, -0.20029830932617188, -0.1924419403076172, -0.1845855712890625, -0.1767292022705078, -0.16887283325195312, -0.16101646423339844, -0.15316009521484375, -0.14530372619628906, -0.13744735717773438, -0.1295909881591797, -0.121734619140625, -0.11387825012207031, -0.10602188110351562, -0.09816551208496094, -0.09030914306640625, -0.08245277404785156, -0.07459640502929688, -0.06674003601074219, -0.0588836669921875, -0.05102729797363281, -0.043170928955078125, -0.03531455993652344, -0.02745819091796875, -0.019601821899414062, -0.011745452880859375, -0.0038890838623046875, 0.00396728515625, 0.011823654174804688, 0.019680023193359375, 0.027536392211914062, 0.03539276123046875, 0.04324913024902344, 0.051105499267578125, 0.05896186828613281, 0.0668182373046875, 0.07467460632324219, 0.08253097534179688, 0.09038734436035156, 0.09824371337890625, 0.10610008239746094, 0.11395645141601562, 0.12181282043457031, 0.129669189453125, 0.1375255584716797, 0.14538192749023438, 0.15323829650878906, 0.16109466552734375, 0.16895103454589844, 0.17680740356445312, 0.1846637725830078, 0.1925201416015625, 0.2003765106201172, 0.20823287963867188, 0.21608924865722656, 0.22394561767578125, 0.23180198669433594, 0.23965835571289062, 0.2475147247314453, 0.25537109375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 5.0, 9.0, 15.0, 18.0, 18.0, 18.0, 40.0, 43.0, 50.0, 58.0, 61.0, 65.0, 65.0, 63.0, 74.0, 70.0, 55.0, 59.0, 36.0, 42.0, 37.0, 21.0, 22.0, 20.0, 8.0, 6.0, 9.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.22412109375, -0.21869850158691406, -0.21327590942382812, -0.2078533172607422, -0.20243072509765625, -0.1970081329345703, -0.19158554077148438, -0.18616294860839844, -0.1807403564453125, -0.17531776428222656, -0.16989517211914062, -0.1644725799560547, -0.15904998779296875, -0.1536273956298828, -0.14820480346679688, -0.14278221130371094, -0.137359619140625, -0.13193702697753906, -0.12651443481445312, -0.12109184265136719, -0.11566925048828125, -0.11024665832519531, -0.10482406616210938, -0.09940147399902344, -0.0939788818359375, -0.08855628967285156, -0.08313369750976562, -0.07771110534667969, -0.07228851318359375, -0.06686592102050781, -0.061443328857421875, -0.05602073669433594, -0.05059814453125, -0.04517555236816406, -0.039752960205078125, -0.03433036804199219, -0.02890777587890625, -0.023485183715820312, -0.018062591552734375, -0.012639999389648438, -0.0072174072265625, -0.0017948150634765625, 0.003627777099609375, 0.009050369262695312, 0.01447296142578125, 0.019895553588867188, 0.025318145751953125, 0.030740737915039062, 0.036163330078125, 0.04158592224121094, 0.047008514404296875, 0.05243110656738281, 0.05785369873046875, 0.06327629089355469, 0.06869888305664062, 0.07412147521972656, 0.0795440673828125, 0.08496665954589844, 0.09038925170898438, 0.09581184387207031, 0.10123443603515625, 0.10665702819824219, 0.11207962036132812, 0.11750221252441406, 0.1229248046875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 12.0, 9.0, 14.0, 19.0, 31.0, 35.0, 44.0, 71.0, 92.0, 146.0, 188.0, 331.0, 499.0, 869.0, 1621.0, 3403.0, 8548.0, 24844.0, 98805.0, 656414.0, 192052.0, 38542.0, 12223.0, 4744.0, 2105.0, 1111.0, 612.0, 339.0, 252.0, 165.0, 94.0, 79.0, 51.0, 51.0, 38.0, 18.0, 17.0, 14.0, 11.0, 5.0, 2.0, 5.0, 7.0, 7.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.431640625, -0.4180145263671875, -0.404388427734375, -0.3907623291015625, -0.37713623046875, -0.3635101318359375, -0.349884033203125, -0.3362579345703125, -0.3226318359375, -0.3090057373046875, -0.295379638671875, -0.2817535400390625, -0.26812744140625, -0.2545013427734375, -0.240875244140625, -0.2272491455078125, -0.213623046875, -0.1999969482421875, -0.186370849609375, -0.1727447509765625, -0.15911865234375, -0.1454925537109375, -0.131866455078125, -0.1182403564453125, -0.1046142578125, -0.0909881591796875, -0.077362060546875, -0.0637359619140625, -0.05010986328125, -0.0364837646484375, -0.022857666015625, -0.0092315673828125, 0.00439453125, 0.0180206298828125, 0.031646728515625, 0.0452728271484375, 0.05889892578125, 0.0725250244140625, 0.086151123046875, 0.0997772216796875, 0.1134033203125, 0.1270294189453125, 0.140655517578125, 0.1542816162109375, 0.16790771484375, 0.1815338134765625, 0.195159912109375, 0.2087860107421875, 0.222412109375, 0.2360382080078125, 0.249664306640625, 0.2632904052734375, 0.27691650390625, 0.2905426025390625, 0.304168701171875, 0.3177947998046875, 0.3314208984375, 0.3450469970703125, 0.358673095703125, 0.3722991943359375, 0.38592529296875, 0.3995513916015625, 0.413177490234375, 0.4268035888671875, 0.4404296875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 9.0, 21.0, 13.0, 15.0, 19.0, 24.0, 30.0, 28.0, 29.0, 38.0, 50.0, 51.0, 58.0, 62.0, 50.0, 47.0, 46.0, 58.0, 61.0, 49.0, 40.0, 41.0, 29.0, 29.0, 16.0, 12.0, 9.0, 8.0, 6.0, 7.0, 8.0, 4.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.60107421875, -0.5829925537109375, -0.564910888671875, -0.5468292236328125, -0.52874755859375, -0.5106658935546875, -0.492584228515625, -0.4745025634765625, -0.4564208984375, -0.4383392333984375, -0.420257568359375, -0.4021759033203125, -0.38409423828125, -0.3660125732421875, -0.347930908203125, -0.3298492431640625, -0.311767578125, -0.2936859130859375, -0.275604248046875, -0.2575225830078125, -0.23944091796875, -0.2213592529296875, -0.203277587890625, -0.1851959228515625, -0.1671142578125, -0.1490325927734375, -0.130950927734375, -0.1128692626953125, -0.09478759765625, -0.0767059326171875, -0.058624267578125, -0.0405426025390625, -0.0224609375, -0.0043792724609375, 0.013702392578125, 0.0317840576171875, 0.04986572265625, 0.0679473876953125, 0.086029052734375, 0.1041107177734375, 0.1221923828125, 0.1402740478515625, 0.158355712890625, 0.1764373779296875, 0.19451904296875, 0.2126007080078125, 0.230682373046875, 0.2487640380859375, 0.266845703125, 0.2849273681640625, 0.303009033203125, 0.3210906982421875, 0.33917236328125, 0.3572540283203125, 0.375335693359375, 0.3934173583984375, 0.4114990234375, 0.4295806884765625, 0.447662353515625, 0.4657440185546875, 0.48382568359375, 0.5019073486328125, 0.519989013671875, 0.5380706787109375, 0.55615234375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 7.0, 9.0, 7.0, 13.0, 17.0, 18.0, 42.0, 105.0, 227.0, 552.0, 1737.0, 7587.0, 75188.0, 864464.0, 87383.0, 8246.0, 1856.0, 617.0, 245.0, 101.0, 54.0, 24.0, 21.0, 10.0, 6.0, 6.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40771484375, -0.3939056396484375, -0.380096435546875, -0.3662872314453125, -0.35247802734375, -0.3386688232421875, -0.324859619140625, -0.3110504150390625, -0.2972412109375, -0.2834320068359375, -0.269622802734375, -0.2558135986328125, -0.24200439453125, -0.2281951904296875, -0.214385986328125, -0.2005767822265625, -0.186767578125, -0.1729583740234375, -0.159149169921875, -0.1453399658203125, -0.13153076171875, -0.1177215576171875, -0.103912353515625, -0.0901031494140625, -0.0762939453125, -0.0624847412109375, -0.048675537109375, -0.0348663330078125, -0.02105712890625, -0.0072479248046875, 0.006561279296875, 0.0203704833984375, 0.0341796875, 0.0479888916015625, 0.061798095703125, 0.0756072998046875, 0.08941650390625, 0.1032257080078125, 0.117034912109375, 0.1308441162109375, 0.1446533203125, 0.1584625244140625, 0.172271728515625, 0.1860809326171875, 0.19989013671875, 0.2136993408203125, 0.227508544921875, 0.2413177490234375, 0.255126953125, 0.2689361572265625, 0.282745361328125, 0.2965545654296875, 0.31036376953125, 0.3241729736328125, 0.337982177734375, 0.3517913818359375, 0.3656005859375, 0.3794097900390625, 0.393218994140625, 0.4070281982421875, 0.42083740234375, 0.4346466064453125, 0.448455810546875, 0.4622650146484375, 0.47607421875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 6.0, 7.0, 10.0, 8.0, 9.0, 23.0, 25.0, 41.0, 60.0, 69.0, 93.0, 117.0, 123.0, 102.0, 71.0, 63.0, 43.0, 30.0, 31.0, 19.0, 13.0, 6.0, 4.0, 5.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.900859832763672e-05, -5.699321627616882e-05, -5.497783422470093e-05, -5.296245217323303e-05, -5.094707012176514e-05, -4.893168807029724e-05, -4.6916306018829346e-05, -4.490092396736145e-05, -4.2885541915893555e-05, -4.087015986442566e-05, -3.8854777812957764e-05, -3.683939576148987e-05, -3.482401371002197e-05, -3.280863165855408e-05, -3.079324960708618e-05, -2.8777867555618286e-05, -2.676248550415039e-05, -2.4747103452682495e-05, -2.27317214012146e-05, -2.0716339349746704e-05, -1.870095729827881e-05, -1.6685575246810913e-05, -1.4670193195343018e-05, -1.2654811143875122e-05, -1.0639429092407227e-05, -8.624047040939331e-06, -6.6086649894714355e-06, -4.59328293800354e-06, -2.5779008865356445e-06, -5.62518835067749e-07, 1.4528632164001465e-06, 3.468245267868042e-06, 5.4836273193359375e-06, 7.499009370803833e-06, 9.514391422271729e-06, 1.1529773473739624e-05, 1.354515552520752e-05, 1.5560537576675415e-05, 1.757591962814331e-05, 1.9591301679611206e-05, 2.16066837310791e-05, 2.3622065782546997e-05, 2.5637447834014893e-05, 2.7652829885482788e-05, 2.9668211936950684e-05, 3.168359398841858e-05, 3.3698976039886475e-05, 3.571435809135437e-05, 3.7729740142822266e-05, 3.974512219429016e-05, 4.176050424575806e-05, 4.377588629722595e-05, 4.579126834869385e-05, 4.780665040016174e-05, 4.982203245162964e-05, 5.1837414503097534e-05, 5.385279655456543e-05, 5.5868178606033325e-05, 5.788356065750122e-05, 5.9898942708969116e-05, 6.191432476043701e-05, 6.392970681190491e-05, 6.59450888633728e-05, 6.79604709148407e-05, 6.99758529663086e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 7.0, 6.0, 15.0, 16.0, 30.0, 24.0, 45.0, 68.0, 124.0, 180.0, 271.0, 490.0, 1007.0, 2215.0, 6206.0, 22785.0, 143713.0, 706437.0, 133068.0, 21515.0, 6052.0, 2073.0, 952.0, 486.0, 258.0, 165.0, 100.0, 87.0, 33.0, 35.0, 16.0, 22.0, 14.0, 8.0, 7.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.283203125, -0.2754402160644531, -0.26767730712890625, -0.2599143981933594, -0.2521514892578125, -0.24438858032226562, -0.23662567138671875, -0.22886276245117188, -0.221099853515625, -0.21333694458007812, -0.20557403564453125, -0.19781112670898438, -0.1900482177734375, -0.18228530883789062, -0.17452239990234375, -0.16675949096679688, -0.15899658203125, -0.15123367309570312, -0.14347076416015625, -0.13570785522460938, -0.1279449462890625, -0.12018203735351562, -0.11241912841796875, -0.10465621948242188, -0.096893310546875, -0.08913040161132812, -0.08136749267578125, -0.07360458374023438, -0.0658416748046875, -0.058078765869140625, -0.05031585693359375, -0.042552947998046875, -0.0347900390625, -0.027027130126953125, -0.01926422119140625, -0.011501312255859375, -0.0037384033203125, 0.004024505615234375, 0.01178741455078125, 0.019550323486328125, 0.027313232421875, 0.035076141357421875, 0.04283905029296875, 0.050601959228515625, 0.0583648681640625, 0.06612777709960938, 0.07389068603515625, 0.08165359497070312, 0.08941650390625, 0.09717941284179688, 0.10494232177734375, 0.11270523071289062, 0.1204681396484375, 0.12823104858398438, 0.13599395751953125, 0.14375686645507812, 0.151519775390625, 0.15928268432617188, 0.16704559326171875, 0.17480850219726562, 0.1825714111328125, 0.19033432006835938, 0.19809722900390625, 0.20586013793945312, 0.213623046875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 3.0, 8.0, 10.0, 18.0, 20.0, 24.0, 40.0, 39.0, 57.0, 47.0, 68.0, 96.0, 88.0, 79.0, 81.0, 59.0, 49.0, 47.0, 34.0, 24.0, 18.0, 12.0, 12.0, 7.0, 9.0, 7.0, 5.0, 7.0, 5.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.2423095703125, -0.2360210418701172, -0.22973251342773438, -0.22344398498535156, -0.21715545654296875, -0.21086692810058594, -0.20457839965820312, -0.1982898712158203, -0.1920013427734375, -0.1857128143310547, -0.17942428588867188, -0.17313575744628906, -0.16684722900390625, -0.16055870056152344, -0.15427017211914062, -0.1479816436767578, -0.141693115234375, -0.1354045867919922, -0.12911605834960938, -0.12282752990722656, -0.11653900146484375, -0.11025047302246094, -0.10396194458007812, -0.09767341613769531, -0.0913848876953125, -0.08509635925292969, -0.07880783081054688, -0.07251930236816406, -0.06623077392578125, -0.05994224548339844, -0.053653717041015625, -0.04736518859863281, -0.04107666015625, -0.03478813171386719, -0.028499603271484375, -0.022211074829101562, -0.01592254638671875, -0.009634017944335938, -0.003345489501953125, 0.0029430389404296875, 0.0092315673828125, 0.015520095825195312, 0.021808624267578125, 0.028097152709960938, 0.03438568115234375, 0.04067420959472656, 0.046962738037109375, 0.05325126647949219, 0.059539794921875, 0.06582832336425781, 0.07211685180664062, 0.07840538024902344, 0.08469390869140625, 0.09098243713378906, 0.09727096557617188, 0.10355949401855469, 0.1098480224609375, 0.11613655090332031, 0.12242507934570312, 0.12871360778808594, 0.13500213623046875, 0.14129066467285156, 0.14757919311523438, 0.1538677215576172, 0.16015625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 7.0, 5.0, 4.0, 10.0, 13.0, 20.0, 48.0, 60.0, 96.0, 118.0, 157.0, 140.0, 115.0, 70.0, 55.0, 31.0, 19.0, 15.0, 8.0, 1.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.539969444274902, -4.439096927642822, -4.338224411010742, -4.237351894378662, -4.136479377746582, -4.035606861114502, -3.934734582901001, -3.833862066268921, -3.732989549636841, -3.6321170330047607, -3.5312445163726807, -3.4303722381591797, -3.3294997215270996, -3.2286272048950195, -3.1277546882629395, -3.0268821716308594, -2.9260096549987793, -2.825137138366699, -2.724264621734619, -2.623392105102539, -2.522519826889038, -2.421647310256958, -2.320774793624878, -2.219902276992798, -2.119029998779297, -2.018157482147217, -1.9172850847244263, -1.8164125680923462, -1.7155400514602661, -1.6146676540374756, -1.5137951374053955, -1.4129226207733154, -1.3120501041412354, -1.2111775875091553, -1.1103051900863647, -1.0094326734542847, -0.9085601568222046, -0.8076876997947693, -0.706815242767334, -0.6059427261352539, -0.5050702691078186, -0.4041977822780609, -0.3033252954483032, -0.20245283842086792, -0.10158035159111023, -0.0007078647613525391, 0.10016459226608276, 0.20103710889816284, 0.30190956592559814, 0.40278205275535583, 0.5036545395851135, 0.6045269966125488, 0.7053995132446289, 0.8062719702720642, 0.9071444272994995, 1.0080169439315796, 1.1088893413543701, 1.2097618579864502, 1.3106342554092407, 1.4115067720413208, 1.5123792886734009, 1.6132516860961914, 1.7141242027282715, 1.8149967193603516, 1.9158692359924316]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 9.0, 9.0, 13.0, 20.0, 19.0, 18.0, 16.0, 22.0, 21.0, 28.0, 26.0, 33.0, 30.0, 38.0, 47.0, 42.0, 49.0, 46.0, 43.0, 41.0, 44.0, 44.0, 31.0, 33.0, 36.0, 26.0, 18.0, 26.0, 31.0, 15.0, 21.0, 17.0, 11.0, 11.0, 12.0, 4.0, 11.0, 3.0, 7.0, 1.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-1.971482753753662, -1.9116636514663696, -1.8518446683883667, -1.7920255661010742, -1.7322065830230713, -1.6723874807357788, -1.6125683784484863, -1.5527493953704834, -1.4929304122924805, -1.433111310005188, -1.373292326927185, -1.3134732246398926, -1.2536542415618896, -1.1938351392745972, -1.1340160369873047, -1.0741970539093018, -1.0143779516220093, -0.9545589089393616, -0.8947398662567139, -0.8349207639694214, -0.7751017808914185, -0.715282678604126, -0.6554636359214783, -0.5956445932388306, -0.5358255505561829, -0.47600650787353516, -0.41618746519088745, -0.35636839270591736, -0.29654935002326965, -0.23673030734062195, -0.17691123485565186, -0.11709219217300415, -0.057273030281066895, 0.0025460198521614075, 0.06236506998538971, 0.12218412756919861, 0.1820031702518463, 0.24182221293449402, 0.3016412854194641, 0.3614603281021118, 0.4212793707847595, 0.4810984134674072, 0.5409174561500549, 0.6007364988327026, 0.6605556011199951, 0.720374584197998, 0.7801936864852905, 0.8400127291679382, 0.8998317718505859, 0.9596508145332336, 1.0194698572158813, 1.0792889595031738, 1.1391079425811768, 1.1989270448684692, 1.2587461471557617, 1.3185651302337646, 1.3783841133117676, 1.43820321559906, 1.498022198677063, 1.5578413009643555, 1.6176602840423584, 1.6774793863296509, 1.7372984886169434, 1.7971174716949463, 1.8569365739822388]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 12.0, 15.0, 22.0, 32.0, 42.0, 76.0, 117.0, 171.0, 319.0, 417.0, 704.0, 1192.0, 1962.0, 3469.0, 6523.0, 12811.0, 29526.0, 84100.0, 374297.0, 2225782.0, 1167311.0, 189165.0, 53749.0, 20990.0, 9645.0, 5053.0, 2709.0, 1534.0, 954.0, 561.0, 374.0, 232.0, 164.0, 91.0, 55.0, 42.0, 27.0, 12.0, 14.0, 4.0, 4.0, 1.0, 3.0], "bins": [-0.26953125, -0.2629241943359375, -0.256317138671875, -0.2497100830078125, -0.24310302734375, -0.2364959716796875, -0.229888916015625, -0.2232818603515625, -0.2166748046875, -0.2100677490234375, -0.203460693359375, -0.1968536376953125, -0.19024658203125, -0.1836395263671875, -0.177032470703125, -0.1704254150390625, -0.163818359375, -0.1572113037109375, -0.150604248046875, -0.1439971923828125, -0.13739013671875, -0.1307830810546875, -0.124176025390625, -0.1175689697265625, -0.1109619140625, -0.1043548583984375, -0.097747802734375, -0.0911407470703125, -0.08453369140625, -0.0779266357421875, -0.071319580078125, -0.0647125244140625, -0.05810546875, -0.0514984130859375, -0.044891357421875, -0.0382843017578125, -0.03167724609375, -0.0250701904296875, -0.018463134765625, -0.0118560791015625, -0.0052490234375, 0.0013580322265625, 0.007965087890625, 0.0145721435546875, 0.02117919921875, 0.0277862548828125, 0.034393310546875, 0.0410003662109375, 0.047607421875, 0.0542144775390625, 0.060821533203125, 0.0674285888671875, 0.07403564453125, 0.0806427001953125, 0.087249755859375, 0.0938568115234375, 0.1004638671875, 0.1070709228515625, 0.113677978515625, 0.1202850341796875, 0.12689208984375, 0.1334991455078125, 0.140106201171875, 0.1467132568359375, 0.1533203125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 7.0, 10.0, 10.0, 11.0, 13.0, 24.0, 33.0, 22.0, 39.0, 44.0, 51.0, 41.0, 55.0, 60.0, 55.0, 60.0, 53.0, 58.0, 48.0, 39.0, 47.0, 45.0, 32.0, 25.0, 29.0, 15.0, 21.0, 18.0, 12.0, 4.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1490478515625, -0.14482784271240234, -0.1406078338623047, -0.13638782501220703, -0.13216781616210938, -0.12794780731201172, -0.12372779846191406, -0.1195077896118164, -0.11528778076171875, -0.1110677719116211, -0.10684776306152344, -0.10262775421142578, -0.09840774536132812, -0.09418773651123047, -0.08996772766113281, -0.08574771881103516, -0.0815277099609375, -0.07730770111083984, -0.07308769226074219, -0.06886768341064453, -0.06464767456054688, -0.06042766571044922, -0.05620765686035156, -0.051987648010253906, -0.04776763916015625, -0.043547630310058594, -0.03932762145996094, -0.03510761260986328, -0.030887603759765625, -0.02666759490966797, -0.022447586059570312, -0.018227577209472656, -0.014007568359375, -0.009787559509277344, -0.0055675506591796875, -0.0013475418090820312, 0.002872467041015625, 0.007092475891113281, 0.011312484741210938, 0.015532493591308594, 0.01975250244140625, 0.023972511291503906, 0.028192520141601562, 0.03241252899169922, 0.036632537841796875, 0.04085254669189453, 0.04507255554199219, 0.049292564392089844, 0.0535125732421875, 0.057732582092285156, 0.06195259094238281, 0.06617259979248047, 0.07039260864257812, 0.07461261749267578, 0.07883262634277344, 0.0830526351928711, 0.08727264404296875, 0.0914926528930664, 0.09571266174316406, 0.09993267059326172, 0.10415267944335938, 0.10837268829345703, 0.11259269714355469, 0.11681270599365234, 0.12103271484375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 11.0, 6.0, 8.0, 20.0, 21.0, 40.0, 75.0, 117.0, 226.0, 417.0, 980.0, 2549.0, 7829.0, 31170.0, 184446.0, 2961484.0, 898544.0, 81404.0, 16999.0, 4849.0, 1732.0, 665.0, 287.0, 143.0, 96.0, 54.0, 34.0, 22.0, 11.0, 8.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.515625, -0.5016098022460938, -0.4875946044921875, -0.47357940673828125, -0.459564208984375, -0.44554901123046875, -0.4315338134765625, -0.41751861572265625, -0.40350341796875, -0.38948822021484375, -0.3754730224609375, -0.36145782470703125, -0.347442626953125, -0.33342742919921875, -0.3194122314453125, -0.30539703369140625, -0.2913818359375, -0.27736663818359375, -0.2633514404296875, -0.24933624267578125, -0.235321044921875, -0.22130584716796875, -0.2072906494140625, -0.19327545166015625, -0.17926025390625, -0.16524505615234375, -0.1512298583984375, -0.13721466064453125, -0.123199462890625, -0.10918426513671875, -0.0951690673828125, -0.08115386962890625, -0.067138671875, -0.05312347412109375, -0.0391082763671875, -0.02509307861328125, -0.011077880859375, 0.00293731689453125, 0.0169525146484375, 0.03096771240234375, 0.04498291015625, 0.05899810791015625, 0.0730133056640625, 0.08702850341796875, 0.101043701171875, 0.11505889892578125, 0.1290740966796875, 0.14308929443359375, 0.1571044921875, 0.17111968994140625, 0.1851348876953125, 0.19915008544921875, 0.213165283203125, 0.22718048095703125, 0.2411956787109375, 0.25521087646484375, 0.26922607421875, 0.28324127197265625, 0.2972564697265625, 0.31127166748046875, 0.325286865234375, 0.33930206298828125, 0.3533172607421875, 0.36733245849609375, 0.38134765625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 6.0, 9.0, 10.0, 10.0, 20.0, 27.0, 30.0, 34.0, 44.0, 60.0, 83.0, 124.0, 182.0, 277.0, 476.0, 666.0, 668.0, 453.0, 271.0, 187.0, 114.0, 83.0, 61.0, 42.0, 31.0, 27.0, 11.0, 16.0, 8.0, 12.0, 7.0, 5.0, 7.0, 5.0, 1.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37744140625, -0.36522674560546875, -0.3530120849609375, -0.34079742431640625, -0.328582763671875, -0.31636810302734375, -0.3041534423828125, -0.29193878173828125, -0.27972412109375, -0.26750946044921875, -0.2552947998046875, -0.24308013916015625, -0.230865478515625, -0.21865081787109375, -0.2064361572265625, -0.19422149658203125, -0.1820068359375, -0.16979217529296875, -0.1575775146484375, -0.14536285400390625, -0.133148193359375, -0.12093353271484375, -0.1087188720703125, -0.09650421142578125, -0.08428955078125, -0.07207489013671875, -0.0598602294921875, -0.04764556884765625, -0.035430908203125, -0.02321624755859375, -0.0110015869140625, 0.00121307373046875, 0.013427734375, 0.02564239501953125, 0.0378570556640625, 0.05007171630859375, 0.062286376953125, 0.07450103759765625, 0.0867156982421875, 0.09893035888671875, 0.11114501953125, 0.12335968017578125, 0.1355743408203125, 0.14778900146484375, 0.160003662109375, 0.17221832275390625, 0.1844329833984375, 0.19664764404296875, 0.2088623046875, 0.22107696533203125, 0.2332916259765625, 0.24550628662109375, 0.257720947265625, 0.26993560791015625, 0.2821502685546875, 0.29436492919921875, 0.30657958984375, 0.31879425048828125, 0.3310089111328125, 0.34322357177734375, 0.355438232421875, 0.36765289306640625, 0.3798675537109375, 0.39208221435546875, 0.404296875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 5.0, 10.0, 16.0, 12.0, 64.0, 123.0, 236.0, 244.0, 151.0, 66.0, 41.0, 13.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.866659164428711, -7.679159164428711, -7.491659641265869, -7.304160118103027, -7.116660118103027, -6.929160118103027, -6.7416605949401855, -6.554161071777344, -6.366661071777344, -6.179161071777344, -5.991661548614502, -5.80416202545166, -5.61666202545166, -5.42916202545166, -5.241662502288818, -5.054162979125977, -4.866662979125977, -4.679162979125977, -4.491663455963135, -4.304163932800293, -4.116663932800293, -3.929164171218872, -3.741664409637451, -3.5541646480560303, -3.3666648864746094, -3.1791651248931885, -2.9916653633117676, -2.8041656017303467, -2.616665840148926, -2.429166078567505, -2.241666316986084, -2.054166555404663, -1.8666667938232422, -1.6791670322418213, -1.4916672706604004, -1.3041675090789795, -1.1166677474975586, -0.9291679859161377, -0.7416682243347168, -0.5541684627532959, -0.366668701171875, -0.1791689395904541, 0.008330821990966797, 0.1958305835723877, 0.3833303451538086, 0.5708301067352295, 0.7583298683166504, 0.9458296298980713, 1.1333293914794922, 1.320829153060913, 1.508328914642334, 1.6958286762237549, 1.8833284378051758, 2.0708281993865967, 2.2583279609680176, 2.4458277225494385, 2.6333274841308594, 2.8208272457122803, 3.008327007293701, 3.195826768875122, 3.383326530456543, 3.570826292037964, 3.7583260536193848, 3.9458258152008057, 4.133325576782227]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 7.0, 12.0, 15.0, 16.0, 22.0, 23.0, 26.0, 26.0, 33.0, 32.0, 40.0, 45.0, 42.0, 42.0, 52.0, 49.0, 45.0, 49.0, 50.0, 53.0, 52.0, 37.0, 31.0, 28.0, 38.0, 24.0, 29.0, 13.0, 16.0, 9.0, 14.0, 9.0, 4.0, 6.0, 6.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.54189133644104, -2.473738670349121, -2.405586004257202, -2.337433338165283, -2.2692806720733643, -2.2011280059814453, -2.1329753398895264, -2.0648226737976074, -1.996670126914978, -1.928517460823059, -1.8603647947311401, -1.7922121286392212, -1.7240595817565918, -1.6559069156646729, -1.587754249572754, -1.519601583480835, -1.451448917388916, -1.383296251296997, -1.3151435852050781, -1.2469909191131592, -1.1788382530212402, -1.1106855869293213, -1.042533040046692, -0.974380373954773, -0.906227707862854, -0.8380750417709351, -0.7699223756790161, -0.7017697691917419, -0.633617103099823, -0.565464437007904, -0.4973118007183075, -0.42915916442871094, -0.3610062599182129, -0.29285359382629395, -0.2247009575366974, -0.15654830634593964, -0.08839565515518188, -0.02024298906326294, 0.04790964722633362, 0.11606228351593018, 0.18421494960784912, 0.25236761569976807, 0.3205202519893646, 0.3886728882789612, 0.4568255543708801, 0.5249782204627991, 0.5931308269500732, 0.6612834930419922, 0.7294361591339111, 0.7975888252258301, 0.865741491317749, 0.9338940978050232, 1.002046823501587, 1.0701994895935059, 1.1383520364761353, 1.2065047025680542, 1.2746573686599731, 1.342810034751892, 1.410962700843811, 1.47911536693573, 1.5472679138183594, 1.6154205799102783, 1.6835732460021973, 1.7517259120941162, 1.8198785781860352]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 6.0, 5.0, 16.0, 20.0, 30.0, 32.0, 62.0, 90.0, 136.0, 193.0, 252.0, 409.0, 681.0, 966.0, 1451.0, 2437.0, 3995.0, 6966.0, 11797.0, 21835.0, 41057.0, 80007.0, 167887.0, 312523.0, 197987.0, 92835.0, 46604.0, 25000.0, 13607.0, 7663.0, 4436.0, 2740.0, 1681.0, 1066.0, 714.0, 451.0, 301.0, 212.0, 143.0, 68.0, 54.0, 42.0, 29.0, 27.0, 15.0, 13.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.220947265625, -0.2137279510498047, -0.20650863647460938, -0.19928932189941406, -0.19207000732421875, -0.18485069274902344, -0.17763137817382812, -0.1704120635986328, -0.1631927490234375, -0.1559734344482422, -0.14875411987304688, -0.14153480529785156, -0.13431549072265625, -0.12709617614746094, -0.11987686157226562, -0.11265754699707031, -0.105438232421875, -0.09821891784667969, -0.09099960327148438, -0.08378028869628906, -0.07656097412109375, -0.06934165954589844, -0.062122344970703125, -0.05490303039550781, -0.0476837158203125, -0.04046440124511719, -0.033245086669921875, -0.026025772094726562, -0.01880645751953125, -0.011587142944335938, -0.004367828369140625, 0.0028514862060546875, 0.01007080078125, 0.017290115356445312, 0.024509429931640625, 0.03172874450683594, 0.03894805908203125, 0.04616737365722656, 0.053386688232421875, 0.06060600280761719, 0.0678253173828125, 0.07504463195800781, 0.08226394653320312, 0.08948326110839844, 0.09670257568359375, 0.10392189025878906, 0.11114120483398438, 0.11836051940917969, 0.125579833984375, 0.1327991485595703, 0.14001846313476562, 0.14723777770996094, 0.15445709228515625, 0.16167640686035156, 0.16889572143554688, 0.1761150360107422, 0.1833343505859375, 0.1905536651611328, 0.19777297973632812, 0.20499229431152344, 0.21221160888671875, 0.21943092346191406, 0.22665023803710938, 0.2338695526123047, 0.2410888671875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 9.0, 10.0, 13.0, 12.0, 12.0, 14.0, 18.0, 17.0, 28.0, 32.0, 35.0, 43.0, 41.0, 45.0, 50.0, 58.0, 48.0, 39.0, 65.0, 35.0, 41.0, 48.0, 51.0, 57.0, 43.0, 20.0, 16.0, 22.0, 22.0, 13.0, 15.0, 11.0, 11.0, 5.0, 2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11138916015625, -0.10715198516845703, -0.10291481018066406, -0.0986776351928711, -0.09444046020507812, -0.09020328521728516, -0.08596611022949219, -0.08172893524169922, -0.07749176025390625, -0.07325458526611328, -0.06901741027832031, -0.06478023529052734, -0.060543060302734375, -0.056305885314941406, -0.05206871032714844, -0.04783153533935547, -0.0435943603515625, -0.03935718536376953, -0.03512001037597656, -0.030882835388183594, -0.026645660400390625, -0.022408485412597656, -0.018171310424804688, -0.013934135437011719, -0.00969696044921875, -0.005459785461425781, -0.0012226104736328125, 0.0030145645141601562, 0.007251739501953125, 0.011488914489746094, 0.015726089477539062, 0.01996326446533203, 0.024200439453125, 0.02843761444091797, 0.03267478942871094, 0.036911964416503906, 0.041149139404296875, 0.045386314392089844, 0.04962348937988281, 0.05386066436767578, 0.05809783935546875, 0.06233501434326172, 0.06657218933105469, 0.07080936431884766, 0.07504653930664062, 0.0792837142944336, 0.08352088928222656, 0.08775806427001953, 0.0919952392578125, 0.09623241424560547, 0.10046958923339844, 0.1047067642211914, 0.10894393920898438, 0.11318111419677734, 0.11741828918457031, 0.12165546417236328, 0.12589263916015625, 0.13012981414794922, 0.1343669891357422, 0.13860416412353516, 0.14284133911132812, 0.1470785140991211, 0.15131568908691406, 0.15555286407470703, 0.1597900390625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 4.0, 5.0, 8.0, 4.0, 20.0, 17.0, 22.0, 38.0, 36.0, 39.0, 64.0, 87.0, 130.0, 172.0, 240.0, 320.0, 537.0, 839.0, 1409.0, 2575.0, 5433.0, 15115.0, 58780.0, 491457.0, 389110.0, 55641.0, 14581.0, 5482.0, 2491.0, 1378.0, 766.0, 554.0, 310.0, 258.0, 179.0, 122.0, 89.0, 75.0, 44.0, 31.0, 33.0, 19.0, 8.0, 12.0, 14.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0], "bins": [-0.58349609375, -0.567718505859375, -0.55194091796875, -0.536163330078125, -0.5203857421875, -0.504608154296875, -0.48883056640625, -0.473052978515625, -0.457275390625, -0.441497802734375, -0.42572021484375, -0.409942626953125, -0.3941650390625, -0.378387451171875, -0.36260986328125, -0.346832275390625, -0.3310546875, -0.315277099609375, -0.29949951171875, -0.283721923828125, -0.2679443359375, -0.252166748046875, -0.23638916015625, -0.220611572265625, -0.204833984375, -0.189056396484375, -0.17327880859375, -0.157501220703125, -0.1417236328125, -0.125946044921875, -0.11016845703125, -0.094390869140625, -0.07861328125, -0.062835693359375, -0.04705810546875, -0.031280517578125, -0.0155029296875, 0.000274658203125, 0.01605224609375, 0.031829833984375, 0.047607421875, 0.063385009765625, 0.07916259765625, 0.094940185546875, 0.1107177734375, 0.126495361328125, 0.14227294921875, 0.158050537109375, 0.173828125, 0.189605712890625, 0.20538330078125, 0.221160888671875, 0.2369384765625, 0.252716064453125, 0.26849365234375, 0.284271240234375, 0.300048828125, 0.315826416015625, 0.33160400390625, 0.347381591796875, 0.3631591796875, 0.378936767578125, 0.39471435546875, 0.410491943359375, 0.42626953125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 2.0, 10.0, 7.0, 9.0, 14.0, 7.0, 23.0, 20.0, 21.0, 25.0, 35.0, 37.0, 48.0, 44.0, 31.0, 40.0, 38.0, 55.0, 48.0, 49.0, 40.0, 46.0, 40.0, 48.0, 40.0, 37.0, 28.0, 26.0, 29.0, 19.0, 16.0, 12.0, 9.0, 8.0, 12.0, 4.0, 6.0, 8.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.59033203125, -0.5719680786132812, -0.5536041259765625, -0.5352401733398438, -0.516876220703125, -0.49851226806640625, -0.4801483154296875, -0.46178436279296875, -0.44342041015625, -0.42505645751953125, -0.4066925048828125, -0.38832855224609375, -0.369964599609375, -0.35160064697265625, -0.3332366943359375, -0.31487274169921875, -0.2965087890625, -0.27814483642578125, -0.2597808837890625, -0.24141693115234375, -0.223052978515625, -0.20468902587890625, -0.1863250732421875, -0.16796112060546875, -0.14959716796875, -0.13123321533203125, -0.1128692626953125, -0.09450531005859375, -0.076141357421875, -0.05777740478515625, -0.0394134521484375, -0.02104949951171875, -0.002685546875, 0.01567840576171875, 0.0340423583984375, 0.05240631103515625, 0.070770263671875, 0.08913421630859375, 0.1074981689453125, 0.12586212158203125, 0.14422607421875, 0.16259002685546875, 0.1809539794921875, 0.19931793212890625, 0.217681884765625, 0.23604583740234375, 0.2544097900390625, 0.27277374267578125, 0.2911376953125, 0.30950164794921875, 0.3278656005859375, 0.34622955322265625, 0.364593505859375, 0.38295745849609375, 0.4013214111328125, 0.41968536376953125, 0.43804931640625, 0.45641326904296875, 0.4747772216796875, 0.49314117431640625, 0.511505126953125, 0.5298690795898438, 0.5482330322265625, 0.5665969848632812, 0.5849609375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 11.0, 10.0, 7.0, 17.0, 42.0, 51.0, 104.0, 146.0, 329.0, 652.0, 1443.0, 4244.0, 16462.0, 88921.0, 657308.0, 230269.0, 36202.0, 8079.0, 2436.0, 939.0, 392.0, 201.0, 106.0, 57.0, 45.0, 15.0, 18.0, 16.0, 7.0, 4.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2216796875, -0.21511077880859375, -0.2085418701171875, -0.20197296142578125, -0.195404052734375, -0.18883514404296875, -0.1822662353515625, -0.17569732666015625, -0.16912841796875, -0.16255950927734375, -0.1559906005859375, -0.14942169189453125, -0.142852783203125, -0.13628387451171875, -0.1297149658203125, -0.12314605712890625, -0.1165771484375, -0.11000823974609375, -0.1034393310546875, -0.09687042236328125, -0.090301513671875, -0.08373260498046875, -0.0771636962890625, -0.07059478759765625, -0.06402587890625, -0.05745697021484375, -0.0508880615234375, -0.04431915283203125, -0.037750244140625, -0.03118133544921875, -0.0246124267578125, -0.01804351806640625, -0.011474609375, -0.00490570068359375, 0.0016632080078125, 0.00823211669921875, 0.014801025390625, 0.02136993408203125, 0.0279388427734375, 0.03450775146484375, 0.04107666015625, 0.04764556884765625, 0.0542144775390625, 0.06078338623046875, 0.067352294921875, 0.07392120361328125, 0.0804901123046875, 0.08705902099609375, 0.0936279296875, 0.10019683837890625, 0.1067657470703125, 0.11333465576171875, 0.119903564453125, 0.12647247314453125, 0.1330413818359375, 0.13961029052734375, 0.14617919921875, 0.15274810791015625, 0.1593170166015625, 0.16588592529296875, 0.172454833984375, 0.17902374267578125, 0.1855926513671875, 0.19216156005859375, 0.19873046875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 7.0, 6.0, 7.0, 10.0, 7.0, 10.0, 5.0, 15.0, 15.0, 15.0, 28.0, 21.0, 31.0, 39.0, 47.0, 57.0, 68.0, 77.0, 100.0, 70.0, 61.0, 49.0, 46.0, 33.0, 36.0, 32.0, 18.0, 16.0, 15.0, 13.0, 8.0, 13.0, 6.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.857778549194336e-05, -4.704948514699936e-05, -4.552118480205536e-05, -4.399288445711136e-05, -4.246458411216736e-05, -4.093628376722336e-05, -3.940798342227936e-05, -3.787968307733536e-05, -3.635138273239136e-05, -3.482308238744736e-05, -3.329478204250336e-05, -3.176648169755936e-05, -3.0238181352615356e-05, -2.8709881007671356e-05, -2.7181580662727356e-05, -2.5653280317783356e-05, -2.4124979972839355e-05, -2.2596679627895355e-05, -2.1068379282951355e-05, -1.9540078938007355e-05, -1.8011778593063354e-05, -1.6483478248119354e-05, -1.4955177903175354e-05, -1.3426877558231354e-05, -1.1898577213287354e-05, -1.0370276868343353e-05, -8.841976523399353e-06, -7.313676178455353e-06, -5.7853758335113525e-06, -4.257075488567352e-06, -2.728775143623352e-06, -1.2004747986793518e-06, 3.2782554626464844e-07, 1.8561258912086487e-06, 3.384426236152649e-06, 4.912726581096649e-06, 6.441026926040649e-06, 7.96932727098465e-06, 9.49762761592865e-06, 1.102592796087265e-05, 1.255422830581665e-05, 1.408252865076065e-05, 1.561082899570465e-05, 1.713912934064865e-05, 1.866742968559265e-05, 2.019573003053665e-05, 2.1724030375480652e-05, 2.3252330720424652e-05, 2.4780631065368652e-05, 2.6308931410312653e-05, 2.7837231755256653e-05, 2.9365532100200653e-05, 3.089383244514465e-05, 3.2422132790088654e-05, 3.3950433135032654e-05, 3.5478733479976654e-05, 3.7007033824920654e-05, 3.8535334169864655e-05, 4.0063634514808655e-05, 4.1591934859752655e-05, 4.3120235204696655e-05, 4.4648535549640656e-05, 4.6176835894584656e-05, 4.7705136239528656e-05, 4.9233436584472656e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 3.0, 11.0, 18.0, 30.0, 52.0, 95.0, 185.0, 332.0, 769.0, 1861.0, 5715.0, 29937.0, 367690.0, 593314.0, 37961.0, 6715.0, 2160.0, 865.0, 414.0, 224.0, 99.0, 45.0, 35.0, 13.0, 9.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.184326171875, -0.17633056640625, -0.1683349609375, -0.16033935546875, -0.15234375, -0.14434814453125, -0.1363525390625, -0.12835693359375, -0.120361328125, -0.11236572265625, -0.1043701171875, -0.09637451171875, -0.08837890625, -0.08038330078125, -0.0723876953125, -0.06439208984375, -0.056396484375, -0.04840087890625, -0.0404052734375, -0.03240966796875, -0.0244140625, -0.01641845703125, -0.0084228515625, -0.00042724609375, 0.007568359375, 0.01556396484375, 0.0235595703125, 0.03155517578125, 0.03955078125, 0.04754638671875, 0.0555419921875, 0.06353759765625, 0.071533203125, 0.07952880859375, 0.0875244140625, 0.09552001953125, 0.103515625, 0.11151123046875, 0.1195068359375, 0.12750244140625, 0.135498046875, 0.14349365234375, 0.1514892578125, 0.15948486328125, 0.16748046875, 0.17547607421875, 0.1834716796875, 0.19146728515625, 0.199462890625, 0.20745849609375, 0.2154541015625, 0.22344970703125, 0.2314453125, 0.23944091796875, 0.2474365234375, 0.25543212890625, 0.263427734375, 0.27142333984375, 0.2794189453125, 0.28741455078125, 0.29541015625, 0.30340576171875, 0.3114013671875, 0.31939697265625, 0.327392578125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 7.0, 3.0, 7.0, 6.0, 7.0, 15.0, 13.0, 14.0, 8.0, 16.0, 20.0, 25.0, 33.0, 31.0, 38.0, 39.0, 44.0, 54.0, 65.0, 62.0, 53.0, 57.0, 46.0, 45.0, 46.0, 44.0, 27.0, 30.0, 21.0, 25.0, 17.0, 16.0, 19.0, 14.0, 8.0, 3.0, 5.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.1414794921875, -0.13768291473388672, -0.13388633728027344, -0.13008975982666016, -0.12629318237304688, -0.1224966049194336, -0.11870002746582031, -0.11490345001220703, -0.11110687255859375, -0.10731029510498047, -0.10351371765136719, -0.0997171401977539, -0.09592056274414062, -0.09212398529052734, -0.08832740783691406, -0.08453083038330078, -0.0807342529296875, -0.07693767547607422, -0.07314109802246094, -0.06934452056884766, -0.06554794311523438, -0.061751365661621094, -0.05795478820800781, -0.05415821075439453, -0.05036163330078125, -0.04656505584716797, -0.04276847839355469, -0.038971900939941406, -0.035175323486328125, -0.031378746032714844, -0.027582168579101562, -0.02378559112548828, -0.019989013671875, -0.01619243621826172, -0.012395858764648438, -0.008599281311035156, -0.004802703857421875, -0.0010061264038085938, 0.0027904510498046875, 0.006587028503417969, 0.01038360595703125, 0.014180183410644531, 0.017976760864257812, 0.021773338317871094, 0.025569915771484375, 0.029366493225097656, 0.03316307067871094, 0.03695964813232422, 0.0407562255859375, 0.04455280303955078, 0.04834938049316406, 0.052145957946777344, 0.055942535400390625, 0.059739112854003906, 0.06353569030761719, 0.06733226776123047, 0.07112884521484375, 0.07492542266845703, 0.07872200012207031, 0.0825185775756836, 0.08631515502929688, 0.09011173248291016, 0.09390830993652344, 0.09770488739013672, 0.10150146484375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 3.0, 12.0, 11.0, 17.0, 43.0, 70.0, 80.0, 142.0, 246.0, 145.0, 97.0, 60.0, 24.0, 16.0, 10.0, 6.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6263699531555176, -3.50262713432312, -3.3788843154907227, -3.255141496658325, -3.1313986778259277, -3.0076558589935303, -2.883913040161133, -2.7601704597473145, -2.636427402496338, -2.5126845836639404, -2.388941764831543, -2.2651989459991455, -2.141456127166748, -2.0177133083343506, -1.8939706087112427, -1.7702277898788452, -1.6464850902557373, -1.5227422714233398, -1.3989994525909424, -1.275256633758545, -1.1515138149261475, -1.02777099609375, -0.9040282964706421, -0.7802854776382446, -0.6565426588058472, -0.5327998399734497, -0.40905705094337463, -0.28531426191329956, -0.1615714430809021, -0.03782862424850464, 0.08591413497924805, 0.2096569538116455, 0.33339977264404297, 0.45714259147644043, 0.5808854103088379, 0.7046281695365906, 0.828370988368988, 0.9521138072013855, 1.0758565664291382, 1.1995993852615356, 1.323342204093933, 1.4470850229263306, 1.570827841758728, 1.694570541381836, 1.8183133602142334, 1.9420561790466309, 2.0657989978790283, 2.189541816711426, 2.3132846355438232, 2.4370274543762207, 2.560770273208618, 2.6845130920410156, 2.808255910873413, 2.9319987297058105, 3.055741310119629, 3.1794843673706055, 3.303226947784424, 3.4269697666168213, 3.5507125854492188, 3.674455404281616, 3.7981982231140137, 3.921941041946411, 4.045683860778809, 4.169426441192627, 4.2931694984436035]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 7.0, 7.0, 8.0, 9.0, 13.0, 14.0, 21.0, 10.0, 22.0, 26.0, 30.0, 27.0, 34.0, 36.0, 37.0, 53.0, 54.0, 59.0, 76.0, 73.0, 55.0, 39.0, 41.0, 35.0, 30.0, 31.0, 24.0, 23.0, 18.0, 18.0, 11.0, 11.0, 11.0, 7.0, 12.0, 6.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5546655654907227, -2.4808285236358643, -2.406991481781006, -2.3331542015075684, -2.25931715965271, -2.1854801177978516, -2.111642837524414, -2.0378057956695557, -1.9639687538146973, -1.8901317119598389, -1.816294550895691, -1.742457389831543, -1.6686203479766846, -1.5947833061218262, -1.5209461450576782, -1.4471089839935303, -1.3732719421386719, -1.2994349002838135, -1.2255977392196655, -1.1517605781555176, -1.0779235363006592, -1.0040864944458008, -0.9302493333816528, -0.8564122319221497, -0.7825751304626465, -0.7087380290031433, -0.6349009275436401, -0.561063826084137, -0.4872267246246338, -0.4133896231651306, -0.33955252170562744, -0.26571542024612427, -0.191878080368042, -0.11804097890853882, -0.044203877449035645, 0.02963322401046753, 0.1034703254699707, 0.17730742692947388, 0.25114452838897705, 0.3249816298484802, 0.3988187313079834, 0.4726558327674866, 0.5464929342269897, 0.6203300356864929, 0.6941671371459961, 0.7680042386054993, 0.8418413400650024, 0.9156784415245056, 0.9895155429840088, 1.0633525848388672, 1.1371897459030151, 1.211026906967163, 1.2848639488220215, 1.3587009906768799, 1.4325381517410278, 1.5063753128051758, 1.5802123546600342, 1.6540493965148926, 1.7278865575790405, 1.8017237186431885, 1.8755607604980469, 1.9493978023529053, 2.0232348442077637, 2.097072124481201, 2.1709091663360596]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 12.0, 13.0, 35.0, 48.0, 75.0, 140.0, 226.0, 386.0, 668.0, 1412.0, 2940.0, 7077.0, 18012.0, 55475.0, 245241.0, 1584984.0, 1889823.0, 292761.0, 61198.0, 19378.0, 7568.0, 3226.0, 1510.0, 872.0, 456.0, 264.0, 167.0, 106.0, 77.0, 42.0, 19.0, 24.0, 14.0, 10.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2103271484375, -0.2039642333984375, -0.197601318359375, -0.1912384033203125, -0.18487548828125, -0.1785125732421875, -0.172149658203125, -0.1657867431640625, -0.159423828125, -0.1530609130859375, -0.146697998046875, -0.1403350830078125, -0.13397216796875, -0.1276092529296875, -0.121246337890625, -0.1148834228515625, -0.1085205078125, -0.1021575927734375, -0.095794677734375, -0.0894317626953125, -0.08306884765625, -0.0767059326171875, -0.070343017578125, -0.0639801025390625, -0.0576171875, -0.0512542724609375, -0.044891357421875, -0.0385284423828125, -0.03216552734375, -0.0258026123046875, -0.019439697265625, -0.0130767822265625, -0.0067138671875, -0.0003509521484375, 0.006011962890625, 0.0123748779296875, 0.01873779296875, 0.0251007080078125, 0.031463623046875, 0.0378265380859375, 0.044189453125, 0.0505523681640625, 0.056915283203125, 0.0632781982421875, 0.06964111328125, 0.0760040283203125, 0.082366943359375, 0.0887298583984375, 0.0950927734375, 0.1014556884765625, 0.107818603515625, 0.1141815185546875, 0.12054443359375, 0.1269073486328125, 0.133270263671875, 0.1396331787109375, 0.14599609375, 0.1523590087890625, 0.158721923828125, 0.1650848388671875, 0.17144775390625, 0.1778106689453125, 0.184173583984375, 0.1905364990234375, 0.1968994140625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 4.0, 9.0, 12.0, 10.0, 12.0, 14.0, 21.0, 33.0, 30.0, 33.0, 46.0, 48.0, 54.0, 65.0, 67.0, 77.0, 60.0, 59.0, 59.0, 43.0, 39.0, 30.0, 32.0, 27.0, 21.0, 22.0, 20.0, 16.0, 15.0, 11.0, 4.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11224365234375, -0.10732555389404297, -0.10240745544433594, -0.0974893569946289, -0.09257125854492188, -0.08765316009521484, -0.08273506164550781, -0.07781696319580078, -0.07289886474609375, -0.06798076629638672, -0.06306266784667969, -0.058144569396972656, -0.053226470947265625, -0.048308372497558594, -0.04339027404785156, -0.03847217559814453, -0.0335540771484375, -0.02863597869873047, -0.023717880249023438, -0.018799781799316406, -0.013881683349609375, -0.008963584899902344, -0.0040454864501953125, 0.0008726119995117188, 0.00579071044921875, 0.010708808898925781, 0.015626907348632812, 0.020545005798339844, 0.025463104248046875, 0.030381202697753906, 0.03529930114746094, 0.04021739959716797, 0.045135498046875, 0.05005359649658203, 0.05497169494628906, 0.059889793395996094, 0.06480789184570312, 0.06972599029541016, 0.07464408874511719, 0.07956218719482422, 0.08448028564453125, 0.08939838409423828, 0.09431648254394531, 0.09923458099365234, 0.10415267944335938, 0.1090707778930664, 0.11398887634277344, 0.11890697479248047, 0.1238250732421875, 0.12874317169189453, 0.13366127014160156, 0.1385793685913086, 0.14349746704101562, 0.14841556549072266, 0.1533336639404297, 0.15825176239013672, 0.16316986083984375, 0.16808795928955078, 0.1730060577392578, 0.17792415618896484, 0.18284225463867188, 0.1877603530883789, 0.19267845153808594, 0.19759654998779297, 0.2025146484375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 7.0, 13.0, 12.0, 31.0, 54.0, 64.0, 112.0, 238.0, 492.0, 1437.0, 4415.0, 16917.0, 88505.0, 1210431.0, 2684663.0, 154346.0, 23710.0, 5707.0, 1808.0, 680.0, 276.0, 114.0, 97.0, 48.0, 30.0, 17.0, 13.0, 10.0, 8.0, 7.0, 2.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.400146484375, -0.3876991271972656, -0.37525177001953125, -0.3628044128417969, -0.3503570556640625, -0.3379096984863281, -0.32546234130859375, -0.3130149841308594, -0.300567626953125, -0.2881202697753906, -0.27567291259765625, -0.2632255554199219, -0.2507781982421875, -0.23833084106445312, -0.22588348388671875, -0.21343612670898438, -0.20098876953125, -0.18854141235351562, -0.17609405517578125, -0.16364669799804688, -0.1511993408203125, -0.13875198364257812, -0.12630462646484375, -0.11385726928710938, -0.101409912109375, -0.08896255493164062, -0.07651519775390625, -0.06406784057617188, -0.0516204833984375, -0.039173126220703125, -0.02672576904296875, -0.014278411865234375, -0.0018310546875, 0.010616302490234375, 0.02306365966796875, 0.035511016845703125, 0.0479583740234375, 0.060405731201171875, 0.07285308837890625, 0.08530044555664062, 0.097747802734375, 0.11019515991210938, 0.12264251708984375, 0.13508987426757812, 0.1475372314453125, 0.15998458862304688, 0.17243194580078125, 0.18487930297851562, 0.19732666015625, 0.20977401733398438, 0.22222137451171875, 0.23466873168945312, 0.2471160888671875, 0.2595634460449219, 0.27201080322265625, 0.2844581604003906, 0.296905517578125, 0.3093528747558594, 0.32180023193359375, 0.3342475891113281, 0.3466949462890625, 0.3591423034667969, 0.37158966064453125, 0.3840370178222656, 0.396484375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 2.0, 6.0, 7.0, 10.0, 4.0, 12.0, 9.0, 13.0, 16.0, 29.0, 36.0, 41.0, 69.0, 90.0, 126.0, 159.0, 243.0, 336.0, 494.0, 585.0, 537.0, 362.0, 272.0, 192.0, 117.0, 92.0, 55.0, 30.0, 35.0, 18.0, 19.0, 12.0, 12.0, 10.0, 10.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27783203125, -0.2677803039550781, -0.25772857666015625, -0.24767684936523438, -0.2376251220703125, -0.22757339477539062, -0.21752166748046875, -0.20746994018554688, -0.197418212890625, -0.18736648559570312, -0.17731475830078125, -0.16726303100585938, -0.1572113037109375, -0.14715957641601562, -0.13710784912109375, -0.12705612182617188, -0.11700439453125, -0.10695266723632812, -0.09690093994140625, -0.08684921264648438, -0.0767974853515625, -0.06674575805664062, -0.05669403076171875, -0.046642303466796875, -0.036590576171875, -0.026538848876953125, -0.01648712158203125, -0.006435394287109375, 0.0036163330078125, 0.013668060302734375, 0.02371978759765625, 0.033771514892578125, 0.0438232421875, 0.053874969482421875, 0.06392669677734375, 0.07397842407226562, 0.0840301513671875, 0.09408187866210938, 0.10413360595703125, 0.11418533325195312, 0.124237060546875, 0.13428878784179688, 0.14434051513671875, 0.15439224243164062, 0.1644439697265625, 0.17449569702148438, 0.18454742431640625, 0.19459915161132812, 0.20465087890625, 0.21470260620117188, 0.22475433349609375, 0.23480606079101562, 0.2448577880859375, 0.2549095153808594, 0.26496124267578125, 0.2750129699707031, 0.285064697265625, 0.2951164245605469, 0.30516815185546875, 0.3152198791503906, 0.3252716064453125, 0.3353233337402344, 0.34537506103515625, 0.3554267883300781, 0.365478515625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 9.0, 14.0, 23.0, 38.0, 81.0, 147.0, 195.0, 207.0, 138.0, 72.0, 28.0, 15.0, 7.0, 8.0, 7.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.727634906768799, -3.5950684547424316, -3.4625022411346436, -3.3299360275268555, -3.1973695755004883, -3.064803123474121, -2.932236909866333, -2.799670696258545, -2.6671042442321777, -2.5345377922058105, -2.4019715785980225, -2.2694053649902344, -2.136838912963867, -2.0042724609375, -1.871706247329712, -1.7391399145126343, -1.6065735816955566, -1.474007248878479, -1.3414409160614014, -1.2088745832443237, -1.076308250427246, -0.9437419176101685, -0.8111755847930908, -0.6786092519760132, -0.5460429191589355, -0.4134765863418579, -0.2809102535247803, -0.14834392070770264, -0.015777587890625, 0.11678874492645264, 0.24935507774353027, 0.3819214105606079, 0.5144882202148438, 0.6470545530319214, 0.779620885848999, 0.9121872186660767, 1.0447535514831543, 1.177319884300232, 1.3098862171173096, 1.4424525499343872, 1.5750188827514648, 1.7075852155685425, 1.8401515483856201, 1.9727178812026978, 2.1052842140197754, 2.2378506660461426, 2.3704168796539307, 2.5029830932617188, 2.635549545288086, 2.768115997314453, 2.900682210922241, 3.0332484245300293, 3.1658148765563965, 3.2983813285827637, 3.4309475421905518, 3.56351375579834, 3.696080207824707, 3.828646659851074, 3.9612128734588623, 4.09377908706665, 4.226345539093018, 4.358911991119385, 4.491477966308594, 4.624044418334961, 4.756610870361328]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 5.0, 12.0, 8.0, 11.0, 14.0, 11.0, 11.0, 19.0, 21.0, 24.0, 27.0, 36.0, 39.0, 53.0, 36.0, 60.0, 53.0, 37.0, 42.0, 49.0, 64.0, 50.0, 41.0, 26.0, 43.0, 44.0, 29.0, 29.0, 19.0, 19.0, 10.0, 13.0, 12.0, 10.0, 8.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.666301965713501, -1.609972596168518, -1.5536432266235352, -1.4973138570785522, -1.4409844875335693, -1.384655237197876, -1.328325867652893, -1.2719964981079102, -1.2156671285629272, -1.1593377590179443, -1.1030083894729614, -1.0466790199279785, -0.9903497099876404, -0.9340203404426575, -0.8776910305023193, -0.8213616609573364, -0.7650322914123535, -0.7087029218673706, -0.6523735523223877, -0.5960442423820496, -0.5397148728370667, -0.48338550329208374, -0.4270561635494232, -0.3707268238067627, -0.3143974542617798, -0.2580680847167969, -0.20173874497413635, -0.14540939033031464, -0.08908003568649292, -0.03275066614151001, 0.023578673601150513, 0.07990801334381104, 0.13623738288879395, 0.19256673753261566, 0.24889609217643738, 0.3052254319190979, 0.3615548014640808, 0.4178841710090637, 0.47421351075172424, 0.5305428504943848, 0.5868722200393677, 0.6432015895843506, 0.6995309591293335, 0.7558602690696716, 0.8121896386146545, 0.8685190081596375, 0.9248483180999756, 0.9811776876449585, 1.0375070571899414, 1.0938364267349243, 1.1501657962799072, 1.2064951658248901, 1.262824535369873, 1.3191537857055664, 1.3754831552505493, 1.4318125247955322, 1.4881418943405151, 1.544471263885498, 1.600800633430481, 1.6571300029754639, 1.7134592533111572, 1.7697887420654297, 1.826117992401123, 1.882447361946106, 1.9387767314910889]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 6.0, 11.0, 11.0, 15.0, 20.0, 23.0, 50.0, 44.0, 56.0, 128.0, 144.0, 221.0, 353.0, 544.0, 881.0, 1341.0, 2262.0, 3728.0, 7031.0, 14129.0, 30714.0, 76185.0, 224629.0, 417329.0, 159960.0, 58179.0, 24651.0, 11326.0, 5928.0, 3328.0, 1870.0, 1193.0, 703.0, 506.0, 339.0, 226.0, 152.0, 105.0, 78.0, 39.0, 38.0, 23.0, 21.0, 9.0, 9.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.248046875, -0.23987579345703125, -0.2317047119140625, -0.22353363037109375, -0.215362548828125, -0.20719146728515625, -0.1990203857421875, -0.19084930419921875, -0.18267822265625, -0.17450714111328125, -0.1663360595703125, -0.15816497802734375, -0.149993896484375, -0.14182281494140625, -0.1336517333984375, -0.12548065185546875, -0.1173095703125, -0.10913848876953125, -0.1009674072265625, -0.09279632568359375, -0.084625244140625, -0.07645416259765625, -0.0682830810546875, -0.06011199951171875, -0.05194091796875, -0.04376983642578125, -0.0355987548828125, -0.02742767333984375, -0.019256591796875, -0.01108551025390625, -0.0029144287109375, 0.00525665283203125, 0.013427734375, 0.02159881591796875, 0.0297698974609375, 0.03794097900390625, 0.046112060546875, 0.05428314208984375, 0.0624542236328125, 0.07062530517578125, 0.07879638671875, 0.08696746826171875, 0.0951385498046875, 0.10330963134765625, 0.111480712890625, 0.11965179443359375, 0.1278228759765625, 0.13599395751953125, 0.1441650390625, 0.15233612060546875, 0.1605072021484375, 0.16867828369140625, 0.176849365234375, 0.18502044677734375, 0.1931915283203125, 0.20136260986328125, 0.20953369140625, 0.21770477294921875, 0.2258758544921875, 0.23404693603515625, 0.242218017578125, 0.25038909912109375, 0.2585601806640625, 0.26673126220703125, 0.27490234375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 4.0, 3.0, 9.0, 9.0, 9.0, 12.0, 16.0, 18.0, 18.0, 24.0, 30.0, 40.0, 38.0, 60.0, 39.0, 57.0, 48.0, 55.0, 60.0, 60.0, 45.0, 48.0, 30.0, 42.0, 43.0, 27.0, 28.0, 25.0, 20.0, 22.0, 15.0, 19.0, 10.0, 5.0, 6.0, 8.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1268310546875, -0.12234115600585938, -0.11785125732421875, -0.11336135864257812, -0.1088714599609375, -0.10438156127929688, -0.09989166259765625, -0.09540176391601562, -0.090911865234375, -0.08642196655273438, -0.08193206787109375, -0.07744216918945312, -0.0729522705078125, -0.06846237182617188, -0.06397247314453125, -0.059482574462890625, -0.05499267578125, -0.050502777099609375, -0.04601287841796875, -0.041522979736328125, -0.0370330810546875, -0.032543182373046875, -0.02805328369140625, -0.023563385009765625, -0.019073486328125, -0.014583587646484375, -0.01009368896484375, -0.005603790283203125, -0.0011138916015625, 0.003376007080078125, 0.00786590576171875, 0.012355804443359375, 0.016845703125, 0.021335601806640625, 0.02582550048828125, 0.030315399169921875, 0.0348052978515625, 0.039295196533203125, 0.04378509521484375, 0.048274993896484375, 0.052764892578125, 0.057254791259765625, 0.06174468994140625, 0.06623458862304688, 0.0707244873046875, 0.07521438598632812, 0.07970428466796875, 0.08419418334960938, 0.08868408203125, 0.09317398071289062, 0.09766387939453125, 0.10215377807617188, 0.1066436767578125, 0.11113357543945312, 0.11562347412109375, 0.12011337280273438, 0.124603271484375, 0.12909317016601562, 0.13358306884765625, 0.13807296752929688, 0.1425628662109375, 0.14705276489257812, 0.15154266357421875, 0.15603256225585938, 0.1605224609375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 1.0, 10.0, 12.0, 17.0, 14.0, 22.0, 32.0, 35.0, 61.0, 73.0, 102.0, 129.0, 185.0, 257.0, 361.0, 620.0, 1052.0, 1832.0, 3929.0, 9715.0, 32124.0, 166642.0, 702983.0, 92613.0, 21187.0, 7250.0, 3041.0, 1502.0, 903.0, 565.0, 375.0, 243.0, 167.0, 119.0, 97.0, 60.0, 60.0, 43.0, 26.0, 22.0, 17.0, 14.0, 7.0, 10.0, 8.0, 5.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4150390625, -0.4008979797363281, -0.38675689697265625, -0.3726158142089844, -0.3584747314453125, -0.3443336486816406, -0.33019256591796875, -0.3160514831542969, -0.301910400390625, -0.2877693176269531, -0.27362823486328125, -0.2594871520996094, -0.2453460693359375, -0.23120498657226562, -0.21706390380859375, -0.20292282104492188, -0.18878173828125, -0.17464065551757812, -0.16049957275390625, -0.14635848999023438, -0.1322174072265625, -0.11807632446289062, -0.10393524169921875, -0.08979415893554688, -0.075653076171875, -0.061511993408203125, -0.04737091064453125, -0.033229827880859375, -0.0190887451171875, -0.004947662353515625, 0.00919342041015625, 0.023334503173828125, 0.0374755859375, 0.051616668701171875, 0.06575775146484375, 0.07989883422851562, 0.0940399169921875, 0.10818099975585938, 0.12232208251953125, 0.13646316528320312, 0.150604248046875, 0.16474533081054688, 0.17888641357421875, 0.19302749633789062, 0.2071685791015625, 0.22130966186523438, 0.23545074462890625, 0.24959182739257812, 0.26373291015625, 0.2778739929199219, 0.29201507568359375, 0.3061561584472656, 0.3202972412109375, 0.3344383239746094, 0.34857940673828125, 0.3627204895019531, 0.376861572265625, 0.3910026550292969, 0.40514373779296875, 0.4192848205566406, 0.4334259033203125, 0.4475669860839844, 0.46170806884765625, 0.4758491516113281, 0.489990234375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 5.0, 9.0, 13.0, 17.0, 11.0, 17.0, 21.0, 31.0, 35.0, 28.0, 37.0, 25.0, 39.0, 50.0, 55.0, 49.0, 53.0, 69.0, 46.0, 49.0, 36.0, 39.0, 42.0, 33.0, 31.0, 21.0, 22.0, 16.0, 16.0, 16.0, 15.0, 11.0, 9.0, 10.0, 7.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.63525390625, -0.61700439453125, -0.5987548828125, -0.58050537109375, -0.562255859375, -0.54400634765625, -0.5257568359375, -0.50750732421875, -0.4892578125, -0.47100830078125, -0.4527587890625, -0.43450927734375, -0.416259765625, -0.39801025390625, -0.3797607421875, -0.36151123046875, -0.34326171875, -0.32501220703125, -0.3067626953125, -0.28851318359375, -0.270263671875, -0.25201416015625, -0.2337646484375, -0.21551513671875, -0.197265625, -0.17901611328125, -0.1607666015625, -0.14251708984375, -0.124267578125, -0.10601806640625, -0.0877685546875, -0.06951904296875, -0.05126953125, -0.03302001953125, -0.0147705078125, 0.00347900390625, 0.021728515625, 0.03997802734375, 0.0582275390625, 0.07647705078125, 0.0947265625, 0.11297607421875, 0.1312255859375, 0.14947509765625, 0.167724609375, 0.18597412109375, 0.2042236328125, 0.22247314453125, 0.24072265625, 0.25897216796875, 0.2772216796875, 0.29547119140625, 0.313720703125, 0.33197021484375, 0.3502197265625, 0.36846923828125, 0.38671875, 0.40496826171875, 0.4232177734375, 0.44146728515625, 0.459716796875, 0.47796630859375, 0.4962158203125, 0.51446533203125, 0.53271484375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 7.0, 9.0, 6.0, 15.0, 10.0, 22.0, 22.0, 36.0, 42.0, 80.0, 96.0, 138.0, 295.0, 454.0, 878.0, 1852.0, 4548.0, 14288.0, 57714.0, 332995.0, 540610.0, 68509.0, 16520.0, 5128.0, 1996.0, 930.0, 508.0, 322.0, 169.0, 124.0, 64.0, 48.0, 32.0, 22.0, 19.0, 8.0, 9.0, 3.0, 4.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.1895751953125, -0.1838397979736328, -0.17810440063476562, -0.17236900329589844, -0.16663360595703125, -0.16089820861816406, -0.15516281127929688, -0.1494274139404297, -0.1436920166015625, -0.1379566192626953, -0.13222122192382812, -0.12648582458496094, -0.12075042724609375, -0.11501502990722656, -0.10927963256835938, -0.10354423522949219, -0.097808837890625, -0.09207344055175781, -0.08633804321289062, -0.08060264587402344, -0.07486724853515625, -0.06913185119628906, -0.06339645385742188, -0.05766105651855469, -0.0519256591796875, -0.04619026184082031, -0.040454864501953125, -0.03471946716308594, -0.02898406982421875, -0.023248672485351562, -0.017513275146484375, -0.011777877807617188, -0.00604248046875, -0.0003070831298828125, 0.005428314208984375, 0.011163711547851562, 0.01689910888671875, 0.022634506225585938, 0.028369903564453125, 0.03410530090332031, 0.0398406982421875, 0.04557609558105469, 0.051311492919921875, 0.05704689025878906, 0.06278228759765625, 0.06851768493652344, 0.07425308227539062, 0.07998847961425781, 0.085723876953125, 0.09145927429199219, 0.09719467163085938, 0.10293006896972656, 0.10866546630859375, 0.11440086364746094, 0.12013626098632812, 0.1258716583251953, 0.1316070556640625, 0.1373424530029297, 0.14307785034179688, 0.14881324768066406, 0.15454864501953125, 0.16028404235839844, 0.16601943969726562, 0.1717548370361328, 0.177490234375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 1.0, 4.0, 10.0, 3.0, 13.0, 10.0, 17.0, 20.0, 32.0, 23.0, 22.0, 26.0, 44.0, 51.0, 72.0, 92.0, 81.0, 86.0, 78.0, 59.0, 49.0, 35.0, 30.0, 23.0, 16.0, 17.0, 17.0, 12.0, 9.0, 11.0, 6.0, 6.0, 2.0, 1.0, 6.0, 3.0, 0.0, 1.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.792213439941406e-05, -4.640687257051468e-05, -4.4891610741615295e-05, -4.337634891271591e-05, -4.186108708381653e-05, -4.0345825254917145e-05, -3.883056342601776e-05, -3.731530159711838e-05, -3.5800039768218994e-05, -3.428477793931961e-05, -3.276951611042023e-05, -3.1254254281520844e-05, -2.973899245262146e-05, -2.8223730623722076e-05, -2.6708468794822693e-05, -2.519320696592331e-05, -2.3677945137023926e-05, -2.2162683308124542e-05, -2.064742147922516e-05, -1.9132159650325775e-05, -1.761689782142639e-05, -1.6101635992527008e-05, -1.4586374163627625e-05, -1.3071112334728241e-05, -1.1555850505828857e-05, -1.0040588676929474e-05, -8.52532684803009e-06, -7.010065019130707e-06, -5.494803190231323e-06, -3.97954136133194e-06, -2.464279532432556e-06, -9.490177035331726e-07, 5.662441253662109e-07, 2.0815059542655945e-06, 3.596767783164978e-06, 5.1120296120643616e-06, 6.627291440963745e-06, 8.142553269863129e-06, 9.657815098762512e-06, 1.1173076927661896e-05, 1.268833875656128e-05, 1.4203600585460663e-05, 1.5718862414360046e-05, 1.723412424325943e-05, 1.8749386072158813e-05, 2.0264647901058197e-05, 2.177990972995758e-05, 2.3295171558856964e-05, 2.4810433387756348e-05, 2.632569521665573e-05, 2.7840957045555115e-05, 2.9356218874454498e-05, 3.087148070335388e-05, 3.2386742532253265e-05, 3.390200436115265e-05, 3.541726619005203e-05, 3.6932528018951416e-05, 3.84477898478508e-05, 3.996305167675018e-05, 4.147831350564957e-05, 4.299357533454895e-05, 4.4508837163448334e-05, 4.602409899234772e-05, 4.75393608212471e-05, 4.9054622650146484e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 12.0, 7.0, 14.0, 15.0, 34.0, 49.0, 75.0, 148.0, 251.0, 530.0, 1123.0, 2807.0, 9899.0, 67518.0, 765898.0, 174414.0, 18267.0, 4308.0, 1622.0, 728.0, 358.0, 199.0, 106.0, 73.0, 46.0, 14.0, 6.0, 12.0, 6.0, 8.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.274658203125, -0.26696205139160156, -0.2592658996582031, -0.2515697479248047, -0.24387359619140625, -0.2361774444580078, -0.22848129272460938, -0.22078514099121094, -0.2130889892578125, -0.20539283752441406, -0.19769668579101562, -0.1900005340576172, -0.18230438232421875, -0.1746082305908203, -0.16691207885742188, -0.15921592712402344, -0.151519775390625, -0.14382362365722656, -0.13612747192382812, -0.1284313201904297, -0.12073516845703125, -0.11303901672363281, -0.10534286499023438, -0.09764671325683594, -0.0899505615234375, -0.08225440979003906, -0.07455825805664062, -0.06686210632324219, -0.05916595458984375, -0.05146980285644531, -0.043773651123046875, -0.03607749938964844, -0.02838134765625, -0.020685195922851562, -0.012989044189453125, -0.0052928924560546875, 0.00240325927734375, 0.010099411010742188, 0.017795562744140625, 0.025491714477539062, 0.0331878662109375, 0.04088401794433594, 0.048580169677734375, 0.05627632141113281, 0.06397247314453125, 0.07166862487792969, 0.07936477661132812, 0.08706092834472656, 0.094757080078125, 0.10245323181152344, 0.11014938354492188, 0.11784553527832031, 0.12554168701171875, 0.1332378387451172, 0.14093399047851562, 0.14863014221191406, 0.1563262939453125, 0.16402244567871094, 0.17171859741210938, 0.1794147491455078, 0.18711090087890625, 0.1948070526123047, 0.20250320434570312, 0.21019935607910156, 0.2178955078125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 7.0, 11.0, 15.0, 13.0, 16.0, 24.0, 37.0, 52.0, 49.0, 94.0, 96.0, 107.0, 92.0, 82.0, 58.0, 48.0, 54.0, 28.0, 34.0, 28.0, 13.0, 15.0, 5.0, 11.0, 7.0, 5.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.252197265625, -0.24586868286132812, -0.23954010009765625, -0.23321151733398438, -0.2268829345703125, -0.22055435180664062, -0.21422576904296875, -0.20789718627929688, -0.201568603515625, -0.19524002075195312, -0.18891143798828125, -0.18258285522460938, -0.1762542724609375, -0.16992568969726562, -0.16359710693359375, -0.15726852416992188, -0.15093994140625, -0.14461135864257812, -0.13828277587890625, -0.13195419311523438, -0.1256256103515625, -0.11929702758789062, -0.11296844482421875, -0.10663986206054688, -0.100311279296875, -0.09398269653320312, -0.08765411376953125, -0.08132553100585938, -0.0749969482421875, -0.06866836547851562, -0.06233978271484375, -0.056011199951171875, -0.0496826171875, -0.043354034423828125, -0.03702545166015625, -0.030696868896484375, -0.0243682861328125, -0.018039703369140625, -0.01171112060546875, -0.005382537841796875, 0.000946044921875, 0.007274627685546875, 0.01360321044921875, 0.019931793212890625, 0.0262603759765625, 0.032588958740234375, 0.03891754150390625, 0.045246124267578125, 0.05157470703125, 0.057903289794921875, 0.06423187255859375, 0.07056045532226562, 0.0768890380859375, 0.08321762084960938, 0.08954620361328125, 0.09587478637695312, 0.102203369140625, 0.10853195190429688, 0.11486053466796875, 0.12118911743164062, 0.1275177001953125, 0.13384628295898438, 0.14017486572265625, 0.14650344848632812, 0.15283203125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 9.0, 11.0, 54.0, 93.0, 216.0, 302.0, 139.0, 82.0, 34.0, 11.0, 14.0, 5.0, 3.0, 2.0, 1.0, 8.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9421443939208984, -3.7858171463012695, -3.6294896602630615, -3.4731624126434326, -3.3168351650238037, -3.1605076789855957, -3.004180431365967, -2.847853183746338, -2.691525936126709, -2.53519868850708, -2.378871202468872, -2.222543954849243, -2.0662167072296143, -1.9098893404006958, -1.7535619735717773, -1.5972347259521484, -1.4409072399139404, -1.284579873085022, -1.128252625465393, -0.9719252586364746, -0.8155979514122009, -0.6592706441879272, -0.5029432773590088, -0.3466160297393799, -0.19028866291046143, -0.03396134078502655, 0.12236598134040833, 0.2786933183670044, 0.4350206255912781, 0.5913479328155518, 0.7476752996444702, 0.9040025472640991, 1.0603299140930176, 1.216657280921936, 1.372984528541565, 1.5293118953704834, 1.6856391429901123, 1.8419665098190308, 1.9982938766479492, 2.154621124267578, 2.310948371887207, 2.467275619506836, 2.623603105545044, 2.779930353164673, 2.9362576007843018, 3.0925850868225098, 3.2489123344421387, 3.4052395820617676, 3.5615670680999756, 3.7178943157196045, 3.8742218017578125, 4.030549049377441, 4.18687629699707, 4.343203544616699, 4.499530792236328, 4.655858039855957, 4.812185764312744, 4.968513011932373, 5.124840259552002, 5.281167984008789, 5.437495231628418, 5.593822479248047, 5.750149726867676, 5.906476974487305, 6.062804222106934]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 2.0, 3.0, 8.0, 9.0, 10.0, 11.0, 10.0, 21.0, 17.0, 19.0, 22.0, 20.0, 21.0, 21.0, 31.0, 21.0, 23.0, 36.0, 42.0, 61.0, 66.0, 72.0, 67.0, 52.0, 38.0, 29.0, 29.0, 28.0, 33.0, 30.0, 22.0, 16.0, 15.0, 11.0, 8.0, 11.0, 9.0, 6.0, 7.0, 7.0, 5.0, 8.0, 6.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.110687255859375, -2.04278564453125, -1.9748839139938354, -1.906982183456421, -1.839080572128296, -1.7711788415908813, -1.7032771110534668, -1.6353754997253418, -1.5674738883972168, -1.4995721578598022, -1.4316705465316772, -1.3637688159942627, -1.2958672046661377, -1.2279654741287231, -1.1600637435913086, -1.0921621322631836, -1.024260401725769, -0.9563587307929993, -0.8884570598602295, -0.8205553293228149, -0.7526537179946899, -0.6847519874572754, -0.6168503165245056, -0.5489486455917358, -0.48104697465896606, -0.4131453037261963, -0.3452436327934265, -0.27734193205833435, -0.20944026112556458, -0.1415385901927948, -0.07363688945770264, -0.005735218524932861, 0.062166452407836914, 0.1300681233406067, 0.19796980917453766, 0.26587149500846863, 0.3337731659412384, 0.4016748368740082, 0.46957653760910034, 0.5374782085418701, 0.6053798794746399, 0.6732815504074097, 0.7411832213401794, 0.8090848922729492, 0.8769866228103638, 0.9448882341384888, 1.0127899646759033, 1.0806915760040283, 1.1485933065414429, 1.2164950370788574, 1.2843966484069824, 1.352298378944397, 1.420199990272522, 1.4881017208099365, 1.5560033321380615, 1.623905062675476, 1.6918067932128906, 1.7597085237503052, 1.8276101350784302, 1.8955118656158447, 1.9634134769439697, 2.0313150882720947, 2.099216938018799, 2.167118549346924, 2.235020160675049]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 2.0, 6.0, 2.0, 6.0, 15.0, 12.0, 18.0, 22.0, 38.0, 50.0, 77.0, 111.0, 155.0, 256.0, 358.0, 487.0, 786.0, 1268.0, 2067.0, 3427.0, 6115.0, 11941.0, 26535.0, 71113.0, 251183.0, 1056670.0, 1943632.0, 586790.0, 145980.0, 45999.0, 18379.0, 8929.0, 4590.0, 2716.0, 1604.0, 966.0, 627.0, 436.0, 286.0, 188.0, 147.0, 87.0, 62.0, 42.0, 33.0, 27.0, 16.0, 7.0, 7.0, 7.0, 8.0, 2.0, 2.0, 3.0], "bins": [-0.15380859375, -0.14957046508789062, -0.14533233642578125, -0.14109420776367188, -0.1368560791015625, -0.13261795043945312, -0.12837982177734375, -0.12414169311523438, -0.119903564453125, -0.11566543579101562, -0.11142730712890625, -0.10718917846679688, -0.1029510498046875, -0.09871292114257812, -0.09447479248046875, -0.09023666381835938, -0.08599853515625, -0.08176040649414062, -0.07752227783203125, -0.07328414916992188, -0.0690460205078125, -0.06480789184570312, -0.06056976318359375, -0.056331634521484375, -0.052093505859375, -0.047855377197265625, -0.04361724853515625, -0.039379119873046875, -0.0351409912109375, -0.030902862548828125, -0.02666473388671875, -0.022426605224609375, -0.0181884765625, -0.013950347900390625, -0.00971221923828125, -0.005474090576171875, -0.0012359619140625, 0.003002166748046875, 0.00724029541015625, 0.011478424072265625, 0.015716552734375, 0.019954681396484375, 0.02419281005859375, 0.028430938720703125, 0.0326690673828125, 0.036907196044921875, 0.04114532470703125, 0.045383453369140625, 0.04962158203125, 0.053859710693359375, 0.05809783935546875, 0.062335968017578125, 0.0665740966796875, 0.07081222534179688, 0.07505035400390625, 0.07928848266601562, 0.083526611328125, 0.08776473999023438, 0.09200286865234375, 0.09624099731445312, 0.1004791259765625, 0.10471725463867188, 0.10895538330078125, 0.11319351196289062, 0.117431640625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 1.0, 9.0, 3.0, 10.0, 12.0, 16.0, 12.0, 11.0, 22.0, 17.0, 30.0, 36.0, 40.0, 45.0, 46.0, 55.0, 75.0, 56.0, 59.0, 72.0, 47.0, 54.0, 39.0, 36.0, 33.0, 33.0, 24.0, 29.0, 16.0, 13.0, 13.0, 15.0, 13.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11724853515625, -0.11259746551513672, -0.10794639587402344, -0.10329532623291016, -0.09864425659179688, -0.0939931869506836, -0.08934211730957031, -0.08469104766845703, -0.08003997802734375, -0.07538890838623047, -0.07073783874511719, -0.0660867691040039, -0.061435699462890625, -0.056784629821777344, -0.05213356018066406, -0.04748249053955078, -0.0428314208984375, -0.03818035125732422, -0.03352928161621094, -0.028878211975097656, -0.024227142333984375, -0.019576072692871094, -0.014925003051757812, -0.010273933410644531, -0.00562286376953125, -0.0009717941284179688, 0.0036792755126953125, 0.008330345153808594, 0.012981414794921875, 0.017632484436035156, 0.022283554077148438, 0.02693462371826172, 0.031585693359375, 0.03623676300048828, 0.04088783264160156, 0.045538902282714844, 0.050189971923828125, 0.054841041564941406, 0.05949211120605469, 0.06414318084716797, 0.06879425048828125, 0.07344532012939453, 0.07809638977050781, 0.0827474594116211, 0.08739852905273438, 0.09204959869384766, 0.09670066833496094, 0.10135173797607422, 0.1060028076171875, 0.11065387725830078, 0.11530494689941406, 0.11995601654052734, 0.12460708618164062, 0.1292581558227539, 0.1339092254638672, 0.13856029510498047, 0.14321136474609375, 0.14786243438720703, 0.1525135040283203, 0.1571645736694336, 0.16181564331054688, 0.16646671295166016, 0.17111778259277344, 0.17576885223388672, 0.180419921875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 8.0, 5.0, 13.0, 11.0, 26.0, 52.0, 75.0, 153.0, 294.0, 909.0, 3242.0, 16298.0, 193329.0, 3755111.0, 204587.0, 15798.0, 2954.0, 821.0, 307.0, 121.0, 67.0, 44.0, 23.0, 18.0, 7.0, 5.0, 7.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60693359375, -0.58984375, -0.57275390625, -0.5556640625, -0.53857421875, -0.521484375, -0.50439453125, -0.4873046875, -0.47021484375, -0.453125, -0.43603515625, -0.4189453125, -0.40185546875, -0.384765625, -0.36767578125, -0.3505859375, -0.33349609375, -0.31640625, -0.29931640625, -0.2822265625, -0.26513671875, -0.248046875, -0.23095703125, -0.2138671875, -0.19677734375, -0.1796875, -0.16259765625, -0.1455078125, -0.12841796875, -0.111328125, -0.09423828125, -0.0771484375, -0.06005859375, -0.04296875, -0.02587890625, -0.0087890625, 0.00830078125, 0.025390625, 0.04248046875, 0.0595703125, 0.07666015625, 0.09375, 0.11083984375, 0.1279296875, 0.14501953125, 0.162109375, 0.17919921875, 0.1962890625, 0.21337890625, 0.23046875, 0.24755859375, 0.2646484375, 0.28173828125, 0.298828125, 0.31591796875, 0.3330078125, 0.35009765625, 0.3671875, 0.38427734375, 0.4013671875, 0.41845703125, 0.435546875, 0.45263671875, 0.4697265625, 0.48681640625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 5.0, 3.0, 11.0, 6.0, 9.0, 9.0, 20.0, 27.0, 29.0, 38.0, 39.0, 70.0, 118.0, 154.0, 224.0, 358.0, 562.0, 682.0, 558.0, 400.0, 236.0, 165.0, 89.0, 80.0, 50.0, 28.0, 30.0, 17.0, 9.0, 15.0, 8.0, 11.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27783203125, -0.26811981201171875, -0.2584075927734375, -0.24869537353515625, -0.238983154296875, -0.22927093505859375, -0.2195587158203125, -0.20984649658203125, -0.20013427734375, -0.19042205810546875, -0.1807098388671875, -0.17099761962890625, -0.161285400390625, -0.15157318115234375, -0.1418609619140625, -0.13214874267578125, -0.1224365234375, -0.11272430419921875, -0.1030120849609375, -0.09329986572265625, -0.083587646484375, -0.07387542724609375, -0.0641632080078125, -0.05445098876953125, -0.04473876953125, -0.03502655029296875, -0.0253143310546875, -0.01560211181640625, -0.005889892578125, 0.00382232666015625, 0.0135345458984375, 0.02324676513671875, 0.032958984375, 0.04267120361328125, 0.0523834228515625, 0.06209564208984375, 0.071807861328125, 0.08152008056640625, 0.0912322998046875, 0.10094451904296875, 0.11065673828125, 0.12036895751953125, 0.1300811767578125, 0.13979339599609375, 0.149505615234375, 0.15921783447265625, 0.1689300537109375, 0.17864227294921875, 0.1883544921875, 0.19806671142578125, 0.2077789306640625, 0.21749114990234375, 0.227203369140625, 0.23691558837890625, 0.2466278076171875, 0.25634002685546875, 0.26605224609375, 0.27576446533203125, 0.2854766845703125, 0.29518890380859375, 0.304901123046875, 0.31461334228515625, 0.3243255615234375, 0.33403778076171875, 0.34375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 4.0, 6.0, 12.0, 29.0, 51.0, 129.0, 235.0, 273.0, 154.0, 60.0, 22.0, 12.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.281395435333252, -7.127960205078125, -6.97452449798584, -6.821089267730713, -6.667653560638428, -6.514218330383301, -6.360782623291016, -6.207347393035889, -6.053912162780762, -5.900476932525635, -5.74704122543335, -5.593605995178223, -5.4401702880859375, -5.2867350578308105, -5.133299350738525, -4.979864120483398, -4.826428413391113, -4.672993183135986, -4.519557476043701, -4.366122245788574, -4.212686538696289, -4.059251308441162, -3.905815839767456, -3.75238037109375, -3.598944902420044, -3.445509433746338, -3.292073965072632, -3.138638496398926, -2.985203266143799, -2.8317675590515137, -2.6783323287963867, -2.5248968601226807, -2.371461868286133, -2.2180263996124268, -2.0645909309387207, -1.9111555814743042, -1.7577201128005981, -1.604284644126892, -1.4508492946624756, -1.2974138259887695, -1.1439783573150635, -0.9905428886413574, -0.8371074795722961, -0.6836720705032349, -0.5302366018295288, -0.37680113315582275, -0.22336572408676147, -0.0699303150177002, 0.08350515365600586, 0.23694059252738953, 0.3903760313987732, 0.5438114404678345, 0.6972469091415405, 0.8506823778152466, 1.004117727279663, 1.1575531959533691, 1.3109886646270752, 1.4644241333007812, 1.6178596019744873, 1.7712949514389038, 1.9247304201126099, 2.0781660079956055, 2.2316012382507324, 2.3850367069244385, 2.5384721755981445]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 12.0, 9.0, 10.0, 16.0, 18.0, 10.0, 18.0, 19.0, 25.0, 30.0, 31.0, 34.0, 39.0, 42.0, 37.0, 39.0, 36.0, 48.0, 45.0, 30.0, 46.0, 35.0, 47.0, 39.0, 32.0, 30.0, 24.0, 20.0, 31.0, 20.0, 26.0, 18.0, 22.0, 12.0, 16.0, 7.0, 6.0, 5.0, 4.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2125723361968994, -1.1690690517425537, -1.1255658864974976, -1.0820626020431519, -1.0385594367980957, -0.99505615234375, -0.9515529274940491, -0.9080497026443481, -0.8645464777946472, -0.8210432529449463, -0.7775400280952454, -0.7340368032455444, -0.6905335187911987, -0.6470303535461426, -0.6035270690917969, -0.560023844242096, -0.516520619392395, -0.4730173945426941, -0.42951416969299316, -0.38601091504096985, -0.3425076901912689, -0.299004465341568, -0.2555012106895447, -0.21199798583984375, -0.16849476099014282, -0.1249915286898613, -0.08148829638957977, -0.03798505663871765, 0.005518168210983276, 0.049021393060684204, 0.09252464771270752, 0.13602787256240845, 0.17953097820281982, 0.22303420305252075, 0.2665374279022217, 0.310040682554245, 0.3535439074039459, 0.39704713225364685, 0.44055038690567017, 0.4840536117553711, 0.527556836605072, 0.571060061454773, 0.6145632863044739, 0.6580665111541748, 0.7015697956085205, 0.7450729608535767, 0.7885762453079224, 0.8320794701576233, 0.8755826950073242, 0.9190859198570251, 0.9625891447067261, 1.0060924291610718, 1.049595594406128, 1.0930988788604736, 1.1366021633148193, 1.1801053285598755, 1.2236084938049316, 1.2671117782592773, 1.3106149435043335, 1.3541182279586792, 1.3976213932037354, 1.441124677658081, 1.4846279621124268, 1.528131127357483, 1.5716344118118286]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 3.0, 12.0, 7.0, 10.0, 25.0, 39.0, 39.0, 72.0, 100.0, 164.0, 265.0, 371.0, 725.0, 1342.0, 2562.0, 5363.0, 12978.0, 34533.0, 112433.0, 351184.0, 353834.0, 113225.0, 35234.0, 12751.0, 5577.0, 2580.0, 1275.0, 740.0, 418.0, 254.0, 150.0, 95.0, 70.0, 44.0, 17.0, 22.0, 21.0, 10.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.180908203125, -0.17444801330566406, -0.16798782348632812, -0.1615276336669922, -0.15506744384765625, -0.1486072540283203, -0.14214706420898438, -0.13568687438964844, -0.1292266845703125, -0.12276649475097656, -0.11630630493164062, -0.10984611511230469, -0.10338592529296875, -0.09692573547363281, -0.09046554565429688, -0.08400535583496094, -0.077545166015625, -0.07108497619628906, -0.06462478637695312, -0.05816459655761719, -0.05170440673828125, -0.04524421691894531, -0.038784027099609375, -0.03232383728027344, -0.0258636474609375, -0.019403457641601562, -0.012943267822265625, -0.0064830780029296875, -2.288818359375e-05, 0.0064373016357421875, 0.012897491455078125, 0.019357681274414062, 0.02581787109375, 0.03227806091308594, 0.038738250732421875, 0.04519844055175781, 0.05165863037109375, 0.05811882019042969, 0.06457901000976562, 0.07103919982910156, 0.0774993896484375, 0.08395957946777344, 0.09041976928710938, 0.09687995910644531, 0.10334014892578125, 0.10980033874511719, 0.11626052856445312, 0.12272071838378906, 0.129180908203125, 0.13564109802246094, 0.14210128784179688, 0.1485614776611328, 0.15502166748046875, 0.1614818572998047, 0.16794204711914062, 0.17440223693847656, 0.1808624267578125, 0.18732261657714844, 0.19378280639648438, 0.2002429962158203, 0.20670318603515625, 0.2131633758544922, 0.21962356567382812, 0.22608375549316406, 0.2325439453125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 1.0, 6.0, 6.0, 7.0, 10.0, 17.0, 23.0, 15.0, 29.0, 21.0, 42.0, 48.0, 29.0, 45.0, 52.0, 58.0, 70.0, 52.0, 51.0, 46.0, 44.0, 36.0, 33.0, 50.0, 35.0, 30.0, 29.0, 23.0, 24.0, 17.0, 13.0, 12.0, 8.0, 6.0, 10.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12353515625, -0.11874961853027344, -0.11396408081054688, -0.10917854309082031, -0.10439300537109375, -0.09960746765136719, -0.09482192993164062, -0.09003639221191406, -0.0852508544921875, -0.08046531677246094, -0.07567977905273438, -0.07089424133300781, -0.06610870361328125, -0.06132316589355469, -0.056537628173828125, -0.05175209045410156, -0.046966552734375, -0.04218101501464844, -0.037395477294921875, -0.03260993957519531, -0.02782440185546875, -0.023038864135742188, -0.018253326416015625, -0.013467788696289062, -0.0086822509765625, -0.0038967132568359375, 0.000888824462890625, 0.0056743621826171875, 0.01045989990234375, 0.015245437622070312, 0.020030975341796875, 0.024816513061523438, 0.02960205078125, 0.03438758850097656, 0.039173126220703125, 0.04395866394042969, 0.04874420166015625, 0.05352973937988281, 0.058315277099609375, 0.06310081481933594, 0.0678863525390625, 0.07267189025878906, 0.07745742797851562, 0.08224296569824219, 0.08702850341796875, 0.09181404113769531, 0.09659957885742188, 0.10138511657714844, 0.106170654296875, 0.11095619201660156, 0.11574172973632812, 0.12052726745605469, 0.12531280517578125, 0.1300983428955078, 0.13488388061523438, 0.13966941833496094, 0.1444549560546875, 0.14924049377441406, 0.15402603149414062, 0.1588115692138672, 0.16359710693359375, 0.1683826446533203, 0.17316818237304688, 0.17795372009277344, 0.1827392578125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 4.0, 3.0, 10.0, 11.0, 7.0, 10.0, 15.0, 19.0, 32.0, 41.0, 52.0, 102.0, 180.0, 232.0, 474.0, 916.0, 2150.0, 6616.0, 27152.0, 191785.0, 701539.0, 93598.0, 15810.0, 4303.0, 1684.0, 796.0, 379.0, 197.0, 139.0, 81.0, 44.0, 42.0, 25.0, 25.0, 17.0, 18.0, 7.0, 10.0, 5.0, 6.0, 4.0, 3.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3466796875, -0.3359565734863281, -0.32523345947265625, -0.3145103454589844, -0.3037872314453125, -0.2930641174316406, -0.28234100341796875, -0.2716178894042969, -0.260894775390625, -0.2501716613769531, -0.23944854736328125, -0.22872543334960938, -0.2180023193359375, -0.20727920532226562, -0.19655609130859375, -0.18583297729492188, -0.17510986328125, -0.16438674926757812, -0.15366363525390625, -0.14294052124023438, -0.1322174072265625, -0.12149429321289062, -0.11077117919921875, -0.10004806518554688, -0.089324951171875, -0.07860183715820312, -0.06787872314453125, -0.057155609130859375, -0.0464324951171875, -0.035709381103515625, -0.02498626708984375, -0.014263153076171875, -0.0035400390625, 0.007183074951171875, 0.01790618896484375, 0.028629302978515625, 0.0393524169921875, 0.050075531005859375, 0.06079864501953125, 0.07152175903320312, 0.082244873046875, 0.09296798706054688, 0.10369110107421875, 0.11441421508789062, 0.1251373291015625, 0.13586044311523438, 0.14658355712890625, 0.15730667114257812, 0.16802978515625, 0.17875289916992188, 0.18947601318359375, 0.20019912719726562, 0.2109222412109375, 0.22164535522460938, 0.23236846923828125, 0.24309158325195312, 0.253814697265625, 0.2645378112792969, 0.27526092529296875, 0.2859840393066406, 0.2967071533203125, 0.3074302673339844, 0.31815338134765625, 0.3288764953613281, 0.339599609375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 7.0, 5.0, 8.0, 5.0, 12.0, 17.0, 23.0, 32.0, 36.0, 55.0, 66.0, 53.0, 64.0, 71.0, 71.0, 56.0, 65.0, 56.0, 48.0, 57.0, 40.0, 39.0, 25.0, 31.0, 16.0, 11.0, 8.0, 13.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68798828125, -0.6650238037109375, -0.642059326171875, -0.6190948486328125, -0.59613037109375, -0.5731658935546875, -0.550201416015625, -0.5272369384765625, -0.5042724609375, -0.4813079833984375, -0.458343505859375, -0.4353790283203125, -0.41241455078125, -0.3894500732421875, -0.366485595703125, -0.3435211181640625, -0.320556640625, -0.2975921630859375, -0.274627685546875, -0.2516632080078125, -0.22869873046875, -0.2057342529296875, -0.182769775390625, -0.1598052978515625, -0.1368408203125, -0.1138763427734375, -0.090911865234375, -0.0679473876953125, -0.04498291015625, -0.0220184326171875, 0.000946044921875, 0.0239105224609375, 0.046875, 0.0698394775390625, 0.092803955078125, 0.1157684326171875, 0.13873291015625, 0.1616973876953125, 0.184661865234375, 0.2076263427734375, 0.2305908203125, 0.2535552978515625, 0.276519775390625, 0.2994842529296875, 0.32244873046875, 0.3454132080078125, 0.368377685546875, 0.3913421630859375, 0.414306640625, 0.4372711181640625, 0.460235595703125, 0.4832000732421875, 0.50616455078125, 0.5291290283203125, 0.552093505859375, 0.5750579833984375, 0.5980224609375, 0.6209869384765625, 0.643951416015625, 0.6669158935546875, 0.68988037109375, 0.7128448486328125, 0.735809326171875, 0.7587738037109375, 0.78173828125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 17.0, 10.0, 25.0, 35.0, 54.0, 92.0, 183.0, 309.0, 589.0, 1342.0, 3235.0, 9808.0, 39119.0, 229742.0, 649985.0, 86234.0, 18584.0, 5380.0, 1969.0, 894.0, 375.0, 237.0, 127.0, 75.0, 44.0, 23.0, 22.0, 16.0, 4.0, 3.0, 3.0, 0.0, 2.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15771484375, -0.1531085968017578, -0.14850234985351562, -0.14389610290527344, -0.13928985595703125, -0.13468360900878906, -0.13007736206054688, -0.1254711151123047, -0.1208648681640625, -0.11625862121582031, -0.11165237426757812, -0.10704612731933594, -0.10243988037109375, -0.09783363342285156, -0.09322738647460938, -0.08862113952636719, -0.084014892578125, -0.07940864562988281, -0.07480239868164062, -0.07019615173339844, -0.06558990478515625, -0.06098365783691406, -0.056377410888671875, -0.05177116394042969, -0.0471649169921875, -0.04255867004394531, -0.037952423095703125, -0.03334617614746094, -0.02873992919921875, -0.024133682250976562, -0.019527435302734375, -0.014921188354492188, -0.01031494140625, -0.0057086944580078125, -0.001102447509765625, 0.0035037994384765625, 0.00811004638671875, 0.012716293334960938, 0.017322540283203125, 0.021928787231445312, 0.0265350341796875, 0.031141281127929688, 0.035747528076171875, 0.04035377502441406, 0.04496002197265625, 0.04956626892089844, 0.054172515869140625, 0.05877876281738281, 0.063385009765625, 0.06799125671386719, 0.07259750366210938, 0.07720375061035156, 0.08180999755859375, 0.08641624450683594, 0.09102249145507812, 0.09562873840332031, 0.1002349853515625, 0.10484123229980469, 0.10944747924804688, 0.11405372619628906, 0.11865997314453125, 0.12326622009277344, 0.12787246704101562, 0.1324787139892578, 0.1370849609375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 7.0, 8.0, 12.0, 7.0, 15.0, 23.0, 23.0, 42.0, 55.0, 67.0, 102.0, 104.0, 103.0, 103.0, 74.0, 74.0, 47.0, 28.0, 25.0, 17.0, 22.0, 16.0, 7.0, 6.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.13060188293457e-05, -3.999192267656326e-05, -3.867782652378082e-05, -3.736373037099838e-05, -3.604963421821594e-05, -3.47355380654335e-05, -3.342144191265106e-05, -3.210734575986862e-05, -3.079324960708618e-05, -2.947915345430374e-05, -2.81650573015213e-05, -2.685096114873886e-05, -2.553686499595642e-05, -2.422276884317398e-05, -2.290867269039154e-05, -2.15945765376091e-05, -2.028048038482666e-05, -1.896638423204422e-05, -1.765228807926178e-05, -1.633819192647934e-05, -1.50240957736969e-05, -1.370999962091446e-05, -1.2395903468132019e-05, -1.1081807315349579e-05, -9.767711162567139e-06, -8.453615009784698e-06, -7.139518857002258e-06, -5.825422704219818e-06, -4.511326551437378e-06, -3.1972303986549377e-06, -1.8831342458724976e-06, -5.690380930900574e-07, 7.450580596923828e-07, 2.059154212474823e-06, 3.373250365257263e-06, 4.687346518039703e-06, 6.0014426708221436e-06, 7.315538823604584e-06, 8.629634976387024e-06, 9.943731129169464e-06, 1.1257827281951904e-05, 1.2571923434734344e-05, 1.3886019587516785e-05, 1.5200115740299225e-05, 1.6514211893081665e-05, 1.7828308045864105e-05, 1.9142404198646545e-05, 2.0456500351428986e-05, 2.1770596504211426e-05, 2.3084692656993866e-05, 2.4398788809776306e-05, 2.5712884962558746e-05, 2.7026981115341187e-05, 2.8341077268123627e-05, 2.9655173420906067e-05, 3.096926957368851e-05, 3.228336572647095e-05, 3.359746187925339e-05, 3.491155803203583e-05, 3.622565418481827e-05, 3.753975033760071e-05, 3.885384649038315e-05, 4.016794264316559e-05, 4.148203879594803e-05, 4.279613494873047e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 5.0, 5.0, 9.0, 20.0, 27.0, 38.0, 58.0, 102.0, 186.0, 327.0, 661.0, 1336.0, 3280.0, 10837.0, 54130.0, 529903.0, 381067.0, 50328.0, 10320.0, 3151.0, 1315.0, 625.0, 323.0, 197.0, 114.0, 69.0, 36.0, 28.0, 13.0, 12.0, 11.0, 10.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12005615234375, -0.1150503158569336, -0.11004447937011719, -0.10503864288330078, -0.10003280639648438, -0.09502696990966797, -0.09002113342285156, -0.08501529693603516, -0.08000946044921875, -0.07500362396240234, -0.06999778747558594, -0.06499195098876953, -0.059986114501953125, -0.05498027801513672, -0.04997444152832031, -0.044968605041503906, -0.0399627685546875, -0.034956932067871094, -0.029951095581054688, -0.02494525909423828, -0.019939422607421875, -0.014933586120605469, -0.009927749633789062, -0.004921913146972656, 8.392333984375e-05, 0.005089759826660156, 0.010095596313476562, 0.015101432800292969, 0.020107269287109375, 0.02511310577392578, 0.030118942260742188, 0.035124778747558594, 0.040130615234375, 0.045136451721191406, 0.05014228820800781, 0.05514812469482422, 0.060153961181640625, 0.06515979766845703, 0.07016563415527344, 0.07517147064208984, 0.08017730712890625, 0.08518314361572266, 0.09018898010253906, 0.09519481658935547, 0.10020065307617188, 0.10520648956298828, 0.11021232604980469, 0.1152181625366211, 0.1202239990234375, 0.1252298355102539, 0.1302356719970703, 0.13524150848388672, 0.14024734497070312, 0.14525318145751953, 0.15025901794433594, 0.15526485443115234, 0.16027069091796875, 0.16527652740478516, 0.17028236389160156, 0.17528820037841797, 0.18029403686523438, 0.18529987335205078, 0.1903057098388672, 0.1953115463256836, 0.2003173828125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 6.0, 13.0, 14.0, 18.0, 28.0, 43.0, 62.0, 77.0, 90.0, 102.0, 106.0, 97.0, 76.0, 69.0, 52.0, 46.0, 27.0, 20.0, 13.0, 12.0, 12.0, 7.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1422119140625, -0.13680076599121094, -0.13138961791992188, -0.1259784698486328, -0.12056732177734375, -0.11515617370605469, -0.10974502563476562, -0.10433387756347656, -0.0989227294921875, -0.09351158142089844, -0.08810043334960938, -0.08268928527832031, -0.07727813720703125, -0.07186698913574219, -0.06645584106445312, -0.06104469299316406, -0.055633544921875, -0.05022239685058594, -0.044811248779296875, -0.03940010070800781, -0.03398895263671875, -0.028577804565429688, -0.023166656494140625, -0.017755508422851562, -0.0123443603515625, -0.0069332122802734375, -0.001522064208984375, 0.0038890838623046875, 0.00930023193359375, 0.014711380004882812, 0.020122528076171875, 0.025533676147460938, 0.03094482421875, 0.03635597229003906, 0.041767120361328125, 0.04717826843261719, 0.05258941650390625, 0.05800056457519531, 0.06341171264648438, 0.06882286071777344, 0.0742340087890625, 0.07964515686035156, 0.08505630493164062, 0.09046745300292969, 0.09587860107421875, 0.10128974914550781, 0.10670089721679688, 0.11211204528808594, 0.117523193359375, 0.12293434143066406, 0.12834548950195312, 0.1337566375732422, 0.13916778564453125, 0.1445789337158203, 0.14999008178710938, 0.15540122985839844, 0.1608123779296875, 0.16622352600097656, 0.17163467407226562, 0.1770458221435547, 0.18245697021484375, 0.1878681182861328, 0.19327926635742188, 0.19869041442871094, 0.2041015625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 11.0, 15.0, 53.0, 138.0, 368.0, 226.0, 98.0, 42.0, 22.0, 11.0, 3.0, 5.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.138543128967285, -4.003957271575928, -3.869371175765991, -3.7347850799560547, -3.6001992225646973, -3.4656131267547607, -3.331027030944824, -3.196441173553467, -3.0618550777435303, -2.9272689819335938, -2.7926831245422363, -2.6580970287323, -2.5235109329223633, -2.388925075531006, -2.2543389797210693, -2.119752883911133, -1.9851670265197754, -1.8505810499191284, -1.7159950733184814, -1.581408977508545, -1.446823000907898, -1.312237024307251, -1.1776509284973145, -1.0430649518966675, -0.9084789752960205, -0.7738929986953735, -0.6393069624900818, -0.50472092628479, -0.37013494968414307, -0.2355489730834961, -0.10096293687820435, 0.0336230993270874, 0.16820955276489258, 0.30279555916786194, 0.4373815655708313, 0.571967601776123, 0.70655357837677, 0.841139554977417, 0.9757255911827087, 1.1103116273880005, 1.2448976039886475, 1.3794835805892944, 1.5140695571899414, 1.648655652999878, 1.783241629600525, 1.9178276062011719, 2.0524137020111084, 2.186999797821045, 2.3215856552124023, 2.456171751022339, 2.5907576084136963, 2.725343704223633, 2.8599295616149902, 2.9945156574249268, 3.1291017532348633, 3.2636876106262207, 3.3982737064361572, 3.5328598022460938, 3.667445659637451, 3.8020317554473877, 3.936617851257324, 4.071203708648682, 4.205789566040039, 4.340375900268555, 4.474961757659912]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 4.0, 9.0, 2.0, 7.0, 11.0, 9.0, 6.0, 18.0, 18.0, 6.0, 22.0, 18.0, 15.0, 18.0, 21.0, 25.0, 27.0, 34.0, 41.0, 58.0, 57.0, 69.0, 82.0, 69.0, 38.0, 29.0, 41.0, 23.0, 36.0, 27.0, 17.0, 20.0, 25.0, 13.0, 8.0, 12.0, 14.0, 10.0, 4.0, 5.0, 5.0, 5.0, 4.0, 7.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.6017582416534424, -1.5445072650909424, -1.4872561693191528, -1.4300051927566528, -1.3727542161941528, -1.3155031204223633, -1.2582521438598633, -1.2010011672973633, -1.1437501907348633, -1.0864992141723633, -1.0292481184005737, -0.9719971418380737, -0.9147461652755737, -0.857495129108429, -0.8002440929412842, -0.7429931163787842, -0.6857420802116394, -0.6284910440444946, -0.5712400674819946, -0.5139890313148499, -0.45673805475234985, -0.3994870185852051, -0.3422360122203827, -0.2849850058555603, -0.22773399949073792, -0.17048299312591553, -0.11323197931051254, -0.05598096549510956, 0.0012700408697128296, 0.05852106213569641, 0.1157720685005188, 0.1730230748653412, 0.23027408123016357, 0.28752508759498596, 0.34477609395980835, 0.4020271301269531, 0.4592781066894531, 0.5165291428565979, 0.5737801790237427, 0.6310311555862427, 0.6882821321487427, 0.7455331683158875, 0.8027841448783875, 0.8600351810455322, 0.9172861576080322, 0.974537193775177, 1.0317882299423218, 1.0890392065048218, 1.1462903022766113, 1.2035412788391113, 1.2607923746109009, 1.3180433511734009, 1.3752943277359009, 1.4325454235076904, 1.4897964000701904, 1.5470473766326904, 1.6042983531951904, 1.6615493297576904, 1.71880042552948, 1.77605140209198, 1.83330237865448, 1.8905534744262695, 1.9478044509887695, 2.0050554275512695, 2.0623064041137695]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 2.0, 4.0, 2.0, 5.0, 12.0, 24.0, 31.0, 32.0, 69.0, 108.0, 172.0, 280.0, 438.0, 675.0, 1161.0, 1893.0, 3447.0, 6629.0, 13700.0, 33753.0, 103302.0, 402006.0, 1646387.0, 1482275.0, 350428.0, 91498.0, 29836.0, 12356.0, 5959.0, 3134.0, 1875.0, 1073.0, 653.0, 408.0, 267.0, 150.0, 69.0, 59.0, 35.0, 27.0, 18.0, 14.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14013671875, -0.13600921630859375, -0.1318817138671875, -0.12775421142578125, -0.123626708984375, -0.11949920654296875, -0.1153717041015625, -0.11124420166015625, -0.10711669921875, -0.10298919677734375, -0.0988616943359375, -0.09473419189453125, -0.090606689453125, -0.08647918701171875, -0.0823516845703125, -0.07822418212890625, -0.0740966796875, -0.06996917724609375, -0.0658416748046875, -0.06171417236328125, -0.057586669921875, -0.05345916748046875, -0.0493316650390625, -0.04520416259765625, -0.04107666015625, -0.03694915771484375, -0.0328216552734375, -0.02869415283203125, -0.024566650390625, -0.02043914794921875, -0.0163116455078125, -0.01218414306640625, -0.008056640625, -0.00392913818359375, 0.0001983642578125, 0.00432586669921875, 0.008453369140625, 0.01258087158203125, 0.0167083740234375, 0.02083587646484375, 0.02496337890625, 0.02909088134765625, 0.0332183837890625, 0.03734588623046875, 0.041473388671875, 0.04560089111328125, 0.0497283935546875, 0.05385589599609375, 0.0579833984375, 0.06211090087890625, 0.0662384033203125, 0.07036590576171875, 0.074493408203125, 0.07862091064453125, 0.0827484130859375, 0.08687591552734375, 0.09100341796875, 0.09513092041015625, 0.0992584228515625, 0.10338592529296875, 0.107513427734375, 0.11164093017578125, 0.1157684326171875, 0.11989593505859375, 0.1240234375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 8.0, 6.0, 5.0, 7.0, 11.0, 14.0, 20.0, 23.0, 29.0, 22.0, 38.0, 36.0, 63.0, 51.0, 60.0, 61.0, 54.0, 53.0, 62.0, 59.0, 50.0, 51.0, 45.0, 35.0, 37.0, 22.0, 18.0, 18.0, 12.0, 11.0, 8.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12890625, -0.123931884765625, -0.11895751953125, -0.113983154296875, -0.1090087890625, -0.104034423828125, -0.09906005859375, -0.094085693359375, -0.089111328125, -0.084136962890625, -0.07916259765625, -0.074188232421875, -0.0692138671875, -0.064239501953125, -0.05926513671875, -0.054290771484375, -0.04931640625, -0.044342041015625, -0.03936767578125, -0.034393310546875, -0.0294189453125, -0.024444580078125, -0.01947021484375, -0.014495849609375, -0.009521484375, -0.004547119140625, 0.00042724609375, 0.005401611328125, 0.0103759765625, 0.015350341796875, 0.02032470703125, 0.025299072265625, 0.0302734375, 0.035247802734375, 0.04022216796875, 0.045196533203125, 0.0501708984375, 0.055145263671875, 0.06011962890625, 0.065093994140625, 0.070068359375, 0.075042724609375, 0.08001708984375, 0.084991455078125, 0.0899658203125, 0.094940185546875, 0.09991455078125, 0.104888916015625, 0.10986328125, 0.114837646484375, 0.11981201171875, 0.124786376953125, 0.1297607421875, 0.134735107421875, 0.13970947265625, 0.144683837890625, 0.149658203125, 0.154632568359375, 0.15960693359375, 0.164581298828125, 0.1695556640625, 0.174530029296875, 0.17950439453125, 0.184478759765625, 0.189453125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 2.0, 2.0, 10.0, 14.0, 15.0, 28.0, 38.0, 43.0, 70.0, 129.0, 333.0, 940.0, 3906.0, 24059.0, 455195.0, 3603635.0, 92717.0, 10125.0, 1950.0, 569.0, 226.0, 105.0, 52.0, 42.0, 16.0, 21.0, 14.0, 11.0, 9.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.383544921875, -0.3677482604980469, -0.35195159912109375, -0.3361549377441406, -0.3203582763671875, -0.3045616149902344, -0.28876495361328125, -0.2729682922363281, -0.257171630859375, -0.24137496948242188, -0.22557830810546875, -0.20978164672851562, -0.1939849853515625, -0.17818832397460938, -0.16239166259765625, -0.14659500122070312, -0.13079833984375, -0.11500167846679688, -0.09920501708984375, -0.08340835571289062, -0.0676116943359375, -0.051815032958984375, -0.03601837158203125, -0.020221710205078125, -0.004425048828125, 0.011371612548828125, 0.02716827392578125, 0.042964935302734375, 0.0587615966796875, 0.07455825805664062, 0.09035491943359375, 0.10615158081054688, 0.1219482421875, 0.13774490356445312, 0.15354156494140625, 0.16933822631835938, 0.1851348876953125, 0.20093154907226562, 0.21672821044921875, 0.23252487182617188, 0.248321533203125, 0.2641181945800781, 0.27991485595703125, 0.2957115173339844, 0.3115081787109375, 0.3273048400878906, 0.34310150146484375, 0.3588981628417969, 0.37469482421875, 0.3904914855957031, 0.40628814697265625, 0.4220848083496094, 0.4378814697265625, 0.4536781311035156, 0.46947479248046875, 0.4852714538574219, 0.501068115234375, 0.5168647766113281, 0.5326614379882812, 0.5484580993652344, 0.5642547607421875, 0.5800514221191406, 0.5958480834960938, 0.6116447448730469, 0.62744140625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 8.0, 2.0, 6.0, 12.0, 10.0, 19.0, 19.0, 32.0, 42.0, 58.0, 100.0, 171.0, 275.0, 437.0, 746.0, 810.0, 524.0, 287.0, 167.0, 104.0, 64.0, 41.0, 34.0, 33.0, 17.0, 10.0, 10.0, 13.0, 5.0, 7.0, 3.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3916015625, -0.3810615539550781, -0.37052154541015625, -0.3599815368652344, -0.3494415283203125, -0.3389015197753906, -0.32836151123046875, -0.3178215026855469, -0.307281494140625, -0.2967414855957031, -0.28620147705078125, -0.2756614685058594, -0.2651214599609375, -0.2545814514160156, -0.24404144287109375, -0.23350143432617188, -0.22296142578125, -0.21242141723632812, -0.20188140869140625, -0.19134140014648438, -0.1808013916015625, -0.17026138305664062, -0.15972137451171875, -0.14918136596679688, -0.138641357421875, -0.12810134887695312, -0.11756134033203125, -0.10702133178710938, -0.0964813232421875, -0.08594131469726562, -0.07540130615234375, -0.06486129760742188, -0.0543212890625, -0.043781280517578125, -0.03324127197265625, -0.022701263427734375, -0.0121612548828125, -0.001621246337890625, 0.00891876220703125, 0.019458770751953125, 0.029998779296875, 0.040538787841796875, 0.05107879638671875, 0.061618804931640625, 0.0721588134765625, 0.08269882202148438, 0.09323883056640625, 0.10377883911132812, 0.11431884765625, 0.12485885620117188, 0.13539886474609375, 0.14593887329101562, 0.1564788818359375, 0.16701889038085938, 0.17755889892578125, 0.18809890747070312, 0.198638916015625, 0.20917892456054688, 0.21971893310546875, 0.23025894165039062, 0.2407989501953125, 0.2513389587402344, 0.26187896728515625, 0.2724189758300781, 0.282958984375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 2.0, 5.0, 3.0, 10.0, 24.0, 64.0, 145.0, 249.0, 246.0, 146.0, 69.0, 27.0, 5.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0440897941589355, -4.911666393280029, -4.779242515563965, -4.646819114685059, -4.514395236968994, -4.381971836090088, -4.249547958374023, -4.117124557495117, -3.984700918197632, -3.8522772789001465, -3.719853639602661, -3.587430000305176, -3.4550065994262695, -3.322582721710205, -3.190159320831299, -3.0577356815338135, -2.925312042236328, -2.7928884029388428, -2.6604647636413574, -2.528041124343872, -2.3956174850463867, -2.2631940841674805, -2.130770444869995, -1.9983468055725098, -1.8659231662750244, -1.733499526977539, -1.6010758876800537, -1.468652367591858, -1.3362287282943726, -1.2038050889968872, -1.0713815689086914, -0.938957929611206, -0.8065338134765625, -0.6741101741790771, -0.5416865944862366, -0.4092629849910736, -0.27683937549591064, -0.1444157361984253, -0.011992156505584717, 0.12043142318725586, 0.2528550624847412, 0.3852786719799042, 0.5177022814750671, 0.6501258611679077, 0.7825495004653931, 0.9149731397628784, 1.0473966598510742, 1.1798202991485596, 1.312243938446045, 1.4446675777435303, 1.5770912170410156, 1.7095147371292114, 1.8419383764266968, 1.9743620157241821, 2.106785535812378, 2.2392091751098633, 2.3716328144073486, 2.504056453704834, 2.6364800930023193, 2.7689037322998047, 2.901327133178711, 3.0337510108947754, 3.1661744117736816, 3.298598051071167, 3.4310216903686523]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 4.0, 11.0, 6.0, 8.0, 9.0, 17.0, 17.0, 15.0, 25.0, 34.0, 31.0, 37.0, 46.0, 47.0, 49.0, 33.0, 54.0, 46.0, 53.0, 44.0, 46.0, 44.0, 52.0, 53.0, 33.0, 30.0, 29.0, 30.0, 25.0, 16.0, 16.0, 13.0, 6.0, 4.0, 2.0, 4.0, 7.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3673722743988037, -1.3215018510818481, -1.2756314277648926, -1.229761004447937, -1.1838905811309814, -1.1380200386047363, -1.0921496152877808, -1.0462791919708252, -1.0004087686538696, -0.9545383453369141, -0.9086679220199585, -0.8627974390983582, -0.8169270157814026, -0.771056592464447, -0.7251861095428467, -0.6793156862258911, -0.6334452629089355, -0.58757483959198, -0.5417044162750244, -0.4958339333534241, -0.4499635100364685, -0.40409308671951294, -0.358222633600235, -0.31235218048095703, -0.26648175716400146, -0.2206113189458847, -0.17474088072776794, -0.12887044250965118, -0.08300000429153442, -0.037129566073417664, 0.008740872144699097, 0.05461132526397705, 0.10048174858093262, 0.14635218679904938, 0.19222262501716614, 0.2380930632352829, 0.28396350145339966, 0.3298339247703552, 0.3757043778896332, 0.42157483100891113, 0.4674452543258667, 0.5133156776428223, 0.5591861009597778, 0.6050565838813782, 0.6509270071983337, 0.6967974305152893, 0.7426679134368896, 0.7885383367538452, 0.8344087600708008, 0.8802791833877563, 0.9261496067047119, 0.9720200896263123, 1.017890453338623, 1.0637609958648682, 1.1096314191818237, 1.1555018424987793, 1.2013722658157349, 1.2472426891326904, 1.293113112449646, 1.3389835357666016, 1.3848540782928467, 1.4307245016098022, 1.4765949249267578, 1.5224653482437134, 1.568335771560669]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 8.0, 8.0, 9.0, 16.0, 13.0, 24.0, 38.0, 45.0, 36.0, 69.0, 129.0, 173.0, 230.0, 398.0, 610.0, 1126.0, 2025.0, 4449.0, 10884.0, 30482.0, 105444.0, 432839.0, 338181.0, 79935.0, 24216.0, 8927.0, 3840.0, 1819.0, 969.0, 542.0, 338.0, 208.0, 145.0, 92.0, 80.0, 62.0, 39.0, 29.0, 33.0, 14.0, 12.0, 5.0, 4.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.239990234375, -0.23291015625, -0.225830078125, -0.21875, -0.211669921875, -0.20458984375, -0.197509765625, -0.1904296875, -0.183349609375, -0.17626953125, -0.169189453125, -0.162109375, -0.155029296875, -0.14794921875, -0.140869140625, -0.1337890625, -0.126708984375, -0.11962890625, -0.112548828125, -0.10546875, -0.098388671875, -0.09130859375, -0.084228515625, -0.0771484375, -0.070068359375, -0.06298828125, -0.055908203125, -0.048828125, -0.041748046875, -0.03466796875, -0.027587890625, -0.0205078125, -0.013427734375, -0.00634765625, 0.000732421875, 0.0078125, 0.014892578125, 0.02197265625, 0.029052734375, 0.0361328125, 0.043212890625, 0.05029296875, 0.057373046875, 0.064453125, 0.071533203125, 0.07861328125, 0.085693359375, 0.0927734375, 0.099853515625, 0.10693359375, 0.114013671875, 0.12109375, 0.128173828125, 0.13525390625, 0.142333984375, 0.1494140625, 0.156494140625, 0.16357421875, 0.170654296875, 0.177734375, 0.184814453125, 0.19189453125, 0.198974609375, 0.2060546875, 0.213134765625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 5.0, 4.0, 3.0, 9.0, 12.0, 10.0, 14.0, 27.0, 15.0, 19.0, 28.0, 33.0, 46.0, 25.0, 37.0, 36.0, 46.0, 49.0, 50.0, 50.0, 38.0, 52.0, 63.0, 38.0, 39.0, 30.0, 35.0, 27.0, 29.0, 24.0, 16.0, 13.0, 15.0, 16.0, 15.0, 10.0, 5.0, 3.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11859130859375, -0.11428546905517578, -0.10997962951660156, -0.10567378997802734, -0.10136795043945312, -0.0970621109008789, -0.09275627136230469, -0.08845043182373047, -0.08414459228515625, -0.07983875274658203, -0.07553291320800781, -0.0712270736694336, -0.06692123413085938, -0.06261539459228516, -0.05830955505371094, -0.05400371551513672, -0.0496978759765625, -0.04539203643798828, -0.04108619689941406, -0.036780357360839844, -0.032474517822265625, -0.028168678283691406, -0.023862838745117188, -0.01955699920654297, -0.01525115966796875, -0.010945320129394531, -0.0066394805908203125, -0.0023336410522460938, 0.001972198486328125, 0.006278038024902344, 0.010583877563476562, 0.014889717102050781, 0.019195556640625, 0.02350139617919922, 0.027807235717773438, 0.032113075256347656, 0.036418914794921875, 0.040724754333496094, 0.04503059387207031, 0.04933643341064453, 0.05364227294921875, 0.05794811248779297, 0.06225395202636719, 0.0665597915649414, 0.07086563110351562, 0.07517147064208984, 0.07947731018066406, 0.08378314971923828, 0.0880889892578125, 0.09239482879638672, 0.09670066833496094, 0.10100650787353516, 0.10531234741210938, 0.1096181869506836, 0.11392402648925781, 0.11822986602783203, 0.12253570556640625, 0.12684154510498047, 0.1311473846435547, 0.1354532241821289, 0.13975906372070312, 0.14406490325927734, 0.14837074279785156, 0.15267658233642578, 0.156982421875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 6.0, 11.0, 9.0, 18.0, 28.0, 51.0, 64.0, 101.0, 153.0, 262.0, 496.0, 1004.0, 2531.0, 8028.0, 42743.0, 671849.0, 282905.0, 28249.0, 6195.0, 1935.0, 865.0, 433.0, 221.0, 137.0, 78.0, 48.0, 42.0, 34.0, 22.0, 14.0, 8.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28564453125, -0.27368927001953125, -0.2617340087890625, -0.24977874755859375, -0.237823486328125, -0.22586822509765625, -0.2139129638671875, -0.20195770263671875, -0.19000244140625, -0.17804718017578125, -0.1660919189453125, -0.15413665771484375, -0.142181396484375, -0.13022613525390625, -0.1182708740234375, -0.10631561279296875, -0.0943603515625, -0.08240509033203125, -0.0704498291015625, -0.05849456787109375, -0.046539306640625, -0.03458404541015625, -0.0226287841796875, -0.01067352294921875, 0.00128173828125, 0.01323699951171875, 0.0251922607421875, 0.03714752197265625, 0.049102783203125, 0.06105804443359375, 0.0730133056640625, 0.08496856689453125, 0.096923828125, 0.10887908935546875, 0.1208343505859375, 0.13278961181640625, 0.144744873046875, 0.15670013427734375, 0.1686553955078125, 0.18061065673828125, 0.19256591796875, 0.20452117919921875, 0.2164764404296875, 0.22843170166015625, 0.240386962890625, 0.25234222412109375, 0.2642974853515625, 0.27625274658203125, 0.2882080078125, 0.30016326904296875, 0.3121185302734375, 0.32407379150390625, 0.336029052734375, 0.34798431396484375, 0.3599395751953125, 0.37189483642578125, 0.38385009765625, 0.39580535888671875, 0.4077606201171875, 0.41971588134765625, 0.431671142578125, 0.44362640380859375, 0.4555816650390625, 0.46753692626953125, 0.4794921875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 9.0, 3.0, 10.0, 22.0, 13.0, 19.0, 23.0, 30.0, 38.0, 50.0, 32.0, 65.0, 50.0, 62.0, 61.0, 58.0, 52.0, 59.0, 52.0, 46.0, 44.0, 38.0, 26.0, 19.0, 17.0, 24.0, 14.0, 8.0, 12.0, 7.0, 10.0, 8.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54150390625, -0.5231170654296875, -0.504730224609375, -0.4863433837890625, -0.46795654296875, -0.4495697021484375, -0.431182861328125, -0.4127960205078125, -0.3944091796875, -0.3760223388671875, -0.357635498046875, -0.3392486572265625, -0.32086181640625, -0.3024749755859375, -0.284088134765625, -0.2657012939453125, -0.247314453125, -0.2289276123046875, -0.210540771484375, -0.1921539306640625, -0.17376708984375, -0.1553802490234375, -0.136993408203125, -0.1186065673828125, -0.1002197265625, -0.0818328857421875, -0.063446044921875, -0.0450592041015625, -0.02667236328125, -0.0082855224609375, 0.010101318359375, 0.0284881591796875, 0.046875, 0.0652618408203125, 0.083648681640625, 0.1020355224609375, 0.12042236328125, 0.1388092041015625, 0.157196044921875, 0.1755828857421875, 0.1939697265625, 0.2123565673828125, 0.230743408203125, 0.2491302490234375, 0.26751708984375, 0.2859039306640625, 0.304290771484375, 0.3226776123046875, 0.341064453125, 0.3594512939453125, 0.377838134765625, 0.3962249755859375, 0.41461181640625, 0.4329986572265625, 0.451385498046875, 0.4697723388671875, 0.4881591796875, 0.5065460205078125, 0.524932861328125, 0.5433197021484375, 0.56170654296875, 0.5800933837890625, 0.598480224609375, 0.6168670654296875, 0.63525390625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 6.0, 6.0, 9.0, 2.0, 6.0, 11.0, 14.0, 30.0, 28.0, 33.0, 44.0, 59.0, 100.0, 145.0, 196.0, 303.0, 529.0, 829.0, 1454.0, 2780.0, 5724.0, 12783.0, 31947.0, 99060.0, 586230.0, 209806.0, 57592.0, 20768.0, 8862.0, 4106.0, 2084.0, 1148.0, 673.0, 420.0, 249.0, 160.0, 107.0, 80.0, 46.0, 32.0, 23.0, 13.0, 8.0, 10.0, 7.0, 5.0, 7.0, 4.0, 6.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 4.0], "bins": [-0.08319091796875, -0.08065223693847656, -0.07811355590820312, -0.07557487487792969, -0.07303619384765625, -0.07049751281738281, -0.06795883178710938, -0.06542015075683594, -0.0628814697265625, -0.06034278869628906, -0.057804107666015625, -0.05526542663574219, -0.05272674560546875, -0.05018806457519531, -0.047649383544921875, -0.04511070251464844, -0.042572021484375, -0.04003334045410156, -0.037494659423828125, -0.03495597839355469, -0.03241729736328125, -0.029878616333007812, -0.027339935302734375, -0.024801254272460938, -0.0222625732421875, -0.019723892211914062, -0.017185211181640625, -0.014646530151367188, -0.01210784912109375, -0.009569168090820312, -0.007030487060546875, -0.0044918060302734375, -0.001953125, 0.0005855560302734375, 0.003124237060546875, 0.0056629180908203125, 0.00820159912109375, 0.010740280151367188, 0.013278961181640625, 0.015817642211914062, 0.0183563232421875, 0.020895004272460938, 0.023433685302734375, 0.025972366333007812, 0.02851104736328125, 0.031049728393554688, 0.033588409423828125, 0.03612709045410156, 0.038665771484375, 0.04120445251464844, 0.043743133544921875, 0.04628181457519531, 0.04882049560546875, 0.05135917663574219, 0.053897857666015625, 0.05643653869628906, 0.0589752197265625, 0.06151390075683594, 0.06405258178710938, 0.06659126281738281, 0.06912994384765625, 0.07166862487792969, 0.07420730590820312, 0.07674598693847656, 0.07928466796875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 10.0, 6.0, 11.0, 10.0, 22.0, 24.0, 35.0, 39.0, 73.0, 83.0, 104.0, 117.0, 117.0, 100.0, 70.0, 46.0, 36.0, 23.0, 15.0, 16.0, 15.0, 4.0, 3.0, 1.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.279613494873047e-05, -4.148110747337341e-05, -4.016607999801636e-05, -3.88510525226593e-05, -3.7536025047302246e-05, -3.622099757194519e-05, -3.4905970096588135e-05, -3.359094262123108e-05, -3.2275915145874023e-05, -3.096088767051697e-05, -2.9645860195159912e-05, -2.8330832719802856e-05, -2.70158052444458e-05, -2.5700777769088745e-05, -2.438575029373169e-05, -2.3070722818374634e-05, -2.1755695343017578e-05, -2.0440667867660522e-05, -1.9125640392303467e-05, -1.781061291694641e-05, -1.6495585441589355e-05, -1.51805579662323e-05, -1.3865530490875244e-05, -1.2550503015518188e-05, -1.1235475540161133e-05, -9.920448064804077e-06, -8.605420589447021e-06, -7.290393114089966e-06, -5.97536563873291e-06, -4.6603381633758545e-06, -3.345310688018799e-06, -2.030283212661743e-06, -7.152557373046875e-07, 5.997717380523682e-07, 1.914799213409424e-06, 3.2298266887664795e-06, 4.544854164123535e-06, 5.859881639480591e-06, 7.1749091148376465e-06, 8.489936590194702e-06, 9.804964065551758e-06, 1.1119991540908813e-05, 1.2435019016265869e-05, 1.3750046491622925e-05, 1.506507396697998e-05, 1.6380101442337036e-05, 1.7695128917694092e-05, 1.9010156393051147e-05, 2.0325183868408203e-05, 2.164021134376526e-05, 2.2955238819122314e-05, 2.427026629447937e-05, 2.5585293769836426e-05, 2.690032124519348e-05, 2.8215348720550537e-05, 2.9530376195907593e-05, 3.084540367126465e-05, 3.2160431146621704e-05, 3.347545862197876e-05, 3.4790486097335815e-05, 3.610551357269287e-05, 3.742054104804993e-05, 3.873556852340698e-05, 4.005059599876404e-05, 4.1365623474121094e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 10.0, 9.0, 11.0, 15.0, 25.0, 46.0, 51.0, 95.0, 140.0, 179.0, 314.0, 582.0, 1192.0, 2235.0, 4990.0, 12902.0, 39959.0, 177229.0, 657557.0, 106219.0, 27575.0, 9382.0, 3827.0, 1788.0, 896.0, 475.0, 317.0, 184.0, 116.0, 55.0, 51.0, 46.0, 27.0, 14.0, 15.0, 7.0, 6.0, 4.0, 2.0, 0.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11260986328125, -0.10942363739013672, -0.10623741149902344, -0.10305118560791016, -0.09986495971679688, -0.0966787338256836, -0.09349250793457031, -0.09030628204345703, -0.08712005615234375, -0.08393383026123047, -0.08074760437011719, -0.0775613784790039, -0.07437515258789062, -0.07118892669677734, -0.06800270080566406, -0.06481647491455078, -0.0616302490234375, -0.05844402313232422, -0.05525779724121094, -0.052071571350097656, -0.048885345458984375, -0.045699119567871094, -0.04251289367675781, -0.03932666778564453, -0.03614044189453125, -0.03295421600341797, -0.029767990112304688, -0.026581764221191406, -0.023395538330078125, -0.020209312438964844, -0.017023086547851562, -0.013836860656738281, -0.010650634765625, -0.007464408874511719, -0.0042781829833984375, -0.0010919570922851562, 0.002094268798828125, 0.005280494689941406, 0.008466720581054688, 0.011652946472167969, 0.01483917236328125, 0.01802539825439453, 0.021211624145507812, 0.024397850036621094, 0.027584075927734375, 0.030770301818847656, 0.03395652770996094, 0.03714275360107422, 0.0403289794921875, 0.04351520538330078, 0.04670143127441406, 0.049887657165527344, 0.053073883056640625, 0.056260108947753906, 0.05944633483886719, 0.06263256072998047, 0.06581878662109375, 0.06900501251220703, 0.07219123840332031, 0.0753774642944336, 0.07856369018554688, 0.08174991607666016, 0.08493614196777344, 0.08812236785888672, 0.09130859375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 7.0, 9.0, 14.0, 19.0, 17.0, 24.0, 39.0, 50.0, 54.0, 76.0, 89.0, 101.0, 87.0, 86.0, 60.0, 73.0, 53.0, 24.0, 22.0, 22.0, 14.0, 11.0, 8.0, 7.0, 10.0, 3.0, 7.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.112060546875, -0.10832786560058594, -0.10459518432617188, -0.10086250305175781, -0.09712982177734375, -0.09339714050292969, -0.08966445922851562, -0.08593177795410156, -0.0821990966796875, -0.07846641540527344, -0.07473373413085938, -0.07100105285644531, -0.06726837158203125, -0.06353569030761719, -0.059803009033203125, -0.05607032775878906, -0.052337646484375, -0.04860496520996094, -0.044872283935546875, -0.04113960266113281, -0.03740692138671875, -0.03367424011230469, -0.029941558837890625, -0.026208877563476562, -0.0224761962890625, -0.018743515014648438, -0.015010833740234375, -0.011278152465820312, -0.00754547119140625, -0.0038127899169921875, -8.0108642578125e-05, 0.0036525726318359375, 0.00738525390625, 0.011117935180664062, 0.014850616455078125, 0.018583297729492188, 0.02231597900390625, 0.026048660278320312, 0.029781341552734375, 0.03351402282714844, 0.0372467041015625, 0.04097938537597656, 0.044712066650390625, 0.04844474792480469, 0.05217742919921875, 0.05591011047363281, 0.059642791748046875, 0.06337547302246094, 0.067108154296875, 0.07084083557128906, 0.07457351684570312, 0.07830619812011719, 0.08203887939453125, 0.08577156066894531, 0.08950424194335938, 0.09323692321777344, 0.0969696044921875, 0.10070228576660156, 0.10443496704101562, 0.10816764831542969, 0.11190032958984375, 0.11563301086425781, 0.11936569213867188, 0.12309837341308594, 0.1268310546875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 7.0, 10.0, 17.0, 69.0, 148.0, 346.0, 197.0, 100.0, 42.0, 29.0, 11.0, 5.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.927361011505127, -3.8200178146362305, -3.712674617767334, -3.6053314208984375, -3.497988224029541, -3.3906450271606445, -3.283301830291748, -3.1759586334228516, -3.068615436553955, -2.9612722396850586, -2.853929042816162, -2.7465858459472656, -2.639242649078369, -2.5318994522094727, -2.424556255340576, -2.3172130584716797, -2.209869861602783, -2.1025266647338867, -1.9951834678649902, -1.8878402709960938, -1.7804970741271973, -1.6731538772583008, -1.5658106803894043, -1.4584674835205078, -1.3511242866516113, -1.2437810897827148, -1.1364378929138184, -1.0290946960449219, -0.9217514991760254, -0.8144083023071289, -0.7070651054382324, -0.5997219085693359, -0.49237847328186035, -0.38503527641296387, -0.2776920795440674, -0.1703488826751709, -0.06300568580627441, 0.04433751106262207, 0.15168070793151855, 0.25902390480041504, 0.3663671016693115, 0.473710298538208, 0.5810534954071045, 0.688396692276001, 0.7957398891448975, 0.903083086013794, 1.0104262828826904, 1.117769479751587, 1.2251126766204834, 1.3324558734893799, 1.4397990703582764, 1.5471422672271729, 1.6544854640960693, 1.7618286609649658, 1.8691718578338623, 1.9765150547027588, 2.0838582515716553, 2.1912014484405518, 2.2985446453094482, 2.4058878421783447, 2.513231039047241, 2.6205742359161377, 2.727917432785034, 2.8352606296539307, 2.942603826522827]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 5.0, 5.0, 6.0, 5.0, 10.0, 13.0, 18.0, 8.0, 24.0, 12.0, 20.0, 26.0, 27.0, 32.0, 27.0, 41.0, 40.0, 88.0, 98.0, 86.0, 71.0, 51.0, 31.0, 36.0, 33.0, 30.0, 36.0, 18.0, 19.0, 17.0, 13.0, 8.0, 8.0, 12.0, 6.0, 3.0, 8.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0], "bins": [-2.4488959312438965, -2.380946159362793, -2.3129966259002686, -2.245047092437744, -2.1770973205566406, -2.109147548675537, -2.0411980152130127, -1.9732483625411987, -1.9052987098693848, -1.8373490571975708, -1.7693994045257568, -1.7014497518539429, -1.633500099182129, -1.565550446510315, -1.497600793838501, -1.429651141166687, -1.361701488494873, -1.293751835823059, -1.2258021831512451, -1.1578525304794312, -1.0899028778076172, -1.0219532251358032, -0.9540035724639893, -0.8860539197921753, -0.8181042671203613, -0.7501546144485474, -0.6822049617767334, -0.6142553091049194, -0.5463056564331055, -0.4783560037612915, -0.41040635108947754, -0.3424566984176636, -0.2745072841644287, -0.20655763149261475, -0.13860797882080078, -0.07065832614898682, -0.0027086734771728516, 0.06524097919464111, 0.13319063186645508, 0.20114028453826904, 0.269089937210083, 0.337039589881897, 0.40498924255371094, 0.4729388952255249, 0.5408885478973389, 0.6088382005691528, 0.6767878532409668, 0.7447375059127808, 0.8126871585845947, 0.8806368112564087, 0.9485864639282227, 1.0165361166000366, 1.0844857692718506, 1.1524354219436646, 1.2203850746154785, 1.2883347272872925, 1.3562843799591064, 1.4242340326309204, 1.4921836853027344, 1.5601333379745483, 1.6280829906463623, 1.6960326433181763, 1.7639822959899902, 1.8319319486618042, 1.8998816013336182]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 1.0, 5.0, 16.0, 4.0, 12.0, 13.0, 27.0, 38.0, 47.0, 68.0, 116.0, 162.0, 260.0, 405.0, 569.0, 1023.0, 1918.0, 3807.0, 9282.0, 26173.0, 100880.0, 550573.0, 2311126.0, 965677.0, 163309.0, 36321.0, 11928.0, 5015.0, 2350.0, 1246.0, 679.0, 424.0, 247.0, 174.0, 114.0, 97.0, 59.0, 35.0, 23.0, 23.0, 11.0, 8.0, 9.0, 6.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.183349609375, -0.1782073974609375, -0.173065185546875, -0.1679229736328125, -0.16278076171875, -0.1576385498046875, -0.152496337890625, -0.1473541259765625, -0.1422119140625, -0.1370697021484375, -0.131927490234375, -0.1267852783203125, -0.12164306640625, -0.1165008544921875, -0.111358642578125, -0.1062164306640625, -0.10107421875, -0.0959320068359375, -0.090789794921875, -0.0856475830078125, -0.08050537109375, -0.0753631591796875, -0.070220947265625, -0.0650787353515625, -0.0599365234375, -0.0547943115234375, -0.049652099609375, -0.0445098876953125, -0.03936767578125, -0.0342254638671875, -0.029083251953125, -0.0239410400390625, -0.018798828125, -0.0136566162109375, -0.008514404296875, -0.0033721923828125, 0.00177001953125, 0.0069122314453125, 0.012054443359375, 0.0171966552734375, 0.0223388671875, 0.0274810791015625, 0.032623291015625, 0.0377655029296875, 0.04290771484375, 0.0480499267578125, 0.053192138671875, 0.0583343505859375, 0.0634765625, 0.0686187744140625, 0.073760986328125, 0.0789031982421875, 0.08404541015625, 0.0891876220703125, 0.094329833984375, 0.0994720458984375, 0.1046142578125, 0.1097564697265625, 0.114898681640625, 0.1200408935546875, 0.12518310546875, 0.1303253173828125, 0.135467529296875, 0.1406097412109375, 0.145751953125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 8.0, 13.0, 17.0, 16.0, 24.0, 31.0, 36.0, 40.0, 35.0, 47.0, 46.0, 49.0, 55.0, 60.0, 52.0, 50.0, 50.0, 50.0, 46.0, 41.0, 39.0, 34.0, 29.0, 19.0, 22.0, 29.0, 11.0, 14.0, 9.0, 10.0, 2.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1396484375, -0.13487815856933594, -0.13010787963867188, -0.1253376007080078, -0.12056732177734375, -0.11579704284667969, -0.11102676391601562, -0.10625648498535156, -0.1014862060546875, -0.09671592712402344, -0.09194564819335938, -0.08717536926269531, -0.08240509033203125, -0.07763481140136719, -0.07286453247070312, -0.06809425354003906, -0.063323974609375, -0.05855369567871094, -0.053783416748046875, -0.04901313781738281, -0.04424285888671875, -0.03947257995605469, -0.034702301025390625, -0.029932022094726562, -0.0251617431640625, -0.020391464233398438, -0.015621185302734375, -0.010850906372070312, -0.00608062744140625, -0.0013103485107421875, 0.003459930419921875, 0.008230209350585938, 0.01300048828125, 0.017770767211914062, 0.022541046142578125, 0.027311325073242188, 0.03208160400390625, 0.03685188293457031, 0.041622161865234375, 0.04639244079589844, 0.0511627197265625, 0.05593299865722656, 0.060703277587890625, 0.06547355651855469, 0.07024383544921875, 0.07501411437988281, 0.07978439331054688, 0.08455467224121094, 0.089324951171875, 0.09409523010253906, 0.09886550903320312, 0.10363578796386719, 0.10840606689453125, 0.11317634582519531, 0.11794662475585938, 0.12271690368652344, 0.1274871826171875, 0.13225746154785156, 0.13702774047851562, 0.1417980194091797, 0.14656829833984375, 0.1513385772705078, 0.15610885620117188, 0.16087913513183594, 0.1656494140625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 1.0, 3.0, 7.0, 4.0, 15.0, 7.0, 20.0, 30.0, 28.0, 62.0, 87.0, 159.0, 379.0, 927.0, 3276.0, 15552.0, 157508.0, 3681146.0, 307217.0, 21876.0, 4076.0, 1067.0, 364.0, 176.0, 95.0, 57.0, 34.0, 24.0, 20.0, 18.0, 8.0, 6.0, 9.0, 7.0, 1.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.437744140625, -0.424713134765625, -0.41168212890625, -0.398651123046875, -0.3856201171875, -0.372589111328125, -0.35955810546875, -0.346527099609375, -0.33349609375, -0.320465087890625, -0.30743408203125, -0.294403076171875, -0.2813720703125, -0.268341064453125, -0.25531005859375, -0.242279052734375, -0.229248046875, -0.216217041015625, -0.20318603515625, -0.190155029296875, -0.1771240234375, -0.164093017578125, -0.15106201171875, -0.138031005859375, -0.125, -0.111968994140625, -0.09893798828125, -0.085906982421875, -0.0728759765625, -0.059844970703125, -0.04681396484375, -0.033782958984375, -0.020751953125, -0.007720947265625, 0.00531005859375, 0.018341064453125, 0.0313720703125, 0.044403076171875, 0.05743408203125, 0.070465087890625, 0.08349609375, 0.096527099609375, 0.10955810546875, 0.122589111328125, 0.1356201171875, 0.148651123046875, 0.16168212890625, 0.174713134765625, 0.187744140625, 0.200775146484375, 0.21380615234375, 0.226837158203125, 0.2398681640625, 0.252899169921875, 0.26593017578125, 0.278961181640625, 0.2919921875, 0.305023193359375, 0.31805419921875, 0.331085205078125, 0.3441162109375, 0.357147216796875, 0.37017822265625, 0.383209228515625, 0.396240234375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 6.0, 1.0, 6.0, 8.0, 14.0, 16.0, 21.0, 24.0, 33.0, 59.0, 86.0, 141.0, 222.0, 367.0, 613.0, 753.0, 627.0, 400.0, 252.0, 143.0, 89.0, 59.0, 33.0, 27.0, 11.0, 15.0, 7.0, 12.0, 8.0, 4.0, 5.0, 4.0, 2.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.276123046875, -0.2664604187011719, -0.25679779052734375, -0.24713516235351562, -0.2374725341796875, -0.22780990600585938, -0.21814727783203125, -0.20848464965820312, -0.198822021484375, -0.18915939331054688, -0.17949676513671875, -0.16983413696289062, -0.1601715087890625, -0.15050888061523438, -0.14084625244140625, -0.13118362426757812, -0.12152099609375, -0.11185836791992188, -0.10219573974609375, -0.09253311157226562, -0.0828704833984375, -0.07320785522460938, -0.06354522705078125, -0.053882598876953125, -0.044219970703125, -0.034557342529296875, -0.02489471435546875, -0.015232086181640625, -0.0055694580078125, 0.004093170166015625, 0.01375579833984375, 0.023418426513671875, 0.0330810546875, 0.042743682861328125, 0.05240631103515625, 0.062068939208984375, 0.0717315673828125, 0.08139419555664062, 0.09105682373046875, 0.10071945190429688, 0.110382080078125, 0.12004470825195312, 0.12970733642578125, 0.13936996459960938, 0.1490325927734375, 0.15869522094726562, 0.16835784912109375, 0.17802047729492188, 0.18768310546875, 0.19734573364257812, 0.20700836181640625, 0.21667098999023438, 0.2263336181640625, 0.23599624633789062, 0.24565887451171875, 0.2553215026855469, 0.264984130859375, 0.2746467590332031, 0.28430938720703125, 0.2939720153808594, 0.3036346435546875, 0.3132972717285156, 0.32295989990234375, 0.3326225280761719, 0.34228515625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 10.0, 17.0, 26.0, 35.0, 80.0, 148.0, 194.0, 168.0, 143.0, 79.0, 42.0, 17.0, 6.0, 7.0, 7.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.446486234664917, -3.3627686500549316, -3.2790513038635254, -3.19533371925354, -3.1116161346435547, -3.0278987884521484, -2.944181203842163, -2.8604636192321777, -2.7767462730407715, -2.693028688430786, -2.60931134223938, -2.5255937576293945, -2.4418764114379883, -2.358158826828003, -2.2744412422180176, -2.1907238960266113, -2.107006311416626, -2.0232887268066406, -1.9395713806152344, -1.855853796005249, -1.7721363306045532, -1.6884188652038574, -1.604701280593872, -1.5209838151931763, -1.4372663497924805, -1.3535488843917847, -1.2698314189910889, -1.1861138343811035, -1.1023963689804077, -1.018678903579712, -0.9349613785743713, -0.8512438535690308, -0.7675262689590454, -0.6838088035583496, -0.600091278553009, -0.5163737535476685, -0.43265628814697266, -0.34893879294395447, -0.2652212977409363, -0.1815037727355957, -0.0977863073348999, -0.014068812131881714, 0.06964868307113647, 0.15336617827415466, 0.23708367347717285, 0.32080116868019104, 0.40451866388320923, 0.4882361888885498, 0.5719536542892456, 0.6556711196899414, 0.739388644695282, 0.8231061697006226, 0.9068236351013184, 0.9905411005020142, 1.07425856590271, 1.1579761505126953, 1.2416936159133911, 1.325411081314087, 1.4091286659240723, 1.492846131324768, 1.5765635967254639, 1.6602810621261597, 1.7439985275268555, 1.8277161121368408, 1.9114335775375366]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 6.0, 3.0, 6.0, 5.0, 6.0, 8.0, 6.0, 9.0, 15.0, 7.0, 13.0, 23.0, 23.0, 14.0, 21.0, 25.0, 35.0, 33.0, 30.0, 38.0, 49.0, 50.0, 43.0, 60.0, 45.0, 41.0, 43.0, 35.0, 28.0, 37.0, 34.0, 34.0, 18.0, 33.0, 20.0, 16.0, 14.0, 11.0, 11.0, 13.0, 7.0, 6.0, 10.0, 6.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.135279655456543, -1.0982357263565063, -1.0611919164657593, -1.0241479873657227, -0.9871041774749756, -0.950060248374939, -0.9130163788795471, -0.8759725093841553, -0.8389286398887634, -0.8018847703933716, -0.7648409008979797, -0.7277970314025879, -0.6907531023025513, -0.6537092924118042, -0.6166653633117676, -0.5796214938163757, -0.5425776243209839, -0.505533754825592, -0.4684898853302002, -0.43144598603248596, -0.3944021165370941, -0.35735824704170227, -0.32031434774398804, -0.2832704782485962, -0.24622660875320435, -0.2091827392578125, -0.17213885486125946, -0.13509497046470642, -0.09805110096931458, -0.06100723147392273, -0.02396334707736969, 0.01308053731918335, 0.050124406814575195, 0.08716828376054764, 0.12421216070652008, 0.16125604510307312, 0.19829991459846497, 0.2353437840938568, 0.27238768339157104, 0.3094315528869629, 0.34647542238235474, 0.3835192918777466, 0.4205631613731384, 0.45760706067085266, 0.4946509301662445, 0.531694769859314, 0.5687386989593506, 0.6057825684547424, 0.6428264379501343, 0.6798703074455261, 0.716914176940918, 0.7539580464363098, 0.7910019159317017, 0.8280458450317383, 0.8650897145271301, 0.902133584022522, 0.9391774535179138, 0.9762213230133057, 1.0132652521133423, 1.0503090620040894, 1.087352991104126, 1.124396800994873, 1.1614407300949097, 1.1984846591949463, 1.2355284690856934]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 8.0, 3.0, 5.0, 5.0, 11.0, 5.0, 17.0, 28.0, 29.0, 43.0, 43.0, 69.0, 105.0, 188.0, 250.0, 439.0, 774.0, 1364.0, 2631.0, 5794.0, 13820.0, 37773.0, 131265.0, 478820.0, 268692.0, 67010.0, 22275.0, 8767.0, 3848.0, 1929.0, 928.0, 561.0, 382.0, 203.0, 140.0, 91.0, 66.0, 51.0, 29.0, 34.0, 17.0, 14.0, 8.0, 10.0, 5.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.2301025390625, -0.2232837677001953, -0.21646499633789062, -0.20964622497558594, -0.20282745361328125, -0.19600868225097656, -0.18918991088867188, -0.1823711395263672, -0.1755523681640625, -0.1687335968017578, -0.16191482543945312, -0.15509605407714844, -0.14827728271484375, -0.14145851135253906, -0.13463973999023438, -0.1278209686279297, -0.121002197265625, -0.11418342590332031, -0.10736465454101562, -0.10054588317871094, -0.09372711181640625, -0.08690834045410156, -0.08008956909179688, -0.07327079772949219, -0.0664520263671875, -0.05963325500488281, -0.052814483642578125, -0.04599571228027344, -0.03917694091796875, -0.03235816955566406, -0.025539398193359375, -0.018720626831054688, -0.01190185546875, -0.0050830841064453125, 0.001735687255859375, 0.008554458618164062, 0.01537322998046875, 0.022192001342773438, 0.029010772705078125, 0.03582954406738281, 0.0426483154296875, 0.04946708679199219, 0.056285858154296875, 0.06310462951660156, 0.06992340087890625, 0.07674217224121094, 0.08356094360351562, 0.09037971496582031, 0.097198486328125, 0.10401725769042969, 0.11083602905273438, 0.11765480041503906, 0.12447357177734375, 0.13129234313964844, 0.13811111450195312, 0.1449298858642578, 0.1517486572265625, 0.1585674285888672, 0.16538619995117188, 0.17220497131347656, 0.17902374267578125, 0.18584251403808594, 0.19266128540039062, 0.1994800567626953, 0.206298828125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 8.0, 3.0, 10.0, 21.0, 18.0, 19.0, 27.0, 32.0, 49.0, 49.0, 51.0, 59.0, 57.0, 58.0, 56.0, 64.0, 58.0, 46.0, 52.0, 55.0, 44.0, 20.0, 26.0, 31.0, 24.0, 21.0, 16.0, 9.0, 7.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1602783203125, -0.1547107696533203, -0.14914321899414062, -0.14357566833496094, -0.13800811767578125, -0.13244056701660156, -0.12687301635742188, -0.12130546569824219, -0.1157379150390625, -0.11017036437988281, -0.10460281372070312, -0.09903526306152344, -0.09346771240234375, -0.08790016174316406, -0.08233261108398438, -0.07676506042480469, -0.071197509765625, -0.06562995910644531, -0.060062408447265625, -0.05449485778808594, -0.04892730712890625, -0.04335975646972656, -0.037792205810546875, -0.03222465515136719, -0.0266571044921875, -0.021089553833007812, -0.015522003173828125, -0.009954452514648438, -0.00438690185546875, 0.0011806488037109375, 0.006748199462890625, 0.012315750122070312, 0.01788330078125, 0.023450851440429688, 0.029018402099609375, 0.03458595275878906, 0.04015350341796875, 0.04572105407714844, 0.051288604736328125, 0.05685615539550781, 0.0624237060546875, 0.06799125671386719, 0.07355880737304688, 0.07912635803222656, 0.08469390869140625, 0.09026145935058594, 0.09582901000976562, 0.10139656066894531, 0.106964111328125, 0.11253166198730469, 0.11809921264648438, 0.12366676330566406, 0.12923431396484375, 0.13480186462402344, 0.14036941528320312, 0.1459369659423828, 0.1515045166015625, 0.1570720672607422, 0.16263961791992188, 0.16820716857910156, 0.17377471923828125, 0.17934226989746094, 0.18490982055664062, 0.1904773712158203, 0.196044921875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 6.0, 3.0, 3.0, 7.0, 17.0, 27.0, 31.0, 40.0, 47.0, 92.0, 161.0, 276.0, 560.0, 1135.0, 2895.0, 10171.0, 66972.0, 845876.0, 101087.0, 13074.0, 3431.0, 1265.0, 583.0, 326.0, 167.0, 102.0, 68.0, 39.0, 39.0, 17.0, 18.0, 7.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47802734375, -0.46459197998046875, -0.4511566162109375, -0.43772125244140625, -0.424285888671875, -0.41085052490234375, -0.3974151611328125, -0.38397979736328125, -0.37054443359375, -0.35710906982421875, -0.3436737060546875, -0.33023834228515625, -0.316802978515625, -0.30336761474609375, -0.2899322509765625, -0.27649688720703125, -0.2630615234375, -0.24962615966796875, -0.2361907958984375, -0.22275543212890625, -0.209320068359375, -0.19588470458984375, -0.1824493408203125, -0.16901397705078125, -0.15557861328125, -0.14214324951171875, -0.1287078857421875, -0.11527252197265625, -0.101837158203125, -0.08840179443359375, -0.0749664306640625, -0.06153106689453125, -0.048095703125, -0.03466033935546875, -0.0212249755859375, -0.00778961181640625, 0.005645751953125, 0.01908111572265625, 0.0325164794921875, 0.04595184326171875, 0.05938720703125, 0.07282257080078125, 0.0862579345703125, 0.09969329833984375, 0.113128662109375, 0.12656402587890625, 0.1399993896484375, 0.15343475341796875, 0.1668701171875, 0.18030548095703125, 0.1937408447265625, 0.20717620849609375, 0.220611572265625, 0.23404693603515625, 0.2474822998046875, 0.26091766357421875, 0.27435302734375, 0.28778839111328125, 0.3012237548828125, 0.31465911865234375, 0.328094482421875, 0.34152984619140625, 0.3549652099609375, 0.36840057373046875, 0.3818359375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 6.0, 7.0, 12.0, 14.0, 22.0, 14.0, 20.0, 26.0, 30.0, 43.0, 39.0, 40.0, 35.0, 51.0, 56.0, 61.0, 52.0, 54.0, 63.0, 47.0, 47.0, 50.0, 37.0, 30.0, 27.0, 19.0, 19.0, 17.0, 12.0, 13.0, 6.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.6171875, -0.5996780395507812, -0.5821685791015625, -0.5646591186523438, -0.547149658203125, -0.5296401977539062, -0.5121307373046875, -0.49462127685546875, -0.47711181640625, -0.45960235595703125, -0.4420928955078125, -0.42458343505859375, -0.407073974609375, -0.38956451416015625, -0.3720550537109375, -0.35454559326171875, -0.3370361328125, -0.31952667236328125, -0.3020172119140625, -0.28450775146484375, -0.266998291015625, -0.24948883056640625, -0.2319793701171875, -0.21446990966796875, -0.19696044921875, -0.17945098876953125, -0.1619415283203125, -0.14443206787109375, -0.126922607421875, -0.10941314697265625, -0.0919036865234375, -0.07439422607421875, -0.056884765625, -0.03937530517578125, -0.0218658447265625, -0.00435638427734375, 0.013153076171875, 0.03066253662109375, 0.0481719970703125, 0.06568145751953125, 0.08319091796875, 0.10070037841796875, 0.1182098388671875, 0.13571929931640625, 0.153228759765625, 0.17073822021484375, 0.1882476806640625, 0.20575714111328125, 0.2232666015625, 0.24077606201171875, 0.2582855224609375, 0.27579498291015625, 0.293304443359375, 0.31081390380859375, 0.3283233642578125, 0.34583282470703125, 0.36334228515625, 0.38085174560546875, 0.3983612060546875, 0.41587066650390625, 0.433380126953125, 0.45088958740234375, 0.4683990478515625, 0.48590850830078125, 0.50341796875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 8.0, 2.0, 15.0, 15.0, 19.0, 21.0, 31.0, 48.0, 61.0, 90.0, 126.0, 219.0, 361.0, 722.0, 1392.0, 2931.0, 7089.0, 19007.0, 65566.0, 578260.0, 286714.0, 56531.0, 17409.0, 6269.0, 2716.0, 1278.0, 622.0, 356.0, 250.0, 120.0, 92.0, 68.0, 44.0, 28.0, 16.0, 19.0, 15.0, 15.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07635498046875, -0.07396507263183594, -0.07157516479492188, -0.06918525695800781, -0.06679534912109375, -0.06440544128417969, -0.062015533447265625, -0.05962562561035156, -0.0572357177734375, -0.05484580993652344, -0.052455902099609375, -0.05006599426269531, -0.04767608642578125, -0.04528617858886719, -0.042896270751953125, -0.04050636291503906, -0.038116455078125, -0.03572654724121094, -0.033336639404296875, -0.030946731567382812, -0.02855682373046875, -0.026166915893554688, -0.023777008056640625, -0.021387100219726562, -0.0189971923828125, -0.016607284545898438, -0.014217376708984375, -0.011827468872070312, -0.00943756103515625, -0.0070476531982421875, -0.004657745361328125, -0.0022678375244140625, 0.0001220703125, 0.0025119781494140625, 0.004901885986328125, 0.0072917938232421875, 0.00968170166015625, 0.012071609497070312, 0.014461517333984375, 0.016851425170898438, 0.0192413330078125, 0.021631240844726562, 0.024021148681640625, 0.026411056518554688, 0.02880096435546875, 0.031190872192382812, 0.033580780029296875, 0.03597068786621094, 0.038360595703125, 0.04075050354003906, 0.043140411376953125, 0.04553031921386719, 0.04792022705078125, 0.05031013488769531, 0.052700042724609375, 0.05508995056152344, 0.0574798583984375, 0.05986976623535156, 0.062259674072265625, 0.06464958190917969, 0.06703948974609375, 0.06942939758300781, 0.07181930541992188, 0.07420921325683594, 0.07659912109375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 12.0, 16.0, 19.0, 39.0, 50.0, 91.0, 132.0, 164.0, 161.0, 114.0, 80.0, 49.0, 31.0, 17.0, 8.0, 10.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7610530853271484e-05, -3.6094337701797485e-05, -3.4578144550323486e-05, -3.306195139884949e-05, -3.154575824737549e-05, -3.002956509590149e-05, -2.851337194442749e-05, -2.699717879295349e-05, -2.5480985641479492e-05, -2.3964792490005493e-05, -2.2448599338531494e-05, -2.0932406187057495e-05, -1.9416213035583496e-05, -1.7900019884109497e-05, -1.6383826732635498e-05, -1.4867633581161499e-05, -1.33514404296875e-05, -1.1835247278213501e-05, -1.0319054126739502e-05, -8.802860975265503e-06, -7.286667823791504e-06, -5.770474672317505e-06, -4.254281520843506e-06, -2.738088369369507e-06, -1.2218952178955078e-06, 2.942979335784912e-07, 1.8104910850524902e-06, 3.3266842365264893e-06, 4.842877388000488e-06, 6.359070539474487e-06, 7.875263690948486e-06, 9.391456842422485e-06, 1.0907649993896484e-05, 1.2423843145370483e-05, 1.3940036296844482e-05, 1.545622944831848e-05, 1.697242259979248e-05, 1.848861575126648e-05, 2.000480890274048e-05, 2.1521002054214478e-05, 2.3037195205688477e-05, 2.4553388357162476e-05, 2.6069581508636475e-05, 2.7585774660110474e-05, 2.9101967811584473e-05, 3.061816096305847e-05, 3.213435411453247e-05, 3.365054726600647e-05, 3.516674041748047e-05, 3.668293356895447e-05, 3.819912672042847e-05, 3.9715319871902466e-05, 4.1231513023376465e-05, 4.2747706174850464e-05, 4.426389932632446e-05, 4.578009247779846e-05, 4.729628562927246e-05, 4.881247878074646e-05, 5.032867193222046e-05, 5.184486508369446e-05, 5.336105823516846e-05, 5.4877251386642456e-05, 5.6393444538116455e-05, 5.7909637689590454e-05, 5.942583084106445e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 2.0, 10.0, 7.0, 5.0, 22.0, 13.0, 37.0, 46.0, 63.0, 101.0, 136.0, 216.0, 322.0, 567.0, 914.0, 1822.0, 3689.0, 8857.0, 24360.0, 77773.0, 555502.0, 270513.0, 66546.0, 21721.0, 7971.0, 3484.0, 1611.0, 865.0, 474.0, 299.0, 192.0, 140.0, 75.0, 69.0, 33.0, 24.0, 18.0, 12.0, 14.0, 12.0, 5.0, 5.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06024169921875, -0.058005332946777344, -0.05576896667480469, -0.05353260040283203, -0.051296234130859375, -0.04905986785888672, -0.04682350158691406, -0.044587135314941406, -0.04235076904296875, -0.040114402770996094, -0.03787803649902344, -0.03564167022705078, -0.033405303955078125, -0.03116893768310547, -0.028932571411132812, -0.026696205139160156, -0.0244598388671875, -0.022223472595214844, -0.019987106323242188, -0.01775074005126953, -0.015514373779296875, -0.013278007507324219, -0.011041641235351562, -0.008805274963378906, -0.00656890869140625, -0.004332542419433594, -0.0020961761474609375, 0.00014019012451171875, 0.002376556396484375, 0.004612922668457031, 0.0068492889404296875, 0.009085655212402344, 0.011322021484375, 0.013558387756347656, 0.015794754028320312, 0.01803112030029297, 0.020267486572265625, 0.02250385284423828, 0.024740219116210938, 0.026976585388183594, 0.02921295166015625, 0.031449317932128906, 0.03368568420410156, 0.03592205047607422, 0.038158416748046875, 0.04039478302001953, 0.04263114929199219, 0.044867515563964844, 0.0471038818359375, 0.049340248107910156, 0.05157661437988281, 0.05381298065185547, 0.056049346923828125, 0.05828571319580078, 0.06052207946777344, 0.0627584457397461, 0.06499481201171875, 0.0672311782836914, 0.06946754455566406, 0.07170391082763672, 0.07394027709960938, 0.07617664337158203, 0.07841300964355469, 0.08064937591552734, 0.0828857421875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 9.0, 2.0, 6.0, 5.0, 12.0, 27.0, 24.0, 29.0, 37.0, 58.0, 49.0, 71.0, 99.0, 96.0, 90.0, 85.0, 76.0, 55.0, 44.0, 28.0, 23.0, 20.0, 12.0, 10.0, 14.0, 6.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1109619140625, -0.10774707794189453, -0.10453224182128906, -0.1013174057006836, -0.09810256958007812, -0.09488773345947266, -0.09167289733886719, -0.08845806121826172, -0.08524322509765625, -0.08202838897705078, -0.07881355285644531, -0.07559871673583984, -0.07238388061523438, -0.0691690444946289, -0.06595420837402344, -0.06273937225341797, -0.0595245361328125, -0.05630970001220703, -0.05309486389160156, -0.049880027770996094, -0.046665191650390625, -0.043450355529785156, -0.04023551940917969, -0.03702068328857422, -0.03380584716796875, -0.03059101104736328, -0.027376174926757812, -0.024161338806152344, -0.020946502685546875, -0.017731666564941406, -0.014516830444335938, -0.011301994323730469, -0.008087158203125, -0.004872322082519531, -0.0016574859619140625, 0.0015573501586914062, 0.004772186279296875, 0.007987022399902344, 0.011201858520507812, 0.014416694641113281, 0.01763153076171875, 0.02084636688232422, 0.024061203002929688, 0.027276039123535156, 0.030490875244140625, 0.033705711364746094, 0.03692054748535156, 0.04013538360595703, 0.0433502197265625, 0.04656505584716797, 0.04977989196777344, 0.052994728088378906, 0.056209564208984375, 0.059424400329589844, 0.06263923645019531, 0.06585407257080078, 0.06906890869140625, 0.07228374481201172, 0.07549858093261719, 0.07871341705322266, 0.08192825317382812, 0.0851430892944336, 0.08835792541503906, 0.09157276153564453, 0.09478759765625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 7.0, 13.0, 30.0, 52.0, 145.0, 395.0, 190.0, 94.0, 38.0, 18.0, 8.0, 4.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1198501586914062, -3.0021679401397705, -2.8844857215881348, -2.76680326461792, -2.649121046066284, -2.5314388275146484, -2.4137563705444336, -2.296074151992798, -2.178391933441162, -2.0607097148895264, -1.943027377128601, -1.8253450393676758, -1.70766282081604, -1.5899806022644043, -1.472298264503479, -1.3546159267425537, -1.236933708190918, -1.1192514896392822, -1.001569151878357, -0.8838868737220764, -0.7662045955657959, -0.6485223174095154, -0.5308400392532349, -0.41315776109695435, -0.29547548294067383, -0.1777932047843933, -0.06011092662811279, 0.057571351528167725, 0.17525362968444824, 0.29293590784072876, 0.4106181859970093, 0.5283004641532898, 0.6459827423095703, 0.7636650204658508, 0.8813472986221313, 0.9990295767784119, 1.1167118549346924, 1.2343940734863281, 1.3520764112472534, 1.4697587490081787, 1.5874409675598145, 1.7051231861114502, 1.8228055238723755, 1.9404878616333008, 2.0581700801849365, 2.1758522987365723, 2.293534755706787, 2.411216974258423, 2.5288991928100586, 2.6465814113616943, 2.76426362991333, 2.881946086883545, 2.9996283054351807, 3.1173105239868164, 3.2349929809570312, 3.352675199508667, 3.4703574180603027, 3.5880396366119385, 3.705721855163574, 3.823404312133789, 3.941086530685425, 4.0587687492370605, 4.176451206207275, 4.294133186340332, 4.411815643310547]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 1.0, 8.0, 9.0, 8.0, 7.0, 9.0, 13.0, 20.0, 24.0, 21.0, 24.0, 30.0, 33.0, 53.0, 41.0, 95.0, 111.0, 123.0, 78.0, 45.0, 36.0, 23.0, 26.0, 40.0, 24.0, 17.0, 16.0, 16.0, 7.0, 6.0, 9.0, 4.0, 6.0, 7.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9430243968963623, -1.8712377548217773, -1.7994511127471924, -1.7276644706726074, -1.6558778285980225, -1.5840911865234375, -1.512304425239563, -1.440517783164978, -1.368731141090393, -1.296944499015808, -1.2251578569412231, -1.1533712148666382, -1.0815844535827637, -1.0097978115081787, -0.9380111694335938, -0.8662245273590088, -0.7944378852844238, -0.7226512432098389, -0.6508646011352539, -0.5790778994560242, -0.5072912573814392, -0.43550461530685425, -0.3637179434299469, -0.29193127155303955, -0.2201446294784546, -0.14835797250270844, -0.07657131552696228, -0.0047846585512161255, 0.06700199842453003, 0.138788640499115, 0.21057531237602234, 0.2823619842529297, 0.35414886474609375, 0.4259355068206787, 0.49772217869758606, 0.5695088505744934, 0.6412954926490784, 0.7130821347236633, 0.7848688364028931, 0.856655478477478, 0.928442120552063, 1.000228762626648, 1.072015404701233, 1.1438020467758179, 1.2155888080596924, 1.2873754501342773, 1.3591620922088623, 1.4309487342834473, 1.5027353763580322, 1.5745220184326172, 1.6463086605072021, 1.718095302581787, 1.789881944656372, 1.861668586730957, 1.9334553480148315, 2.005241870880127, 2.077028751373291, 2.148815393447876, 2.220602035522461, 2.292388677597046, 2.364175319671631, 2.435961961746216, 2.507748603820801, 2.579535484313965, 2.6513218879699707]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 7.0, 9.0, 12.0, 18.0, 29.0, 44.0, 69.0, 109.0, 219.0, 326.0, 577.0, 931.0, 1560.0, 2929.0, 5842.0, 11608.0, 25967.0, 67381.0, 209872.0, 718566.0, 1725985.0, 977459.0, 292639.0, 88269.0, 33125.0, 14784.0, 7118.0, 3802.0, 2064.0, 1191.0, 665.0, 391.0, 267.0, 176.0, 103.0, 68.0, 47.0, 19.0, 14.0, 10.0, 4.0, 4.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.163818359375, -0.15789222717285156, -0.15196609497070312, -0.1460399627685547, -0.14011383056640625, -0.1341876983642578, -0.12826156616210938, -0.12233543395996094, -0.1164093017578125, -0.11048316955566406, -0.10455703735351562, -0.09863090515136719, -0.09270477294921875, -0.08677864074707031, -0.08085250854492188, -0.07492637634277344, -0.069000244140625, -0.06307411193847656, -0.057147979736328125, -0.05122184753417969, -0.04529571533203125, -0.03936958312988281, -0.033443450927734375, -0.027517318725585938, -0.0215911865234375, -0.015665054321289062, -0.009738922119140625, -0.0038127899169921875, 0.00211334228515625, 0.008039474487304688, 0.013965606689453125, 0.019891738891601562, 0.02581787109375, 0.03174400329589844, 0.037670135498046875, 0.04359626770019531, 0.04952239990234375, 0.05544853210449219, 0.061374664306640625, 0.06730079650878906, 0.0732269287109375, 0.07915306091308594, 0.08507919311523438, 0.09100532531738281, 0.09693145751953125, 0.10285758972167969, 0.10878372192382812, 0.11470985412597656, 0.120635986328125, 0.12656211853027344, 0.13248825073242188, 0.1384143829345703, 0.14434051513671875, 0.1502666473388672, 0.15619277954101562, 0.16211891174316406, 0.1680450439453125, 0.17397117614746094, 0.17989730834960938, 0.1858234405517578, 0.19174957275390625, 0.1976757049560547, 0.20360183715820312, 0.20952796936035156, 0.2154541015625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 1.0, 5.0, 5.0, 3.0, 4.0, 7.0, 7.0, 8.0, 15.0, 15.0, 27.0, 22.0, 28.0, 37.0, 45.0, 48.0, 51.0, 43.0, 64.0, 49.0, 46.0, 48.0, 54.0, 43.0, 46.0, 43.0, 32.0, 44.0, 30.0, 33.0, 27.0, 13.0, 18.0, 11.0, 16.0, 9.0, 5.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1119384765625, -0.10716056823730469, -0.10238265991210938, -0.09760475158691406, -0.09282684326171875, -0.08804893493652344, -0.08327102661132812, -0.07849311828613281, -0.0737152099609375, -0.06893730163574219, -0.06415939331054688, -0.05938148498535156, -0.05460357666015625, -0.04982566833496094, -0.045047760009765625, -0.04026985168457031, -0.035491943359375, -0.030714035034179688, -0.025936126708984375, -0.021158218383789062, -0.01638031005859375, -0.011602401733398438, -0.006824493408203125, -0.0020465850830078125, 0.0027313232421875, 0.0075092315673828125, 0.012287139892578125, 0.017065048217773438, 0.02184295654296875, 0.026620864868164062, 0.031398773193359375, 0.03617668151855469, 0.04095458984375, 0.04573249816894531, 0.050510406494140625, 0.05528831481933594, 0.06006622314453125, 0.06484413146972656, 0.06962203979492188, 0.07439994812011719, 0.0791778564453125, 0.08395576477050781, 0.08873367309570312, 0.09351158142089844, 0.09828948974609375, 0.10306739807128906, 0.10784530639648438, 0.11262321472167969, 0.117401123046875, 0.12217903137207031, 0.12695693969726562, 0.13173484802246094, 0.13651275634765625, 0.14129066467285156, 0.14606857299804688, 0.1508464813232422, 0.1556243896484375, 0.1604022979736328, 0.16518020629882812, 0.16995811462402344, 0.17473602294921875, 0.17951393127441406, 0.18429183959960938, 0.1890697479248047, 0.19384765625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 11.0, 18.0, 22.0, 37.0, 63.0, 104.0, 241.0, 506.0, 1368.0, 8017.0, 2181553.0, 1992035.0, 8033.0, 1276.0, 484.0, 221.0, 131.0, 69.0, 37.0, 19.0, 15.0, 1.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.8212890625, -1.7789306640625, -1.736572265625, -1.6942138671875, -1.65185546875, -1.6094970703125, -1.567138671875, -1.5247802734375, -1.482421875, -1.4400634765625, -1.397705078125, -1.3553466796875, -1.31298828125, -1.2706298828125, -1.228271484375, -1.1859130859375, -1.1435546875, -1.1011962890625, -1.058837890625, -1.0164794921875, -0.97412109375, -0.9317626953125, -0.889404296875, -0.8470458984375, -0.8046875, -0.7623291015625, -0.719970703125, -0.6776123046875, -0.63525390625, -0.5928955078125, -0.550537109375, -0.5081787109375, -0.4658203125, -0.4234619140625, -0.381103515625, -0.3387451171875, -0.29638671875, -0.2540283203125, -0.211669921875, -0.1693115234375, -0.126953125, -0.0845947265625, -0.042236328125, 0.0001220703125, 0.04248046875, 0.0848388671875, 0.127197265625, 0.1695556640625, 0.2119140625, 0.2542724609375, 0.296630859375, 0.3389892578125, 0.38134765625, 0.4237060546875, 0.466064453125, 0.5084228515625, 0.55078125, 0.5931396484375, 0.635498046875, 0.6778564453125, 0.72021484375, 0.7625732421875, 0.804931640625, 0.8472900390625, 0.8896484375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 13.0, 9.0, 26.0, 18.0, 33.0, 49.0, 69.0, 94.0, 131.0, 209.0, 313.0, 476.0, 700.0, 601.0, 405.0, 251.0, 200.0, 135.0, 104.0, 74.0, 47.0, 33.0, 26.0, 20.0, 15.0, 10.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5869140625, -0.5709953308105469, -0.5550765991210938, -0.5391578674316406, -0.5232391357421875, -0.5073204040527344, -0.49140167236328125, -0.4754829406738281, -0.459564208984375, -0.4436454772949219, -0.42772674560546875, -0.4118080139160156, -0.3958892822265625, -0.3799705505371094, -0.36405181884765625, -0.3481330871582031, -0.33221435546875, -0.3162956237792969, -0.30037689208984375, -0.2844581604003906, -0.2685394287109375, -0.2526206970214844, -0.23670196533203125, -0.22078323364257812, -0.204864501953125, -0.18894577026367188, -0.17302703857421875, -0.15710830688476562, -0.1411895751953125, -0.12527084350585938, -0.10935211181640625, -0.09343338012695312, -0.0775146484375, -0.061595916748046875, -0.04567718505859375, -0.029758453369140625, -0.0138397216796875, 0.002079010009765625, 0.01799774169921875, 0.033916473388671875, 0.049835205078125, 0.06575393676757812, 0.08167266845703125, 0.09759140014648438, 0.1135101318359375, 0.12942886352539062, 0.14534759521484375, 0.16126632690429688, 0.17718505859375, 0.19310379028320312, 0.20902252197265625, 0.22494125366210938, 0.2408599853515625, 0.2567787170410156, 0.27269744873046875, 0.2886161804199219, 0.304534912109375, 0.3204536437988281, 0.33637237548828125, 0.3522911071777344, 0.3682098388671875, 0.3841285705566406, 0.40004730224609375, 0.4159660339355469, 0.431884765625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 6.0, 6.0, 6.0, 19.0, 37.0, 70.0, 166.0, 283.0, 213.0, 99.0, 51.0, 19.0, 14.0, 9.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-12.26026725769043, -11.991594314575195, -11.722922325134277, -11.454249382019043, -11.185577392578125, -10.91690444946289, -10.648231506347656, -10.379559516906738, -10.110886573791504, -9.84221363067627, -9.573541641235352, -9.304868698120117, -9.036195755004883, -8.767523765563965, -8.49885082244873, -8.230178833007812, -7.961505889892578, -7.692833423614502, -7.424160957336426, -7.155488014221191, -6.886815547943115, -6.618143081665039, -6.349470138549805, -6.0807976722717285, -5.812125205993652, -5.543452739715576, -5.2747802734375, -5.006107330322266, -4.7374348640441895, -4.468762397766113, -4.200089454650879, -3.9314169883728027, -3.6627445220947266, -3.3940720558166504, -3.125399351119995, -2.85672664642334, -2.5880541801452637, -2.3193817138671875, -2.0507090091705322, -1.7820364236831665, -1.5133638381958008, -1.244691252708435, -0.9760186672210693, -0.7073460817337036, -0.4386734962463379, -0.17000091075897217, 0.09867167472839355, 0.3673442602157593, 0.636016845703125, 0.9046894311904907, 1.1733620166778564, 1.4420346021652222, 1.710707187652588, 1.9793797731399536, 2.2480523586273193, 2.5167250633239746, 2.785397529602051, 3.054069995880127, 3.3227427005767822, 3.5914154052734375, 3.8600878715515137, 4.12876033782959, 4.397433280944824, 4.6661057472229, 4.934778213500977]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 1.0, 4.0, 8.0, 9.0, 14.0, 16.0, 24.0, 17.0, 23.0, 27.0, 31.0, 38.0, 33.0, 37.0, 62.0, 61.0, 76.0, 70.0, 66.0, 55.0, 45.0, 38.0, 46.0, 32.0, 21.0, 16.0, 19.0, 15.0, 26.0, 17.0, 12.0, 10.0, 11.0, 8.0, 8.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.313432455062866, -2.2276346683502197, -2.1418368816375732, -2.0560390949249268, -1.9702411890029907, -1.8844434022903442, -1.7986454963684082, -1.7128477096557617, -1.6270499229431152, -1.5412521362304688, -1.4554543495178223, -1.3696564435958862, -1.2838586568832397, -1.1980608701705933, -1.1122629642486572, -1.0264651775360107, -0.9406673908233643, -0.8548696041107178, -0.7690717577934265, -0.6832739114761353, -0.5974761247634888, -0.5116783380508423, -0.425880491733551, -0.34008264541625977, -0.2542848587036133, -0.1684870421886444, -0.08268922567367554, 0.003108590841293335, 0.08890640735626221, 0.17470422387123108, 0.26050204038619995, 0.3462998867034912, 0.4320974349975586, 0.5178952217102051, 0.6036930680274963, 0.6894909143447876, 0.7752887010574341, 0.8610864877700806, 0.9468843340873718, 1.032682180404663, 1.1184799671173096, 1.204277753829956, 1.2900755405426025, 1.3758734464645386, 1.461671233177185, 1.5474690198898315, 1.6332669258117676, 1.719064712524414, 1.8048624992370605, 1.890660285949707, 1.9764580726623535, 2.062255859375, 2.1480536460876465, 2.233851671218872, 2.3196494579315186, 2.405447244644165, 2.4912450313568115, 2.577042818069458, 2.6628406047821045, 2.748638391494751, 2.8344364166259766, 2.920234203338623, 3.0060319900512695, 3.091829776763916, 3.1776275634765625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 5.0, 7.0, 11.0, 15.0, 18.0, 18.0, 47.0, 64.0, 105.0, 118.0, 228.0, 433.0, 857.0, 2091.0, 5885.0, 18699.0, 84983.0, 676636.0, 208585.0, 34354.0, 9437.0, 3298.0, 1316.0, 538.0, 326.0, 155.0, 98.0, 60.0, 34.0, 36.0, 28.0, 18.0, 12.0, 11.0, 9.0, 10.0, 2.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.348876953125, -0.33882904052734375, -0.3287811279296875, -0.31873321533203125, -0.308685302734375, -0.29863739013671875, -0.2885894775390625, -0.27854156494140625, -0.26849365234375, -0.25844573974609375, -0.2483978271484375, -0.23834991455078125, -0.228302001953125, -0.21825408935546875, -0.2082061767578125, -0.19815826416015625, -0.1881103515625, -0.17806243896484375, -0.1680145263671875, -0.15796661376953125, -0.147918701171875, -0.13787078857421875, -0.1278228759765625, -0.11777496337890625, -0.10772705078125, -0.09767913818359375, -0.0876312255859375, -0.07758331298828125, -0.067535400390625, -0.05748748779296875, -0.0474395751953125, -0.03739166259765625, -0.02734375, -0.01729583740234375, -0.0072479248046875, 0.00279998779296875, 0.012847900390625, 0.02289581298828125, 0.0329437255859375, 0.04299163818359375, 0.05303955078125, 0.06308746337890625, 0.0731353759765625, 0.08318328857421875, 0.093231201171875, 0.10327911376953125, 0.1133270263671875, 0.12337493896484375, 0.1334228515625, 0.14347076416015625, 0.1535186767578125, 0.16356658935546875, 0.173614501953125, 0.18366241455078125, 0.1937103271484375, 0.20375823974609375, 0.21380615234375, 0.22385406494140625, 0.2339019775390625, 0.24394989013671875, 0.253997802734375, 0.26404571533203125, 0.2740936279296875, 0.28414154052734375, 0.294189453125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 6.0, 10.0, 10.0, 11.0, 15.0, 20.0, 18.0, 22.0, 38.0, 24.0, 28.0, 44.0, 49.0, 58.0, 67.0, 45.0, 49.0, 44.0, 49.0, 53.0, 47.0, 41.0, 35.0, 39.0, 30.0, 29.0, 25.0, 15.0, 14.0, 7.0, 11.0, 7.0, 12.0, 2.0, 7.0, 1.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.19921875, -0.19310760498046875, -0.1869964599609375, -0.18088531494140625, -0.174774169921875, -0.16866302490234375, -0.1625518798828125, -0.15644073486328125, -0.15032958984375, -0.14421844482421875, -0.1381072998046875, -0.13199615478515625, -0.125885009765625, -0.11977386474609375, -0.1136627197265625, -0.10755157470703125, -0.1014404296875, -0.09532928466796875, -0.0892181396484375, -0.08310699462890625, -0.076995849609375, -0.07088470458984375, -0.0647735595703125, -0.05866241455078125, -0.05255126953125, -0.04644012451171875, -0.0403289794921875, -0.03421783447265625, -0.028106689453125, -0.02199554443359375, -0.0158843994140625, -0.00977325439453125, -0.003662109375, 0.00244903564453125, 0.0085601806640625, 0.01467132568359375, 0.020782470703125, 0.02689361572265625, 0.0330047607421875, 0.03911590576171875, 0.04522705078125, 0.05133819580078125, 0.0574493408203125, 0.06356048583984375, 0.069671630859375, 0.07578277587890625, 0.0818939208984375, 0.08800506591796875, 0.0941162109375, 0.10022735595703125, 0.1063385009765625, 0.11244964599609375, 0.118560791015625, 0.12467193603515625, 0.1307830810546875, 0.13689422607421875, 0.14300537109375, 0.14911651611328125, 0.1552276611328125, 0.16133880615234375, 0.167449951171875, 0.17356109619140625, 0.1796722412109375, 0.18578338623046875, 0.19189453125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 7.0, 15.0, 7.0, 12.0, 22.0, 32.0, 57.0, 72.0, 126.0, 225.0, 483.0, 1171.0, 3884.0, 25038.0, 883539.0, 118919.0, 10877.0, 2361.0, 815.0, 382.0, 203.0, 117.0, 60.0, 37.0, 25.0, 16.0, 18.0, 8.0, 7.0, 9.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.433837890625, -0.41927337646484375, -0.4047088623046875, -0.39014434814453125, -0.375579833984375, -0.36101531982421875, -0.3464508056640625, -0.33188629150390625, -0.31732177734375, -0.30275726318359375, -0.2881927490234375, -0.27362823486328125, -0.259063720703125, -0.24449920654296875, -0.2299346923828125, -0.21537017822265625, -0.2008056640625, -0.18624114990234375, -0.1716766357421875, -0.15711212158203125, -0.142547607421875, -0.12798309326171875, -0.1134185791015625, -0.09885406494140625, -0.08428955078125, -0.06972503662109375, -0.0551605224609375, -0.04059600830078125, -0.026031494140625, -0.01146697998046875, 0.0030975341796875, 0.01766204833984375, 0.0322265625, 0.04679107666015625, 0.0613555908203125, 0.07592010498046875, 0.090484619140625, 0.10504913330078125, 0.1196136474609375, 0.13417816162109375, 0.14874267578125, 0.16330718994140625, 0.1778717041015625, 0.19243621826171875, 0.207000732421875, 0.22156524658203125, 0.2361297607421875, 0.25069427490234375, 0.2652587890625, 0.27982330322265625, 0.2943878173828125, 0.30895233154296875, 0.323516845703125, 0.33808135986328125, 0.3526458740234375, 0.36721038818359375, 0.38177490234375, 0.39633941650390625, 0.4109039306640625, 0.42546844482421875, 0.440032958984375, 0.45459747314453125, 0.4691619873046875, 0.48372650146484375, 0.498291015625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 6.0, 8.0, 7.0, 6.0, 7.0, 10.0, 11.0, 18.0, 12.0, 12.0, 30.0, 25.0, 36.0, 41.0, 58.0, 73.0, 78.0, 97.0, 72.0, 56.0, 50.0, 40.0, 37.0, 35.0, 31.0, 25.0, 23.0, 14.0, 16.0, 18.0, 8.0, 5.0, 13.0, 6.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.748046875, -0.7234573364257812, -0.6988677978515625, -0.6742782592773438, -0.649688720703125, -0.6250991821289062, -0.6005096435546875, -0.5759201049804688, -0.55133056640625, -0.5267410278320312, -0.5021514892578125, -0.47756195068359375, -0.452972412109375, -0.42838287353515625, -0.4037933349609375, -0.37920379638671875, -0.3546142578125, -0.33002471923828125, -0.3054351806640625, -0.28084564208984375, -0.256256103515625, -0.23166656494140625, -0.2070770263671875, -0.18248748779296875, -0.15789794921875, -0.13330841064453125, -0.1087188720703125, -0.08412933349609375, -0.059539794921875, -0.03495025634765625, -0.0103607177734375, 0.01422882080078125, 0.038818359375, 0.06340789794921875, 0.0879974365234375, 0.11258697509765625, 0.137176513671875, 0.16176605224609375, 0.1863555908203125, 0.21094512939453125, 0.23553466796875, 0.26012420654296875, 0.2847137451171875, 0.30930328369140625, 0.333892822265625, 0.35848236083984375, 0.3830718994140625, 0.40766143798828125, 0.4322509765625, 0.45684051513671875, 0.4814300537109375, 0.5060195922851562, 0.530609130859375, 0.5551986694335938, 0.5797882080078125, 0.6043777465820312, 0.62896728515625, 0.6535568237304688, 0.6781463623046875, 0.7027359008789062, 0.727325439453125, 0.7519149780273438, 0.7765045166015625, 0.8010940551757812, 0.82568359375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 1.0, 9.0, 6.0, 3.0, 7.0, 4.0, 11.0, 13.0, 9.0, 15.0, 20.0, 28.0, 39.0, 45.0, 64.0, 83.0, 127.0, 167.0, 316.0, 487.0, 787.0, 1327.0, 2666.0, 5718.0, 13841.0, 42385.0, 233341.0, 673081.0, 46450.0, 14892.0, 6161.0, 2779.0, 1397.0, 832.0, 469.0, 331.0, 187.0, 118.0, 92.0, 62.0, 44.0, 22.0, 22.0, 21.0, 10.0, 12.0, 10.0, 12.0, 13.0, 7.0, 7.0, 4.0, 3.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.047393798828125, -0.045866966247558594, -0.04434013366699219, -0.04281330108642578, -0.041286468505859375, -0.03975963592529297, -0.03823280334472656, -0.036705970764160156, -0.03517913818359375, -0.033652305603027344, -0.03212547302246094, -0.03059864044189453, -0.029071807861328125, -0.02754497528076172, -0.026018142700195312, -0.024491310119628906, -0.0229644775390625, -0.021437644958496094, -0.019910812377929688, -0.01838397979736328, -0.016857147216796875, -0.015330314636230469, -0.013803482055664062, -0.012276649475097656, -0.01074981689453125, -0.009222984313964844, -0.0076961517333984375, -0.006169319152832031, -0.004642486572265625, -0.0031156539916992188, -0.0015888214111328125, -6.198883056640625e-05, 0.00146484375, 0.0029916763305664062, 0.0045185089111328125, 0.006045341491699219, 0.007572174072265625, 0.009099006652832031, 0.010625839233398438, 0.012152671813964844, 0.01367950439453125, 0.015206336975097656, 0.016733169555664062, 0.01826000213623047, 0.019786834716796875, 0.02131366729736328, 0.022840499877929688, 0.024367332458496094, 0.0258941650390625, 0.027420997619628906, 0.028947830200195312, 0.03047466278076172, 0.032001495361328125, 0.03352832794189453, 0.03505516052246094, 0.036581993103027344, 0.03810882568359375, 0.039635658264160156, 0.04116249084472656, 0.04268932342529297, 0.044216156005859375, 0.04574298858642578, 0.04726982116699219, 0.048796653747558594, 0.050323486328125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 4.0, 9.0, 12.0, 14.0, 12.0, 17.0, 19.0, 38.0, 44.0, 96.0, 108.0, 115.0, 117.0, 114.0, 71.0, 55.0, 37.0, 25.0, 24.0, 18.0, 12.0, 17.0, 9.0, 5.0, 3.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.24249267578125e-05, -3.141164779663086e-05, -3.039836883544922e-05, -2.9385089874267578e-05, -2.8371810913085938e-05, -2.7358531951904297e-05, -2.6345252990722656e-05, -2.5331974029541016e-05, -2.4318695068359375e-05, -2.3305416107177734e-05, -2.2292137145996094e-05, -2.1278858184814453e-05, -2.0265579223632812e-05, -1.9252300262451172e-05, -1.823902130126953e-05, -1.722574234008789e-05, -1.621246337890625e-05, -1.519918441772461e-05, -1.4185905456542969e-05, -1.3172626495361328e-05, -1.2159347534179688e-05, -1.1146068572998047e-05, -1.0132789611816406e-05, -9.119510650634766e-06, -8.106231689453125e-06, -7.092952728271484e-06, -6.079673767089844e-06, -5.066394805908203e-06, -4.0531158447265625e-06, -3.039836883544922e-06, -2.0265579223632812e-06, -1.0132789611816406e-06, 0.0, 1.0132789611816406e-06, 2.0265579223632812e-06, 3.039836883544922e-06, 4.0531158447265625e-06, 5.066394805908203e-06, 6.079673767089844e-06, 7.092952728271484e-06, 8.106231689453125e-06, 9.119510650634766e-06, 1.0132789611816406e-05, 1.1146068572998047e-05, 1.2159347534179688e-05, 1.3172626495361328e-05, 1.4185905456542969e-05, 1.519918441772461e-05, 1.621246337890625e-05, 1.722574234008789e-05, 1.823902130126953e-05, 1.9252300262451172e-05, 2.0265579223632812e-05, 2.1278858184814453e-05, 2.2292137145996094e-05, 2.3305416107177734e-05, 2.4318695068359375e-05, 2.5331974029541016e-05, 2.6345252990722656e-05, 2.7358531951904297e-05, 2.8371810913085938e-05, 2.9385089874267578e-05, 3.039836883544922e-05, 3.141164779663086e-05, 3.24249267578125e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 7.0, 2.0, 1.0, 3.0, 4.0, 7.0, 8.0, 13.0, 16.0, 23.0, 61.0, 75.0, 99.0, 173.0, 277.0, 459.0, 890.0, 1632.0, 3374.0, 7893.0, 21603.0, 80445.0, 781310.0, 107366.0, 25591.0, 9090.0, 3901.0, 1879.0, 963.0, 517.0, 339.0, 177.0, 109.0, 86.0, 57.0, 35.0, 15.0, 13.0, 12.0, 6.0, 7.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05322265625, -0.051482200622558594, -0.04974174499511719, -0.04800128936767578, -0.046260833740234375, -0.04452037811279297, -0.04277992248535156, -0.041039466857910156, -0.03929901123046875, -0.037558555603027344, -0.03581809997558594, -0.03407764434814453, -0.032337188720703125, -0.03059673309326172, -0.028856277465820312, -0.027115821838378906, -0.0253753662109375, -0.023634910583496094, -0.021894454956054688, -0.02015399932861328, -0.018413543701171875, -0.01667308807373047, -0.014932632446289062, -0.013192176818847656, -0.01145172119140625, -0.009711265563964844, -0.007970809936523438, -0.006230354309082031, -0.004489898681640625, -0.0027494430541992188, -0.0010089874267578125, 0.0007314682006835938, 0.002471923828125, 0.004212379455566406, 0.0059528350830078125, 0.007693290710449219, 0.009433746337890625, 0.011174201965332031, 0.012914657592773438, 0.014655113220214844, 0.01639556884765625, 0.018136024475097656, 0.019876480102539062, 0.02161693572998047, 0.023357391357421875, 0.02509784698486328, 0.026838302612304688, 0.028578758239746094, 0.0303192138671875, 0.032059669494628906, 0.03380012512207031, 0.03554058074951172, 0.037281036376953125, 0.03902149200439453, 0.04076194763183594, 0.042502403259277344, 0.04424285888671875, 0.045983314514160156, 0.04772377014160156, 0.04946422576904297, 0.051204681396484375, 0.05294513702392578, 0.05468559265136719, 0.056426048278808594, 0.05816650390625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 10.0, 7.0, 13.0, 12.0, 21.0, 28.0, 34.0, 49.0, 99.0, 169.0, 189.0, 127.0, 72.0, 51.0, 19.0, 17.0, 21.0, 19.0, 9.0, 10.0, 6.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.146484375, -0.14219284057617188, -0.13790130615234375, -0.13360977172851562, -0.1293182373046875, -0.12502670288085938, -0.12073516845703125, -0.11644363403320312, -0.112152099609375, -0.10786056518554688, -0.10356903076171875, -0.09927749633789062, -0.0949859619140625, -0.09069442749023438, -0.08640289306640625, -0.08211135864257812, -0.07781982421875, -0.07352828979492188, -0.06923675537109375, -0.06494522094726562, -0.0606536865234375, -0.056362152099609375, -0.05207061767578125, -0.047779083251953125, -0.043487548828125, -0.039196014404296875, -0.03490447998046875, -0.030612945556640625, -0.0263214111328125, -0.022029876708984375, -0.01773834228515625, -0.013446807861328125, -0.0091552734375, -0.004863739013671875, -0.00057220458984375, 0.003719329833984375, 0.0080108642578125, 0.012302398681640625, 0.01659393310546875, 0.020885467529296875, 0.025177001953125, 0.029468536376953125, 0.03376007080078125, 0.038051605224609375, 0.0423431396484375, 0.046634674072265625, 0.05092620849609375, 0.055217742919921875, 0.05950927734375, 0.06380081176757812, 0.06809234619140625, 0.07238388061523438, 0.0766754150390625, 0.08096694946289062, 0.08525848388671875, 0.08955001831054688, 0.093841552734375, 0.09813308715820312, 0.10242462158203125, 0.10671615600585938, 0.1110076904296875, 0.11529922485351562, 0.11959075927734375, 0.12388229370117188, 0.128173828125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 2.0, 11.0, 10.0, 34.0, 74.0, 316.0, 400.0, 94.0, 37.0, 14.0, 4.0, 4.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.525306224822998, -2.3678910732269287, -2.2104761600494385, -2.053061008453369, -1.8956459760665894, -1.7382309436798096, -1.5808157920837402, -1.4234007596969604, -1.2659857273101807, -1.1085706949234009, -0.9511556029319763, -0.7937405109405518, -0.636325478553772, -0.4789104461669922, -0.3214953541755676, -0.16408026218414307, -0.006665229797363281, 0.1507498323917389, 0.30816489458084106, 0.46557995676994324, 0.6229950189590454, 0.7804100513458252, 0.9378251433372498, 1.0952402353286743, 1.252655267715454, 1.4100703001022339, 1.5674853324890137, 1.724900484085083, 1.8823155164718628, 2.0397305488586426, 2.197145700454712, 2.3545608520507812, 2.5119762420654297, 2.669391393661499, 2.8268063068389893, 2.9842214584350586, 3.141636371612549, 3.299051523208618, 3.4564666748046875, 3.6138815879821777, 3.771296739578247, 3.9287118911743164, 4.086126804351807, 4.243541717529297, 4.400957107543945, 4.5583720207214355, 4.715786933898926, 4.873202323913574, 5.0306172370910645, 5.188032150268555, 5.345447540283203, 5.502862453460693, 5.660277366638184, 5.817692756652832, 5.975107669830322, 6.1325225830078125, 6.289937973022461, 6.447352886199951, 6.6047682762146, 6.76218318939209, 6.91959810256958, 7.07701301574707, 7.234428405761719, 7.391843318939209, 7.549258232116699]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 10.0, 3.0, 2.0, 6.0, 6.0, 5.0, 12.0, 5.0, 16.0, 12.0, 14.0, 22.0, 27.0, 18.0, 37.0, 58.0, 96.0, 106.0, 97.0, 96.0, 88.0, 51.0, 24.0, 25.0, 19.0, 18.0, 18.0, 20.0, 9.0, 14.0, 6.0, 10.0, 7.0, 7.0, 7.0, 1.0, 4.0, 7.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0], "bins": [-2.1506664752960205, -2.091336488723755, -2.0320067405700684, -1.9726767539978027, -1.913346767425537, -1.854016900062561, -1.794687032699585, -1.7353570461273193, -1.6760271787643433, -1.6166973114013672, -1.5573673248291016, -1.4980374574661255, -1.4387074708938599, -1.3793776035308838, -1.3200476169586182, -1.260717749595642, -1.201387882232666, -1.14205801486969, -1.0827280282974243, -1.0233981609344482, -0.9640682339668274, -0.9047383069992065, -0.8454083800315857, -0.7860784530639648, -0.7267484664916992, -0.6674185395240784, -0.6080886125564575, -0.5487587451934814, -0.4894288182258606, -0.43009889125823975, -0.3707689642906189, -0.31143906712532043, -0.252109169960022, -0.19277925789356232, -0.13344934582710266, -0.07411941885948181, -0.014789506793022156, 0.0445404052734375, 0.10387033224105835, 0.1632002294063568, 0.22253015637397766, 0.2818600833415985, 0.341189980506897, 0.4005199074745178, 0.45984983444213867, 0.5191797018051147, 0.5785096883773804, 0.6378395557403564, 0.6971694827079773, 0.7564994096755981, 0.815829336643219, 0.8751592636108398, 0.9344891309738159, 0.9938190579414368, 1.0531489849090576, 1.1124788522720337, 1.1718088388442993, 1.2311387062072754, 1.290468692779541, 1.349798560142517, 1.4091285467147827, 1.4684584140777588, 1.5277884006500244, 1.5871182680130005, 1.6464481353759766]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 3.0, 6.0, 3.0, 5.0, 5.0, 9.0, 9.0, 25.0, 21.0, 24.0, 24.0, 25.0, 35.0, 36.0, 36.0, 43.0, 75.0, 178.0, 122.0, 37.0, 38.0, 28.0, 35.0, 28.0, 14.0, 21.0, 18.0, 14.0, 12.0, 12.0, 10.0, 11.0, 9.0, 4.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.1776123046875, -0.17202186584472656, -0.16643142700195312, -0.1608409881591797, -0.15525054931640625, -0.1496601104736328, -0.14406967163085938, -0.13847923278808594, -0.1328887939453125, -0.12729835510253906, -0.12170791625976562, -0.11611747741699219, -0.11052703857421875, -0.10493659973144531, -0.09934616088867188, -0.09375572204589844, -0.088165283203125, -0.08257484436035156, -0.07698440551757812, -0.07139396667480469, -0.06580352783203125, -0.06021308898925781, -0.054622650146484375, -0.04903221130371094, -0.0434417724609375, -0.03785133361816406, -0.032260894775390625, -0.026670455932617188, -0.02108001708984375, -0.015489578247070312, -0.009899139404296875, -0.0043087005615234375, 0.00128173828125, 0.0068721771240234375, 0.012462615966796875, 0.018053054809570312, 0.02364349365234375, 0.029233932495117188, 0.034824371337890625, 0.04041481018066406, 0.0460052490234375, 0.05159568786621094, 0.057186126708984375, 0.06277656555175781, 0.06836700439453125, 0.07395744323730469, 0.07954788208007812, 0.08513832092285156, 0.090728759765625, 0.09631919860839844, 0.10190963745117188, 0.10750007629394531, 0.11309051513671875, 0.11868095397949219, 0.12427139282226562, 0.12986183166503906, 0.1354522705078125, 0.14104270935058594, 0.14663314819335938, 0.1522235870361328, 0.15781402587890625, 0.1634044647216797, 0.16899490356445312, 0.17458534240722656, 0.18017578125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 8.0, 6.0, 7.0, 4.0, 7.0, 3.0, 2.0, 7.0, 4.0, 9.0, 16.0, 35.0, 44.0, 46.0, 92.0, 125.0, 221.0, 619.0, 1842.0, 7046.0, 775399.0, 7592187.0, 7675.0, 1837.0, 650.0, 255.0, 160.0, 71.0, 53.0, 30.0, 41.0, 19.0, 16.0, 12.0, 10.0, 10.0, 6.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0], "bins": [-1.56608247756958, -1.5213700532913208, -1.476657509803772, -1.4319450855255127, -1.3872326612472534, -1.3425201177597046, -1.2978076934814453, -1.2530951499938965, -1.2083827257156372, -1.163670301437378, -1.118957757949829, -1.0742453336715698, -1.0295329093933105, -0.9848203659057617, -0.9401079416275024, -0.8953954577445984, -0.8506830334663391, -0.8059705495834351, -0.7612581253051758, -0.7165456414222717, -0.6718331575393677, -0.6271207332611084, -0.5824082493782043, -0.5376957654953003, -0.49298331141471863, -0.44827085733413696, -0.4035583734512329, -0.35884591937065125, -0.3141334652900696, -0.2694209814071655, -0.22470852732658386, -0.1799960434436798, -0.13528358936309814, -0.09057112038135529, -0.045858658850193024, -0.0011461973190307617, 0.0435662716627121, 0.08827874064445496, 0.13299119472503662, 0.17770367860794067, 0.22241613268852234, 0.267128586769104, 0.31184107065200806, 0.3565535247325897, 0.4012659788131714, 0.44597846269607544, 0.4906909167766571, 0.5354033708572388, 0.5801158547401428, 0.6248283386230469, 0.6695407629013062, 0.7142532467842102, 0.7589657306671143, 0.8036781549453735, 0.8483906388282776, 0.8931031227111816, 0.9378155469894409, 0.982528030872345, 1.027240514755249, 1.0719529390335083, 1.1166653633117676, 1.1613779067993164, 1.2060903310775757, 1.250802755355835, 1.2955152988433838]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 4.0, 1.0, 5.0, 6.0, 8.0, 4.0, 6.0, 9.0, 5.0, 4.0, 3.0, 4.0, 10.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.898141384124756, -2.814516544342041, -2.730891704559326, -2.6472666263580322, -2.5636417865753174, -2.4800169467926025, -2.3963918685913086, -2.3127670288085938, -2.229142189025879, -2.145517349243164, -2.061892509460449, -1.9782674312591553, -1.8946425914764404, -1.8110177516937256, -1.7273927927017212, -1.6437678337097168, -1.560142993927002, -1.476518154144287, -1.3928931951522827, -1.3092682361602783, -1.2256433963775635, -1.1420185565948486, -1.0583935976028442, -0.9747686982154846, -0.891143798828125, -0.8075188994407654, -0.7238940000534058, -0.6402691006660461, -0.5566442012786865, -0.4730193018913269, -0.3893944025039673, -0.30576950311660767, -0.22214460372924805, -0.13851970434188843, -0.05489480495452881, 0.02873009443283081, 0.11235499382019043, 0.19597989320755005, 0.27960479259490967, 0.3632296919822693, 0.4468545913696289, 0.5304794907569885, 0.6141043901443481, 0.6977292895317078, 0.7813541889190674, 0.864979088306427, 0.9486039876937866, 1.032228946685791, 1.1158537864685059, 1.1994786262512207, 1.283103585243225, 1.3667285442352295, 1.4503533840179443, 1.5339782238006592, 1.6176031827926636, 1.701228141784668, 1.7848529815673828, 1.8684778213500977, 1.952102780342102, 2.0357277393341064, 2.1193525791168213, 2.202977418899536, 2.28660249710083, 2.370227336883545, 2.4538521766662598]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 6.0, 3.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 7.0, 5.0, 13.0, 18.0, 14.0, 18.0, 20.0, 27.0, 30.0, 29.0, 35.0, 35.0, 42.0, 45.0, 63.0, 51.0, 59.0, 53.0, 49.0, 48.0, 43.0, 33.0, 30.0, 23.0, 16.0, 36.0, 23.0, 25.0, 18.0, 14.0, 9.0, 10.0, 9.0, 11.0, 6.0, 8.0, 6.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.135498046875, -0.13158798217773438, -0.12767791748046875, -0.12376785278320312, -0.1198577880859375, -0.11594772338867188, -0.11203765869140625, -0.10812759399414062, -0.104217529296875, -0.10030746459960938, -0.09639739990234375, -0.09248733520507812, -0.0885772705078125, -0.08466720581054688, -0.08075714111328125, -0.07684707641601562, -0.07293701171875, -0.06902694702148438, -0.06511688232421875, -0.061206817626953125, -0.0572967529296875, -0.053386688232421875, -0.04947662353515625, -0.045566558837890625, -0.041656494140625, -0.037746429443359375, -0.03383636474609375, -0.029926300048828125, -0.0260162353515625, -0.022106170654296875, -0.01819610595703125, -0.014286041259765625, -0.0103759765625, -0.006465911865234375, -0.00255584716796875, 0.001354217529296875, 0.0052642822265625, 0.009174346923828125, 0.01308441162109375, 0.016994476318359375, 0.020904541015625, 0.024814605712890625, 0.02872467041015625, 0.032634735107421875, 0.0365447998046875, 0.040454864501953125, 0.04436492919921875, 0.048274993896484375, 0.05218505859375, 0.056095123291015625, 0.06000518798828125, 0.06391525268554688, 0.0678253173828125, 0.07173538208007812, 0.07564544677734375, 0.07955551147460938, 0.083465576171875, 0.08737564086914062, 0.09128570556640625, 0.09519577026367188, 0.0991058349609375, 0.10301589965820312, 0.10692596435546875, 0.11083602905273438, 0.11474609375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 1.0, 10.0, 6.0, 3.0, 7.0, 4.0, 13.0, 18.0, 15.0, 31.0, 45.0, 74.0, 125.0, 224.0, 380.0, 686.0, 1298.0, 2816.0, 5900.0, 13840.0, 34008.0, 86404.0, 173172.0, 121570.0, 48901.0, 19288.0, 8168.0, 3634.0, 1723.0, 865.0, 418.0, 224.0, 126.0, 97.0, 52.0, 35.0, 24.0, 16.0, 20.0, 11.0, 8.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.109375, -1.0774002075195312, -1.0454254150390625, -1.0134506225585938, -0.981475830078125, -0.9495010375976562, -0.9175262451171875, -0.8855514526367188, -0.85357666015625, -0.8216018676757812, -0.7896270751953125, -0.7576522827148438, -0.725677490234375, -0.6937026977539062, -0.6617279052734375, -0.6297531127929688, -0.5977783203125, -0.5658035278320312, -0.5338287353515625, -0.5018539428710938, -0.469879150390625, -0.43790435791015625, -0.4059295654296875, -0.37395477294921875, -0.34197998046875, -0.31000518798828125, -0.2780303955078125, -0.24605560302734375, -0.214080810546875, -0.18210601806640625, -0.1501312255859375, -0.11815643310546875, -0.086181640625, -0.05420684814453125, -0.0222320556640625, 0.00974273681640625, 0.041717529296875, 0.07369232177734375, 0.1056671142578125, 0.13764190673828125, 0.16961669921875, 0.20159149169921875, 0.2335662841796875, 0.26554107666015625, 0.297515869140625, 0.32949066162109375, 0.3614654541015625, 0.39344024658203125, 0.4254150390625, 0.45738983154296875, 0.4893646240234375, 0.5213394165039062, 0.553314208984375, 0.5852890014648438, 0.6172637939453125, 0.6492385864257812, 0.68121337890625, 0.7131881713867188, 0.7451629638671875, 0.7771377563476562, 0.809112548828125, 0.8410873413085938, 0.8730621337890625, 0.9050369262695312, 0.93701171875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 4.0, 7.0, 6.0, 9.0, 12.0, 14.0, 16.0, 22.0, 30.0, 21.0, 32.0, 29.0, 33.0, 57.0, 44.0, 67.0, 52.0, 60.0, 52.0, 65.0, 46.0, 39.0, 32.0, 43.0, 32.0, 25.0, 22.0, 25.0, 19.0, 9.0, 12.0, 12.0, 6.0, 9.0, 7.0, 7.0, 5.0, 3.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.187744140625, -0.182769775390625, -0.17779541015625, -0.172821044921875, -0.1678466796875, -0.162872314453125, -0.15789794921875, -0.152923583984375, -0.14794921875, -0.142974853515625, -0.13800048828125, -0.133026123046875, -0.1280517578125, -0.123077392578125, -0.11810302734375, -0.113128662109375, -0.108154296875, -0.103179931640625, -0.09820556640625, -0.093231201171875, -0.0882568359375, -0.083282470703125, -0.07830810546875, -0.073333740234375, -0.068359375, -0.063385009765625, -0.05841064453125, -0.053436279296875, -0.0484619140625, -0.043487548828125, -0.03851318359375, -0.033538818359375, -0.028564453125, -0.023590087890625, -0.01861572265625, -0.013641357421875, -0.0086669921875, -0.003692626953125, 0.00128173828125, 0.006256103515625, 0.01123046875, 0.016204833984375, 0.02117919921875, 0.026153564453125, 0.0311279296875, 0.036102294921875, 0.04107666015625, 0.046051025390625, 0.051025390625, 0.055999755859375, 0.06097412109375, 0.065948486328125, 0.0709228515625, 0.075897216796875, 0.08087158203125, 0.085845947265625, 0.0908203125, 0.095794677734375, 0.10076904296875, 0.105743408203125, 0.1107177734375, 0.115692138671875, 0.12066650390625, 0.125640869140625, 0.130615234375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 9.0, 4.0, 6.0, 8.0, 13.0, 25.0, 53.0, 96.0, 90.0, 69.0, 49.0, 18.0, 8.0, 7.0, 6.0, 3.0, 6.0, 5.0, 1.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.331541895866394, -1.2872164249420166, -1.2428910732269287, -1.1985657215118408, -1.1542402505874634, -1.109914779663086, -1.065589427947998, -1.0212640762329102, -0.9769386053085327, -0.9326131939888, -0.8882877826690674, -0.8439623713493347, -0.799636960029602, -0.7553115487098694, -0.7109861373901367, -0.666660726070404, -0.6223353147506714, -0.5780099034309387, -0.533684492111206, -0.4893590807914734, -0.4450336694717407, -0.40070825815200806, -0.3563828468322754, -0.3120574355125427, -0.26773202419281006, -0.2234066128730774, -0.17908120155334473, -0.13475579023361206, -0.0904303789138794, -0.04610496759414673, -0.0017795562744140625, 0.042545855045318604, 0.08687114715576172, 0.13119655847549438, 0.17552196979522705, 0.21984738111495972, 0.2641727924346924, 0.30849820375442505, 0.3528236150741577, 0.3971490263938904, 0.44147443771362305, 0.4857998490333557, 0.5301252603530884, 0.574450671672821, 0.6187760829925537, 0.6631014943122864, 0.707426905632019, 0.7517523169517517, 0.7960777282714844, 0.840403139591217, 0.8847285509109497, 0.9290539622306824, 0.973379373550415, 1.017704725265503, 1.0620301961898804, 1.1063556671142578, 1.1506810188293457, 1.1950063705444336, 1.239331841468811, 1.2836573123931885, 1.3279826641082764, 1.3723080158233643, 1.4166334867477417, 1.4609589576721191, 1.505284309387207]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 6.0, 8.0, 7.0, 17.0, 22.0, 57.0, 71.0, 94.0, 70.0, 42.0, 19.0, 14.0, 7.0, 6.0, 2.0, 5.0, 2.0, 2.0, 8.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1043403148651123, -1.0688014030456543, -1.0332624912261963, -0.9977235794067383, -0.9621846675872803, -0.9266457557678223, -0.8911067843437195, -0.8555678725242615, -0.8200289607048035, -0.7844900488853455, -0.7489511370658875, -0.7134122252464294, -0.6778732538223267, -0.6423343420028687, -0.6067954301834106, -0.5712565183639526, -0.5357176065444946, -0.5001786947250366, -0.4646397829055786, -0.4291008412837982, -0.3935619294643402, -0.3580230176448822, -0.3224840760231018, -0.2869451642036438, -0.2514062523841858, -0.21586734056472778, -0.18032841384410858, -0.14478948712348938, -0.10925057530403137, -0.07371166348457336, -0.03817273676395416, -0.002633810043334961, 0.03290510177612305, 0.06844402104616165, 0.10398294031620026, 0.13952186703681946, 0.17506077885627747, 0.21059969067573547, 0.24613861739635468, 0.2816775441169739, 0.3172164559364319, 0.3527553677558899, 0.3882942795753479, 0.4238332211971283, 0.4593721330165863, 0.4949110448360443, 0.5304499864578247, 0.5659888982772827, 0.6015278100967407, 0.6370667219161987, 0.6726056337356567, 0.7081445455551147, 0.7436834573745728, 0.7792223691940308, 0.8147613406181335, 0.8503002524375916, 0.8858391642570496, 0.9213780760765076, 0.9569169878959656, 0.9924558997154236, 1.0279948711395264, 1.0635337829589844, 1.0990726947784424, 1.1346116065979004, 1.1701505184173584]}, "eval/loss": 0.36502909660339355, "eval/wer": 0.11207854026180088, "eval/runtime": 567.0865, "eval/samples_per_second": 4.659, "eval/steps_per_second": 0.584, "train/train_runtime": 25980.5507, "train/train_samples_per_second": 5.492, "train/train_steps_per_second": 0.043, "train/total_flos": 0.0, "train/train_loss": 2.498668275362574} \ No newline at end of file